Morgan Funtowicz
commited on
Commit
·
922eee4
1
Parent(s):
960dd65
test(hfjobs): add instance type and size to deploy.json
Browse files- .hfjobs/Dockerfile +3 -3
- .hfjobs/deploy.json +2 -1
.hfjobs/Dockerfile
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
FROM python:3.12
|
2 |
|
3 |
-
ENV ENDPOINT_URL="http://host.docker.internal:8000"
|
4 |
ENV ENDPOINT_API_KEY="undefined"
|
5 |
-
|
6 |
-
|
|
|
7 |
|
8 |
RUN --mount=type=bind,source=.hfjobs/requirements.txt,target=/opt/endpoint/tests/requirements.txt \
|
9 |
python -m pip install -r /opt/endpoint/tests/requirements.txt
|
|
|
1 |
FROM python:3.12
|
2 |
|
|
|
3 |
ENV ENDPOINT_API_KEY="undefined"
|
4 |
+
ARG ENDPOINT_URL="http://host.docker.internal:8000"
|
5 |
+
ARG ENDPOINT_NUM_SAMPLES=50
|
6 |
+
ARG ENDPOINT_TEST_SEED=31415926
|
7 |
|
8 |
RUN --mount=type=bind,source=.hfjobs/requirements.txt,target=/opt/endpoint/tests/requirements.txt \
|
9 |
python -m pip install -r /opt/endpoint/tests/requirements.txt
|
.hfjobs/deploy.json
CHANGED
@@ -1,6 +1,7 @@
|
|
1 |
{
|
2 |
"id": "deploy-whisper-vllm-gpu",
|
3 |
"description": "Build and deploy vLLM based Whisper on Inference Endpoint",
|
4 |
-
"
|
|
|
5 |
"model": "openai/whisper-large-v3-turbo"
|
6 |
}
|
|
|
1 |
{
|
2 |
"id": "deploy-whisper-vllm-gpu",
|
3 |
"description": "Build and deploy vLLM based Whisper on Inference Endpoint",
|
4 |
+
"instance_type": "nvidia-l4",
|
5 |
+
"instance_size": "x1",
|
6 |
"model": "openai/whisper-large-v3-turbo"
|
7 |
}
|