Morgan Funtowicz commited on
Commit
922eee4
·
1 Parent(s): 960dd65

test(hfjobs): add instance type and size to deploy.json

Browse files
Files changed (2) hide show
  1. .hfjobs/Dockerfile +3 -3
  2. .hfjobs/deploy.json +2 -1
.hfjobs/Dockerfile CHANGED
@@ -1,9 +1,9 @@
1
  FROM python:3.12
2
 
3
- ENV ENDPOINT_URL="http://host.docker.internal:8000"
4
  ENV ENDPOINT_API_KEY="undefined"
5
- ENV ENDPOINT_NUM_SAMPLES=50
6
- ENV ENDPOINT_TEST_SEED=31415926
 
7
 
8
  RUN --mount=type=bind,source=.hfjobs/requirements.txt,target=/opt/endpoint/tests/requirements.txt \
9
  python -m pip install -r /opt/endpoint/tests/requirements.txt
 
1
  FROM python:3.12
2
 
 
3
  ENV ENDPOINT_API_KEY="undefined"
4
+ ARG ENDPOINT_URL="http://host.docker.internal:8000"
5
+ ARG ENDPOINT_NUM_SAMPLES=50
6
+ ARG ENDPOINT_TEST_SEED=31415926
7
 
8
  RUN --mount=type=bind,source=.hfjobs/requirements.txt,target=/opt/endpoint/tests/requirements.txt \
9
  python -m pip install -r /opt/endpoint/tests/requirements.txt
.hfjobs/deploy.json CHANGED
@@ -1,6 +1,7 @@
1
  {
2
  "id": "deploy-whisper-vllm-gpu",
3
  "description": "Build and deploy vLLM based Whisper on Inference Endpoint",
4
- "hardware": "l4x1",
 
5
  "model": "openai/whisper-large-v3-turbo"
6
  }
 
1
  {
2
  "id": "deploy-whisper-vllm-gpu",
3
  "description": "Build and deploy vLLM based Whisper on Inference Endpoint",
4
+ "instance_type": "nvidia-l4",
5
+ "instance_size": "x1",
6
  "model": "openai/whisper-large-v3-turbo"
7
  }