Skip to content

Commit 388d760

Browse files
committed
added test
1 parent caa789d commit 388d760

File tree

1 file changed

+17
-0
lines changed

1 file changed

+17
-0
lines changed

src/recipe.yaml

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -379,6 +379,23 @@
379379
extra_labels:
380380
openllm_alias: 70b
381381
model_name: nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
382+
'llama3.1-nemotron:70b-instruct-fp16-TEST':
383+
project: vllm-chat
384+
service_config:
385+
name: llama3.1-nemotron
386+
traffic:
387+
timeout: 300
388+
resources:
389+
gpu: 2
390+
gpu_type: nvidia-a100-80gb
391+
engine_config:
392+
model: nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
393+
max_model_len: 128000
394+
tensor_parallel_size: 2
395+
extra_labels:
396+
openllm_alias: 70b
397+
model_name: nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
398+
382399
'llama3.1:70b-instruct-awq-4bit':
383400
project: vllm-chat
384401
service_config:

0 commit comments

Comments
 (0)