File tree Expand file tree Collapse file tree 2 files changed +14
-1
lines changed
models/language/generation Expand file tree Collapse file tree 2 files changed +14
-1
lines changed Original file line number Diff line number Diff line change @@ -129,6 +129,18 @@ if [ $? -ne 0 ]; then
129129fi
130130echo " Test with granite-8b passed"
131131
132+ # used to check asynchronous scheduling
133+ echo " Testing GSM8K on ganite-8b with async scheduling"
134+ echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 ASYNC_SCHEDULING=1 \
135+ pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
136+ VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 ASYNC_SCHEDULING=1 \
137+ pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
138+ if [ $? -ne 0 ]; then
139+ echo " Error: Test failed for granite-8b + async_scheduling" >&2
140+ exit -1
141+ fi
142+ echo " Test with granite-8b + async_scheduling passed"
143+
132144# used to check MLA + MOE
133145echo " Testing GSM8K on deepseek v2 lite"
134146# deepseek-R1
Original file line number Diff line number Diff line change @@ -23,10 +23,11 @@ def launch_lm_eval(eval_config):
2323 enforce_eager = os .environ .get ('ENFORCE_EAGER' , 'False' ).lower () in ['true' , '1' ]
2424 kv_cache_dtype = os .environ .get ('KV_CACHE_DTYPE' , None )
2525 task = eval_config .get ('tasks' , 'gsm8k' )
26+ async_scheduling = os .environ .get ('ASYNC_SCHEDULING' , 'False' ).lower () in ['true' , '1' ]
2627 model_args = {
2728 'pretrained' : eval_config ['model_name' ],
2829 'tensor_parallel_size' : tp_size ,
29- 'async_scheduling' : True ,
30+ 'async_scheduling' : async_scheduling ,
3031 'enforce_eager' : enforce_eager ,
3132 'enable_prefix_caching' : enable_apc ,
3233 'add_bos_token' : True ,
You can’t perform that action at this time.
0 commit comments