Skip to content

Commit fa3b2c0

Browse files
committed
Add ci
Signed-off-by: Tianmu Li <[email protected]>
1 parent ab4d28a commit fa3b2c0

File tree

2 files changed

+14
-1
lines changed

2 files changed

+14
-1
lines changed

tests/full_tests/ci_gsm8k_tests.sh

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -129,6 +129,18 @@ if [ $? -ne 0 ]; then
129129
fi
130130
echo "Test with granite-8b passed"
131131

132+
# used to check asynchronous scheduling
133+
echo "Testing GSM8K on ganite-8b with async scheduling"
134+
echo VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 ASYNC_SCHEDULING=1 \
135+
pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
136+
VLLM_CONTIGUOUS_PA=False VLLM_SKIP_WARMUP=True PT_HPU_LAZY_MODE=1 VLLM_USE_V1=1 ASYNC_SCHEDULING=1 \
137+
pytest -v -s vllm-gaudi/tests/models/language/generation/test_common.py --model_card_path vllm-gaudi/tests/full_tests/model_cards/granite-8b.yaml
138+
if [ $? -ne 0 ]; then
139+
echo "Error: Test failed for granite-8b + async_scheduling" >&2
140+
exit -1
141+
fi
142+
echo "Test with granite-8b + async_scheduling passed"
143+
132144
# used to check MLA + MOE
133145
echo "Testing GSM8K on deepseek v2 lite"
134146
# deepseek-R1

tests/models/language/generation/test_common.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,10 +23,11 @@ def launch_lm_eval(eval_config):
2323
enforce_eager = os.environ.get('ENFORCE_EAGER', 'False').lower() in ['true', '1']
2424
kv_cache_dtype = os.environ.get('KV_CACHE_DTYPE', None)
2525
task = eval_config.get('tasks', 'gsm8k')
26+
async_scheduling = os.environ.get('ASYNC_SCHEDULING', 'False').lower() in ['true', '1']
2627
model_args = {
2728
'pretrained': eval_config['model_name'],
2829
'tensor_parallel_size': tp_size,
29-
'async_scheduling': True,
30+
'async_scheduling': async_scheduling,
3031
'enforce_eager': enforce_eager,
3132
'enable_prefix_caching': enable_apc,
3233
'add_bos_token': True,

0 commit comments

Comments
 (0)