@@ -571,44 +571,98 @@ steps:
571
571
572
572
# #### models test #####
573
573
574
- - label : Basic Models Test # 57min
575
- timeout_in_minutes : 75
574
+ - label : Basic Models Tests (Initialization)
575
+ timeout_in_minutes : 45
576
576
mirror_hardwares : [amdexperimental]
577
577
torch_nightly : true
578
578
source_file_dependencies :
579
579
- vllm/
580
- - tests/models
580
+ - tests/models/test_initialization.py
581
581
commands :
582
- - pytest -v -s models/test_transformers.py
583
- - pytest -v -s models/test_registry.py
584
- - pytest -v -s models/test_utils.py
585
- - pytest -v -s models/test_vision.py
586
- - pytest -v -s models/test_initialization.py
582
+ # Run a subset of model initialization tests
583
+ - pytest -v -s models/test_initialization.py::test_can_initialize_small_subset
587
584
588
- - label : Language Models Test (Standard) # 35min
585
+ - label : Basic Models Tests (Extra Initialization) %N
589
586
timeout_in_minutes : 45
590
587
mirror_hardwares : [amdexperimental]
591
588
torch_nightly : true
592
589
source_file_dependencies :
590
+ - vllm/model_executor/models/
591
+ - tests/models/test_initialization.py
592
+ commands :
593
+ # Only when vLLM model source is modified - test initialization of a large
594
+ # subset of supported models (the complement of the small subset in the above
595
+ # test.) Also run if model initialization test file is modified
596
+ - pytest -v -s models/test_initialization.py \
597
+ -k 'not test_can_initialize_small_subset' \
598
+ --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT \
599
+ --shard-id=$$BUILDKITE_PARALLEL_JOB
600
+ parallelism : 2
601
+
602
+ - label : Basic Models Tests (Other)
603
+ timeout_in_minutes : 45
604
+ mirror_hardwares : [amdexperimental]
605
+ torch_nightly : true
606
+ source_file_dependencies :
607
+ - vllm/
608
+ - tests/models/test_transformers.py
609
+ - tests/models/test_registry.py
610
+ - tests/models/test_utils.py
611
+ - tests/models/test_vision.py
612
+ commands :
613
+ - pytest -v -s models/test_transformers.py \
614
+ models/test_registry.py \
615
+ models/test_utils.py \
616
+ models/test_vision.py
617
+
618
+ - label : Language Models Tests (Standard)
619
+ timeout_in_minutes : 25
620
+ mirror_hardwares : [amdexperimental]
621
+ torch_nightly : true
622
+ source_file_dependencies :
593
623
- vllm/
594
624
- tests/models/language
595
625
commands :
626
+ # Test standard language models, excluding a subset of slow tests
596
627
- pip freeze | grep -E 'torch'
597
- - pytest -v -s models/language -m core_model
628
+ - pytest -v -s models/language -m ' core_model and (not slow_test)'
598
629
599
- - label : Language Models Test (Hybrid) # 35 min
630
+ - label : Language Models Tests (Extra Standard) %N
600
631
timeout_in_minutes : 45
601
632
mirror_hardwares : [amdexperimental]
602
633
torch_nightly : true
603
634
source_file_dependencies :
635
+ - vllm/model_executor/models/
636
+ - tests/models/language/pooling/test_embedding.py
637
+ - tests/models/language/generation/test_common.py
638
+ - tests/models/language/pooling/test_classification.py
639
+ commands :
640
+ # Shard slow subset of standard language models tests. Only run when model
641
+ # source is modified, or when specified test files are modified
642
+ - pip freeze | grep -E 'torch'
643
+ - pytest -v -s models/language -m 'core_model and slow_test' \
644
+ --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT \
645
+ --shard-id=$$BUILDKITE_PARALLEL_JOB
646
+ parallelism : 2
647
+
648
+ - label : Language Models Tests (Hybrid) %N
649
+ timeout_in_minutes : 75
650
+ mirror_hardwares : [amdexperimental]
651
+ torch_nightly : true
652
+ source_file_dependencies :
604
653
- vllm/
605
654
- tests/models/language/generation
606
655
commands :
607
656
# Install fast path packages for testing against transformers
608
657
# Note: also needed to run plamo2 model in vLLM
609
658
-
uv pip install --system --no-build-isolation 'git+https://github.com/state-spaces/[email protected] '
610
659
-
uv pip install --system --no-build-isolation 'git+https://github.com/Dao-AILab/[email protected] '
611
- - pytest -v -s models/language/generation -m hybrid_model
660
+ # Shard hybrid language model tests
661
+ - pytest -v -s models/language/generation \
662
+ -m hybrid_model \
663
+ --num-shards=$$BUILDKITE_PARALLEL_JOB_COUNT \
664
+ --shard-id=$$BUILDKITE_PARALLEL_JOB
665
+ parallelism : 2
612
666
613
667
- label : Language Models Test (Extended Generation) # 80min
614
668
timeout_in_minutes : 110
0 commit comments