@@ -4,98 +4,168 @@ stages:
4
4
steps :
5
5
- name : gsm8k_small_g3_tp1
6
6
flavor : g3
7
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-small.txt -t 1
7
+ command : >
8
+ cd .jenkins/lm-eval-harness &&
9
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
10
+ bash run-tests.sh -c configs/models-small.txt -t 1
8
11
- name : gsm8k_small_g3_tp2
9
12
flavor : g3.s
10
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-small.txt -t 2
13
+ command : >
14
+ cd .jenkins/lm-eval-harness &&
15
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
16
+ bash run-tests.sh -c configs/models-small.txt -t 2
11
17
- name : gsm8k_small_g2_tp1
12
18
flavor : g2
13
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-small.txt -t 1
19
+ command : >
20
+ cd .jenkins/lm-eval-harness &&
21
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
22
+ bash run-tests.sh -c configs/models-small.txt -t 1
14
23
- name : gsm8k_small_g2_tp2
15
24
flavor : g2.s
16
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-small.txt -t 2
25
+ command : >
26
+ cd .jenkins/lm-eval-harness &&
27
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
28
+ bash run-tests.sh -c configs/models-small.txt -t 2
17
29
- name : test_gsm8k_large_models
18
30
steps :
19
31
- name : gsm8k_large_g3_tp2
20
32
flavor : g3.s
21
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-large.txt -t 2
33
+ command : >
34
+ cd .jenkins/lm-eval-harness &&
35
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
36
+ bash run-tests.sh -c configs/models-large.txt -t 2
22
37
- name : gsm8k_large_g2_tp4
23
38
flavor : g2.m
24
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-large.txt -t 4
39
+ command : >
40
+ cd .jenkins/lm-eval-harness &&
41
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
42
+ bash run-tests.sh -c configs/models-large.txt -t 4
25
43
- name : test_gsm8k_fp8
26
44
steps :
27
45
- name : gsm8k_small_g3_tp1_fp8
28
46
flavor : g3
29
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-fp8.txt -t 1
47
+ command : >
48
+ cd .jenkins/lm-eval-harness &&
49
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
50
+ bash run-tests.sh -c configs/models-fp8.txt -t 1
30
51
- name : gsm8k_small_g3_tp2_fp8
31
52
flavor : g3.s
32
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-fp8.txt -t 2
53
+ command : >
54
+ cd .jenkins/lm-eval-harness &&
55
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
56
+ bash run-tests.sh -c configs/models-fp8.txt -t 2
33
57
- name : test_gsm8k_mss
34
58
steps :
35
59
- name : gsm8k_small_g3_tp1_mss
36
60
flavor : g3
37
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-mss.txt -t 1
61
+ command : >
62
+ cd .jenkins/lm-eval-harness &&
63
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
64
+ bash run-tests.sh -c configs/models-mss.txt -t 1
38
65
- name : gsm8k_small_g2_tp1_mss
39
66
flavor : g2
40
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-mss.txt -t 1
67
+ command : >
68
+ cd .jenkins/lm-eval-harness &&
69
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
70
+ bash run-tests.sh -c configs/models-mss.txt -t 1
41
71
- name : gsm8k_small_g3_tp2_mss
42
72
flavor : g3.s
43
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-mss.txt -t 2
73
+ command : >
74
+ cd .jenkins/lm-eval-harness &&
75
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
76
+ bash run-tests.sh -c configs/models-mss.txt -t 2
44
77
- name : gsm8k_small_g2_tp2_mss
45
78
flavor : g2.s
46
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-mss.txt -t 2
79
+ command : >
80
+ cd .jenkins/lm-eval-harness &&
81
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
82
+ bash run-tests.sh -c configs/models-mss.txt -t 2
47
83
- name : gsm8k_small_g2_tp1_spec_decode
48
84
flavor : g2
49
- command : cd .jenkins/lm-eval-harness && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-mss.txt -t 1
85
+ command : >
86
+ cd .jenkins/lm-eval-harness &&
87
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
88
+ bash run-tests.sh -c configs/models-mss.txt -t 1
50
89
- name : test_gsm8k_spec_decode
51
90
steps :
52
91
- name : gsm8k_small_g2_tp1_mlp_spec_decode
53
92
flavor : g2
54
- command : PT_HPU_LAZY_MODE=0 TORCH_COMPILE_DISABLE=true VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True pytest -v tests/spec_decode/e2e/test_mlp_correctness.py::test_mlp_e2e_greedy_correctness
93
+ command : >
94
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0 TORCH_COMPILE_DISABLE=true VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True
95
+ pytest -v tests/spec_decode/e2e/test_mlp_correctness.py::test_mlp_e2e_greedy_correctness
55
96
- name : gsm8k_small_g2_tp1_medusa_spec_decode
56
97
flavor : g2
57
- command : PT_HPU_LAZY_MODE=0 TORCH_COMPILE_DISABLE=true VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True pytest -v tests/spec_decode/e2e/test_medusa_correctness.py::test_medusa_e2e_greedy_correctness
98
+ command : >
99
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0 TORCH_COMPILE_DISABLE=true VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True
100
+ pytest -v tests/spec_decode/e2e/test_medusa_correctness.py::test_medusa_e2e_greedy_correctness
58
101
- name : gsm8k_small_g2_tp1_eagle_spec_decode
59
102
flavor : g2
60
- command : PT_HPU_LAZY_MODE=0 VLLM_COS_SIN_RECOMPUTE=true TORCH_COMPILE_DISABLE=true VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True pytest -v tests/spec_decode/e2e/test_eagle_correctness.py::test_eagle_e2e_greedy_correctness
103
+ command : >
104
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0 VLLM_COS_SIN_RECOMPUTE=true TORCH_COMPILE_DISABLE=true VLLM_CONTIGUOUS_PA=false VLLM_SKIP_WARMUP=True
105
+ pytest -v tests/spec_decode/e2e/test_eagle_correctness.py::test_eagle_e2e_greedy_correctness
61
106
- name : tests_lora
62
107
steps :
63
108
- name : test_llama_lora
64
109
flavor : g2
65
- command : PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true pytest -v tests/lora/test_llama_hpu.py::test_llama_lora_1x
110
+ command : >
111
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true
112
+ pytest -v tests/lora/test_llama_hpu.py::test_llama_lora_1x
66
113
- name : test_multilora
67
114
flavor : g2
68
- command : PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true pytest -v tests/lora/test_multilora_hpu.py::test_llama_multilora_1x
115
+ command : >
116
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true
117
+ pytest -v tests/lora/test_multilora_hpu.py::test_llama_multilora_1x
69
118
# - name: test_long_context
70
119
# flavor: g2
71
- # command: PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true pytest -v tests/lora/test_long_context_hpu.py::test_quality
120
+ # command: VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true pytest -v tests/lora/test_long_context_hpu.py::test_quality
72
121
- name : tests_multimodal
73
122
steps :
74
123
- name : multimodal_small_g3_tp1
75
124
flavor : g3
76
- command : cd .jenkins/vision && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-small.txt -t 1
125
+ command : >
126
+ cd .jenkins/vision &&
127
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
128
+ bash run-tests.sh -c configs/models-small.txt -t 1
77
129
- name : multimodal_small_g3_tp2
78
130
flavor : g3.s
79
- command : cd .jenkins/vision && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-small.txt -t 2
131
+ command : >
132
+ cd .jenkins/vision &&
133
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
134
+ bash run-tests.sh -c configs/models-small.txt -t 2
80
135
- name : multimodal_small_g3_tp1_mss
81
136
flavor : g3
82
- command : cd .jenkins/vision && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-mss.txt -t 1
137
+ command : >
138
+ cd .jenkins/vision && VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
139
+ bash run-tests.sh -c configs/models-mss.txt -t 1
83
140
- name : multimodal_small_g3_tp2_mss
84
141
flavor : g3.s
85
- command : cd .jenkins/vision && PT_HPU_LAZY_MODE=0 bash run-tests.sh -c configs/models-mss.txt -t 2
142
+ command : >
143
+ cd .jenkins/vision &&
144
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
145
+ bash run-tests.sh -c configs/models-mss.txt -t 2
86
146
- name : tests_int4_quantization
87
147
steps :
88
148
- name : test_awq
89
149
flavor : g2
90
- command : PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true pytest -v tests/quantization/test_awq.py::test_awq
150
+ command : >
151
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true
152
+ pytest -v tests/quantization/test_awq.py::test_awq
91
153
- name : test_gptq
92
154
flavor : g2
93
- command : PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true pytest -v tests/quantization/test_gptq.py::test_gptq
155
+ command : >
156
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0 VLLM_SKIP_WARMUP=true
157
+ pytest -v tests/quantization/test_gptq.py::test_gptq
94
158
- name : tests_guided_decode
95
159
steps :
96
160
- name : test_lazy_outlines
97
161
flavor : g2
98
- command : export VLLM_SKIP_WARMUP=true && pip install -e tests/vllm_test_utils && PT_HPU_LAZY_MODE=0 pytest -v tests/entrypoints/llm/test_lazy_outlines.py -s -vvv --log-cli-level=INFO
162
+ command : >
163
+ export VLLM_SKIP_WARMUP=true && pip install -e tests/vllm_test_utils &&
164
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
165
+ pytest -v tests/entrypoints/llm/test_lazy_outlines.py -s -vvv --log-cli-level=INFO
99
166
- name : test_guided_generate
100
167
flavor : g2
101
- command : export VLLM_SKIP_WARMUP=true && pip install -e tests/vllm_test_utils && PT_HPU_LAZY_MODE=0 pytest -v tests/entrypoints/llm/test_guided_generate.py -s -vvv --log-cli-level=INFO
168
+ command : >
169
+ export VLLM_SKIP_WARMUP=true && pip install -e tests/vllm_test_utils &&
170
+ VLLM_T_COMPILE_FULLGRAPH=True PT_HPU_LAZY_MODE=0
171
+ pytest -v tests/entrypoints/llm/test_guided_generate.py -s -vvv --log-cli-level=INFO
0 commit comments