@@ -15,7 +15,7 @@ class TestFile:
15
15
"per-commit" : [
16
16
TestFile ("models/lora/test_lora.py" , 76 ),
17
17
TestFile ("models/lora/test_lora_backend.py" , 420 ),
18
- TestFile ("models/lora/test_multi_lora_backend.py" , 144 ),
18
+ TestFile ("models/lora/test_multi_lora_backend.py" , 60 ),
19
19
TestFile ("models/test_embedding_models.py" , 35 ),
20
20
TestFile ("models/test_generation_models.py" , 103 ),
21
21
TestFile ("models/test_grok_models.py" , 60 ),
@@ -28,15 +28,15 @@ class TestFile:
28
28
TestFile ("test_chunked_prefill.py" , 336 ),
29
29
TestFile ("test_eagle_infer.py" , 500 ),
30
30
TestFile ("test_ebnf_constrained.py" ),
31
- TestFile ("test_fp8_kernel.py" , 2 ),
31
+ TestFile ("test_fp8_kernel.py" , 8 ),
32
32
TestFile ("test_embedding_openai_server.py" , 36 ),
33
33
TestFile ("test_hidden_states.py" , 55 ),
34
- TestFile ("test_int8_kernel.py" , 1 ),
34
+ TestFile ("test_int8_kernel.py" , 8 ),
35
35
TestFile ("test_input_embeddings.py" , 38 ),
36
36
TestFile ("test_json_constrained.py" , 98 ),
37
37
TestFile ("test_large_max_new_tokens.py" , 41 ),
38
38
TestFile ("test_metrics.py" , 32 ),
39
- TestFile ("test_mla.py" , 92 ),
39
+ TestFile ("test_mla.py" , 162 ),
40
40
TestFile ("test_mla_deepseek_v3.py" , 221 ),
41
41
TestFile ("test_mla_int8_deepseek_v3.py" , 522 ),
42
42
TestFile ("test_mla_flashinfer.py" , 395 ),
@@ -68,23 +68,23 @@ class TestFile:
68
68
TestFile ("test_vertex_endpoint.py" , 31 ),
69
69
TestFile ("test_vision_chunked_prefill.py" , 223 ),
70
70
TestFile ("test_vlm_accuracy.py" , 60 ),
71
- TestFile ("test_vision_openai_server.py" , 344 ),
72
- TestFile ("test_fim_completion.py" , 120 ),
71
+ TestFile ("test_vision_openai_server.py" , 537 ),
72
+ TestFile ("test_fim_completion.py" , 40 ),
73
73
TestFile ("test_w8a8_quantization.py" , 46 ),
74
- TestFile ("test_eval_fp8_accuracy.py" , 172 ),
74
+ TestFile ("test_eval_fp8_accuracy.py" , 303 ),
75
75
TestFile ("test_create_kvindices.py" , 2 ),
76
76
TestFile ("test_hicache.py" , 60 ),
77
77
TestFile ("test_hicache_mla.py" , 90 ),
78
78
],
79
79
"per-commit-2-gpu" : [
80
+ TestFile ("models/lora/test_lora_tp.py" , 300 ),
80
81
TestFile ("test_data_parallelism.py" , 90 ),
81
82
TestFile ("test_dp_attention.py" , 90 ),
83
+ TestFile ("test_mla_tp.py" , 420 ),
84
+ TestFile ("test_moe_ep.py" , 220 ),
85
+ TestFile ("test_patch_torch.py" , 30 ),
82
86
TestFile ("test_update_weights_from_distributed.py" , 100 ),
83
87
TestFile ("test_verl_engine.py" , 100 ),
84
- TestFile ("test_patch_torch.py" , 30 ),
85
- TestFile ("test_moe_ep.py" , 220 ),
86
- TestFile ("test_mla_tp.py" , 420 ),
87
- TestFile ("test_lora_tp.py" , 300 ),
88
88
],
89
89
"nightly" : [
90
90
TestFile ("test_nightly_gsm8k_eval.py" ),
0 commit comments