File tree
21 files changed
+33
-33
lines changed- benchmarks
- csrc/mamba/causal_conv1d
- vllm
- attention
- backends
- mla
- ops
- benchmarks
- engine/output_processor
- entrypoints/openai/tool_parsers
- model_executor/layers/quantization/kernels/scaled_mm
- platforms
- reasoning
- third_party
- v1
- attention/backends/mla
- executor
- worker
21 files changed
+33
-33
lines changedDiff for: benchmarks/benchmark_serving.py
+2-2
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
921 | 921 |
| |
922 | 922 |
| |
923 | 923 |
| |
924 |
| - | |
| 924 | + | |
925 | 925 |
| |
926 | 926 |
| |
927 | 927 |
| |
928 | 928 |
| |
929 | 929 |
| |
930 | 930 |
| |
931 | 931 |
| |
932 |
| - | |
| 932 | + | |
933 | 933 |
| |
934 | 934 |
| |
935 | 935 |
| |
|
+2-2
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
963 | 963 |
| |
964 | 964 |
| |
965 | 965 |
| |
966 |
| - | |
| 966 | + | |
967 | 967 |
| |
968 | 968 |
| |
969 | 969 |
| |
970 | 970 |
| |
971 | 971 |
| |
972 | 972 |
| |
973 | 973 |
| |
974 |
| - | |
| 974 | + | |
975 | 975 |
| |
976 | 976 |
| |
977 | 977 |
| |
|
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
422 | 422 |
| |
423 | 423 |
| |
424 | 424 |
| |
425 |
| - | |
| 425 | + | |
426 | 426 |
| |
427 | 427 |
| |
428 | 428 |
| |
|
Diff for: vllm/attention/backends/flash_attn.py
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
326 | 326 |
| |
327 | 327 |
| |
328 | 328 |
| |
329 |
| - | |
| 329 | + | |
330 | 330 |
| |
331 | 331 |
| |
332 | 332 |
| |
|
Diff for: vllm/attention/backends/hpu_attn.py
+3-3
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
152 | 152 |
| |
153 | 153 |
| |
154 | 154 |
| |
155 |
| - | |
156 |
| - | |
| 155 | + | |
| 156 | + | |
157 | 157 |
| |
158 | 158 |
| |
159 |
| - | |
| 159 | + | |
160 | 160 |
| |
161 | 161 |
| |
162 | 162 |
| |
|
Diff for: vllm/attention/backends/mla/common.py
+3-3
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
83 | 83 |
| |
84 | 84 |
| |
85 | 85 |
| |
86 |
| - | |
87 |
| - | |
| 86 | + | |
| 87 | + | |
88 | 88 |
| |
89 | 89 |
| |
90 | 90 |
| |
| |||
667 | 667 |
| |
668 | 668 |
| |
669 | 669 |
| |
670 |
| - | |
| 670 | + | |
671 | 671 |
| |
672 | 672 |
| |
673 | 673 |
| |
|
Diff for: vllm/attention/backends/xformers.py
+3-3
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
414 | 414 |
| |
415 | 415 |
| |
416 | 416 |
| |
417 |
| - | |
418 |
| - | |
| 417 | + | |
| 418 | + | |
419 | 419 |
| |
420 | 420 |
| |
421 |
| - | |
| 421 | + | |
422 | 422 |
| |
423 | 423 |
| |
424 | 424 |
| |
|
Diff for: vllm/attention/ops/nki_flash_attn.py
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
446 | 446 |
| |
447 | 447 |
| |
448 | 448 |
| |
449 |
| - | |
| 449 | + | |
450 | 450 |
| |
451 | 451 |
| |
452 | 452 |
| |
|
Diff for: vllm/benchmarks/serve.py
+2-2
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
724 | 724 |
| |
725 | 725 |
| |
726 | 726 |
| |
727 |
| - | |
| 727 | + | |
728 | 728 |
| |
729 | 729 |
| |
730 | 730 |
| |
731 | 731 |
| |
732 | 732 |
| |
733 | 733 |
| |
734 |
| - | |
| 734 | + | |
735 | 735 |
| |
736 | 736 |
| |
737 | 737 |
| |
|
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
93 | 93 |
| |
94 | 94 |
| |
95 | 95 |
| |
96 |
| - | |
| 96 | + | |
97 | 97 |
| |
98 | 98 |
| |
99 | 99 |
| |
|
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
98 | 98 |
| |
99 | 99 |
| |
100 | 100 |
| |
101 |
| - | |
| 101 | + | |
102 | 102 |
| |
103 | 103 |
| |
104 | 104 |
| |
|
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
29 | 29 |
| |
30 | 30 |
| |
31 | 31 |
| |
32 |
| - | |
| 32 | + | |
33 | 33 |
| |
34 | 34 |
| |
35 | 35 |
| |
|
Diff for: vllm/platforms/cpu.py
+3-3
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
69 | 69 |
| |
70 | 70 |
| |
71 | 71 |
| |
72 |
| - | |
| 72 | + | |
73 | 73 |
| |
74 | 74 |
| |
75 |
| - | |
| 75 | + | |
76 | 76 |
| |
77 |
| - | |
| 77 | + | |
78 | 78 |
| |
79 | 79 |
| |
80 | 80 |
| |
|
Diff for: vllm/platforms/interface.py
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
231 | 231 |
| |
232 | 232 |
| |
233 | 233 |
| |
234 |
| - | |
| 234 | + | |
235 | 235 |
| |
236 | 236 |
| |
237 | 237 |
| |
|
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
60 | 60 |
| |
61 | 61 |
| |
62 | 62 |
| |
63 |
| - | |
| 63 | + | |
64 | 64 |
| |
65 | 65 |
| |
66 | 66 |
| |
|
Diff for: vllm/sampling_params.py
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
101 | 101 |
| |
102 | 102 |
| |
103 | 103 |
| |
104 |
| - | |
| 104 | + | |
105 | 105 |
| |
106 | 106 |
| |
107 | 107 |
| |
|
Diff for: vllm/third_party/pynvml.py
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
1119 | 1119 |
| |
1120 | 1120 |
| |
1121 | 1121 |
| |
1122 |
| - | |
| 1122 | + | |
1123 | 1123 |
| |
1124 | 1124 |
| |
1125 | 1125 |
| |
|
+2-2
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
83 | 83 |
| |
84 | 84 |
| |
85 | 85 |
| |
86 |
| - | |
87 |
| - | |
| 86 | + | |
| 87 | + | |
88 | 88 |
| |
89 | 89 |
| |
90 | 90 |
| |
|
Diff for: vllm/v1/executor/multiproc_executor.py
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
326 | 326 |
| |
327 | 327 |
| |
328 | 328 |
| |
329 |
| - | |
| 329 | + | |
330 | 330 |
| |
331 | 331 |
| |
332 | 332 |
| |
|
Diff for: vllm/v1/worker/gpu_model_runner.py
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
998 | 998 |
| |
999 | 999 |
| |
1000 | 1000 |
| |
1001 |
| - | |
| 1001 | + | |
1002 | 1002 |
| |
1003 | 1003 |
| |
1004 | 1004 |
| |
|
Diff for: vllm/v1/worker/tpu_model_runner.py
+1-1
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
652 | 652 |
| |
653 | 653 |
| |
654 | 654 |
| |
655 |
| - | |
| 655 | + | |
656 | 656 |
| |
657 | 657 |
| |
658 | 658 |
| |
|
0 commit comments