File tree
8 files changed
+255
-32
lines changed- csrc/quantization/cutlass_w8a8
- moe
- vllm/model_executor/layers/quantization/compressed_tensors
8 files changed
+255
-32
lines changedLines changed: 21 additions & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
577 | 577 |
| |
578 | 578 |
| |
579 | 579 |
| |
580 |
| - | |
| 580 | + | |
581 | 581 |
| |
582 | 582 |
| |
583 | 583 |
| |
| |||
595 | 595 |
| |
596 | 596 |
| |
597 | 597 |
| |
| 598 | + | |
| 599 | + | |
| 600 | + | |
| 601 | + | |
| 602 | + | |
| 603 | + | |
| 604 | + | |
| 605 | + | |
| 606 | + | |
| 607 | + | |
| 608 | + | |
| 609 | + | |
| 610 | + | |
| 611 | + | |
| 612 | + | |
| 613 | + | |
| 614 | + | |
| 615 | + | |
| 616 | + | |
| 617 | + | |
598 | 618 |
| |
599 | 619 |
| |
600 | 620 |
| |
|
Lines changed: 9 additions & 4 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
18 | 18 |
| |
19 | 19 |
| |
20 | 20 |
| |
21 |
| - | |
22 | 21 |
| |
23 | 22 |
| |
24 | 23 |
| |
| |||
33 | 32 |
| |
34 | 33 |
| |
35 | 34 |
| |
36 |
| - | |
| 35 | + | |
37 | 36 |
| |
38 | 37 |
| |
39 | 38 |
| |
| |||
43 | 42 |
| |
44 | 43 |
| |
45 | 44 |
| |
| 45 | + | |
46 | 46 |
| |
47 | 47 |
| |
48 | 48 |
| |
| |||
77 | 77 |
| |
78 | 78 |
| |
79 | 79 |
| |
80 |
| - | |
| 80 | + | |
81 | 81 |
| |
82 | 82 |
| |
83 | 83 |
| |
| |||
156 | 156 |
| |
157 | 157 |
| |
158 | 158 |
| |
| 159 | + | |
| 160 | + | |
| 161 | + | |
| 162 | + | |
| 163 | + | |
159 | 164 |
| |
160 | 165 |
| |
161 |
| - | |
| 166 | + | |
162 | 167 |
| |
163 | 168 |
| |
164 | 169 |
| |
|
Lines changed: 140 additions & 0 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
| 1 | + | |
| 2 | + | |
| 3 | + | |
| 4 | + | |
| 5 | + | |
| 6 | + | |
| 7 | + | |
| 8 | + | |
| 9 | + | |
| 10 | + | |
| 11 | + | |
| 12 | + | |
| 13 | + | |
| 14 | + | |
| 15 | + | |
| 16 | + | |
| 17 | + | |
| 18 | + | |
| 19 | + | |
| 20 | + | |
| 21 | + | |
| 22 | + | |
| 23 | + | |
| 24 | + | |
| 25 | + | |
| 26 | + | |
| 27 | + | |
| 28 | + | |
| 29 | + | |
| 30 | + | |
| 31 | + | |
| 32 | + | |
| 33 | + | |
| 34 | + | |
| 35 | + | |
| 36 | + | |
| 37 | + | |
| 38 | + | |
| 39 | + | |
| 40 | + | |
| 41 | + | |
| 42 | + | |
| 43 | + | |
| 44 | + | |
| 45 | + | |
| 46 | + | |
| 47 | + | |
| 48 | + | |
| 49 | + | |
| 50 | + | |
| 51 | + | |
| 52 | + | |
| 53 | + | |
| 54 | + | |
| 55 | + | |
| 56 | + | |
| 57 | + | |
| 58 | + | |
| 59 | + | |
| 60 | + | |
| 61 | + | |
| 62 | + | |
| 63 | + | |
| 64 | + | |
| 65 | + | |
| 66 | + | |
| 67 | + | |
| 68 | + | |
| 69 | + | |
| 70 | + | |
| 71 | + | |
| 72 | + | |
| 73 | + | |
| 74 | + | |
| 75 | + | |
| 76 | + | |
| 77 | + | |
| 78 | + | |
| 79 | + | |
| 80 | + | |
| 81 | + | |
| 82 | + | |
| 83 | + | |
| 84 | + | |
| 85 | + | |
| 86 | + | |
| 87 | + | |
| 88 | + | |
| 89 | + | |
| 90 | + | |
| 91 | + | |
| 92 | + | |
| 93 | + | |
| 94 | + | |
| 95 | + | |
| 96 | + | |
| 97 | + | |
| 98 | + | |
| 99 | + | |
| 100 | + | |
| 101 | + | |
| 102 | + | |
| 103 | + | |
| 104 | + | |
| 105 | + | |
| 106 | + | |
| 107 | + | |
| 108 | + | |
| 109 | + | |
| 110 | + | |
| 111 | + | |
| 112 | + | |
| 113 | + | |
| 114 | + | |
| 115 | + | |
| 116 | + | |
| 117 | + | |
| 118 | + | |
| 119 | + | |
| 120 | + | |
| 121 | + | |
| 122 | + | |
| 123 | + | |
| 124 | + | |
| 125 | + | |
| 126 | + | |
| 127 | + | |
| 128 | + | |
| 129 | + | |
| 130 | + | |
| 131 | + | |
| 132 | + | |
| 133 | + | |
| 134 | + | |
| 135 | + | |
| 136 | + | |
| 137 | + | |
| 138 | + | |
| 139 | + | |
| 140 | + |
Lines changed: 17 additions & 13 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
21 | 21 |
| |
22 | 22 |
| |
23 | 23 |
| |
| 24 | + | |
24 | 25 |
| |
25 | 26 |
| |
26 |
| - | |
27 |
| - | |
| 27 | + | |
| 28 | + | |
28 | 29 |
| |
29 | 30 |
| |
30 | 31 |
| |
| |||
38 | 39 |
| |
39 | 40 |
| |
40 | 41 |
| |
| 42 | + | |
41 | 43 |
| |
42 | 44 |
| |
43 |
| - | |
44 |
| - | |
| 45 | + | |
| 46 | + | |
| 47 | + | |
45 | 48 |
| |
46 | 49 |
| |
47 | 50 |
| |
| |||
55 | 58 |
| |
56 | 59 |
| |
57 | 60 |
| |
| 61 | + | |
58 | 62 |
| |
59 | 63 |
| |
60 |
| - | |
61 |
| - | |
| 64 | + | |
| 65 | + | |
| 66 | + | |
62 | 67 |
| |
63 | 68 |
| |
64 | 69 |
| |
| |||
72 | 77 |
| |
73 | 78 |
| |
74 | 79 |
| |
| 80 | + | |
75 | 81 |
| |
76 | 82 |
| |
77 |
| - | |
78 |
| - | |
| 83 | + | |
| 84 | + | |
79 | 85 |
| |
80 | 86 |
| |
81 | 87 |
| |
| |||
89 | 95 |
| |
90 | 96 |
| |
91 | 97 |
| |
| 98 | + | |
92 | 99 |
| |
93 | 100 |
| |
94 |
| - | |
95 |
| - | |
| 101 | + | |
| 102 | + | |
96 | 103 |
| |
97 | 104 |
| |
98 | 105 |
| |
| |||
112 | 119 |
| |
113 | 120 |
| |
114 | 121 |
| |
115 |
| - | |
116 |
| - | |
117 |
| - | |
118 | 122 |
| |
119 | 123 |
| |
120 | 124 |
| |
|
Lines changed: 1 addition & 1 deletion
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
190 | 190 |
| |
191 | 191 |
| |
192 | 192 |
| |
193 |
| - | |
| 193 | + |
Lines changed: 34 additions & 11 deletions
Original file line number | Diff line number | Diff line change | |
---|---|---|---|
| |||
41 | 41 |
| |
42 | 42 |
| |
43 | 43 |
| |
| 44 | + | |
| 45 | + | |
| 46 | + | |
| 47 | + | |
| 48 | + | |
| 49 | + | |
| 50 | + | |
| 51 | + | |
| 52 | + | |
| 53 | + | |
44 | 54 |
| |
45 | 55 |
| |
46 | 56 |
| |
| |||
130 | 140 |
| |
131 | 141 |
| |
132 | 142 |
| |
133 |
| - | |
134 |
| - | |
135 |
| - | |
| 143 | + | |
136 | 144 |
| |
| 145 | + | |
| 146 | + | |
137 | 147 |
| |
138 | 148 |
| |
139 | 149 |
| |
140 | 150 |
| |
141 | 151 |
| |
142 | 152 |
| |
143 | 153 |
| |
144 |
| - | |
145 |
| - | |
| 154 | + | |
| 155 | + | |
146 | 156 |
| |
147 | 157 |
| |
148 |
| - | |
| 158 | + | |
| 159 | + | |
| 160 | + | |
| 161 | + | |
149 | 162 |
| |
150 | 163 |
| |
151 | 164 |
| |
| |||
234 | 247 |
| |
235 | 248 |
| |
236 | 249 |
| |
| 250 | + | |
| 251 | + | |
| 252 | + | |
| 253 | + | |
| 254 | + | |
| 255 | + | |
| 256 | + | |
| 257 | + | |
237 | 258 |
| |
238 |
| - | |
239 |
| - | |
240 |
| - | |
241 |
| - | |
| 259 | + | |
| 260 | + | |
| 261 | + | |
| 262 | + | |
| 263 | + | |
| 264 | + | |
242 | 265 |
| |
243 | 266 |
| |
244 | 267 |
| |
245 | 268 |
| |
246 |
| - | |
| 269 | + | |
247 | 270 |
| |
248 | 271 |
| |
249 | 272 |
| |
|
0 commit comments