Commit c1a9c83
[Model] Add BNB quantization support for Mllama (vllm-project#9720)
1 parent cf1e822 commit c1a9c83
File tree
3 files changed
+84
-12
lines changed- vllm/model_executor
- layers/quantization
- model_loader
- models
3 files changed
+84
-12
lines changed| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
3 | 3 | | |
4 | 4 | | |
5 | 5 | | |
| 6 | + | |
6 | 7 | | |
7 | 8 | | |
8 | 9 | | |
| |||
23 | 24 | | |
24 | 25 | | |
25 | 26 | | |
26 | | - | |
| 27 | + | |
27 | 28 | | |
28 | 29 | | |
29 | 30 | | |
| |||
34 | 35 | | |
35 | 36 | | |
36 | 37 | | |
37 | | - | |
| 38 | + | |
38 | 39 | | |
39 | 40 | | |
40 | 41 | | |
41 | | - | |
| 42 | + | |
| 43 | + | |
| 44 | + | |
| 45 | + | |
| 46 | + | |
42 | 47 | | |
43 | 48 | | |
44 | 49 | | |
| |||
102 | 107 | | |
103 | 108 | | |
104 | 109 | | |
105 | | - | |
| 110 | + | |
106 | 111 | | |
| 112 | + | |
| 113 | + | |
107 | 114 | | |
108 | 115 | | |
109 | 116 | | |
110 | 117 | | |
111 | 118 | | |
112 | 119 | | |
113 | 120 | | |
| 121 | + | |
| 122 | + | |
| 123 | + | |
| 124 | + | |
114 | 125 | | |
115 | 126 | | |
116 | 127 | | |
| |||
211 | 222 | | |
212 | 223 | | |
213 | 224 | | |
| 225 | + | |
| 226 | + | |
| 227 | + | |
| 228 | + | |
| 229 | + | |
214 | 230 | | |
215 | 231 | | |
216 | 232 | | |
| |||
265 | 281 | | |
266 | 282 | | |
267 | 283 | | |
| 284 | + | |
| 285 | + | |
| 286 | + | |
268 | 287 | | |
269 | 288 | | |
270 | 289 | | |
| |||
282 | 301 | | |
283 | 302 | | |
284 | 303 | | |
| 304 | + | |
| 305 | + | |
| 306 | + | |
| 307 | + | |
| 308 | + | |
285 | 309 | | |
286 | 310 | | |
287 | 311 | | |
| |||
310 | 334 | | |
311 | 335 | | |
312 | 336 | | |
| 337 | + | |
| 338 | + | |
| 339 | + | |
313 | 340 | | |
314 | 341 | | |
315 | 342 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
899 | 899 | | |
900 | 900 | | |
901 | 901 | | |
| 902 | + | |
| 903 | + | |
| 904 | + | |
| 905 | + | |
| 906 | + | |
| 907 | + | |
| 908 | + | |
| 909 | + | |
| 910 | + | |
| 911 | + | |
| 912 | + | |
| 913 | + | |
| 914 | + | |
902 | 915 | | |
903 | 916 | | |
904 | 917 | | |
| |||
912 | 925 | | |
913 | 926 | | |
914 | 927 | | |
915 | | - | |
| 928 | + | |
916 | 929 | | |
917 | 930 | | |
918 | 931 | | |
| |||
932 | 945 | | |
933 | 946 | | |
934 | 947 | | |
935 | | - | |
| 948 | + | |
936 | 949 | | |
937 | 950 | | |
938 | 951 | | |
| |||
956 | 969 | | |
957 | 970 | | |
958 | 971 | | |
959 | | - | |
| 972 | + | |
960 | 973 | | |
961 | 974 | | |
962 | 975 | | |
| |||
| Original file line number | Diff line number | Diff line change | |
|---|---|---|---|
| |||
325 | 325 | | |
326 | 326 | | |
327 | 327 | | |
328 | | - | |
| 328 | + | |
| 329 | + | |
| 330 | + | |
| 331 | + | |
329 | 332 | | |
330 | 333 | | |
331 | 334 | | |
| |||
341 | 344 | | |
342 | 345 | | |
343 | 346 | | |
| 347 | + | |
| 348 | + | |
344 | 349 | | |
345 | 350 | | |
346 | 351 | | |
347 | 352 | | |
348 | 353 | | |
349 | 354 | | |
| 355 | + | |
| 356 | + | |
350 | 357 | | |
351 | 358 | | |
352 | 359 | | |
| |||
393 | 400 | | |
394 | 401 | | |
395 | 402 | | |
396 | | - | |
| 403 | + | |
| 404 | + | |
397 | 405 | | |
398 | 406 | | |
399 | 407 | | |
| |||
1002 | 1010 | | |
1003 | 1011 | | |
1004 | 1012 | | |
| 1013 | + | |
1005 | 1014 | | |
1006 | 1015 | | |
1007 | 1016 | | |
| |||
1037 | 1046 | | |
1038 | 1047 | | |
1039 | 1048 | | |
| 1049 | + | |
| 1050 | + | |
| 1051 | + | |
| 1052 | + | |
| 1053 | + | |
| 1054 | + | |
| 1055 | + | |
| 1056 | + | |
| 1057 | + | |
| 1058 | + | |
| 1059 | + | |
| 1060 | + | |
| 1061 | + | |
| 1062 | + | |
| 1063 | + | |
| 1064 | + | |
| 1065 | + | |
| 1066 | + | |
| 1067 | + | |
| 1068 | + | |
1040 | 1069 | | |
1041 | 1070 | | |
1042 | 1071 | | |
| |||
1061 | 1090 | | |
1062 | 1091 | | |
1063 | 1092 | | |
1064 | | - | |
| 1093 | + | |
1065 | 1094 | | |
1066 | 1095 | | |
1067 | 1096 | | |
| 1097 | + | |
| 1098 | + | |
| 1099 | + | |
1068 | 1100 | | |
1069 | 1101 | | |
1070 | 1102 | | |
| |||
1128 | 1160 | | |
1129 | 1161 | | |
1130 | 1162 | | |
1131 | | - | |
| 1163 | + | |
1132 | 1164 | | |
1133 | 1165 | | |
1134 | 1166 | | |
| |||
1204 | 1236 | | |
1205 | 1237 | | |
1206 | 1238 | | |
1207 | | - | |
| 1239 | + | |
1208 | 1240 | | |
1209 | 1241 | | |
1210 | 1242 | | |
| |||
0 commit comments