zRzRzRzRzRzRzR
commited on
Commit
·
58009ba
1
Parent(s):
ad148df
final
Browse files- config.json +49 -1
config.json
CHANGED
@@ -193,14 +193,24 @@
|
|
193 |
"model.layers.8.mlp.gate",
|
194 |
"model.layers.9.mlp.gate",
|
195 |
"visual.blocks.15.mlp.gate_up_proj",
|
|
|
|
|
196 |
"visual.blocks.16.mlp.down_proj",
|
197 |
"visual.blocks.16.mlp.gate_up_proj",
|
|
|
|
|
198 |
"visual.blocks.17.mlp.down_proj",
|
199 |
"visual.blocks.17.mlp.gate_up_proj",
|
|
|
|
|
200 |
"visual.blocks.18.mlp.down_proj",
|
201 |
"visual.blocks.18.mlp.gate_up_proj",
|
|
|
|
|
202 |
"visual.blocks.19.mlp.down_proj",
|
203 |
"visual.blocks.19.mlp.gate_up_proj",
|
|
|
|
|
204 |
"visual.blocks.20.mlp.down_proj",
|
205 |
"visual.post_layernorm",
|
206 |
"model.layers.40.mlp.gate.e_score_correction_bias",
|
@@ -241,25 +251,43 @@
|
|
241 |
"model.layers.28.self_attn.v_proj.bias",
|
242 |
"model.layers.29.self_attn.v_proj.bias",
|
243 |
"visual.blocks.11.mlp.gate_up_proj",
|
|
|
|
|
244 |
"visual.blocks.5.mlp.gate_up_proj",
|
|
|
|
|
245 |
"visual.blocks.5.norm1",
|
246 |
"visual.blocks.6.mlp.gate_up_proj",
|
|
|
|
|
247 |
"visual.blocks.7.mlp.gate_up_proj",
|
|
|
|
|
248 |
"visual.blocks.8.mlp.gate_up_proj",
|
|
|
|
|
249 |
"visual.blocks.9.mlp.gate_up_proj",
|
|
|
|
|
250 |
"model.layers.22.mlp.gate.e_score_correction_bias",
|
251 |
"model.layers.10.mlp.gate.e_score_correction_bias",
|
252 |
"model.layers.11.mlp.gate.e_score_correction_bias",
|
253 |
"model.layers.12.mlp.gate.e_score_correction_bias",
|
254 |
"visual.blocks.12.mlp.down_proj",
|
255 |
"visual.blocks.12.mlp.gate_up_proj",
|
|
|
|
|
256 |
"model.layers.14.mlp.gate.e_score_correction_bias",
|
257 |
"model.layers.13.mlp.gate.e_score_correction_bias",
|
258 |
"model.layers.15.mlp.gate.e_score_correction_bias",
|
259 |
"visual.blocks.13.mlp.down_proj",
|
260 |
"visual.blocks.13.mlp.gate_up_proj",
|
|
|
|
|
261 |
"visual.blocks.14.mlp.down_proj",
|
262 |
"visual.blocks.14.mlp.gate_up_proj",
|
|
|
|
|
263 |
"visual.blocks.15.mlp.down_proj",
|
264 |
"model.embed_tokens",
|
265 |
"model.layers.10.input_layernorm",
|
@@ -377,14 +405,24 @@
|
|
377 |
"visual.blocks.8.norm2",
|
378 |
"visual.blocks.9.norm2",
|
379 |
"visual.blocks.20.mlp.gate_up_proj",
|
|
|
|
|
380 |
"visual.blocks.21.mlp.down_proj",
|
381 |
"visual.blocks.21.mlp.gate_up_proj",
|
|
|
|
|
382 |
"visual.blocks.22.mlp.down_proj",
|
383 |
"visual.blocks.22.mlp.gate_up_proj",
|
|
|
|
|
384 |
"visual.blocks.23.mlp.down_proj",
|
385 |
"visual.blocks.23.mlp.gate_up_proj",
|
|
|
|
|
386 |
"visual.blocks.10.mlp.down_proj",
|
387 |
"visual.blocks.10.mlp.gate_up_proj",
|
|
|
|
|
388 |
"visual.blocks.11.mlp.down_proj",
|
389 |
"visual.embeddings.position_embedding",
|
390 |
"model.layers.15.mlp.gate",
|
@@ -497,14 +535,24 @@
|
|
497 |
"visual.post_conv_layernorm",
|
498 |
"visual.blocks.0.mlp.down_proj",
|
499 |
"visual.blocks.0.mlp.gate_up_proj",
|
|
|
|
|
500 |
"visual.blocks.1.mlp.down_proj",
|
501 |
"visual.blocks.1.mlp.gate_up_proj",
|
|
|
|
|
502 |
"visual.blocks.2.mlp.down_proj",
|
503 |
"visual.blocks.2.mlp.gate_up_proj",
|
|
|
|
|
504 |
"visual.blocks.3.mlp.down_proj",
|
505 |
"visual.blocks.3.mlp.gate_up_proj",
|
|
|
|
|
506 |
"visual.blocks.4.mlp.down_proj",
|
507 |
"visual.blocks.4.mlp.gate_up_proj",
|
|
|
|
|
508 |
"visual.merger.post_projection_norm",
|
509 |
"visual.blocks.12.attn.proj",
|
510 |
"visual.blocks.13.attn.proj",
|
@@ -599,4 +647,4 @@
|
|
599 |
"quant_method": "compressed-tensors",
|
600 |
"quantization_status": "compressed"
|
601 |
}
|
602 |
-
}
|
|
|
193 |
"model.layers.8.mlp.gate",
|
194 |
"model.layers.9.mlp.gate",
|
195 |
"visual.blocks.15.mlp.gate_up_proj",
|
196 |
+
"visual.blocks.15.mlp.gate_proj",
|
197 |
+
"visual.blocks.15.mlp.up_proj",
|
198 |
"visual.blocks.16.mlp.down_proj",
|
199 |
"visual.blocks.16.mlp.gate_up_proj",
|
200 |
+
"visual.blocks.16.mlp.gate_proj",
|
201 |
+
"visual.blocks.16.mlp.up_proj",
|
202 |
"visual.blocks.17.mlp.down_proj",
|
203 |
"visual.blocks.17.mlp.gate_up_proj",
|
204 |
+
"visual.blocks.17.mlp.gate_proj",
|
205 |
+
"visual.blocks.17.mlp.up_proj",
|
206 |
"visual.blocks.18.mlp.down_proj",
|
207 |
"visual.blocks.18.mlp.gate_up_proj",
|
208 |
+
"visual.blocks.18.mlp.gate_proj",
|
209 |
+
"visual.blocks.18.mlp.up_proj",
|
210 |
"visual.blocks.19.mlp.down_proj",
|
211 |
"visual.blocks.19.mlp.gate_up_proj",
|
212 |
+
"visual.blocks.19.mlp.gate_proj",
|
213 |
+
"visual.blocks.19.mlp.up_proj",
|
214 |
"visual.blocks.20.mlp.down_proj",
|
215 |
"visual.post_layernorm",
|
216 |
"model.layers.40.mlp.gate.e_score_correction_bias",
|
|
|
251 |
"model.layers.28.self_attn.v_proj.bias",
|
252 |
"model.layers.29.self_attn.v_proj.bias",
|
253 |
"visual.blocks.11.mlp.gate_up_proj",
|
254 |
+
"visual.blocks.11.mlp.gate_proj",
|
255 |
+
"visual.blocks.11.mlp.up_proj",
|
256 |
"visual.blocks.5.mlp.gate_up_proj",
|
257 |
+
"visual.blocks.5.mlp.gate_proj",
|
258 |
+
"visual.blocks.5.mlp.up_proj",
|
259 |
"visual.blocks.5.norm1",
|
260 |
"visual.blocks.6.mlp.gate_up_proj",
|
261 |
+
"visual.blocks.6.mlp.gate_proj",
|
262 |
+
"visual.blocks.6.mlp.up_proj",
|
263 |
"visual.blocks.7.mlp.gate_up_proj",
|
264 |
+
"visual.blocks.7.mlp.gate_proj",
|
265 |
+
"visual.blocks.7.mlp.up_proj",
|
266 |
"visual.blocks.8.mlp.gate_up_proj",
|
267 |
+
"visual.blocks.8.mlp.gate_proj",
|
268 |
+
"visual.blocks.8.mlp.up_proj",
|
269 |
"visual.blocks.9.mlp.gate_up_proj",
|
270 |
+
"visual.blocks.9.mlp.gate_proj",
|
271 |
+
"visual.blocks.9.mlp.up_proj",
|
272 |
"model.layers.22.mlp.gate.e_score_correction_bias",
|
273 |
"model.layers.10.mlp.gate.e_score_correction_bias",
|
274 |
"model.layers.11.mlp.gate.e_score_correction_bias",
|
275 |
"model.layers.12.mlp.gate.e_score_correction_bias",
|
276 |
"visual.blocks.12.mlp.down_proj",
|
277 |
"visual.blocks.12.mlp.gate_up_proj",
|
278 |
+
"visual.blocks.12.mlp.gate_proj",
|
279 |
+
"visual.blocks.12.mlp.up_proj",
|
280 |
"model.layers.14.mlp.gate.e_score_correction_bias",
|
281 |
"model.layers.13.mlp.gate.e_score_correction_bias",
|
282 |
"model.layers.15.mlp.gate.e_score_correction_bias",
|
283 |
"visual.blocks.13.mlp.down_proj",
|
284 |
"visual.blocks.13.mlp.gate_up_proj",
|
285 |
+
"visual.blocks.13.mlp.gate_proj",
|
286 |
+
"visual.blocks.13.mlp.up_proj",
|
287 |
"visual.blocks.14.mlp.down_proj",
|
288 |
"visual.blocks.14.mlp.gate_up_proj",
|
289 |
+
"visual.blocks.14.mlp.gate_proj",
|
290 |
+
"visual.blocks.14.mlp.up_proj",
|
291 |
"visual.blocks.15.mlp.down_proj",
|
292 |
"model.embed_tokens",
|
293 |
"model.layers.10.input_layernorm",
|
|
|
405 |
"visual.blocks.8.norm2",
|
406 |
"visual.blocks.9.norm2",
|
407 |
"visual.blocks.20.mlp.gate_up_proj",
|
408 |
+
"visual.blocks.20.mlp.gate_proj",
|
409 |
+
"visual.blocks.20.mlp.up_proj",
|
410 |
"visual.blocks.21.mlp.down_proj",
|
411 |
"visual.blocks.21.mlp.gate_up_proj",
|
412 |
+
"visual.blocks.21.mlp.gate_proj",
|
413 |
+
"visual.blocks.21.mlp.up_proj",
|
414 |
"visual.blocks.22.mlp.down_proj",
|
415 |
"visual.blocks.22.mlp.gate_up_proj",
|
416 |
+
"visual.blocks.22.mlp.gate_proj",
|
417 |
+
"visual.blocks.22.mlp.up_proj",
|
418 |
"visual.blocks.23.mlp.down_proj",
|
419 |
"visual.blocks.23.mlp.gate_up_proj",
|
420 |
+
"visual.blocks.23.mlp.gate_proj",
|
421 |
+
"visual.blocks.23.mlp.up_proj",
|
422 |
"visual.blocks.10.mlp.down_proj",
|
423 |
"visual.blocks.10.mlp.gate_up_proj",
|
424 |
+
"visual.blocks.10.mlp.gate_proj",
|
425 |
+
"visual.blocks.10.mlp.up_proj",
|
426 |
"visual.blocks.11.mlp.down_proj",
|
427 |
"visual.embeddings.position_embedding",
|
428 |
"model.layers.15.mlp.gate",
|
|
|
535 |
"visual.post_conv_layernorm",
|
536 |
"visual.blocks.0.mlp.down_proj",
|
537 |
"visual.blocks.0.mlp.gate_up_proj",
|
538 |
+
"visual.blocks.0.mlp.gate_proj",
|
539 |
+
"visual.blocks.0.mlp.up_proj",
|
540 |
"visual.blocks.1.mlp.down_proj",
|
541 |
"visual.blocks.1.mlp.gate_up_proj",
|
542 |
+
"visual.blocks.1.mlp.gate_proj",
|
543 |
+
"visual.blocks.1.mlp.up_proj",
|
544 |
"visual.blocks.2.mlp.down_proj",
|
545 |
"visual.blocks.2.mlp.gate_up_proj",
|
546 |
+
"visual.blocks.2.mlp.gate_proj",
|
547 |
+
"visual.blocks.2.mlp.up_proj",
|
548 |
"visual.blocks.3.mlp.down_proj",
|
549 |
"visual.blocks.3.mlp.gate_up_proj",
|
550 |
+
"visual.blocks.3.mlp.gate_proj",
|
551 |
+
"visual.blocks.3.mlp.up_proj",
|
552 |
"visual.blocks.4.mlp.down_proj",
|
553 |
"visual.blocks.4.mlp.gate_up_proj",
|
554 |
+
"visual.blocks.4.mlp.gate_proj",
|
555 |
+
"visual.blocks.4.mlp.up_proj",
|
556 |
"visual.merger.post_projection_norm",
|
557 |
"visual.blocks.12.attn.proj",
|
558 |
"visual.blocks.13.attn.proj",
|
|
|
647 |
"quant_method": "compressed-tensors",
|
648 |
"quantization_status": "compressed"
|
649 |
}
|
650 |
+
}
|