zRzRzRzRzRzRzR commited on
Commit
58009ba
·
1 Parent(s): ad148df
Files changed (1) hide show
  1. config.json +49 -1
config.json CHANGED
@@ -193,14 +193,24 @@
193
  "model.layers.8.mlp.gate",
194
  "model.layers.9.mlp.gate",
195
  "visual.blocks.15.mlp.gate_up_proj",
 
 
196
  "visual.blocks.16.mlp.down_proj",
197
  "visual.blocks.16.mlp.gate_up_proj",
 
 
198
  "visual.blocks.17.mlp.down_proj",
199
  "visual.blocks.17.mlp.gate_up_proj",
 
 
200
  "visual.blocks.18.mlp.down_proj",
201
  "visual.blocks.18.mlp.gate_up_proj",
 
 
202
  "visual.blocks.19.mlp.down_proj",
203
  "visual.blocks.19.mlp.gate_up_proj",
 
 
204
  "visual.blocks.20.mlp.down_proj",
205
  "visual.post_layernorm",
206
  "model.layers.40.mlp.gate.e_score_correction_bias",
@@ -241,25 +251,43 @@
241
  "model.layers.28.self_attn.v_proj.bias",
242
  "model.layers.29.self_attn.v_proj.bias",
243
  "visual.blocks.11.mlp.gate_up_proj",
 
 
244
  "visual.blocks.5.mlp.gate_up_proj",
 
 
245
  "visual.blocks.5.norm1",
246
  "visual.blocks.6.mlp.gate_up_proj",
 
 
247
  "visual.blocks.7.mlp.gate_up_proj",
 
 
248
  "visual.blocks.8.mlp.gate_up_proj",
 
 
249
  "visual.blocks.9.mlp.gate_up_proj",
 
 
250
  "model.layers.22.mlp.gate.e_score_correction_bias",
251
  "model.layers.10.mlp.gate.e_score_correction_bias",
252
  "model.layers.11.mlp.gate.e_score_correction_bias",
253
  "model.layers.12.mlp.gate.e_score_correction_bias",
254
  "visual.blocks.12.mlp.down_proj",
255
  "visual.blocks.12.mlp.gate_up_proj",
 
 
256
  "model.layers.14.mlp.gate.e_score_correction_bias",
257
  "model.layers.13.mlp.gate.e_score_correction_bias",
258
  "model.layers.15.mlp.gate.e_score_correction_bias",
259
  "visual.blocks.13.mlp.down_proj",
260
  "visual.blocks.13.mlp.gate_up_proj",
 
 
261
  "visual.blocks.14.mlp.down_proj",
262
  "visual.blocks.14.mlp.gate_up_proj",
 
 
263
  "visual.blocks.15.mlp.down_proj",
264
  "model.embed_tokens",
265
  "model.layers.10.input_layernorm",
@@ -377,14 +405,24 @@
377
  "visual.blocks.8.norm2",
378
  "visual.blocks.9.norm2",
379
  "visual.blocks.20.mlp.gate_up_proj",
 
 
380
  "visual.blocks.21.mlp.down_proj",
381
  "visual.blocks.21.mlp.gate_up_proj",
 
 
382
  "visual.blocks.22.mlp.down_proj",
383
  "visual.blocks.22.mlp.gate_up_proj",
 
 
384
  "visual.blocks.23.mlp.down_proj",
385
  "visual.blocks.23.mlp.gate_up_proj",
 
 
386
  "visual.blocks.10.mlp.down_proj",
387
  "visual.blocks.10.mlp.gate_up_proj",
 
 
388
  "visual.blocks.11.mlp.down_proj",
389
  "visual.embeddings.position_embedding",
390
  "model.layers.15.mlp.gate",
@@ -497,14 +535,24 @@
497
  "visual.post_conv_layernorm",
498
  "visual.blocks.0.mlp.down_proj",
499
  "visual.blocks.0.mlp.gate_up_proj",
 
 
500
  "visual.blocks.1.mlp.down_proj",
501
  "visual.blocks.1.mlp.gate_up_proj",
 
 
502
  "visual.blocks.2.mlp.down_proj",
503
  "visual.blocks.2.mlp.gate_up_proj",
 
 
504
  "visual.blocks.3.mlp.down_proj",
505
  "visual.blocks.3.mlp.gate_up_proj",
 
 
506
  "visual.blocks.4.mlp.down_proj",
507
  "visual.blocks.4.mlp.gate_up_proj",
 
 
508
  "visual.merger.post_projection_norm",
509
  "visual.blocks.12.attn.proj",
510
  "visual.blocks.13.attn.proj",
@@ -599,4 +647,4 @@
599
  "quant_method": "compressed-tensors",
600
  "quantization_status": "compressed"
601
  }
602
- }
 
193
  "model.layers.8.mlp.gate",
194
  "model.layers.9.mlp.gate",
195
  "visual.blocks.15.mlp.gate_up_proj",
196
+ "visual.blocks.15.mlp.gate_proj",
197
+ "visual.blocks.15.mlp.up_proj",
198
  "visual.blocks.16.mlp.down_proj",
199
  "visual.blocks.16.mlp.gate_up_proj",
200
+ "visual.blocks.16.mlp.gate_proj",
201
+ "visual.blocks.16.mlp.up_proj",
202
  "visual.blocks.17.mlp.down_proj",
203
  "visual.blocks.17.mlp.gate_up_proj",
204
+ "visual.blocks.17.mlp.gate_proj",
205
+ "visual.blocks.17.mlp.up_proj",
206
  "visual.blocks.18.mlp.down_proj",
207
  "visual.blocks.18.mlp.gate_up_proj",
208
+ "visual.blocks.18.mlp.gate_proj",
209
+ "visual.blocks.18.mlp.up_proj",
210
  "visual.blocks.19.mlp.down_proj",
211
  "visual.blocks.19.mlp.gate_up_proj",
212
+ "visual.blocks.19.mlp.gate_proj",
213
+ "visual.blocks.19.mlp.up_proj",
214
  "visual.blocks.20.mlp.down_proj",
215
  "visual.post_layernorm",
216
  "model.layers.40.mlp.gate.e_score_correction_bias",
 
251
  "model.layers.28.self_attn.v_proj.bias",
252
  "model.layers.29.self_attn.v_proj.bias",
253
  "visual.blocks.11.mlp.gate_up_proj",
254
+ "visual.blocks.11.mlp.gate_proj",
255
+ "visual.blocks.11.mlp.up_proj",
256
  "visual.blocks.5.mlp.gate_up_proj",
257
+ "visual.blocks.5.mlp.gate_proj",
258
+ "visual.blocks.5.mlp.up_proj",
259
  "visual.blocks.5.norm1",
260
  "visual.blocks.6.mlp.gate_up_proj",
261
+ "visual.blocks.6.mlp.gate_proj",
262
+ "visual.blocks.6.mlp.up_proj",
263
  "visual.blocks.7.mlp.gate_up_proj",
264
+ "visual.blocks.7.mlp.gate_proj",
265
+ "visual.blocks.7.mlp.up_proj",
266
  "visual.blocks.8.mlp.gate_up_proj",
267
+ "visual.blocks.8.mlp.gate_proj",
268
+ "visual.blocks.8.mlp.up_proj",
269
  "visual.blocks.9.mlp.gate_up_proj",
270
+ "visual.blocks.9.mlp.gate_proj",
271
+ "visual.blocks.9.mlp.up_proj",
272
  "model.layers.22.mlp.gate.e_score_correction_bias",
273
  "model.layers.10.mlp.gate.e_score_correction_bias",
274
  "model.layers.11.mlp.gate.e_score_correction_bias",
275
  "model.layers.12.mlp.gate.e_score_correction_bias",
276
  "visual.blocks.12.mlp.down_proj",
277
  "visual.blocks.12.mlp.gate_up_proj",
278
+ "visual.blocks.12.mlp.gate_proj",
279
+ "visual.blocks.12.mlp.up_proj",
280
  "model.layers.14.mlp.gate.e_score_correction_bias",
281
  "model.layers.13.mlp.gate.e_score_correction_bias",
282
  "model.layers.15.mlp.gate.e_score_correction_bias",
283
  "visual.blocks.13.mlp.down_proj",
284
  "visual.blocks.13.mlp.gate_up_proj",
285
+ "visual.blocks.13.mlp.gate_proj",
286
+ "visual.blocks.13.mlp.up_proj",
287
  "visual.blocks.14.mlp.down_proj",
288
  "visual.blocks.14.mlp.gate_up_proj",
289
+ "visual.blocks.14.mlp.gate_proj",
290
+ "visual.blocks.14.mlp.up_proj",
291
  "visual.blocks.15.mlp.down_proj",
292
  "model.embed_tokens",
293
  "model.layers.10.input_layernorm",
 
405
  "visual.blocks.8.norm2",
406
  "visual.blocks.9.norm2",
407
  "visual.blocks.20.mlp.gate_up_proj",
408
+ "visual.blocks.20.mlp.gate_proj",
409
+ "visual.blocks.20.mlp.up_proj",
410
  "visual.blocks.21.mlp.down_proj",
411
  "visual.blocks.21.mlp.gate_up_proj",
412
+ "visual.blocks.21.mlp.gate_proj",
413
+ "visual.blocks.21.mlp.up_proj",
414
  "visual.blocks.22.mlp.down_proj",
415
  "visual.blocks.22.mlp.gate_up_proj",
416
+ "visual.blocks.22.mlp.gate_proj",
417
+ "visual.blocks.22.mlp.up_proj",
418
  "visual.blocks.23.mlp.down_proj",
419
  "visual.blocks.23.mlp.gate_up_proj",
420
+ "visual.blocks.23.mlp.gate_proj",
421
+ "visual.blocks.23.mlp.up_proj",
422
  "visual.blocks.10.mlp.down_proj",
423
  "visual.blocks.10.mlp.gate_up_proj",
424
+ "visual.blocks.10.mlp.gate_proj",
425
+ "visual.blocks.10.mlp.up_proj",
426
  "visual.blocks.11.mlp.down_proj",
427
  "visual.embeddings.position_embedding",
428
  "model.layers.15.mlp.gate",
 
535
  "visual.post_conv_layernorm",
536
  "visual.blocks.0.mlp.down_proj",
537
  "visual.blocks.0.mlp.gate_up_proj",
538
+ "visual.blocks.0.mlp.gate_proj",
539
+ "visual.blocks.0.mlp.up_proj",
540
  "visual.blocks.1.mlp.down_proj",
541
  "visual.blocks.1.mlp.gate_up_proj",
542
+ "visual.blocks.1.mlp.gate_proj",
543
+ "visual.blocks.1.mlp.up_proj",
544
  "visual.blocks.2.mlp.down_proj",
545
  "visual.blocks.2.mlp.gate_up_proj",
546
+ "visual.blocks.2.mlp.gate_proj",
547
+ "visual.blocks.2.mlp.up_proj",
548
  "visual.blocks.3.mlp.down_proj",
549
  "visual.blocks.3.mlp.gate_up_proj",
550
+ "visual.blocks.3.mlp.gate_proj",
551
+ "visual.blocks.3.mlp.up_proj",
552
  "visual.blocks.4.mlp.down_proj",
553
  "visual.blocks.4.mlp.gate_up_proj",
554
+ "visual.blocks.4.mlp.gate_proj",
555
+ "visual.blocks.4.mlp.up_proj",
556
  "visual.merger.post_projection_norm",
557
  "visual.blocks.12.attn.proj",
558
  "visual.blocks.13.attn.proj",
 
647
  "quant_method": "compressed-tensors",
648
  "quantization_status": "compressed"
649
  }
650
+ }