zRzRzRzRzRzRzR
commited on
Commit
·
58009ba
1
Parent(s):
ad148df
final
Browse files- config.json +49 -1
config.json
CHANGED
|
@@ -193,14 +193,24 @@
|
|
| 193 |
"model.layers.8.mlp.gate",
|
| 194 |
"model.layers.9.mlp.gate",
|
| 195 |
"visual.blocks.15.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 196 |
"visual.blocks.16.mlp.down_proj",
|
| 197 |
"visual.blocks.16.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 198 |
"visual.blocks.17.mlp.down_proj",
|
| 199 |
"visual.blocks.17.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 200 |
"visual.blocks.18.mlp.down_proj",
|
| 201 |
"visual.blocks.18.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 202 |
"visual.blocks.19.mlp.down_proj",
|
| 203 |
"visual.blocks.19.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 204 |
"visual.blocks.20.mlp.down_proj",
|
| 205 |
"visual.post_layernorm",
|
| 206 |
"model.layers.40.mlp.gate.e_score_correction_bias",
|
|
@@ -241,25 +251,43 @@
|
|
| 241 |
"model.layers.28.self_attn.v_proj.bias",
|
| 242 |
"model.layers.29.self_attn.v_proj.bias",
|
| 243 |
"visual.blocks.11.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 244 |
"visual.blocks.5.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 245 |
"visual.blocks.5.norm1",
|
| 246 |
"visual.blocks.6.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 247 |
"visual.blocks.7.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 248 |
"visual.blocks.8.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 249 |
"visual.blocks.9.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 250 |
"model.layers.22.mlp.gate.e_score_correction_bias",
|
| 251 |
"model.layers.10.mlp.gate.e_score_correction_bias",
|
| 252 |
"model.layers.11.mlp.gate.e_score_correction_bias",
|
| 253 |
"model.layers.12.mlp.gate.e_score_correction_bias",
|
| 254 |
"visual.blocks.12.mlp.down_proj",
|
| 255 |
"visual.blocks.12.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 256 |
"model.layers.14.mlp.gate.e_score_correction_bias",
|
| 257 |
"model.layers.13.mlp.gate.e_score_correction_bias",
|
| 258 |
"model.layers.15.mlp.gate.e_score_correction_bias",
|
| 259 |
"visual.blocks.13.mlp.down_proj",
|
| 260 |
"visual.blocks.13.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 261 |
"visual.blocks.14.mlp.down_proj",
|
| 262 |
"visual.blocks.14.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 263 |
"visual.blocks.15.mlp.down_proj",
|
| 264 |
"model.embed_tokens",
|
| 265 |
"model.layers.10.input_layernorm",
|
|
@@ -377,14 +405,24 @@
|
|
| 377 |
"visual.blocks.8.norm2",
|
| 378 |
"visual.blocks.9.norm2",
|
| 379 |
"visual.blocks.20.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 380 |
"visual.blocks.21.mlp.down_proj",
|
| 381 |
"visual.blocks.21.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 382 |
"visual.blocks.22.mlp.down_proj",
|
| 383 |
"visual.blocks.22.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 384 |
"visual.blocks.23.mlp.down_proj",
|
| 385 |
"visual.blocks.23.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 386 |
"visual.blocks.10.mlp.down_proj",
|
| 387 |
"visual.blocks.10.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 388 |
"visual.blocks.11.mlp.down_proj",
|
| 389 |
"visual.embeddings.position_embedding",
|
| 390 |
"model.layers.15.mlp.gate",
|
|
@@ -497,14 +535,24 @@
|
|
| 497 |
"visual.post_conv_layernorm",
|
| 498 |
"visual.blocks.0.mlp.down_proj",
|
| 499 |
"visual.blocks.0.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 500 |
"visual.blocks.1.mlp.down_proj",
|
| 501 |
"visual.blocks.1.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 502 |
"visual.blocks.2.mlp.down_proj",
|
| 503 |
"visual.blocks.2.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 504 |
"visual.blocks.3.mlp.down_proj",
|
| 505 |
"visual.blocks.3.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 506 |
"visual.blocks.4.mlp.down_proj",
|
| 507 |
"visual.blocks.4.mlp.gate_up_proj",
|
|
|
|
|
|
|
| 508 |
"visual.merger.post_projection_norm",
|
| 509 |
"visual.blocks.12.attn.proj",
|
| 510 |
"visual.blocks.13.attn.proj",
|
|
@@ -599,4 +647,4 @@
|
|
| 599 |
"quant_method": "compressed-tensors",
|
| 600 |
"quantization_status": "compressed"
|
| 601 |
}
|
| 602 |
-
}
|
|
|
|
| 193 |
"model.layers.8.mlp.gate",
|
| 194 |
"model.layers.9.mlp.gate",
|
| 195 |
"visual.blocks.15.mlp.gate_up_proj",
|
| 196 |
+
"visual.blocks.15.mlp.gate_proj",
|
| 197 |
+
"visual.blocks.15.mlp.up_proj",
|
| 198 |
"visual.blocks.16.mlp.down_proj",
|
| 199 |
"visual.blocks.16.mlp.gate_up_proj",
|
| 200 |
+
"visual.blocks.16.mlp.gate_proj",
|
| 201 |
+
"visual.blocks.16.mlp.up_proj",
|
| 202 |
"visual.blocks.17.mlp.down_proj",
|
| 203 |
"visual.blocks.17.mlp.gate_up_proj",
|
| 204 |
+
"visual.blocks.17.mlp.gate_proj",
|
| 205 |
+
"visual.blocks.17.mlp.up_proj",
|
| 206 |
"visual.blocks.18.mlp.down_proj",
|
| 207 |
"visual.blocks.18.mlp.gate_up_proj",
|
| 208 |
+
"visual.blocks.18.mlp.gate_proj",
|
| 209 |
+
"visual.blocks.18.mlp.up_proj",
|
| 210 |
"visual.blocks.19.mlp.down_proj",
|
| 211 |
"visual.blocks.19.mlp.gate_up_proj",
|
| 212 |
+
"visual.blocks.19.mlp.gate_proj",
|
| 213 |
+
"visual.blocks.19.mlp.up_proj",
|
| 214 |
"visual.blocks.20.mlp.down_proj",
|
| 215 |
"visual.post_layernorm",
|
| 216 |
"model.layers.40.mlp.gate.e_score_correction_bias",
|
|
|
|
| 251 |
"model.layers.28.self_attn.v_proj.bias",
|
| 252 |
"model.layers.29.self_attn.v_proj.bias",
|
| 253 |
"visual.blocks.11.mlp.gate_up_proj",
|
| 254 |
+
"visual.blocks.11.mlp.gate_proj",
|
| 255 |
+
"visual.blocks.11.mlp.up_proj",
|
| 256 |
"visual.blocks.5.mlp.gate_up_proj",
|
| 257 |
+
"visual.blocks.5.mlp.gate_proj",
|
| 258 |
+
"visual.blocks.5.mlp.up_proj",
|
| 259 |
"visual.blocks.5.norm1",
|
| 260 |
"visual.blocks.6.mlp.gate_up_proj",
|
| 261 |
+
"visual.blocks.6.mlp.gate_proj",
|
| 262 |
+
"visual.blocks.6.mlp.up_proj",
|
| 263 |
"visual.blocks.7.mlp.gate_up_proj",
|
| 264 |
+
"visual.blocks.7.mlp.gate_proj",
|
| 265 |
+
"visual.blocks.7.mlp.up_proj",
|
| 266 |
"visual.blocks.8.mlp.gate_up_proj",
|
| 267 |
+
"visual.blocks.8.mlp.gate_proj",
|
| 268 |
+
"visual.blocks.8.mlp.up_proj",
|
| 269 |
"visual.blocks.9.mlp.gate_up_proj",
|
| 270 |
+
"visual.blocks.9.mlp.gate_proj",
|
| 271 |
+
"visual.blocks.9.mlp.up_proj",
|
| 272 |
"model.layers.22.mlp.gate.e_score_correction_bias",
|
| 273 |
"model.layers.10.mlp.gate.e_score_correction_bias",
|
| 274 |
"model.layers.11.mlp.gate.e_score_correction_bias",
|
| 275 |
"model.layers.12.mlp.gate.e_score_correction_bias",
|
| 276 |
"visual.blocks.12.mlp.down_proj",
|
| 277 |
"visual.blocks.12.mlp.gate_up_proj",
|
| 278 |
+
"visual.blocks.12.mlp.gate_proj",
|
| 279 |
+
"visual.blocks.12.mlp.up_proj",
|
| 280 |
"model.layers.14.mlp.gate.e_score_correction_bias",
|
| 281 |
"model.layers.13.mlp.gate.e_score_correction_bias",
|
| 282 |
"model.layers.15.mlp.gate.e_score_correction_bias",
|
| 283 |
"visual.blocks.13.mlp.down_proj",
|
| 284 |
"visual.blocks.13.mlp.gate_up_proj",
|
| 285 |
+
"visual.blocks.13.mlp.gate_proj",
|
| 286 |
+
"visual.blocks.13.mlp.up_proj",
|
| 287 |
"visual.blocks.14.mlp.down_proj",
|
| 288 |
"visual.blocks.14.mlp.gate_up_proj",
|
| 289 |
+
"visual.blocks.14.mlp.gate_proj",
|
| 290 |
+
"visual.blocks.14.mlp.up_proj",
|
| 291 |
"visual.blocks.15.mlp.down_proj",
|
| 292 |
"model.embed_tokens",
|
| 293 |
"model.layers.10.input_layernorm",
|
|
|
|
| 405 |
"visual.blocks.8.norm2",
|
| 406 |
"visual.blocks.9.norm2",
|
| 407 |
"visual.blocks.20.mlp.gate_up_proj",
|
| 408 |
+
"visual.blocks.20.mlp.gate_proj",
|
| 409 |
+
"visual.blocks.20.mlp.up_proj",
|
| 410 |
"visual.blocks.21.mlp.down_proj",
|
| 411 |
"visual.blocks.21.mlp.gate_up_proj",
|
| 412 |
+
"visual.blocks.21.mlp.gate_proj",
|
| 413 |
+
"visual.blocks.21.mlp.up_proj",
|
| 414 |
"visual.blocks.22.mlp.down_proj",
|
| 415 |
"visual.blocks.22.mlp.gate_up_proj",
|
| 416 |
+
"visual.blocks.22.mlp.gate_proj",
|
| 417 |
+
"visual.blocks.22.mlp.up_proj",
|
| 418 |
"visual.blocks.23.mlp.down_proj",
|
| 419 |
"visual.blocks.23.mlp.gate_up_proj",
|
| 420 |
+
"visual.blocks.23.mlp.gate_proj",
|
| 421 |
+
"visual.blocks.23.mlp.up_proj",
|
| 422 |
"visual.blocks.10.mlp.down_proj",
|
| 423 |
"visual.blocks.10.mlp.gate_up_proj",
|
| 424 |
+
"visual.blocks.10.mlp.gate_proj",
|
| 425 |
+
"visual.blocks.10.mlp.up_proj",
|
| 426 |
"visual.blocks.11.mlp.down_proj",
|
| 427 |
"visual.embeddings.position_embedding",
|
| 428 |
"model.layers.15.mlp.gate",
|
|
|
|
| 535 |
"visual.post_conv_layernorm",
|
| 536 |
"visual.blocks.0.mlp.down_proj",
|
| 537 |
"visual.blocks.0.mlp.gate_up_proj",
|
| 538 |
+
"visual.blocks.0.mlp.gate_proj",
|
| 539 |
+
"visual.blocks.0.mlp.up_proj",
|
| 540 |
"visual.blocks.1.mlp.down_proj",
|
| 541 |
"visual.blocks.1.mlp.gate_up_proj",
|
| 542 |
+
"visual.blocks.1.mlp.gate_proj",
|
| 543 |
+
"visual.blocks.1.mlp.up_proj",
|
| 544 |
"visual.blocks.2.mlp.down_proj",
|
| 545 |
"visual.blocks.2.mlp.gate_up_proj",
|
| 546 |
+
"visual.blocks.2.mlp.gate_proj",
|
| 547 |
+
"visual.blocks.2.mlp.up_proj",
|
| 548 |
"visual.blocks.3.mlp.down_proj",
|
| 549 |
"visual.blocks.3.mlp.gate_up_proj",
|
| 550 |
+
"visual.blocks.3.mlp.gate_proj",
|
| 551 |
+
"visual.blocks.3.mlp.up_proj",
|
| 552 |
"visual.blocks.4.mlp.down_proj",
|
| 553 |
"visual.blocks.4.mlp.gate_up_proj",
|
| 554 |
+
"visual.blocks.4.mlp.gate_proj",
|
| 555 |
+
"visual.blocks.4.mlp.up_proj",
|
| 556 |
"visual.merger.post_projection_norm",
|
| 557 |
"visual.blocks.12.attn.proj",
|
| 558 |
"visual.blocks.13.attn.proj",
|
|
|
|
| 647 |
"quant_method": "compressed-tensors",
|
| 648 |
"quantization_status": "compressed"
|
| 649 |
}
|
| 650 |
+
}
|