Upload folder using huggingface_hub
Browse files- model-00001-of-00009.safetensors +2 -2
- model-00002-of-00009.safetensors +2 -2
- model-00003-of-00009.safetensors +2 -2
- model-00004-of-00009.safetensors +2 -2
- model-00005-of-00009.safetensors +2 -2
- model-00006-of-00009.safetensors +2 -2
- model-00007-of-00009.safetensors +2 -2
- model-00008-of-00009.safetensors +2 -2
- model-00009-of-00009.safetensors +2 -2
- model.safetensors.index.json +1 -82
model-00001-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d418a84d3f217a392b8be61a52b2709ebdb2e742e0a4d71f2cc5556758365cf2
|
| 3 |
+
size 4691828232
|
model-00002-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13218b59621b3bd998143d97e2454fce9005e972fb650a9e8e41d2ae5ed9e603
|
| 3 |
+
size 4972326544
|
model-00003-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e57fb00719ba2816dcb7099eefc47b52b138923ba21e1525a21997ccce6f54e4
|
| 3 |
+
size 4964462408
|
model-00004-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c9ff45e48754f8ed7f2617d7618a107ef906a678eb60af70c78401c6a6545d9c
|
| 3 |
+
size 4972326648
|
model-00005-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d721b5ce36d91d06cae02e0b01fc08ea984c4dc739d4d4814a2eac8354d5cf0c
|
| 3 |
+
size 4956602632
|
model-00006-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:15bbba410e206d7091385c8d5d44e5c62486c6ad06ab5f71ac257c07f6fa2a84
|
| 3 |
+
size 4972987488
|
model-00007-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81d39a1f2b14fe875436acf8bd4585dcfb1c293cc898c0f3406720471fedca8c
|
| 3 |
+
size 4972326600
|
model-00008-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc900ee1edd9b2b1ab3c67aeaab02952d2293e7af5ce097e97e0c592939105f3
|
| 3 |
+
size 4964462256
|
model-00009-of-00009.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a42af40a048dc16eb4959e76ae225923d5d315c633a158f40f0168eddb26a378
|
| 3 |
+
size 4193085520
|
model.safetensors.index.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
-
"total_size":
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"model.layers.15.mlp.gate.weight": "model-00001-of-00009.safetensors",
|
|
@@ -203,9 +203,6 @@
|
|
| 203 |
"model.layers.15.mlp.experts.63.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 204 |
"model.layers.15.mlp.experts.63.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 205 |
"model.layers.15.mlp.experts.63.gate_proj.weight": "model-00001-of-00009.safetensors",
|
| 206 |
-
"model.layers.15.mlp.experts.64.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 207 |
-
"model.layers.15.mlp.experts.64.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 208 |
-
"model.layers.15.mlp.experts.64.gate_proj.weight": "model-00001-of-00009.safetensors",
|
| 209 |
"model.layers.15.mlp.experts.7.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 210 |
"model.layers.15.mlp.experts.7.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 211 |
"model.layers.15.mlp.experts.7.gate_proj.weight": "model-00001-of-00009.safetensors",
|
|
@@ -407,9 +404,6 @@
|
|
| 407 |
"model.layers.20.mlp.experts.63.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 408 |
"model.layers.20.mlp.experts.63.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 409 |
"model.layers.20.mlp.experts.63.gate_proj.weight": "model-00001-of-00009.safetensors",
|
| 410 |
-
"model.layers.20.mlp.experts.64.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 411 |
-
"model.layers.20.mlp.experts.64.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 412 |
-
"model.layers.20.mlp.experts.64.gate_proj.weight": "model-00001-of-00009.safetensors",
|
| 413 |
"model.layers.20.mlp.experts.7.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 414 |
"model.layers.20.mlp.experts.7.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 415 |
"model.layers.20.mlp.experts.7.gate_proj.weight": "model-00001-of-00009.safetensors",
|
|
@@ -840,9 +834,6 @@
|
|
| 840 |
"model.layers.19.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 841 |
"model.layers.19.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 842 |
"model.layers.19.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
|
| 843 |
-
"model.layers.19.mlp.experts.64.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 844 |
-
"model.layers.19.mlp.experts.64.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 845 |
-
"model.layers.19.mlp.experts.64.gate_proj.weight": "model-00002-of-00009.safetensors",
|
| 846 |
"model.layers.19.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 847 |
"model.layers.19.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 848 |
"model.layers.19.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
@@ -1044,9 +1035,6 @@
|
|
| 1044 |
"model.layers.4.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1045 |
"model.layers.4.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1046 |
"model.layers.4.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
|
| 1047 |
-
"model.layers.4.mlp.experts.64.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1048 |
-
"model.layers.4.mlp.experts.64.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1049 |
-
"model.layers.4.mlp.experts.64.gate_proj.weight": "model-00002-of-00009.safetensors",
|
| 1050 |
"model.layers.4.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1051 |
"model.layers.4.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1052 |
"model.layers.4.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
@@ -1150,9 +1138,6 @@
|
|
| 1150 |
"model.layers.8.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1151 |
"model.layers.8.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1152 |
"model.layers.8.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
|
| 1153 |
-
"model.layers.8.mlp.experts.64.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1154 |
-
"model.layers.8.mlp.experts.64.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1155 |
-
"model.layers.8.mlp.experts.64.gate_proj.weight": "model-00002-of-00009.safetensors",
|
| 1156 |
"model.layers.8.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1157 |
"model.layers.8.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1158 |
"model.layers.8.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
@@ -1360,9 +1345,6 @@
|
|
| 1360 |
"model.layers.11.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1361 |
"model.layers.11.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1362 |
"model.layers.11.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
|
| 1363 |
-
"model.layers.11.mlp.experts.64.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1364 |
-
"model.layers.11.mlp.experts.64.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1365 |
-
"model.layers.11.mlp.experts.64.gate_proj.weight": "model-00003-of-00009.safetensors",
|
| 1366 |
"model.layers.11.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1367 |
"model.layers.11.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1368 |
"model.layers.11.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
@@ -1564,9 +1546,6 @@
|
|
| 1564 |
"model.layers.13.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1565 |
"model.layers.13.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1566 |
"model.layers.13.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
|
| 1567 |
-
"model.layers.13.mlp.experts.64.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1568 |
-
"model.layers.13.mlp.experts.64.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1569 |
-
"model.layers.13.mlp.experts.64.gate_proj.weight": "model-00003-of-00009.safetensors",
|
| 1570 |
"model.layers.13.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1571 |
"model.layers.13.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1572 |
"model.layers.13.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
@@ -1644,9 +1623,6 @@
|
|
| 1644 |
"model.layers.18.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1645 |
"model.layers.18.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1646 |
"model.layers.18.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
|
| 1647 |
-
"model.layers.18.mlp.experts.64.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1648 |
-
"model.layers.18.mlp.experts.64.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1649 |
-
"model.layers.18.mlp.experts.64.gate_proj.weight": "model-00003-of-00009.safetensors",
|
| 1650 |
"model.layers.18.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1651 |
"model.layers.18.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1652 |
"model.layers.18.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
@@ -2003,9 +1979,6 @@
|
|
| 2003 |
"model.layers.17.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2004 |
"model.layers.17.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2005 |
"model.layers.17.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
|
| 2006 |
-
"model.layers.17.mlp.experts.64.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2007 |
-
"model.layers.17.mlp.experts.64.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2008 |
-
"model.layers.17.mlp.experts.64.gate_proj.weight": "model-00004-of-00009.safetensors",
|
| 2009 |
"model.layers.17.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2010 |
"model.layers.17.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2011 |
"model.layers.17.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
@@ -2233,9 +2206,6 @@
|
|
| 2233 |
"model.layers.27.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2234 |
"model.layers.27.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2235 |
"model.layers.27.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
|
| 2236 |
-
"model.layers.27.mlp.experts.64.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2237 |
-
"model.layers.27.mlp.experts.64.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2238 |
-
"model.layers.27.mlp.experts.64.gate_proj.weight": "model-00004-of-00009.safetensors",
|
| 2239 |
"model.layers.27.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2240 |
"model.layers.27.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2241 |
"model.layers.27.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
@@ -2437,9 +2407,6 @@
|
|
| 2437 |
"model.layers.9.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2438 |
"model.layers.9.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2439 |
"model.layers.9.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
|
| 2440 |
-
"model.layers.9.mlp.experts.64.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2441 |
-
"model.layers.9.mlp.experts.64.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2442 |
-
"model.layers.9.mlp.experts.64.gate_proj.weight": "model-00004-of-00009.safetensors",
|
| 2443 |
"model.layers.9.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2444 |
"model.layers.9.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2445 |
"model.layers.9.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
@@ -2647,9 +2614,6 @@
|
|
| 2647 |
"model.layers.22.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2648 |
"model.layers.22.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2649 |
"model.layers.22.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
|
| 2650 |
-
"model.layers.22.mlp.experts.64.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2651 |
-
"model.layers.22.mlp.experts.64.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2652 |
-
"model.layers.22.mlp.experts.64.gate_proj.weight": "model-00005-of-00009.safetensors",
|
| 2653 |
"model.layers.22.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2654 |
"model.layers.22.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2655 |
"model.layers.22.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
@@ -2847,9 +2811,6 @@
|
|
| 2847 |
"model.layers.24.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2848 |
"model.layers.24.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2849 |
"model.layers.24.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
|
| 2850 |
-
"model.layers.24.mlp.experts.64.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2851 |
-
"model.layers.24.mlp.experts.64.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2852 |
-
"model.layers.24.mlp.experts.64.gate_proj.weight": "model-00005-of-00009.safetensors",
|
| 2853 |
"model.layers.24.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2854 |
"model.layers.24.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2855 |
"model.layers.24.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
@@ -2876,9 +2837,6 @@
|
|
| 2876 |
"model.layers.26.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2877 |
"model.layers.26.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2878 |
"model.layers.26.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
|
| 2879 |
-
"model.layers.26.mlp.experts.64.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2880 |
-
"model.layers.26.mlp.experts.64.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2881 |
-
"model.layers.26.mlp.experts.64.gate_proj.weight": "model-00005-of-00009.safetensors",
|
| 2882 |
"model.layers.26.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2883 |
"model.layers.26.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2884 |
"model.layers.26.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
@@ -3080,9 +3038,6 @@
|
|
| 3080 |
"model.layers.6.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 3081 |
"model.layers.6.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 3082 |
"model.layers.6.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
|
| 3083 |
-
"model.layers.6.mlp.experts.64.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 3084 |
-
"model.layers.6.mlp.experts.64.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 3085 |
-
"model.layers.6.mlp.experts.64.gate_proj.weight": "model-00005-of-00009.safetensors",
|
| 3086 |
"model.layers.6.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 3087 |
"model.layers.6.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 3088 |
"model.layers.6.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
@@ -3292,9 +3247,6 @@
|
|
| 3292 |
"model.layers.1.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3293 |
"model.layers.1.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3294 |
"model.layers.1.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
|
| 3295 |
-
"model.layers.1.mlp.experts.64.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3296 |
-
"model.layers.1.mlp.experts.64.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3297 |
-
"model.layers.1.mlp.experts.64.gate_proj.weight": "model-00006-of-00009.safetensors",
|
| 3298 |
"model.layers.1.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3299 |
"model.layers.1.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3300 |
"model.layers.1.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
@@ -3496,9 +3448,6 @@
|
|
| 3496 |
"model.layers.16.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3497 |
"model.layers.16.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3498 |
"model.layers.16.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
|
| 3499 |
-
"model.layers.16.mlp.experts.64.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3500 |
-
"model.layers.16.mlp.experts.64.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3501 |
-
"model.layers.16.mlp.experts.64.gate_proj.weight": "model-00006-of-00009.safetensors",
|
| 3502 |
"model.layers.16.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3503 |
"model.layers.16.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3504 |
"model.layers.16.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
@@ -3700,9 +3649,6 @@
|
|
| 3700 |
"model.layers.2.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3701 |
"model.layers.2.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3702 |
"model.layers.2.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
|
| 3703 |
-
"model.layers.2.mlp.experts.64.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3704 |
-
"model.layers.2.mlp.experts.64.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3705 |
-
"model.layers.2.mlp.experts.64.gate_proj.weight": "model-00006-of-00009.safetensors",
|
| 3706 |
"model.layers.2.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3707 |
"model.layers.2.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3708 |
"model.layers.2.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
@@ -3937,9 +3883,6 @@
|
|
| 3937 |
"model.layers.12.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 3938 |
"model.layers.12.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 3939 |
"model.layers.12.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
|
| 3940 |
-
"model.layers.12.mlp.experts.64.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 3941 |
-
"model.layers.12.mlp.experts.64.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 3942 |
-
"model.layers.12.mlp.experts.64.gate_proj.weight": "model-00007-of-00009.safetensors",
|
| 3943 |
"model.layers.12.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 3944 |
"model.layers.12.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 3945 |
"model.layers.12.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
@@ -4118,9 +4061,6 @@
|
|
| 4118 |
"model.layers.21.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4119 |
"model.layers.21.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4120 |
"model.layers.21.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
|
| 4121 |
-
"model.layers.21.mlp.experts.64.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4122 |
-
"model.layers.21.mlp.experts.64.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4123 |
-
"model.layers.21.mlp.experts.64.gate_proj.weight": "model-00007-of-00009.safetensors",
|
| 4124 |
"model.layers.21.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4125 |
"model.layers.21.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4126 |
"model.layers.21.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
@@ -4371,9 +4311,6 @@
|
|
| 4371 |
"model.layers.7.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4372 |
"model.layers.7.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4373 |
"model.layers.7.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
|
| 4374 |
-
"model.layers.7.mlp.experts.64.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4375 |
-
"model.layers.7.mlp.experts.64.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4376 |
-
"model.layers.7.mlp.experts.64.gate_proj.weight": "model-00007-of-00009.safetensors",
|
| 4377 |
"model.layers.7.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4378 |
"model.layers.7.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4379 |
"model.layers.7.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
@@ -4581,9 +4518,6 @@
|
|
| 4581 |
"model.layers.10.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4582 |
"model.layers.10.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4583 |
"model.layers.10.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
|
| 4584 |
-
"model.layers.10.mlp.experts.64.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4585 |
-
"model.layers.10.mlp.experts.64.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4586 |
-
"model.layers.10.mlp.experts.64.gate_proj.weight": "model-00008-of-00009.safetensors",
|
| 4587 |
"model.layers.10.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4588 |
"model.layers.10.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4589 |
"model.layers.10.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
@@ -4859,9 +4793,6 @@
|
|
| 4859 |
"model.layers.23.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4860 |
"model.layers.23.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4861 |
"model.layers.23.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
|
| 4862 |
-
"model.layers.23.mlp.experts.64.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4863 |
-
"model.layers.23.mlp.experts.64.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4864 |
-
"model.layers.23.mlp.experts.64.gate_proj.weight": "model-00008-of-00009.safetensors",
|
| 4865 |
"model.layers.23.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4866 |
"model.layers.23.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4867 |
"model.layers.23.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
@@ -5014,9 +4945,6 @@
|
|
| 5014 |
"model.layers.5.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 5015 |
"model.layers.5.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 5016 |
"model.layers.5.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
|
| 5017 |
-
"model.layers.5.mlp.experts.64.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 5018 |
-
"model.layers.5.mlp.experts.64.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 5019 |
-
"model.layers.5.mlp.experts.64.gate_proj.weight": "model-00008-of-00009.safetensors",
|
| 5020 |
"model.layers.5.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 5021 |
"model.layers.5.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 5022 |
"model.layers.5.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
@@ -5148,9 +5076,6 @@
|
|
| 5148 |
"model.layers.14.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5149 |
"model.layers.14.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5150 |
"model.layers.14.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
|
| 5151 |
-
"model.layers.14.mlp.experts.64.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5152 |
-
"model.layers.14.mlp.experts.64.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5153 |
-
"model.layers.14.mlp.experts.64.gate_proj.weight": "model-00009-of-00009.safetensors",
|
| 5154 |
"model.layers.14.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5155 |
"model.layers.14.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5156 |
"model.layers.14.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
|
|
@@ -5352,9 +5277,6 @@
|
|
| 5352 |
"model.layers.25.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5353 |
"model.layers.25.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5354 |
"model.layers.25.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
|
| 5355 |
-
"model.layers.25.mlp.experts.64.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5356 |
-
"model.layers.25.mlp.experts.64.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5357 |
-
"model.layers.25.mlp.experts.64.gate_proj.weight": "model-00009-of-00009.safetensors",
|
| 5358 |
"model.layers.25.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5359 |
"model.layers.25.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5360 |
"model.layers.25.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
|
|
@@ -5556,9 +5478,6 @@
|
|
| 5556 |
"model.layers.3.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5557 |
"model.layers.3.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5558 |
"model.layers.3.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
|
| 5559 |
-
"model.layers.3.mlp.experts.64.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5560 |
-
"model.layers.3.mlp.experts.64.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5561 |
-
"model.layers.3.mlp.experts.64.gate_proj.weight": "model-00009-of-00009.safetensors",
|
| 5562 |
"model.layers.3.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5563 |
"model.layers.3.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5564 |
"model.layers.3.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
|
|
|
|
| 1 |
{
|
| 2 |
"metadata": {
|
| 3 |
+
"total_size": 43659726592
|
| 4 |
},
|
| 5 |
"weight_map": {
|
| 6 |
"model.layers.15.mlp.gate.weight": "model-00001-of-00009.safetensors",
|
|
|
|
| 203 |
"model.layers.15.mlp.experts.63.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 204 |
"model.layers.15.mlp.experts.63.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 205 |
"model.layers.15.mlp.experts.63.gate_proj.weight": "model-00001-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 206 |
"model.layers.15.mlp.experts.7.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 207 |
"model.layers.15.mlp.experts.7.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 208 |
"model.layers.15.mlp.experts.7.gate_proj.weight": "model-00001-of-00009.safetensors",
|
|
|
|
| 404 |
"model.layers.20.mlp.experts.63.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 405 |
"model.layers.20.mlp.experts.63.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 406 |
"model.layers.20.mlp.experts.63.gate_proj.weight": "model-00001-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 407 |
"model.layers.20.mlp.experts.7.down_proj.weight": "model-00001-of-00009.safetensors",
|
| 408 |
"model.layers.20.mlp.experts.7.up_proj.weight": "model-00001-of-00009.safetensors",
|
| 409 |
"model.layers.20.mlp.experts.7.gate_proj.weight": "model-00001-of-00009.safetensors",
|
|
|
|
| 834 |
"model.layers.19.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 835 |
"model.layers.19.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 836 |
"model.layers.19.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 837 |
"model.layers.19.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 838 |
"model.layers.19.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 839 |
"model.layers.19.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
|
|
| 1035 |
"model.layers.4.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1036 |
"model.layers.4.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1037 |
"model.layers.4.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 1038 |
"model.layers.4.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1039 |
"model.layers.4.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1040 |
"model.layers.4.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
|
|
| 1138 |
"model.layers.8.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1139 |
"model.layers.8.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1140 |
"model.layers.8.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 1141 |
"model.layers.8.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
|
| 1142 |
"model.layers.8.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
|
| 1143 |
"model.layers.8.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
|
|
|
|
| 1345 |
"model.layers.11.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1346 |
"model.layers.11.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1347 |
"model.layers.11.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 1348 |
"model.layers.11.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1349 |
"model.layers.11.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1350 |
"model.layers.11.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
|
|
| 1546 |
"model.layers.13.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1547 |
"model.layers.13.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1548 |
"model.layers.13.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 1549 |
"model.layers.13.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1550 |
"model.layers.13.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1551 |
"model.layers.13.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
|
|
| 1623 |
"model.layers.18.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1624 |
"model.layers.18.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1625 |
"model.layers.18.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 1626 |
"model.layers.18.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
|
| 1627 |
"model.layers.18.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
|
| 1628 |
"model.layers.18.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
|
|
|
|
| 1979 |
"model.layers.17.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 1980 |
"model.layers.17.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 1981 |
"model.layers.17.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 1982 |
"model.layers.17.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 1983 |
"model.layers.17.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 1984 |
"model.layers.17.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
|
|
| 2206 |
"model.layers.27.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2207 |
"model.layers.27.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2208 |
"model.layers.27.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 2209 |
"model.layers.27.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2210 |
"model.layers.27.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2211 |
"model.layers.27.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
|
|
| 2407 |
"model.layers.9.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2408 |
"model.layers.9.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2409 |
"model.layers.9.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 2410 |
"model.layers.9.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
|
| 2411 |
"model.layers.9.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
|
| 2412 |
"model.layers.9.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
|
|
|
|
| 2614 |
"model.layers.22.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2615 |
"model.layers.22.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2616 |
"model.layers.22.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 2617 |
"model.layers.22.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2618 |
"model.layers.22.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2619 |
"model.layers.22.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
|
|
| 2811 |
"model.layers.24.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2812 |
"model.layers.24.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2813 |
"model.layers.24.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 2814 |
"model.layers.24.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2815 |
"model.layers.24.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2816 |
"model.layers.24.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
|
|
| 2837 |
"model.layers.26.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2838 |
"model.layers.26.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2839 |
"model.layers.26.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 2840 |
"model.layers.26.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 2841 |
"model.layers.26.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 2842 |
"model.layers.26.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
|
|
| 3038 |
"model.layers.6.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 3039 |
"model.layers.6.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 3040 |
"model.layers.6.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 3041 |
"model.layers.6.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
|
| 3042 |
"model.layers.6.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
|
| 3043 |
"model.layers.6.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
|
|
|
|
| 3247 |
"model.layers.1.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3248 |
"model.layers.1.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3249 |
"model.layers.1.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 3250 |
"model.layers.1.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3251 |
"model.layers.1.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3252 |
"model.layers.1.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
|
|
| 3448 |
"model.layers.16.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3449 |
"model.layers.16.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3450 |
"model.layers.16.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 3451 |
"model.layers.16.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3452 |
"model.layers.16.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3453 |
"model.layers.16.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
|
|
| 3649 |
"model.layers.2.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3650 |
"model.layers.2.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3651 |
"model.layers.2.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 3652 |
"model.layers.2.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
|
| 3653 |
"model.layers.2.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
|
| 3654 |
"model.layers.2.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
|
|
|
|
| 3883 |
"model.layers.12.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 3884 |
"model.layers.12.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 3885 |
"model.layers.12.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 3886 |
"model.layers.12.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 3887 |
"model.layers.12.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 3888 |
"model.layers.12.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
|
|
| 4061 |
"model.layers.21.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4062 |
"model.layers.21.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4063 |
"model.layers.21.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 4064 |
"model.layers.21.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4065 |
"model.layers.21.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4066 |
"model.layers.21.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
|
|
| 4311 |
"model.layers.7.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4312 |
"model.layers.7.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4313 |
"model.layers.7.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 4314 |
"model.layers.7.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
|
| 4315 |
"model.layers.7.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
|
| 4316 |
"model.layers.7.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
|
|
|
|
| 4518 |
"model.layers.10.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4519 |
"model.layers.10.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4520 |
"model.layers.10.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 4521 |
"model.layers.10.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4522 |
"model.layers.10.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4523 |
"model.layers.10.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
|
|
| 4793 |
"model.layers.23.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4794 |
"model.layers.23.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4795 |
"model.layers.23.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 4796 |
"model.layers.23.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4797 |
"model.layers.23.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4798 |
"model.layers.23.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
|
|
| 4945 |
"model.layers.5.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4946 |
"model.layers.5.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4947 |
"model.layers.5.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 4948 |
"model.layers.5.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
|
| 4949 |
"model.layers.5.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
|
| 4950 |
"model.layers.5.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
|
|
|
|
| 5076 |
"model.layers.14.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5077 |
"model.layers.14.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5078 |
"model.layers.14.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 5079 |
"model.layers.14.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5080 |
"model.layers.14.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5081 |
"model.layers.14.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
|
|
|
|
| 5277 |
"model.layers.25.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5278 |
"model.layers.25.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5279 |
"model.layers.25.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 5280 |
"model.layers.25.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5281 |
"model.layers.25.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5282 |
"model.layers.25.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
|
|
|
|
| 5478 |
"model.layers.3.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5479 |
"model.layers.3.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5480 |
"model.layers.3.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
|
|
|
|
|
|
|
|
|
|
| 5481 |
"model.layers.3.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
|
| 5482 |
"model.layers.3.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
|
| 5483 |
"model.layers.3.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
|