liaojc commited on
Commit
ccf7bd1
·
verified ·
1 Parent(s): 7053045

Upload folder using huggingface_hub

Browse files
model-00001-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dfd3960c50edbe96d7a2821636476d9dbcd28cb98a548fbf807ea341c497831f
3
- size 4707557616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d418a84d3f217a392b8be61a52b2709ebdb2e742e0a4d71f2cc5556758365cf2
3
+ size 4691828232
model-00002-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c39b70baff7c022dd9fbb23a23b4fff939264c991188c4e2125fd92a6402f7c9
3
- size 4995920616
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:13218b59621b3bd998143d97e2454fce9005e972fb650a9e8e41d2ae5ed9e603
3
+ size 4972326544
model-00003-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed1f016ca5954c1de2ca7f4eff6cd6cb72491963bffd0ab867fccb50bc3c1147
3
- size 4988056488
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e57fb00719ba2816dcb7099eefc47b52b138923ba21e1525a21997ccce6f54e4
3
+ size 4964462408
model-00004-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2503408d79a9eb1078250d73fd54cfab7029b95c76cf8e5cca92d3ca08823e62
3
- size 4995920728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9ff45e48754f8ed7f2617d7618a107ef906a678eb60af70c78401c6a6545d9c
3
+ size 4972326648
model-00005-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4f395f9c314ccb60cbfe052a8b3576515802e40769b3c9918cb609caecb55169
3
- size 4988061400
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d721b5ce36d91d06cae02e0b01fc08ea984c4dc739d4d4814a2eac8354d5cf0c
3
+ size 4956602632
model-00006-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94be392cde6b5cb00171f428a6c5e13ffb83c92a6ad766dedc9daa6c31e8e8cb
3
- size 4996581560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15bbba410e206d7091385c8d5d44e5c62486c6ad06ab5f71ac257c07f6fa2a84
3
+ size 4972987488
model-00007-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c6c2b24dfd4f10f4830473da040176a704b9ac0d809e927adf31180e447ccc37
3
- size 4995920672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81d39a1f2b14fe875436acf8bd4585dcfb1c293cc898c0f3406720471fedca8c
3
+ size 4972326600
model-00008-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6a3be133d4cd089a4ee185e316c69dc761e4642e952f2a73e616a240a1e34135
3
- size 4988056336
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc900ee1edd9b2b1ab3c67aeaab02952d2293e7af5ce097e97e0c592939105f3
3
+ size 4964462256
model-00009-of-00009.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e7c23cd1f8709147fbcdd4d88ecd46b79ef7b2d8958571f92666706c3de7867e
3
- size 4216679584
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a42af40a048dc16eb4959e76ae225923d5d315c633a158f40f0168eddb26a378
3
+ size 4193085520
model.safetensors.index.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
  "metadata": {
3
- "total_size": 43872063232
4
  },
5
  "weight_map": {
6
  "model.layers.15.mlp.gate.weight": "model-00001-of-00009.safetensors",
@@ -203,9 +203,6 @@
203
  "model.layers.15.mlp.experts.63.down_proj.weight": "model-00001-of-00009.safetensors",
204
  "model.layers.15.mlp.experts.63.up_proj.weight": "model-00001-of-00009.safetensors",
205
  "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00001-of-00009.safetensors",
206
- "model.layers.15.mlp.experts.64.down_proj.weight": "model-00001-of-00009.safetensors",
207
- "model.layers.15.mlp.experts.64.up_proj.weight": "model-00001-of-00009.safetensors",
208
- "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00001-of-00009.safetensors",
209
  "model.layers.15.mlp.experts.7.down_proj.weight": "model-00001-of-00009.safetensors",
210
  "model.layers.15.mlp.experts.7.up_proj.weight": "model-00001-of-00009.safetensors",
211
  "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00001-of-00009.safetensors",
@@ -407,9 +404,6 @@
407
  "model.layers.20.mlp.experts.63.down_proj.weight": "model-00001-of-00009.safetensors",
408
  "model.layers.20.mlp.experts.63.up_proj.weight": "model-00001-of-00009.safetensors",
409
  "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00001-of-00009.safetensors",
410
- "model.layers.20.mlp.experts.64.down_proj.weight": "model-00001-of-00009.safetensors",
411
- "model.layers.20.mlp.experts.64.up_proj.weight": "model-00001-of-00009.safetensors",
412
- "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00001-of-00009.safetensors",
413
  "model.layers.20.mlp.experts.7.down_proj.weight": "model-00001-of-00009.safetensors",
414
  "model.layers.20.mlp.experts.7.up_proj.weight": "model-00001-of-00009.safetensors",
415
  "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00001-of-00009.safetensors",
@@ -840,9 +834,6 @@
840
  "model.layers.19.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
841
  "model.layers.19.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
842
  "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
843
- "model.layers.19.mlp.experts.64.down_proj.weight": "model-00002-of-00009.safetensors",
844
- "model.layers.19.mlp.experts.64.up_proj.weight": "model-00002-of-00009.safetensors",
845
- "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00002-of-00009.safetensors",
846
  "model.layers.19.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
847
  "model.layers.19.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
848
  "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
@@ -1044,9 +1035,6 @@
1044
  "model.layers.4.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
1045
  "model.layers.4.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
1046
  "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
1047
- "model.layers.4.mlp.experts.64.down_proj.weight": "model-00002-of-00009.safetensors",
1048
- "model.layers.4.mlp.experts.64.up_proj.weight": "model-00002-of-00009.safetensors",
1049
- "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00002-of-00009.safetensors",
1050
  "model.layers.4.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
1051
  "model.layers.4.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
1052
  "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
@@ -1150,9 +1138,6 @@
1150
  "model.layers.8.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
1151
  "model.layers.8.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
1152
  "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
1153
- "model.layers.8.mlp.experts.64.down_proj.weight": "model-00002-of-00009.safetensors",
1154
- "model.layers.8.mlp.experts.64.up_proj.weight": "model-00002-of-00009.safetensors",
1155
- "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00002-of-00009.safetensors",
1156
  "model.layers.8.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
1157
  "model.layers.8.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
1158
  "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
@@ -1360,9 +1345,6 @@
1360
  "model.layers.11.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
1361
  "model.layers.11.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
1362
  "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
1363
- "model.layers.11.mlp.experts.64.down_proj.weight": "model-00003-of-00009.safetensors",
1364
- "model.layers.11.mlp.experts.64.up_proj.weight": "model-00003-of-00009.safetensors",
1365
- "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00003-of-00009.safetensors",
1366
  "model.layers.11.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
1367
  "model.layers.11.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
1368
  "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
@@ -1564,9 +1546,6 @@
1564
  "model.layers.13.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
1565
  "model.layers.13.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
1566
  "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
1567
- "model.layers.13.mlp.experts.64.down_proj.weight": "model-00003-of-00009.safetensors",
1568
- "model.layers.13.mlp.experts.64.up_proj.weight": "model-00003-of-00009.safetensors",
1569
- "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00003-of-00009.safetensors",
1570
  "model.layers.13.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
1571
  "model.layers.13.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
1572
  "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
@@ -1644,9 +1623,6 @@
1644
  "model.layers.18.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
1645
  "model.layers.18.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
1646
  "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
1647
- "model.layers.18.mlp.experts.64.down_proj.weight": "model-00003-of-00009.safetensors",
1648
- "model.layers.18.mlp.experts.64.up_proj.weight": "model-00003-of-00009.safetensors",
1649
- "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00003-of-00009.safetensors",
1650
  "model.layers.18.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
1651
  "model.layers.18.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
1652
  "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
@@ -2003,9 +1979,6 @@
2003
  "model.layers.17.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
2004
  "model.layers.17.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
2005
  "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
2006
- "model.layers.17.mlp.experts.64.down_proj.weight": "model-00004-of-00009.safetensors",
2007
- "model.layers.17.mlp.experts.64.up_proj.weight": "model-00004-of-00009.safetensors",
2008
- "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00004-of-00009.safetensors",
2009
  "model.layers.17.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
2010
  "model.layers.17.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
2011
  "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
@@ -2233,9 +2206,6 @@
2233
  "model.layers.27.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
2234
  "model.layers.27.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
2235
  "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
2236
- "model.layers.27.mlp.experts.64.down_proj.weight": "model-00004-of-00009.safetensors",
2237
- "model.layers.27.mlp.experts.64.up_proj.weight": "model-00004-of-00009.safetensors",
2238
- "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00004-of-00009.safetensors",
2239
  "model.layers.27.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
2240
  "model.layers.27.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
2241
  "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
@@ -2437,9 +2407,6 @@
2437
  "model.layers.9.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
2438
  "model.layers.9.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
2439
  "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
2440
- "model.layers.9.mlp.experts.64.down_proj.weight": "model-00004-of-00009.safetensors",
2441
- "model.layers.9.mlp.experts.64.up_proj.weight": "model-00004-of-00009.safetensors",
2442
- "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00004-of-00009.safetensors",
2443
  "model.layers.9.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
2444
  "model.layers.9.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
2445
  "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
@@ -2647,9 +2614,6 @@
2647
  "model.layers.22.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
2648
  "model.layers.22.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
2649
  "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
2650
- "model.layers.22.mlp.experts.64.down_proj.weight": "model-00005-of-00009.safetensors",
2651
- "model.layers.22.mlp.experts.64.up_proj.weight": "model-00005-of-00009.safetensors",
2652
- "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00005-of-00009.safetensors",
2653
  "model.layers.22.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
2654
  "model.layers.22.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
2655
  "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
@@ -2847,9 +2811,6 @@
2847
  "model.layers.24.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
2848
  "model.layers.24.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
2849
  "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
2850
- "model.layers.24.mlp.experts.64.down_proj.weight": "model-00005-of-00009.safetensors",
2851
- "model.layers.24.mlp.experts.64.up_proj.weight": "model-00005-of-00009.safetensors",
2852
- "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00005-of-00009.safetensors",
2853
  "model.layers.24.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
2854
  "model.layers.24.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
2855
  "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
@@ -2876,9 +2837,6 @@
2876
  "model.layers.26.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
2877
  "model.layers.26.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
2878
  "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
2879
- "model.layers.26.mlp.experts.64.down_proj.weight": "model-00005-of-00009.safetensors",
2880
- "model.layers.26.mlp.experts.64.up_proj.weight": "model-00005-of-00009.safetensors",
2881
- "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00005-of-00009.safetensors",
2882
  "model.layers.26.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
2883
  "model.layers.26.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
2884
  "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
@@ -3080,9 +3038,6 @@
3080
  "model.layers.6.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
3081
  "model.layers.6.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
3082
  "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
3083
- "model.layers.6.mlp.experts.64.down_proj.weight": "model-00005-of-00009.safetensors",
3084
- "model.layers.6.mlp.experts.64.up_proj.weight": "model-00005-of-00009.safetensors",
3085
- "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00005-of-00009.safetensors",
3086
  "model.layers.6.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
3087
  "model.layers.6.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
3088
  "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
@@ -3292,9 +3247,6 @@
3292
  "model.layers.1.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
3293
  "model.layers.1.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
3294
  "model.layers.1.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
3295
- "model.layers.1.mlp.experts.64.down_proj.weight": "model-00006-of-00009.safetensors",
3296
- "model.layers.1.mlp.experts.64.up_proj.weight": "model-00006-of-00009.safetensors",
3297
- "model.layers.1.mlp.experts.64.gate_proj.weight": "model-00006-of-00009.safetensors",
3298
  "model.layers.1.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
3299
  "model.layers.1.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
3300
  "model.layers.1.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
@@ -3496,9 +3448,6 @@
3496
  "model.layers.16.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
3497
  "model.layers.16.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
3498
  "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
3499
- "model.layers.16.mlp.experts.64.down_proj.weight": "model-00006-of-00009.safetensors",
3500
- "model.layers.16.mlp.experts.64.up_proj.weight": "model-00006-of-00009.safetensors",
3501
- "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00006-of-00009.safetensors",
3502
  "model.layers.16.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
3503
  "model.layers.16.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
3504
  "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
@@ -3700,9 +3649,6 @@
3700
  "model.layers.2.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
3701
  "model.layers.2.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
3702
  "model.layers.2.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
3703
- "model.layers.2.mlp.experts.64.down_proj.weight": "model-00006-of-00009.safetensors",
3704
- "model.layers.2.mlp.experts.64.up_proj.weight": "model-00006-of-00009.safetensors",
3705
- "model.layers.2.mlp.experts.64.gate_proj.weight": "model-00006-of-00009.safetensors",
3706
  "model.layers.2.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
3707
  "model.layers.2.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
3708
  "model.layers.2.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
@@ -3937,9 +3883,6 @@
3937
  "model.layers.12.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
3938
  "model.layers.12.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
3939
  "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
3940
- "model.layers.12.mlp.experts.64.down_proj.weight": "model-00007-of-00009.safetensors",
3941
- "model.layers.12.mlp.experts.64.up_proj.weight": "model-00007-of-00009.safetensors",
3942
- "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00007-of-00009.safetensors",
3943
  "model.layers.12.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
3944
  "model.layers.12.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
3945
  "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
@@ -4118,9 +4061,6 @@
4118
  "model.layers.21.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
4119
  "model.layers.21.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
4120
  "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
4121
- "model.layers.21.mlp.experts.64.down_proj.weight": "model-00007-of-00009.safetensors",
4122
- "model.layers.21.mlp.experts.64.up_proj.weight": "model-00007-of-00009.safetensors",
4123
- "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00007-of-00009.safetensors",
4124
  "model.layers.21.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
4125
  "model.layers.21.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
4126
  "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
@@ -4371,9 +4311,6 @@
4371
  "model.layers.7.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
4372
  "model.layers.7.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
4373
  "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
4374
- "model.layers.7.mlp.experts.64.down_proj.weight": "model-00007-of-00009.safetensors",
4375
- "model.layers.7.mlp.experts.64.up_proj.weight": "model-00007-of-00009.safetensors",
4376
- "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00007-of-00009.safetensors",
4377
  "model.layers.7.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
4378
  "model.layers.7.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
4379
  "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
@@ -4581,9 +4518,6 @@
4581
  "model.layers.10.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
4582
  "model.layers.10.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
4583
  "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
4584
- "model.layers.10.mlp.experts.64.down_proj.weight": "model-00008-of-00009.safetensors",
4585
- "model.layers.10.mlp.experts.64.up_proj.weight": "model-00008-of-00009.safetensors",
4586
- "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00008-of-00009.safetensors",
4587
  "model.layers.10.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
4588
  "model.layers.10.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
4589
  "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
@@ -4859,9 +4793,6 @@
4859
  "model.layers.23.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
4860
  "model.layers.23.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
4861
  "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
4862
- "model.layers.23.mlp.experts.64.down_proj.weight": "model-00008-of-00009.safetensors",
4863
- "model.layers.23.mlp.experts.64.up_proj.weight": "model-00008-of-00009.safetensors",
4864
- "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00008-of-00009.safetensors",
4865
  "model.layers.23.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
4866
  "model.layers.23.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
4867
  "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
@@ -5014,9 +4945,6 @@
5014
  "model.layers.5.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
5015
  "model.layers.5.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
5016
  "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
5017
- "model.layers.5.mlp.experts.64.down_proj.weight": "model-00008-of-00009.safetensors",
5018
- "model.layers.5.mlp.experts.64.up_proj.weight": "model-00008-of-00009.safetensors",
5019
- "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00008-of-00009.safetensors",
5020
  "model.layers.5.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
5021
  "model.layers.5.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
5022
  "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
@@ -5148,9 +5076,6 @@
5148
  "model.layers.14.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
5149
  "model.layers.14.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
5150
  "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
5151
- "model.layers.14.mlp.experts.64.down_proj.weight": "model-00009-of-00009.safetensors",
5152
- "model.layers.14.mlp.experts.64.up_proj.weight": "model-00009-of-00009.safetensors",
5153
- "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00009-of-00009.safetensors",
5154
  "model.layers.14.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
5155
  "model.layers.14.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
5156
  "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
@@ -5352,9 +5277,6 @@
5352
  "model.layers.25.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
5353
  "model.layers.25.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
5354
  "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
5355
- "model.layers.25.mlp.experts.64.down_proj.weight": "model-00009-of-00009.safetensors",
5356
- "model.layers.25.mlp.experts.64.up_proj.weight": "model-00009-of-00009.safetensors",
5357
- "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00009-of-00009.safetensors",
5358
  "model.layers.25.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
5359
  "model.layers.25.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
5360
  "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
@@ -5556,9 +5478,6 @@
5556
  "model.layers.3.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
5557
  "model.layers.3.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
5558
  "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
5559
- "model.layers.3.mlp.experts.64.down_proj.weight": "model-00009-of-00009.safetensors",
5560
- "model.layers.3.mlp.experts.64.up_proj.weight": "model-00009-of-00009.safetensors",
5561
- "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00009-of-00009.safetensors",
5562
  "model.layers.3.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
5563
  "model.layers.3.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
5564
  "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
 
1
  {
2
  "metadata": {
3
+ "total_size": 43659726592
4
  },
5
  "weight_map": {
6
  "model.layers.15.mlp.gate.weight": "model-00001-of-00009.safetensors",
 
203
  "model.layers.15.mlp.experts.63.down_proj.weight": "model-00001-of-00009.safetensors",
204
  "model.layers.15.mlp.experts.63.up_proj.weight": "model-00001-of-00009.safetensors",
205
  "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00001-of-00009.safetensors",
 
 
 
206
  "model.layers.15.mlp.experts.7.down_proj.weight": "model-00001-of-00009.safetensors",
207
  "model.layers.15.mlp.experts.7.up_proj.weight": "model-00001-of-00009.safetensors",
208
  "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00001-of-00009.safetensors",
 
404
  "model.layers.20.mlp.experts.63.down_proj.weight": "model-00001-of-00009.safetensors",
405
  "model.layers.20.mlp.experts.63.up_proj.weight": "model-00001-of-00009.safetensors",
406
  "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00001-of-00009.safetensors",
 
 
 
407
  "model.layers.20.mlp.experts.7.down_proj.weight": "model-00001-of-00009.safetensors",
408
  "model.layers.20.mlp.experts.7.up_proj.weight": "model-00001-of-00009.safetensors",
409
  "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00001-of-00009.safetensors",
 
834
  "model.layers.19.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
835
  "model.layers.19.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
836
  "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
 
 
 
837
  "model.layers.19.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
838
  "model.layers.19.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
839
  "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
 
1035
  "model.layers.4.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
1036
  "model.layers.4.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
1037
  "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
 
 
 
1038
  "model.layers.4.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
1039
  "model.layers.4.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
1040
  "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
 
1138
  "model.layers.8.mlp.experts.63.down_proj.weight": "model-00002-of-00009.safetensors",
1139
  "model.layers.8.mlp.experts.63.up_proj.weight": "model-00002-of-00009.safetensors",
1140
  "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00002-of-00009.safetensors",
 
 
 
1141
  "model.layers.8.mlp.experts.7.down_proj.weight": "model-00002-of-00009.safetensors",
1142
  "model.layers.8.mlp.experts.7.up_proj.weight": "model-00002-of-00009.safetensors",
1143
  "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00002-of-00009.safetensors",
 
1345
  "model.layers.11.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
1346
  "model.layers.11.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
1347
  "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
 
 
 
1348
  "model.layers.11.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
1349
  "model.layers.11.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
1350
  "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
 
1546
  "model.layers.13.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
1547
  "model.layers.13.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
1548
  "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
 
 
 
1549
  "model.layers.13.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
1550
  "model.layers.13.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
1551
  "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
 
1623
  "model.layers.18.mlp.experts.63.down_proj.weight": "model-00003-of-00009.safetensors",
1624
  "model.layers.18.mlp.experts.63.up_proj.weight": "model-00003-of-00009.safetensors",
1625
  "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00003-of-00009.safetensors",
 
 
 
1626
  "model.layers.18.mlp.experts.7.down_proj.weight": "model-00003-of-00009.safetensors",
1627
  "model.layers.18.mlp.experts.7.up_proj.weight": "model-00003-of-00009.safetensors",
1628
  "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00003-of-00009.safetensors",
 
1979
  "model.layers.17.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
1980
  "model.layers.17.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
1981
  "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
 
 
 
1982
  "model.layers.17.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
1983
  "model.layers.17.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
1984
  "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
 
2206
  "model.layers.27.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
2207
  "model.layers.27.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
2208
  "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
 
 
 
2209
  "model.layers.27.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
2210
  "model.layers.27.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
2211
  "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
 
2407
  "model.layers.9.mlp.experts.63.down_proj.weight": "model-00004-of-00009.safetensors",
2408
  "model.layers.9.mlp.experts.63.up_proj.weight": "model-00004-of-00009.safetensors",
2409
  "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00004-of-00009.safetensors",
 
 
 
2410
  "model.layers.9.mlp.experts.7.down_proj.weight": "model-00004-of-00009.safetensors",
2411
  "model.layers.9.mlp.experts.7.up_proj.weight": "model-00004-of-00009.safetensors",
2412
  "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00004-of-00009.safetensors",
 
2614
  "model.layers.22.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
2615
  "model.layers.22.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
2616
  "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
 
 
 
2617
  "model.layers.22.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
2618
  "model.layers.22.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
2619
  "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
 
2811
  "model.layers.24.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
2812
  "model.layers.24.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
2813
  "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
 
 
 
2814
  "model.layers.24.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
2815
  "model.layers.24.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
2816
  "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
 
2837
  "model.layers.26.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
2838
  "model.layers.26.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
2839
  "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
 
 
 
2840
  "model.layers.26.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
2841
  "model.layers.26.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
2842
  "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
 
3038
  "model.layers.6.mlp.experts.63.down_proj.weight": "model-00005-of-00009.safetensors",
3039
  "model.layers.6.mlp.experts.63.up_proj.weight": "model-00005-of-00009.safetensors",
3040
  "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00005-of-00009.safetensors",
 
 
 
3041
  "model.layers.6.mlp.experts.7.down_proj.weight": "model-00005-of-00009.safetensors",
3042
  "model.layers.6.mlp.experts.7.up_proj.weight": "model-00005-of-00009.safetensors",
3043
  "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00005-of-00009.safetensors",
 
3247
  "model.layers.1.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
3248
  "model.layers.1.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
3249
  "model.layers.1.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
 
 
 
3250
  "model.layers.1.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
3251
  "model.layers.1.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
3252
  "model.layers.1.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
 
3448
  "model.layers.16.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
3449
  "model.layers.16.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
3450
  "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
 
 
 
3451
  "model.layers.16.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
3452
  "model.layers.16.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
3453
  "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
 
3649
  "model.layers.2.mlp.experts.63.down_proj.weight": "model-00006-of-00009.safetensors",
3650
  "model.layers.2.mlp.experts.63.up_proj.weight": "model-00006-of-00009.safetensors",
3651
  "model.layers.2.mlp.experts.63.gate_proj.weight": "model-00006-of-00009.safetensors",
 
 
 
3652
  "model.layers.2.mlp.experts.7.down_proj.weight": "model-00006-of-00009.safetensors",
3653
  "model.layers.2.mlp.experts.7.up_proj.weight": "model-00006-of-00009.safetensors",
3654
  "model.layers.2.mlp.experts.7.gate_proj.weight": "model-00006-of-00009.safetensors",
 
3883
  "model.layers.12.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
3884
  "model.layers.12.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
3885
  "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
 
 
 
3886
  "model.layers.12.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
3887
  "model.layers.12.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
3888
  "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
 
4061
  "model.layers.21.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
4062
  "model.layers.21.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
4063
  "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
 
 
 
4064
  "model.layers.21.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
4065
  "model.layers.21.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
4066
  "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
 
4311
  "model.layers.7.mlp.experts.63.down_proj.weight": "model-00007-of-00009.safetensors",
4312
  "model.layers.7.mlp.experts.63.up_proj.weight": "model-00007-of-00009.safetensors",
4313
  "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00007-of-00009.safetensors",
 
 
 
4314
  "model.layers.7.mlp.experts.7.down_proj.weight": "model-00007-of-00009.safetensors",
4315
  "model.layers.7.mlp.experts.7.up_proj.weight": "model-00007-of-00009.safetensors",
4316
  "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00007-of-00009.safetensors",
 
4518
  "model.layers.10.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
4519
  "model.layers.10.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
4520
  "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
 
 
 
4521
  "model.layers.10.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
4522
  "model.layers.10.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
4523
  "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
 
4793
  "model.layers.23.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
4794
  "model.layers.23.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
4795
  "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
 
 
 
4796
  "model.layers.23.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
4797
  "model.layers.23.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
4798
  "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
 
4945
  "model.layers.5.mlp.experts.63.down_proj.weight": "model-00008-of-00009.safetensors",
4946
  "model.layers.5.mlp.experts.63.up_proj.weight": "model-00008-of-00009.safetensors",
4947
  "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00008-of-00009.safetensors",
 
 
 
4948
  "model.layers.5.mlp.experts.7.down_proj.weight": "model-00008-of-00009.safetensors",
4949
  "model.layers.5.mlp.experts.7.up_proj.weight": "model-00008-of-00009.safetensors",
4950
  "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00008-of-00009.safetensors",
 
5076
  "model.layers.14.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
5077
  "model.layers.14.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
5078
  "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
 
 
 
5079
  "model.layers.14.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
5080
  "model.layers.14.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
5081
  "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
 
5277
  "model.layers.25.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
5278
  "model.layers.25.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
5279
  "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
 
 
 
5280
  "model.layers.25.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
5281
  "model.layers.25.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
5282
  "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",
 
5478
  "model.layers.3.mlp.experts.63.down_proj.weight": "model-00009-of-00009.safetensors",
5479
  "model.layers.3.mlp.experts.63.up_proj.weight": "model-00009-of-00009.safetensors",
5480
  "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00009-of-00009.safetensors",
 
 
 
5481
  "model.layers.3.mlp.experts.7.down_proj.weight": "model-00009-of-00009.safetensors",
5482
  "model.layers.3.mlp.experts.7.up_proj.weight": "model-00009-of-00009.safetensors",
5483
  "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00009-of-00009.safetensors",