| { | |
| "metadata": { | |
| "total_size": 3936644272 | |
| }, | |
| "weight_map": { | |
| "backbone.embeddings.weight": "model-00001-of-00010.safetensors", | |
| "backbone.norm_f.weight": "model-00001-of-00010.safetensors", | |
| "lm_head.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.A_log": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.D": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.dt_bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.conv1d.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.conv1d.bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.in_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.in_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.in_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.out_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.out_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.0.mixer.out_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.1.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.1.mixer.up_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.1.mixer.up_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.1.mixer.up_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.1.mixer.down_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.1.mixer.down_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.1.mixer.down_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.A_log": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.D": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.dt_bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.conv1d.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.conv1d.bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.in_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.in_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.in_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.out_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.out_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.2.mixer.out_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.3.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.3.mixer.up_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.3.mixer.up_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.3.mixer.up_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.3.mixer.down_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.3.mixer.down_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.3.mixer.down_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.A_log": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.D": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.dt_bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.conv1d.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.conv1d.bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.in_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.in_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.in_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.out_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.out_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.4.mixer.out_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.5.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.5.mixer.up_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.5.mixer.up_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.5.mixer.up_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.5.mixer.down_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.5.mixer.down_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.5.mixer.down_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.A_log": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.D": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.dt_bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.conv1d.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.conv1d.bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.in_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.in_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.in_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.out_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.out_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.6.mixer.out_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.A_log": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.D": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.dt_bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.conv1d.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.conv1d.bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.in_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.in_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.in_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.out_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.out_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.7.mixer.out_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.8.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.8.mixer.up_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.8.mixer.up_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.8.mixer.up_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.8.mixer.down_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.8.mixer.down_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.8.mixer.down_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.A_log": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.D": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.dt_bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.conv1d.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.conv1d.bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.in_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.in_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.in_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.out_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.out_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.9.mixer.out_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.10.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.10.mixer.up_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.10.mixer.up_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.10.mixer.up_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.10.mixer.down_proj.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.10.mixer.down_proj.weight_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.10.mixer.down_proj.input_scale": "model-00001-of-00010.safetensors", | |
| "backbone.layers.11.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.11.mixer.norm.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.11.mixer.A_log": "model-00001-of-00010.safetensors", | |
| "backbone.layers.11.mixer.D": "model-00001-of-00010.safetensors", | |
| "backbone.layers.11.mixer.dt_bias": "model-00001-of-00010.safetensors", | |
| "backbone.layers.11.mixer.conv1d.weight": "model-00001-of-00010.safetensors", | |
| "backbone.layers.11.mixer.conv1d.bias": "model-00001-of-00010.safetensors" | |
| } | |
| } |