clowman's picture
Upload folder using huggingface_hub
d6526e0 verified
layer,module,loss,damp,time
0,self_attn.k_proj,0.00572,0.01000,1.223
0,self_attn.v_proj,0.00005,0.01000,0.782
0,self_attn.q_proj,0.00837,0.01000,0.766
0,self_attn.o_proj,0.00000,0.01000,0.863
0,mlp.up_proj,0.00385,0.01000,0.919
0,mlp.gate_proj,0.00464,0.01000,0.759
0,mlp.down_proj,0.00002,0.01000,3.434
1,self_attn.k_proj,0.00399,0.01000,0.960
1,self_attn.v_proj,0.00016,0.01000,0.750
1,self_attn.q_proj,0.00714,0.01000,0.748
1,self_attn.o_proj,0.00001,0.01000,0.862
1,mlp.up_proj,0.00687,0.01000,0.916
1,mlp.gate_proj,0.00809,0.01000,0.761
1,mlp.down_proj,0.00025,0.01000,3.395
2,self_attn.k_proj,0.01956,0.01000,1.261
2,self_attn.v_proj,0.00085,0.01000,0.769
2,self_attn.q_proj,0.02965,0.01000,0.742
2,self_attn.o_proj,0.00002,0.01000,1.119
2,mlp.up_proj,0.01129,0.01000,0.915
2,mlp.gate_proj,0.01405,0.01000,0.744
2,mlp.down_proj,0.00008,0.01000,3.630
3,self_attn.k_proj,0.01597,0.01000,1.073
3,self_attn.v_proj,0.00146,0.01000,0.742
3,self_attn.q_proj,0.02837,0.01000,0.745
3,self_attn.o_proj,0.00003,0.01000,0.958
3,mlp.up_proj,0.01511,0.01000,0.924
3,mlp.gate_proj,0.02157,0.01000,0.766
3,mlp.down_proj,0.00014,0.01000,3.348
4,self_attn.k_proj,0.01460,0.01000,1.009
4,self_attn.v_proj,0.00140,0.01000,0.748
4,self_attn.q_proj,0.02542,0.01000,0.736
4,self_attn.o_proj,0.00008,0.01000,0.862
4,mlp.up_proj,0.01951,0.01000,0.905
4,mlp.gate_proj,0.03157,0.01000,0.750
4,mlp.down_proj,0.00025,0.01000,3.404
5,self_attn.k_proj,0.02427,0.01000,0.952
5,self_attn.v_proj,0.00142,0.01000,0.748
5,self_attn.q_proj,0.03766,0.01000,0.744
5,self_attn.o_proj,0.00010,0.01000,0.869
5,mlp.up_proj,0.02402,0.01000,0.937
5,mlp.gate_proj,0.03846,0.01000,0.758
5,mlp.down_proj,0.00036,0.01000,3.414
6,self_attn.k_proj,0.01964,0.01000,0.958
6,self_attn.v_proj,0.00161,0.01000,0.736
6,self_attn.q_proj,0.03495,0.01000,0.732
6,self_attn.o_proj,0.00016,0.01000,0.866
6,mlp.up_proj,0.02682,0.01000,0.966
6,mlp.gate_proj,0.04351,0.01000,0.805
6,mlp.down_proj,0.00046,0.01000,3.437
7,self_attn.k_proj,0.02019,0.01000,0.976
7,self_attn.v_proj,0.00174,0.01000,0.772
7,self_attn.q_proj,0.03369,0.01000,0.747
7,self_attn.o_proj,0.00024,0.01000,0.909
7,mlp.up_proj,0.03001,0.01000,0.915
7,mlp.gate_proj,0.04555,0.01000,0.804
7,mlp.down_proj,0.00056,0.01000,3.453
8,self_attn.k_proj,0.02674,0.01000,0.966
8,self_attn.v_proj,0.00239,0.01000,0.752
8,self_attn.q_proj,0.04336,0.01000,0.750
8,self_attn.o_proj,0.00034,0.01000,0.867
8,mlp.up_proj,0.03200,0.01000,0.926
8,mlp.gate_proj,0.04926,0.01000,0.756
8,mlp.down_proj,0.00061,0.01000,3.452
9,self_attn.k_proj,0.02576,0.01000,0.979
9,self_attn.v_proj,0.00334,0.01000,0.761
9,self_attn.q_proj,0.04328,0.01000,0.745
9,self_attn.o_proj,0.00042,0.01000,0.864
9,mlp.up_proj,0.03358,0.01000,0.914
9,mlp.gate_proj,0.05205,0.01000,0.755
9,mlp.down_proj,0.00065,0.01000,3.550
10,self_attn.k_proj,0.03109,0.01000,0.957
10,self_attn.v_proj,0.00260,0.01000,0.748
10,self_attn.q_proj,0.05052,0.01000,0.742
10,self_attn.o_proj,0.00038,0.01000,0.858
10,mlp.up_proj,0.03457,0.01000,0.912
10,mlp.gate_proj,0.04996,0.01000,0.752
10,mlp.down_proj,0.00068,0.01000,3.401
11,self_attn.k_proj,0.02801,0.01000,0.954
11,self_attn.v_proj,0.00261,0.01000,0.747
11,self_attn.q_proj,0.04387,0.01000,0.758
11,self_attn.o_proj,0.00040,0.01000,0.872
11,mlp.up_proj,0.03638,0.01000,0.918
11,mlp.gate_proj,0.05101,0.01000,0.781
11,mlp.down_proj,0.00073,0.01000,3.456
12,self_attn.k_proj,0.02175,0.01000,0.953
12,self_attn.v_proj,0.00309,0.01000,0.781
12,self_attn.q_proj,0.03811,0.01000,0.760
12,self_attn.o_proj,0.00047,0.01000,0.889
12,mlp.up_proj,0.03778,0.01000,0.916
12,mlp.gate_proj,0.05012,0.01000,0.780
12,mlp.down_proj,0.00083,0.01000,3.414
13,self_attn.k_proj,0.03227,0.01000,0.955
13,self_attn.v_proj,0.00338,0.01000,0.746
13,self_attn.q_proj,0.04979,0.01000,0.748
13,self_attn.o_proj,0.00058,0.01000,0.866
13,mlp.up_proj,0.04061,0.01000,0.915
13,mlp.gate_proj,0.05386,0.01000,0.753
13,mlp.down_proj,0.00096,0.01000,3.451
14,self_attn.k_proj,0.03492,0.01000,0.955
14,self_attn.v_proj,0.00362,0.01000,0.751
14,self_attn.q_proj,0.05149,0.01000,0.763
14,self_attn.o_proj,0.00068,0.01000,0.867
14,mlp.up_proj,0.04541,0.01000,0.916
14,mlp.gate_proj,0.06339,0.01000,0.753
14,mlp.down_proj,0.00120,0.01000,3.400
15,self_attn.k_proj,0.03256,0.01000,1.044
15,self_attn.v_proj,0.00452,0.01000,0.746
15,self_attn.q_proj,0.06113,0.01000,0.745
15,self_attn.o_proj,0.00075,0.01000,0.866
15,mlp.up_proj,0.04829,0.01000,1.117
15,mlp.gate_proj,0.07109,0.01000,0.948
15,mlp.down_proj,0.00144,0.01000,4.163
16,self_attn.k_proj,0.03448,0.01000,0.972
16,self_attn.v_proj,0.00408,0.01000,0.761
16,self_attn.q_proj,0.05693,0.01000,0.757
16,self_attn.o_proj,0.00059,0.01000,0.884
16,mlp.up_proj,0.05158,0.01000,0.942
16,mlp.gate_proj,0.08038,0.01000,0.771
16,mlp.down_proj,0.00155,0.01000,4.371
17,self_attn.k_proj,0.03758,0.01000,1.024
17,self_attn.v_proj,0.00455,0.01000,0.806
17,self_attn.q_proj,0.06028,0.01000,1.121
17,self_attn.o_proj,0.00050,0.01000,0.956
17,mlp.up_proj,0.05369,0.01000,1.232
17,mlp.gate_proj,0.08562,0.01000,1.101
17,mlp.down_proj,0.00176,0.01000,4.635
18,self_attn.k_proj,0.04196,0.01000,1.283
18,self_attn.v_proj,0.00469,0.01000,1.056
18,self_attn.q_proj,0.06148,0.01000,1.039
18,self_attn.o_proj,0.00034,0.01000,1.306
18,mlp.up_proj,0.05583,0.01000,1.184
18,mlp.gate_proj,0.09008,0.01000,1.041
18,mlp.down_proj,0.00172,0.01000,4.425
19,self_attn.k_proj,0.03756,0.01000,1.218
19,self_attn.v_proj,0.00505,0.01000,1.130
19,self_attn.q_proj,0.06241,0.01000,1.039
19,self_attn.o_proj,0.00031,0.01000,1.175
19,mlp.up_proj,0.05776,0.01000,1.240
19,mlp.gate_proj,0.09495,0.01000,1.135
19,mlp.down_proj,0.00182,0.01000,4.239
20,self_attn.k_proj,0.04167,0.01000,0.956
20,self_attn.v_proj,0.00561,0.01000,0.751
20,self_attn.q_proj,0.06523,0.01000,0.820
20,self_attn.o_proj,0.00040,0.01000,0.871
20,mlp.up_proj,0.06277,0.01000,0.924
20,mlp.gate_proj,0.10218,0.01000,0.759
20,mlp.down_proj,0.00201,0.01000,3.710
21,self_attn.k_proj,0.04118,0.01000,1.101
21,self_attn.v_proj,0.00618,0.01000,0.750
21,self_attn.q_proj,0.06289,0.01000,0.754
21,self_attn.o_proj,0.00045,0.01000,1.036
21,mlp.up_proj,0.06714,0.01000,1.057
21,mlp.gate_proj,0.11034,0.01000,0.902
21,mlp.down_proj,0.00234,0.01000,3.546
22,self_attn.k_proj,0.04402,0.01000,0.952
22,self_attn.v_proj,0.00732,0.01000,0.752
22,self_attn.q_proj,0.06415,0.01000,0.750
22,self_attn.o_proj,0.00046,0.01000,0.860
22,mlp.up_proj,0.07031,0.01000,0.923
22,mlp.gate_proj,0.11440,0.01000,0.757
22,mlp.down_proj,0.00240,0.01000,3.389
23,self_attn.k_proj,0.04254,0.01000,0.951
23,self_attn.v_proj,0.00793,0.01000,0.750
23,self_attn.q_proj,0.06684,0.01000,0.748
23,self_attn.o_proj,0.00035,0.01000,0.866
23,mlp.up_proj,0.07450,0.01000,0.917
23,mlp.gate_proj,0.12051,0.01000,0.753
23,mlp.down_proj,0.00254,0.01000,3.421
24,self_attn.k_proj,0.04258,0.01000,0.993
24,self_attn.v_proj,0.01002,0.01000,0.733
24,self_attn.q_proj,0.06728,0.01000,0.732
24,self_attn.o_proj,0.00044,0.01000,0.889
24,mlp.up_proj,0.07882,0.01000,0.915
24,mlp.gate_proj,0.12752,0.01000,0.755
24,mlp.down_proj,0.00270,0.01000,3.431
25,self_attn.k_proj,0.03998,0.01000,0.981
25,self_attn.v_proj,0.01046,0.01000,0.770
25,self_attn.q_proj,0.06746,0.01000,0.751
25,self_attn.o_proj,0.00044,0.01000,0.889
25,mlp.up_proj,0.08398,0.01000,0.910
25,mlp.gate_proj,0.13579,0.01000,0.752
25,mlp.down_proj,0.00297,0.01000,3.426
26,self_attn.k_proj,0.04234,0.01000,0.951
26,self_attn.v_proj,0.00950,0.01000,0.742
26,self_attn.q_proj,0.06494,0.01000,0.742
26,self_attn.o_proj,0.00066,0.01000,0.877
26,mlp.up_proj,0.08960,0.01000,0.917
26,mlp.gate_proj,0.14520,0.01000,0.755
26,mlp.down_proj,0.00334,0.01000,3.387
27,self_attn.k_proj,0.04629,0.01000,0.948
27,self_attn.v_proj,0.01406,0.01000,0.744
27,self_attn.q_proj,0.06788,0.01000,0.744
27,self_attn.o_proj,0.00078,0.01000,0.862
27,mlp.up_proj,0.09763,0.01000,0.934
27,mlp.gate_proj,0.15711,0.01000,0.776
27,mlp.down_proj,0.00393,0.01000,3.412
28,self_attn.k_proj,0.03655,0.01000,0.966
28,self_attn.v_proj,0.01233,0.01000,0.750
28,self_attn.q_proj,0.06297,0.01000,0.743
28,self_attn.o_proj,0.00146,0.01000,0.874
28,mlp.up_proj,0.10832,0.01000,0.983
28,mlp.gate_proj,0.16666,0.01000,0.768
28,mlp.down_proj,0.00508,0.01000,3.436
29,self_attn.k_proj,0.03799,0.01000,0.946
29,self_attn.v_proj,0.01470,0.01000,0.748
29,self_attn.q_proj,0.06669,0.01000,0.748
29,self_attn.o_proj,0.00120,0.01000,0.872
29,mlp.up_proj,0.11543,0.01000,0.915
29,mlp.gate_proj,0.16996,0.01000,0.752
29,mlp.down_proj,0.00667,0.01000,3.694
30,self_attn.k_proj,0.03873,0.01000,1.102
30,self_attn.v_proj,0.02061,0.01000,0.752
30,self_attn.q_proj,0.06170,0.01000,0.754
30,self_attn.o_proj,0.00225,0.01000,0.871
30,mlp.up_proj,0.12185,0.01000,0.926
30,mlp.gate_proj,0.18361,0.01000,0.766
30,mlp.down_proj,0.01061,0.01000,3.467
31,self_attn.k_proj,0.02776,0.01000,0.957
31,self_attn.v_proj,0.01209,0.01000,0.749
31,self_attn.q_proj,0.05268,0.01000,0.754
31,self_attn.o_proj,0.00419,0.01000,0.871
31,mlp.up_proj,0.11449,0.01000,0.919
31,mlp.gate_proj,0.16690,0.01000,0.761
31,mlp.down_proj,0.02763,0.01000,3.674