File size: 9,067 Bytes
6986a6a |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 |
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.0000432854,0.05000,1.766
0,self_attn.v_proj,0.0000049972,0.05000,1.793
0,self_attn.q_proj,0.0001757931,0.05000,1.798
0,self_attn.o_proj,0.0000108898,0.05000,0.778
0,mlp.up_proj,0.0003301854,0.05000,1.146
0,mlp.gate_proj,0.0007666261,0.05000,1.183
0,mlp.down_proj,0.0000141513,0.05000,5.336
1,self_attn.k_proj,0.0000358306,0.05000,1.767
1,self_attn.q_proj,0.0001356997,0.05000,1.789
1,self_attn.v_proj,0.0000092715,0.05000,1.792
1,self_attn.o_proj,0.0000043125,0.05000,0.785
1,mlp.up_proj,0.0068297327,0.05000,1.161
1,mlp.gate_proj,0.0110956548,0.05000,1.184
1,mlp.down_proj,0.0000095164,0.05000,5.333
2,self_attn.k_proj,0.0000858678,0.05000,1.750
2,self_attn.v_proj,0.0000151014,0.05000,1.786
2,self_attn.q_proj,0.0003180285,0.05000,1.790
2,self_attn.o_proj,0.0000078531,0.05000,0.777
2,mlp.up_proj,0.0060570274,0.05000,1.143
2,mlp.gate_proj,0.0098869666,0.05000,1.177
2,mlp.down_proj,0.0000373999,0.05000,5.348
3,self_attn.k_proj,0.0000810958,0.05000,1.771
3,self_attn.q_proj,0.0003177889,0.05000,1.790
3,self_attn.v_proj,0.0000203367,0.05000,1.792
3,self_attn.o_proj,0.0000193827,0.05000,0.780
3,mlp.up_proj,0.0127348766,0.05000,1.154
3,mlp.gate_proj,0.0171400174,0.05000,1.185
3,mlp.down_proj,0.0021732034,0.05000,5.357
4,self_attn.k_proj,0.0001399196,0.05000,1.776
4,self_attn.q_proj,0.0006156289,0.05000,1.794
4,self_attn.v_proj,0.0000480736,0.05000,1.796
4,self_attn.o_proj,0.0000394140,0.05000,0.788
4,mlp.up_proj,0.0090971480,0.05000,1.153
4,mlp.gate_proj,0.0135318746,0.05000,1.185
4,mlp.down_proj,0.0023862841,0.05000,5.319
5,self_attn.k_proj,0.0001325996,0.05000,1.784
5,self_attn.q_proj,0.0006572159,0.05000,1.797
5,self_attn.v_proj,0.0000548861,0.05000,1.799
5,self_attn.o_proj,0.0000599871,0.05000,0.795
5,mlp.up_proj,0.0147371594,0.05000,1.171
5,mlp.gate_proj,0.0186996124,0.05000,1.195
5,mlp.down_proj,0.0002437168,0.05000,5.403
6,self_attn.k_proj,0.0000885772,0.05000,1.742
6,self_attn.v_proj,0.0000421790,0.05000,1.777
6,self_attn.q_proj,0.0004314109,0.05000,1.783
6,self_attn.o_proj,0.0000446818,0.05000,0.794
6,mlp.up_proj,0.0026338197,0.05000,1.157
6,mlp.gate_proj,0.0037542884,0.05000,1.188
6,mlp.down_proj,0.0000997583,0.05000,5.390
7,self_attn.k_proj,0.0000925571,0.05000,1.789
7,self_attn.q_proj,0.0005228582,0.05000,1.802
7,self_attn.v_proj,0.0000846739,0.05000,1.804
7,self_attn.o_proj,0.0000540034,0.05000,0.791
7,mlp.up_proj,0.0021272203,0.05000,1.164
7,mlp.gate_proj,0.0023616219,0.05000,1.187
7,mlp.down_proj,0.0001141313,0.05000,5.314
8,self_attn.k_proj,0.0001738771,0.05000,1.777
8,self_attn.v_proj,0.0000707547,0.05000,1.794
8,self_attn.q_proj,0.0007570342,0.05000,1.799
8,self_attn.o_proj,0.0000702879,0.05000,0.788
8,mlp.up_proj,0.0023392382,0.05000,1.160
8,mlp.gate_proj,0.0024381351,0.05000,1.184
8,mlp.down_proj,0.0001141036,0.05000,5.359
9,self_attn.k_proj,0.0001255440,0.05000,1.747
9,self_attn.v_proj,0.0001075853,0.05000,1.781
9,self_attn.q_proj,0.0006896859,0.05000,1.785
9,self_attn.o_proj,0.0000752609,0.05000,0.778
9,mlp.up_proj,0.0046194003,0.05000,1.152
9,mlp.gate_proj,0.0072552940,0.05000,1.185
9,mlp.down_proj,0.0001435438,0.05000,5.375
10,self_attn.v_proj,0.0000711022,0.05000,1.815
10,self_attn.k_proj,0.0001285309,0.05000,1.819
10,self_attn.q_proj,0.0006438414,0.05000,1.842
10,self_attn.o_proj,0.0000531726,0.05000,0.780
10,mlp.up_proj,0.0023653700,0.05000,1.150
10,mlp.gate_proj,0.0026815632,0.05000,1.183
10,mlp.down_proj,0.0000887731,0.05000,5.373
11,self_attn.k_proj,0.0001696957,0.05000,1.778
11,self_attn.v_proj,0.0000648065,0.05000,1.797
11,self_attn.q_proj,0.0007402942,0.05000,1.801
11,self_attn.o_proj,0.0000742858,0.05000,0.783
11,mlp.up_proj,0.0021493328,0.05000,1.163
11,mlp.gate_proj,0.0022600763,0.05000,1.190
11,mlp.down_proj,0.0002429208,0.05000,5.360
12,self_attn.k_proj,0.0001913924,0.05000,1.775
12,self_attn.v_proj,0.0000848261,0.05000,1.794
12,self_attn.q_proj,0.0008414217,0.05000,1.799
12,self_attn.o_proj,0.0000603520,0.05000,0.791
12,mlp.up_proj,0.0021892047,0.05000,1.165
12,mlp.gate_proj,0.0021619192,0.05000,1.188
12,mlp.down_proj,0.0000992026,0.05000,5.388
13,self_attn.k_proj,0.0001764100,0.05000,1.783
13,self_attn.v_proj,0.0001123422,0.05000,1.800
13,self_attn.q_proj,0.0009153854,0.05000,1.803
13,self_attn.o_proj,0.0000794259,0.05000,0.789
13,mlp.up_proj,0.0022109749,0.05000,1.161
13,mlp.gate_proj,0.0023554429,0.05000,1.187
13,mlp.down_proj,0.0000893284,0.05000,5.370
14,self_attn.k_proj,0.0002561925,0.05000,1.782
14,self_attn.v_proj,0.0001154645,0.05000,1.787
14,self_attn.q_proj,0.0013007666,0.05000,1.813
14,self_attn.o_proj,0.0001204233,0.05000,0.781
14,mlp.up_proj,0.0025638388,0.05000,1.145
14,mlp.gate_proj,0.0025896619,0.05000,1.171
14,mlp.down_proj,0.0000961390,0.05000,5.339
15,self_attn.k_proj,0.0002411058,0.05000,1.771
15,self_attn.v_proj,0.0001010086,0.05000,1.779
15,self_attn.q_proj,0.0010763963,0.05000,1.806
15,self_attn.o_proj,0.0001248457,0.05000,0.779
15,mlp.up_proj,0.0025943129,0.05000,1.146
15,mlp.gate_proj,0.0025343251,0.05000,1.173
15,mlp.down_proj,0.0001141996,0.05000,5.327
16,self_attn.k_proj,0.0002437389,0.05000,1.762
16,self_attn.v_proj,0.0001444091,0.05000,1.778
16,self_attn.q_proj,0.0012326450,0.05000,1.798
16,self_attn.o_proj,0.0001986508,0.05000,0.780
16,mlp.up_proj,0.0028457921,0.05000,1.147
16,mlp.gate_proj,0.0027699758,0.05000,1.172
16,mlp.down_proj,0.0001097131,0.05000,5.343
17,self_attn.k_proj,0.0002372200,0.05000,1.779
17,self_attn.v_proj,0.0001644637,0.05000,1.785
17,self_attn.q_proj,0.0013344949,0.05000,1.804
17,self_attn.o_proj,0.0001687157,0.05000,0.777
17,mlp.up_proj,0.0034605139,0.05000,1.152
17,mlp.gate_proj,0.0032823749,0.05000,1.177
17,mlp.down_proj,0.0001509321,0.05000,5.323
18,self_attn.k_proj,0.0001887011,0.05000,1.765
18,self_attn.v_proj,0.0001808350,0.05000,1.779
18,self_attn.q_proj,0.0010705749,0.05000,1.801
18,self_attn.o_proj,0.0001657871,0.05000,0.783
18,mlp.up_proj,0.0040642183,0.05000,1.148
18,mlp.gate_proj,0.0037679110,0.05000,1.174
18,mlp.down_proj,0.0002181015,0.05000,5.336
19,self_attn.k_proj,0.0002055513,0.05000,1.769
19,self_attn.v_proj,0.0002454614,0.05000,1.785
19,self_attn.q_proj,0.0013781268,0.05000,1.805
19,self_attn.o_proj,0.0002243668,0.05000,0.781
19,mlp.up_proj,0.0046072615,0.05000,1.154
19,mlp.gate_proj,0.0044774732,0.05000,1.177
19,mlp.down_proj,0.0002187767,0.05000,5.333
20,self_attn.k_proj,0.0002085851,0.05000,1.772
20,self_attn.v_proj,0.0002610162,0.05000,1.786
20,self_attn.q_proj,0.0013019970,0.05000,1.806
20,self_attn.o_proj,0.0001514216,0.05000,0.781
20,mlp.up_proj,0.0054252240,0.05000,1.148
20,mlp.gate_proj,0.0051634870,0.05000,1.173
20,mlp.down_proj,0.0003712054,0.05000,5.326
21,self_attn.k_proj,0.0002118031,0.05000,1.759
21,self_attn.v_proj,0.0003764736,0.05000,1.772
21,self_attn.q_proj,0.0015059532,0.05000,1.788
21,self_attn.o_proj,0.0004255283,0.05000,0.782
21,mlp.up_proj,0.0066461328,0.05000,1.147
21,mlp.gate_proj,0.0066254139,0.05000,1.174
21,mlp.down_proj,0.0005992475,0.05000,5.317
22,self_attn.k_proj,0.0002988659,0.05000,1.769
22,self_attn.v_proj,0.0005736383,0.05000,1.783
22,self_attn.q_proj,0.0021297575,0.05000,1.807
22,self_attn.o_proj,0.0004206545,0.05000,0.780
22,mlp.up_proj,0.0094454406,0.05000,1.151
22,mlp.gate_proj,0.0092535556,0.05000,1.175
22,mlp.down_proj,0.0008095826,0.05000,5.324
23,self_attn.k_proj,0.0003835323,0.05000,1.771
23,self_attn.v_proj,0.0007766295,0.05000,1.785
23,self_attn.q_proj,0.0024568439,0.05000,1.806
23,self_attn.o_proj,0.0008100346,0.05000,0.780
23,mlp.up_proj,0.0125601661,0.05000,1.148
23,mlp.gate_proj,0.0126166713,0.05000,1.174
23,mlp.down_proj,0.0009607696,0.05000,5.323
24,self_attn.k_proj,0.0003131202,0.05000,1.760
24,self_attn.v_proj,0.0008387528,0.05000,1.777
24,self_attn.q_proj,0.0022884397,0.05000,1.799
24,self_attn.o_proj,0.0006900308,0.05000,0.784
24,mlp.up_proj,0.0137791785,0.05000,1.152
24,mlp.gate_proj,0.0128174114,0.05000,1.177
24,mlp.down_proj,0.0013900608,0.05000,5.345
25,self_attn.k_proj,0.0003696309,0.05000,1.796
25,self_attn.v_proj,0.0014799064,0.05000,1.798
25,self_attn.q_proj,0.0027035042,0.05000,1.818
25,self_attn.o_proj,0.0010714627,0.05000,0.780
25,mlp.up_proj,0.0188588492,0.05000,1.149
25,mlp.gate_proj,0.0167194957,0.05000,1.181
25,mlp.down_proj,0.0112290785,0.05000,5.347
26,self_attn.k_proj,0.0005632932,0.05000,1.775
26,self_attn.v_proj,0.0039053194,0.05000,1.784
26,self_attn.q_proj,0.0044603734,0.05000,1.806
26,self_attn.o_proj,0.0024405535,0.05000,0.786
26,mlp.up_proj,0.0201260808,0.05000,1.157
26,mlp.gate_proj,0.0176544122,0.05000,1.180
26,mlp.down_proj,0.0254254744,0.05000,5.332
27,self_attn.k_proj,0.0007584638,0.05000,1.767
27,self_attn.v_proj,0.0063212753,0.05000,1.781
27,self_attn.q_proj,0.0070051274,0.05000,1.795
27,self_attn.o_proj,0.0045859847,0.05000,0.785
27,mlp.up_proj,0.0242716040,0.05000,1.155
27,mlp.gate_proj,0.0231725800,0.05000,1.181
27,mlp.down_proj,0.0212887442,0.05000,5.341
|