File size: 8,675 Bytes
9fb036e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 |
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.13902166,0.10000,1.339
0,self_attn.v_proj,0.00411488,0.10000,1.143
0,self_attn.q_proj,0.25420425,0.10000,1.155
0,self_attn.o_proj,0.00059406,0.10000,1.136
0,mlp.up_proj,0.14385145,0.10000,1.159
0,mlp.gate_proj,0.16117708,0.10000,1.159
0,mlp.down_proj,0.00199381,0.10000,3.209
1,self_attn.k_proj,0.15608716,0.10000,1.148
1,self_attn.v_proj,0.01423703,0.10000,1.135
1,self_attn.q_proj,0.25583876,0.10000,1.170
1,self_attn.o_proj,0.00460686,0.10000,1.147
1,mlp.up_proj,0.17664601,0.10000,1.164
1,mlp.gate_proj,0.20205935,0.10000,1.165
1,mlp.down_proj,0.26540963,0.10000,3.208
2,self_attn.k_proj,0.64143051,0.10000,1.128
2,self_attn.v_proj,0.05575921,0.10000,1.158
2,self_attn.q_proj,1.00400524,0.10000,1.152
2,self_attn.o_proj,0.00137172,0.10000,1.143
2,mlp.up_proj,0.32489484,0.10000,1.170
2,mlp.gate_proj,0.38338157,0.10000,1.164
2,mlp.down_proj,0.00555915,0.10000,3.210
3,self_attn.k_proj,0.46079177,0.10000,1.171
3,self_attn.v_proj,0.07834912,0.10000,1.138
3,self_attn.q_proj,0.82779565,0.10000,1.202
3,self_attn.o_proj,0.00174203,0.10000,1.153
3,mlp.up_proj,0.43483363,0.10000,1.178
3,mlp.gate_proj,0.57168456,0.10000,1.179
3,mlp.down_proj,0.00857076,0.10000,3.169
4,self_attn.k_proj,0.41968606,0.10000,1.149
4,self_attn.v_proj,0.07420651,0.10000,1.145
4,self_attn.q_proj,0.79865553,0.10000,1.182
4,self_attn.o_proj,0.00336127,0.10000,1.152
4,mlp.up_proj,0.49365585,0.10000,1.170
4,mlp.gate_proj,0.74100946,0.10000,1.165
4,mlp.down_proj,0.01335056,0.10000,3.186
5,self_attn.k_proj,0.65282072,0.10000,1.149
5,self_attn.v_proj,0.06885923,0.10000,1.151
5,self_attn.q_proj,1.06100185,0.10000,1.155
5,self_attn.o_proj,0.00436050,0.10000,1.144
5,mlp.up_proj,0.57540012,0.10000,1.172
5,mlp.gate_proj,0.81276573,0.10000,1.161
5,mlp.down_proj,0.01836273,0.10000,3.199
6,self_attn.k_proj,0.52795381,0.10000,1.151
6,self_attn.v_proj,0.07394283,0.10000,1.149
6,self_attn.q_proj,0.96784992,0.10000,1.144
6,self_attn.o_proj,0.00695068,0.10000,1.164
6,mlp.up_proj,0.62315580,0.10000,1.172
6,mlp.gate_proj,0.86376086,0.10000,1.164
6,mlp.down_proj,0.02160461,0.10000,3.193
7,self_attn.k_proj,0.51381869,0.10000,1.151
7,self_attn.v_proj,0.07086828,0.10000,1.147
7,self_attn.q_proj,0.85494958,0.10000,1.166
7,self_attn.o_proj,0.00933906,0.10000,1.160
7,mlp.up_proj,0.65060491,0.10000,1.170
7,mlp.gate_proj,0.83545278,0.10000,1.173
7,mlp.down_proj,0.02384820,0.10000,3.197
8,self_attn.k_proj,0.61009663,0.10000,1.146
8,self_attn.v_proj,0.08485761,0.10000,1.139
8,self_attn.q_proj,1.03384483,0.10000,1.152
8,self_attn.o_proj,0.01181837,0.10000,1.154
8,mlp.up_proj,0.67781304,0.10000,1.169
8,mlp.gate_proj,0.88280136,0.10000,1.168
8,mlp.down_proj,0.02553345,0.10000,3.172
9,self_attn.k_proj,0.61209971,0.10000,1.146
9,self_attn.v_proj,0.10749650,0.10000,1.145
9,self_attn.q_proj,1.03778622,0.10000,1.154
9,self_attn.o_proj,0.01342493,0.10000,1.153
9,mlp.up_proj,0.69132690,0.10000,1.173
9,mlp.gate_proj,0.86247390,0.10000,1.180
9,mlp.down_proj,0.02601313,0.10000,3.203
10,self_attn.k_proj,0.62474133,0.10000,1.157
10,self_attn.v_proj,0.08401376,0.10000,1.167
10,self_attn.q_proj,1.04063724,0.10000,1.166
10,self_attn.o_proj,0.01185641,0.10000,1.143
10,mlp.up_proj,0.72412362,0.10000,1.161
10,mlp.gate_proj,0.84645346,0.10000,1.195
10,mlp.down_proj,0.02780603,0.10000,3.182
11,self_attn.k_proj,0.51180097,0.10000,1.144
11,self_attn.v_proj,0.10558044,0.10000,1.152
11,self_attn.q_proj,0.91123513,0.10000,1.180
11,self_attn.o_proj,0.01549722,0.10000,1.154
11,mlp.up_proj,0.77185845,0.10000,1.166
11,mlp.gate_proj,0.85984341,0.10000,1.184
11,mlp.down_proj,0.03146418,0.10000,3.171
12,self_attn.k_proj,0.74853297,0.10000,1.143
12,self_attn.v_proj,0.11227088,0.10000,1.136
12,self_attn.q_proj,1.25926862,0.10000,1.154
12,self_attn.o_proj,0.01763893,0.10000,1.146
12,mlp.up_proj,0.81915410,0.10000,1.155
12,mlp.gate_proj,0.89613688,0.10000,1.158
12,mlp.down_proj,0.03564403,0.10000,3.175
13,self_attn.k_proj,0.75234242,0.10000,1.142
13,self_attn.v_proj,0.11938924,0.10000,1.146
13,self_attn.q_proj,1.17813722,0.10000,1.163
13,self_attn.o_proj,0.02167543,0.10000,1.147
13,mlp.up_proj,0.89836866,0.10000,1.167
13,mlp.gate_proj,1.01834695,0.10000,1.158
13,mlp.down_proj,0.04383968,0.10000,3.189
14,self_attn.k_proj,0.68150638,0.10000,1.140
14,self_attn.v_proj,0.13524983,0.10000,1.150
14,self_attn.q_proj,1.37748688,0.10000,1.155
14,self_attn.o_proj,0.02483580,0.10000,1.203
14,mlp.up_proj,0.97236985,0.10000,1.158
14,mlp.gate_proj,1.12228150,0.10000,1.172
14,mlp.down_proj,0.05535022,0.10000,3.189
15,self_attn.k_proj,0.75259839,0.10000,1.153
15,self_attn.v_proj,0.14126670,0.10000,1.156
15,self_attn.q_proj,1.38710701,0.10000,1.150
15,self_attn.o_proj,0.01717166,0.10000,1.137
15,mlp.up_proj,0.98969074,0.10000,1.166
15,mlp.gate_proj,1.24946946,0.10000,1.163
15,mlp.down_proj,0.06018501,0.10000,3.230
16,self_attn.k_proj,0.83249243,0.10000,1.144
16,self_attn.v_proj,0.14333684,0.10000,1.148
16,self_attn.q_proj,1.42057782,0.10000,1.151
16,self_attn.o_proj,0.01254638,0.10000,1.153
16,mlp.up_proj,1.03370025,0.10000,1.162
16,mlp.gate_proj,1.35148522,0.10000,1.177
16,mlp.down_proj,0.06047480,0.10000,3.258
17,self_attn.k_proj,0.76570194,0.10000,1.139
17,self_attn.v_proj,0.15113925,0.10000,1.163
17,self_attn.q_proj,1.40730178,0.10000,1.176
17,self_attn.o_proj,0.01126649,0.10000,1.145
17,mlp.up_proj,1.09815854,0.10000,1.167
17,mlp.gate_proj,1.45470468,0.10000,1.174
17,mlp.down_proj,0.06544407,0.10000,3.206
18,self_attn.k_proj,0.84666482,0.10000,1.130
18,self_attn.v_proj,0.17572731,0.10000,1.171
18,self_attn.q_proj,1.52004973,0.10000,1.167
18,self_attn.o_proj,0.01051633,0.10000,1.148
18,mlp.up_proj,1.19301062,0.10000,1.171
18,mlp.gate_proj,1.55704117,0.10000,1.168
18,mlp.down_proj,0.07174794,0.10000,3.164
19,self_attn.k_proj,0.83629734,0.10000,1.140
19,self_attn.v_proj,0.18202185,0.10000,1.152
19,self_attn.q_proj,1.44164488,0.10000,1.156
19,self_attn.o_proj,0.01828037,0.10000,1.145
19,mlp.up_proj,1.30551202,0.10000,1.149
19,mlp.gate_proj,1.66621888,0.10000,1.162
19,mlp.down_proj,0.08933399,0.10000,3.197
20,self_attn.k_proj,0.86651410,0.10000,1.139
20,self_attn.v_proj,0.22740557,0.10000,1.140
20,self_attn.q_proj,1.52156200,0.10000,1.155
20,self_attn.o_proj,0.01467473,0.10000,1.143
20,mlp.up_proj,1.37747804,0.10000,1.166
20,mlp.gate_proj,1.69420732,0.10000,1.174
20,mlp.down_proj,0.09297852,0.10000,3.169
21,self_attn.k_proj,0.82437217,0.10000,1.135
21,self_attn.v_proj,0.28204440,0.10000,1.148
21,self_attn.q_proj,1.49503875,0.10000,1.158
21,self_attn.o_proj,0.01584026,0.10000,1.172
21,mlp.up_proj,1.49381587,0.10000,1.175
21,mlp.gate_proj,1.84704486,0.10000,1.158
21,mlp.down_proj,0.10311377,0.10000,3.164
22,self_attn.k_proj,0.78454527,0.10000,1.143
22,self_attn.v_proj,0.29480893,0.10000,1.138
22,self_attn.q_proj,1.51049621,0.10000,1.143
22,self_attn.o_proj,0.01483698,0.10000,1.151
22,mlp.up_proj,1.63850020,0.10000,1.167
22,mlp.gate_proj,2.04142903,0.10000,1.162
22,mlp.down_proj,0.11971325,0.10000,3.147
23,self_attn.k_proj,0.87311951,0.10000,1.153
23,self_attn.v_proj,0.28546786,0.10000,1.147
23,self_attn.q_proj,1.49267762,0.10000,1.151
23,self_attn.o_proj,0.02627072,0.10000,1.140
23,mlp.up_proj,1.81052402,0.10000,1.160
23,mlp.gate_proj,2.34182375,0.10000,1.169
23,mlp.down_proj,0.13955892,0.10000,3.240
24,self_attn.k_proj,0.92957858,0.10000,1.165
24,self_attn.v_proj,0.40332459,0.10000,1.144
24,self_attn.q_proj,1.61930737,0.10000,1.166
24,self_attn.o_proj,0.03366064,0.10000,1.142
24,mlp.up_proj,2.02484539,0.10000,1.160
24,mlp.gate_proj,2.67931360,0.10000,1.162
24,mlp.down_proj,0.16569229,0.10000,3.165
25,self_attn.k_proj,0.80799884,0.10000,1.146
25,self_attn.v_proj,0.40075913,0.10000,1.159
25,self_attn.q_proj,1.61817187,0.10000,1.174
25,self_attn.o_proj,0.03860076,0.10000,1.139
25,mlp.up_proj,2.23846866,0.10000,1.163
25,mlp.gate_proj,2.93024124,0.10000,1.177
25,mlp.down_proj,0.21674625,0.10000,3.197
26,self_attn.k_proj,0.77650310,0.10000,1.149
26,self_attn.v_proj,0.49124430,0.10000,1.140
26,self_attn.q_proj,1.45946094,0.10000,1.154
26,self_attn.o_proj,0.07463339,0.10000,1.131
26,mlp.up_proj,2.32856115,0.10000,1.159
26,mlp.gate_proj,3.08885019,0.10000,1.171
26,mlp.down_proj,0.29293505,0.10000,3.180
27,self_attn.k_proj,0.58231013,0.10000,1.137
27,self_attn.v_proj,0.33187094,0.10000,1.127
27,self_attn.q_proj,1.15255964,0.10000,1.151
27,self_attn.o_proj,0.14841482,0.10000,1.150
27,mlp.up_proj,2.35349909,0.10000,1.161
27,mlp.gate_proj,2.82487768,0.10000,1.156
27,mlp.down_proj,0.67249798,0.10000,3.171
|