File size: 8,675 Bytes
9fb036e
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.13902166,0.10000,1.339
0,self_attn.v_proj,0.00411488,0.10000,1.143
0,self_attn.q_proj,0.25420425,0.10000,1.155
0,self_attn.o_proj,0.00059406,0.10000,1.136
0,mlp.up_proj,0.14385145,0.10000,1.159
0,mlp.gate_proj,0.16117708,0.10000,1.159
0,mlp.down_proj,0.00199381,0.10000,3.209
1,self_attn.k_proj,0.15608716,0.10000,1.148
1,self_attn.v_proj,0.01423703,0.10000,1.135
1,self_attn.q_proj,0.25583876,0.10000,1.170
1,self_attn.o_proj,0.00460686,0.10000,1.147
1,mlp.up_proj,0.17664601,0.10000,1.164
1,mlp.gate_proj,0.20205935,0.10000,1.165
1,mlp.down_proj,0.26540963,0.10000,3.208
2,self_attn.k_proj,0.64143051,0.10000,1.128
2,self_attn.v_proj,0.05575921,0.10000,1.158
2,self_attn.q_proj,1.00400524,0.10000,1.152
2,self_attn.o_proj,0.00137172,0.10000,1.143
2,mlp.up_proj,0.32489484,0.10000,1.170
2,mlp.gate_proj,0.38338157,0.10000,1.164
2,mlp.down_proj,0.00555915,0.10000,3.210
3,self_attn.k_proj,0.46079177,0.10000,1.171
3,self_attn.v_proj,0.07834912,0.10000,1.138
3,self_attn.q_proj,0.82779565,0.10000,1.202
3,self_attn.o_proj,0.00174203,0.10000,1.153
3,mlp.up_proj,0.43483363,0.10000,1.178
3,mlp.gate_proj,0.57168456,0.10000,1.179
3,mlp.down_proj,0.00857076,0.10000,3.169
4,self_attn.k_proj,0.41968606,0.10000,1.149
4,self_attn.v_proj,0.07420651,0.10000,1.145
4,self_attn.q_proj,0.79865553,0.10000,1.182
4,self_attn.o_proj,0.00336127,0.10000,1.152
4,mlp.up_proj,0.49365585,0.10000,1.170
4,mlp.gate_proj,0.74100946,0.10000,1.165
4,mlp.down_proj,0.01335056,0.10000,3.186
5,self_attn.k_proj,0.65282072,0.10000,1.149
5,self_attn.v_proj,0.06885923,0.10000,1.151
5,self_attn.q_proj,1.06100185,0.10000,1.155
5,self_attn.o_proj,0.00436050,0.10000,1.144
5,mlp.up_proj,0.57540012,0.10000,1.172
5,mlp.gate_proj,0.81276573,0.10000,1.161
5,mlp.down_proj,0.01836273,0.10000,3.199
6,self_attn.k_proj,0.52795381,0.10000,1.151
6,self_attn.v_proj,0.07394283,0.10000,1.149
6,self_attn.q_proj,0.96784992,0.10000,1.144
6,self_attn.o_proj,0.00695068,0.10000,1.164
6,mlp.up_proj,0.62315580,0.10000,1.172
6,mlp.gate_proj,0.86376086,0.10000,1.164
6,mlp.down_proj,0.02160461,0.10000,3.193
7,self_attn.k_proj,0.51381869,0.10000,1.151
7,self_attn.v_proj,0.07086828,0.10000,1.147
7,self_attn.q_proj,0.85494958,0.10000,1.166
7,self_attn.o_proj,0.00933906,0.10000,1.160
7,mlp.up_proj,0.65060491,0.10000,1.170
7,mlp.gate_proj,0.83545278,0.10000,1.173
7,mlp.down_proj,0.02384820,0.10000,3.197
8,self_attn.k_proj,0.61009663,0.10000,1.146
8,self_attn.v_proj,0.08485761,0.10000,1.139
8,self_attn.q_proj,1.03384483,0.10000,1.152
8,self_attn.o_proj,0.01181837,0.10000,1.154
8,mlp.up_proj,0.67781304,0.10000,1.169
8,mlp.gate_proj,0.88280136,0.10000,1.168
8,mlp.down_proj,0.02553345,0.10000,3.172
9,self_attn.k_proj,0.61209971,0.10000,1.146
9,self_attn.v_proj,0.10749650,0.10000,1.145
9,self_attn.q_proj,1.03778622,0.10000,1.154
9,self_attn.o_proj,0.01342493,0.10000,1.153
9,mlp.up_proj,0.69132690,0.10000,1.173
9,mlp.gate_proj,0.86247390,0.10000,1.180
9,mlp.down_proj,0.02601313,0.10000,3.203
10,self_attn.k_proj,0.62474133,0.10000,1.157
10,self_attn.v_proj,0.08401376,0.10000,1.167
10,self_attn.q_proj,1.04063724,0.10000,1.166
10,self_attn.o_proj,0.01185641,0.10000,1.143
10,mlp.up_proj,0.72412362,0.10000,1.161
10,mlp.gate_proj,0.84645346,0.10000,1.195
10,mlp.down_proj,0.02780603,0.10000,3.182
11,self_attn.k_proj,0.51180097,0.10000,1.144
11,self_attn.v_proj,0.10558044,0.10000,1.152
11,self_attn.q_proj,0.91123513,0.10000,1.180
11,self_attn.o_proj,0.01549722,0.10000,1.154
11,mlp.up_proj,0.77185845,0.10000,1.166
11,mlp.gate_proj,0.85984341,0.10000,1.184
11,mlp.down_proj,0.03146418,0.10000,3.171
12,self_attn.k_proj,0.74853297,0.10000,1.143
12,self_attn.v_proj,0.11227088,0.10000,1.136
12,self_attn.q_proj,1.25926862,0.10000,1.154
12,self_attn.o_proj,0.01763893,0.10000,1.146
12,mlp.up_proj,0.81915410,0.10000,1.155
12,mlp.gate_proj,0.89613688,0.10000,1.158
12,mlp.down_proj,0.03564403,0.10000,3.175
13,self_attn.k_proj,0.75234242,0.10000,1.142
13,self_attn.v_proj,0.11938924,0.10000,1.146
13,self_attn.q_proj,1.17813722,0.10000,1.163
13,self_attn.o_proj,0.02167543,0.10000,1.147
13,mlp.up_proj,0.89836866,0.10000,1.167
13,mlp.gate_proj,1.01834695,0.10000,1.158
13,mlp.down_proj,0.04383968,0.10000,3.189
14,self_attn.k_proj,0.68150638,0.10000,1.140
14,self_attn.v_proj,0.13524983,0.10000,1.150
14,self_attn.q_proj,1.37748688,0.10000,1.155
14,self_attn.o_proj,0.02483580,0.10000,1.203
14,mlp.up_proj,0.97236985,0.10000,1.158
14,mlp.gate_proj,1.12228150,0.10000,1.172
14,mlp.down_proj,0.05535022,0.10000,3.189
15,self_attn.k_proj,0.75259839,0.10000,1.153
15,self_attn.v_proj,0.14126670,0.10000,1.156
15,self_attn.q_proj,1.38710701,0.10000,1.150
15,self_attn.o_proj,0.01717166,0.10000,1.137
15,mlp.up_proj,0.98969074,0.10000,1.166
15,mlp.gate_proj,1.24946946,0.10000,1.163
15,mlp.down_proj,0.06018501,0.10000,3.230
16,self_attn.k_proj,0.83249243,0.10000,1.144
16,self_attn.v_proj,0.14333684,0.10000,1.148
16,self_attn.q_proj,1.42057782,0.10000,1.151
16,self_attn.o_proj,0.01254638,0.10000,1.153
16,mlp.up_proj,1.03370025,0.10000,1.162
16,mlp.gate_proj,1.35148522,0.10000,1.177
16,mlp.down_proj,0.06047480,0.10000,3.258
17,self_attn.k_proj,0.76570194,0.10000,1.139
17,self_attn.v_proj,0.15113925,0.10000,1.163
17,self_attn.q_proj,1.40730178,0.10000,1.176
17,self_attn.o_proj,0.01126649,0.10000,1.145
17,mlp.up_proj,1.09815854,0.10000,1.167
17,mlp.gate_proj,1.45470468,0.10000,1.174
17,mlp.down_proj,0.06544407,0.10000,3.206
18,self_attn.k_proj,0.84666482,0.10000,1.130
18,self_attn.v_proj,0.17572731,0.10000,1.171
18,self_attn.q_proj,1.52004973,0.10000,1.167
18,self_attn.o_proj,0.01051633,0.10000,1.148
18,mlp.up_proj,1.19301062,0.10000,1.171
18,mlp.gate_proj,1.55704117,0.10000,1.168
18,mlp.down_proj,0.07174794,0.10000,3.164
19,self_attn.k_proj,0.83629734,0.10000,1.140
19,self_attn.v_proj,0.18202185,0.10000,1.152
19,self_attn.q_proj,1.44164488,0.10000,1.156
19,self_attn.o_proj,0.01828037,0.10000,1.145
19,mlp.up_proj,1.30551202,0.10000,1.149
19,mlp.gate_proj,1.66621888,0.10000,1.162
19,mlp.down_proj,0.08933399,0.10000,3.197
20,self_attn.k_proj,0.86651410,0.10000,1.139
20,self_attn.v_proj,0.22740557,0.10000,1.140
20,self_attn.q_proj,1.52156200,0.10000,1.155
20,self_attn.o_proj,0.01467473,0.10000,1.143
20,mlp.up_proj,1.37747804,0.10000,1.166
20,mlp.gate_proj,1.69420732,0.10000,1.174
20,mlp.down_proj,0.09297852,0.10000,3.169
21,self_attn.k_proj,0.82437217,0.10000,1.135
21,self_attn.v_proj,0.28204440,0.10000,1.148
21,self_attn.q_proj,1.49503875,0.10000,1.158
21,self_attn.o_proj,0.01584026,0.10000,1.172
21,mlp.up_proj,1.49381587,0.10000,1.175
21,mlp.gate_proj,1.84704486,0.10000,1.158
21,mlp.down_proj,0.10311377,0.10000,3.164
22,self_attn.k_proj,0.78454527,0.10000,1.143
22,self_attn.v_proj,0.29480893,0.10000,1.138
22,self_attn.q_proj,1.51049621,0.10000,1.143
22,self_attn.o_proj,0.01483698,0.10000,1.151
22,mlp.up_proj,1.63850020,0.10000,1.167
22,mlp.gate_proj,2.04142903,0.10000,1.162
22,mlp.down_proj,0.11971325,0.10000,3.147
23,self_attn.k_proj,0.87311951,0.10000,1.153
23,self_attn.v_proj,0.28546786,0.10000,1.147
23,self_attn.q_proj,1.49267762,0.10000,1.151
23,self_attn.o_proj,0.02627072,0.10000,1.140
23,mlp.up_proj,1.81052402,0.10000,1.160
23,mlp.gate_proj,2.34182375,0.10000,1.169
23,mlp.down_proj,0.13955892,0.10000,3.240
24,self_attn.k_proj,0.92957858,0.10000,1.165
24,self_attn.v_proj,0.40332459,0.10000,1.144
24,self_attn.q_proj,1.61930737,0.10000,1.166
24,self_attn.o_proj,0.03366064,0.10000,1.142
24,mlp.up_proj,2.02484539,0.10000,1.160
24,mlp.gate_proj,2.67931360,0.10000,1.162
24,mlp.down_proj,0.16569229,0.10000,3.165
25,self_attn.k_proj,0.80799884,0.10000,1.146
25,self_attn.v_proj,0.40075913,0.10000,1.159
25,self_attn.q_proj,1.61817187,0.10000,1.174
25,self_attn.o_proj,0.03860076,0.10000,1.139
25,mlp.up_proj,2.23846866,0.10000,1.163
25,mlp.gate_proj,2.93024124,0.10000,1.177
25,mlp.down_proj,0.21674625,0.10000,3.197
26,self_attn.k_proj,0.77650310,0.10000,1.149
26,self_attn.v_proj,0.49124430,0.10000,1.140
26,self_attn.q_proj,1.45946094,0.10000,1.154
26,self_attn.o_proj,0.07463339,0.10000,1.131
26,mlp.up_proj,2.32856115,0.10000,1.159
26,mlp.gate_proj,3.08885019,0.10000,1.171
26,mlp.down_proj,0.29293505,0.10000,3.180
27,self_attn.k_proj,0.58231013,0.10000,1.137
27,self_attn.v_proj,0.33187094,0.10000,1.127
27,self_attn.q_proj,1.15255964,0.10000,1.151
27,self_attn.o_proj,0.14841482,0.10000,1.150
27,mlp.up_proj,2.35349909,0.10000,1.161
27,mlp.gate_proj,2.82487768,0.10000,1.156
27,mlp.down_proj,0.67249798,0.10000,3.171