|
layer,module,loss,samples,damp,time
|
|
0,self_attn.k_proj,0.30323729,0.01500,1.376
|
|
0,self_attn.v_proj,0.00081456,0.01500,1.134
|
|
0,self_attn.q_proj,0.50177538,0.01500,1.143
|
|
0,self_attn.o_proj,0.00410974,0.01500,1.150
|
|
0,mlp.up_proj,0.87140083,0.01500,1.140
|
|
0,mlp.gate_proj,0.88596356,0.01500,1.168
|
|
0,mlp.down_proj,3.59487438,0.01500,2.880
|
|
1,self_attn.k_proj,1.79021871,0.01500,1.075
|
|
1,self_attn.v_proj,0.08866195,0.01500,1.081
|
|
1,self_attn.q_proj,2.48720980,0.01500,1.146
|
|
1,self_attn.o_proj,0.79290819,0.01500,1.133
|
|
1,mlp.up_proj,0.70214444,0.01500,1.135
|
|
1,mlp.gate_proj,0.79838932,0.01500,1.136
|
|
1,mlp.down_proj,2.23402882,0.01500,2.897
|
|
2,self_attn.k_proj,1.86278677,0.01500,1.109
|
|
2,self_attn.v_proj,0.19091517,0.01500,1.116
|
|
2,self_attn.q_proj,1.61090231,0.01500,1.166
|
|
2,self_attn.o_proj,0.63032722,0.01500,1.121
|
|
2,mlp.up_proj,0.84249359,0.01500,1.134
|
|
2,mlp.gate_proj,0.95266348,0.01500,1.129
|
|
2,mlp.down_proj,157.33862305,0.01500,2.853
|
|
3,self_attn.k_proj,1.13371205,0.01500,1.070
|
|
3,self_attn.v_proj,0.19112220,0.01500,1.130
|
|
3,self_attn.q_proj,1.95455039,0.01500,1.110
|
|
3,self_attn.o_proj,0.43849713,0.01500,1.116
|
|
3,mlp.up_proj,0.91409326,0.01500,1.126
|
|
3,mlp.gate_proj,1.00409079,0.01500,1.135
|
|
3,mlp.down_proj,12.42405319,0.01500,2.883
|
|
4,self_attn.k_proj,0.87567437,0.01500,1.108
|
|
4,self_attn.v_proj,0.14826132,0.01500,1.070
|
|
4,self_attn.q_proj,2.46379852,0.01500,1.138
|
|
4,self_attn.o_proj,0.33942133,0.01500,1.126
|
|
4,mlp.up_proj,1.05060482,0.01500,1.138
|
|
4,mlp.gate_proj,1.17461491,0.01500,1.132
|
|
4,mlp.down_proj,1.44320405,0.01500,2.879
|
|
5,self_attn.k_proj,1.32893443,0.01500,1.075
|
|
5,self_attn.v_proj,0.17556122,0.01500,1.062
|
|
5,self_attn.q_proj,2.47826910,0.01500,1.112
|
|
5,self_attn.o_proj,0.59731841,0.01500,1.113
|
|
5,mlp.up_proj,1.13487399,0.01500,1.148
|
|
5,mlp.gate_proj,1.18413568,0.01500,1.135
|
|
5,mlp.down_proj,1.55033576,0.01500,2.881
|
|
6,self_attn.k_proj,1.86866426,0.01500,1.072
|
|
6,self_attn.v_proj,0.21436407,0.01500,1.075
|
|
6,self_attn.q_proj,2.72684455,0.01500,1.111
|
|
6,self_attn.o_proj,0.75209558,0.01500,1.127
|
|
6,mlp.up_proj,1.31616020,0.01500,1.132
|
|
6,mlp.gate_proj,1.32581091,0.01500,1.139
|
|
6,mlp.down_proj,2.13556457,0.01500,2.880
|
|
7,self_attn.k_proj,1.53838611,0.01500,1.087
|
|
7,self_attn.v_proj,0.22950518,0.01500,1.071
|
|
7,self_attn.q_proj,1.99251246,0.01500,1.109
|
|
7,self_attn.o_proj,0.50463128,0.01500,1.118
|
|
7,mlp.up_proj,1.58821356,0.01500,1.125
|
|
7,mlp.gate_proj,1.58579147,0.01500,1.147
|
|
7,mlp.down_proj,13.17560577,0.01500,2.849
|
|
8,self_attn.k_proj,0.73372823,0.01500,1.068
|
|
8,self_attn.v_proj,0.23304689,0.01500,1.088
|
|
8,self_attn.q_proj,2.41669130,0.01500,1.118
|
|
8,self_attn.o_proj,0.46610335,0.01500,1.116
|
|
8,mlp.up_proj,1.65750051,0.01500,1.136
|
|
8,mlp.gate_proj,1.56000757,0.01500,1.156
|
|
8,mlp.down_proj,8.41586971,0.01500,2.874
|
|
9,self_attn.k_proj,1.64468992,0.01500,1.094
|
|
9,self_attn.v_proj,0.18850568,0.01500,1.094
|
|
9,self_attn.q_proj,1.78751516,0.01500,1.112
|
|
9,self_attn.o_proj,1.78545237,0.01500,1.117
|
|
9,mlp.up_proj,1.77682400,0.01500,1.127
|
|
9,mlp.gate_proj,1.57283258,0.01500,1.141
|
|
9,mlp.down_proj,14.36819839,0.01500,2.873
|
|
10,self_attn.k_proj,1.32247448,0.01500,1.061
|
|
10,self_attn.v_proj,0.22332871,0.01500,1.074
|
|
10,self_attn.q_proj,1.70967674,0.01500,1.109
|
|
10,self_attn.o_proj,2.30593014,0.01500,1.119
|
|
10,mlp.up_proj,2.46851778,0.01500,1.129
|
|
10,mlp.gate_proj,2.33083105,0.01500,1.137
|
|
10,mlp.down_proj,17.56273270,0.01500,2.857
|
|
11,self_attn.k_proj,1.05880129,0.01500,1.068
|
|
11,self_attn.v_proj,0.20641716,0.01500,1.074
|
|
11,self_attn.q_proj,2.14066696,0.01500,1.111
|
|
11,self_attn.o_proj,2.36638355,0.01500,1.138
|
|
11,mlp.up_proj,2.62533450,0.01500,1.126
|
|
11,mlp.gate_proj,2.36855841,0.01500,1.117
|
|
11,mlp.down_proj,36624136.00000000,0.01500,2.888
|
|
12,self_attn.k_proj,0.60637605,0.01500,1.081
|
|
12,self_attn.v_proj,0.20556667,0.01500,1.108
|
|
12,self_attn.q_proj,6.41779613,0.01500,1.111
|
|
12,self_attn.o_proj,1.40109611,0.01500,1.119
|
|
12,mlp.up_proj,10.91535950,0.01500,1.132
|
|
12,mlp.gate_proj,4.99505901,0.01500,1.146
|
|
12,mlp.down_proj,9760.42968750,0.01500,2.909
|
|
13,self_attn.k_proj,2.24922800,0.01500,1.082
|
|
13,self_attn.v_proj,0.27756080,0.01500,1.086
|
|
13,self_attn.q_proj,7.30099392,0.01500,1.109
|
|
13,self_attn.o_proj,2.96828890,0.01500,1.118
|
|
13,mlp.up_proj,2.91019154,0.01500,1.123
|
|
13,mlp.gate_proj,6.23261738,0.01500,1.141
|
|
13,mlp.down_proj,6.46631765,0.01500,2.860
|
|
14,self_attn.k_proj,0.69264430,0.01500,1.071
|
|
14,self_attn.v_proj,0.51544046,0.01500,1.091
|
|
14,self_attn.q_proj,3.18851161,0.01500,1.131
|
|
14,self_attn.o_proj,1.25791931,0.01500,1.127
|
|
14,mlp.up_proj,2.58898783,0.01500,1.112
|
|
14,mlp.gate_proj,5.24106836,0.01500,1.133
|
|
14,mlp.down_proj,9.01900768,0.01500,2.851
|
|
15,self_attn.k_proj,0.67096651,0.01500,1.094
|
|
15,self_attn.v_proj,0.36131397,0.01500,1.112
|
|
15,self_attn.q_proj,3.81791139,0.01500,1.097
|
|
15,self_attn.o_proj,2.25381660,0.01500,1.114
|
|
15,mlp.up_proj,2.34244204,0.01500,1.116
|
|
15,mlp.gate_proj,4.29145336,0.01500,1.132
|
|
15,mlp.down_proj,7.26017952,0.01500,2.923
|
|
16,self_attn.k_proj,0.64388847,0.01500,1.060
|
|
16,self_attn.v_proj,0.34459960,0.01500,1.078
|
|
16,self_attn.q_proj,4.61652613,0.01500,1.101
|
|
16,self_attn.o_proj,1.88339543,0.01500,1.119
|
|
16,mlp.up_proj,2.72254467,0.01500,1.121
|
|
16,mlp.gate_proj,3.13850927,0.01500,1.119
|
|
16,mlp.down_proj,6.84692860,0.01500,2.887
|
|
17,self_attn.k_proj,0.55838877,0.01500,1.057
|
|
17,self_attn.v_proj,0.51657593,0.01500,1.071
|
|
17,self_attn.q_proj,4.33557653,0.01500,1.092
|
|
17,self_attn.o_proj,2.56168294,0.01500,1.126
|
|
17,mlp.up_proj,3.06461382,0.01500,1.110
|
|
17,mlp.gate_proj,3.21341205,0.01500,1.114
|
|
17,mlp.down_proj,7.29544258,0.01500,2.854
|
|
18,self_attn.k_proj,0.68149984,0.01500,1.102
|
|
18,self_attn.v_proj,1.32401478,0.01500,1.124
|
|
18,self_attn.q_proj,7.70216036,0.01500,1.098
|
|
18,self_attn.o_proj,2.28013134,0.01500,1.119
|
|
18,mlp.up_proj,3.90698004,0.01500,1.116
|
|
18,mlp.gate_proj,4.11436844,0.01500,1.152
|
|
18,mlp.down_proj,11.87063789,0.01500,2.870
|
|
19,self_attn.k_proj,0.65415150,0.01500,1.066
|
|
19,self_attn.v_proj,0.53765559,0.01500,1.075
|
|
19,self_attn.q_proj,6.70729065,0.01500,1.112
|
|
19,self_attn.o_proj,3.07730746,0.01500,1.132
|
|
19,mlp.up_proj,3.57759047,0.01500,1.119
|
|
19,mlp.gate_proj,5.04411411,0.01500,1.120
|
|
19,mlp.down_proj,13.49418736,0.01500,2.850
|
|
20,self_attn.k_proj,0.45334548,0.01500,1.062
|
|
20,self_attn.v_proj,1.12238181,0.01500,1.083
|
|
20,self_attn.q_proj,5.45634222,0.01500,1.106
|
|
20,self_attn.o_proj,2.11403751,0.01500,1.122
|
|
20,mlp.up_proj,3.80852771,0.01500,1.123
|
|
20,mlp.gate_proj,4.78546810,0.01500,1.129
|
|
20,mlp.down_proj,15.71007252,0.01500,2.860
|
|
21,self_attn.k_proj,0.67353952,0.01500,1.056
|
|
21,self_attn.v_proj,0.74522316,0.01500,1.084
|
|
21,self_attn.q_proj,4.39328623,0.01500,1.095
|
|
21,self_attn.o_proj,2.93690538,0.01500,1.109
|
|
21,mlp.up_proj,4.77232122,0.01500,1.108
|
|
21,mlp.gate_proj,5.83200645,0.01500,1.138
|
|
21,mlp.down_proj,19.96510315,0.01500,2.825
|
|
22,self_attn.k_proj,0.63552809,0.01500,1.060
|
|
22,self_attn.v_proj,1.77812839,0.01500,1.101
|
|
22,self_attn.q_proj,6.14302778,0.01500,1.112
|
|
22,self_attn.o_proj,3.85619378,0.01500,1.108
|
|
22,mlp.up_proj,5.24628830,0.01500,1.106
|
|
22,mlp.gate_proj,8.02893066,0.01500,1.106
|
|
22,mlp.down_proj,24.18618774,0.01500,2.823
|
|
23,self_attn.k_proj,0.82243836,0.01500,1.073
|
|
23,self_attn.v_proj,2.90332031,0.01500,1.065
|
|
23,self_attn.q_proj,9.50726032,0.01500,1.098
|
|
23,self_attn.o_proj,8.13974857,0.01500,1.113
|
|
23,mlp.up_proj,5.42801857,0.01500,1.099
|
|
23,mlp.gate_proj,10.77536011,0.01500,1.128
|
|
23,mlp.down_proj,29.22331047,0.01500,2.812
|
|
24,self_attn.k_proj,0.60857439,0.01500,1.061
|
|
24,self_attn.v_proj,1.17702281,0.01500,1.069
|
|
24,self_attn.q_proj,6.26180887,0.01500,1.110
|
|
24,self_attn.o_proj,4.30931950,0.01500,1.096
|
|
24,mlp.up_proj,5.46759701,0.01500,1.095
|
|
24,mlp.gate_proj,10.43561554,0.01500,1.102
|
|
24,mlp.down_proj,31.56058502,0.01500,2.808
|
|
25,self_attn.k_proj,0.78283930,0.01500,1.041
|
|
25,self_attn.v_proj,1.24567127,0.01500,1.058
|
|
25,self_attn.q_proj,4.97283077,0.01500,1.095
|
|
25,self_attn.o_proj,5.16120386,0.01500,1.105
|
|
25,mlp.up_proj,6.94152546,0.01500,1.102
|
|
25,mlp.gate_proj,9.48820877,0.01500,1.099
|
|
25,mlp.down_proj,37.16706085,0.01500,2.802
|
|
26,self_attn.k_proj,0.95313138,0.01500,1.052
|
|
26,self_attn.v_proj,1.37231970,0.01500,1.054
|
|
26,self_attn.q_proj,6.39235163,0.01500,1.087
|
|
26,self_attn.o_proj,5.90192604,0.01500,1.090
|
|
26,mlp.up_proj,12.41309357,0.01500,1.094
|
|
26,mlp.gate_proj,9.54691982,0.01500,1.093
|
|
26,mlp.down_proj,37.73841095,0.01500,2.798
|
|
27,self_attn.k_proj,0.49448842,0.01500,1.041
|
|
27,self_attn.v_proj,0.81519926,0.01500,1.044
|
|
27,self_attn.q_proj,5.96102524,0.01500,1.087
|
|
27,self_attn.o_proj,5.79659319,0.01500,1.101
|
|
27,mlp.up_proj,14.86005974,0.01500,1.099
|
|
27,mlp.gate_proj,29.81634903,0.01500,1.100
|
|
27,mlp.down_proj,702.13244629,0.01500,2.865
|
|
28,self_attn.k_proj,0.60215271,0.01500,1.045
|
|
28,self_attn.v_proj,1.07407022,0.01500,1.044
|
|
28,self_attn.q_proj,7.19515991,0.01500,1.075
|
|
28,self_attn.o_proj,6.81128788,0.01500,1.090
|
|
28,mlp.up_proj,28.30822754,0.01500,1.100
|
|
28,mlp.gate_proj,35.86479950,0.01500,1.100
|
|
28,mlp.down_proj,33054578.00000000,0.01500,2.789
|
|
29,self_attn.k_proj,0.62672096,0.01500,1.042
|
|
29,self_attn.v_proj,0.87135106,0.01500,1.051
|
|
29,self_attn.q_proj,12.68386078,0.01500,1.077
|
|
29,self_attn.o_proj,41.61279678,0.01500,1.103
|
|
29,mlp.up_proj,224.53115845,0.01500,1.092
|
|
29,mlp.gate_proj,142.67680359,0.01500,1.107
|
|
29,mlp.down_proj,10202.70410156,0.01500,2.805
|
|
|