SmolLM-135M_gptq_g32_4bit / quant_log.csv
JustJaro's picture
Add files using upload-large-folder tool
c9a730b verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.30323729,0.01500,1.376
0,self_attn.v_proj,0.00081456,0.01500,1.134
0,self_attn.q_proj,0.50177538,0.01500,1.143
0,self_attn.o_proj,0.00410974,0.01500,1.150
0,mlp.up_proj,0.87140083,0.01500,1.140
0,mlp.gate_proj,0.88596356,0.01500,1.168
0,mlp.down_proj,3.59487438,0.01500,2.880
1,self_attn.k_proj,1.79021871,0.01500,1.075
1,self_attn.v_proj,0.08866195,0.01500,1.081
1,self_attn.q_proj,2.48720980,0.01500,1.146
1,self_attn.o_proj,0.79290819,0.01500,1.133
1,mlp.up_proj,0.70214444,0.01500,1.135
1,mlp.gate_proj,0.79838932,0.01500,1.136
1,mlp.down_proj,2.23402882,0.01500,2.897
2,self_attn.k_proj,1.86278677,0.01500,1.109
2,self_attn.v_proj,0.19091517,0.01500,1.116
2,self_attn.q_proj,1.61090231,0.01500,1.166
2,self_attn.o_proj,0.63032722,0.01500,1.121
2,mlp.up_proj,0.84249359,0.01500,1.134
2,mlp.gate_proj,0.95266348,0.01500,1.129
2,mlp.down_proj,157.33862305,0.01500,2.853
3,self_attn.k_proj,1.13371205,0.01500,1.070
3,self_attn.v_proj,0.19112220,0.01500,1.130
3,self_attn.q_proj,1.95455039,0.01500,1.110
3,self_attn.o_proj,0.43849713,0.01500,1.116
3,mlp.up_proj,0.91409326,0.01500,1.126
3,mlp.gate_proj,1.00409079,0.01500,1.135
3,mlp.down_proj,12.42405319,0.01500,2.883
4,self_attn.k_proj,0.87567437,0.01500,1.108
4,self_attn.v_proj,0.14826132,0.01500,1.070
4,self_attn.q_proj,2.46379852,0.01500,1.138
4,self_attn.o_proj,0.33942133,0.01500,1.126
4,mlp.up_proj,1.05060482,0.01500,1.138
4,mlp.gate_proj,1.17461491,0.01500,1.132
4,mlp.down_proj,1.44320405,0.01500,2.879
5,self_attn.k_proj,1.32893443,0.01500,1.075
5,self_attn.v_proj,0.17556122,0.01500,1.062
5,self_attn.q_proj,2.47826910,0.01500,1.112
5,self_attn.o_proj,0.59731841,0.01500,1.113
5,mlp.up_proj,1.13487399,0.01500,1.148
5,mlp.gate_proj,1.18413568,0.01500,1.135
5,mlp.down_proj,1.55033576,0.01500,2.881
6,self_attn.k_proj,1.86866426,0.01500,1.072
6,self_attn.v_proj,0.21436407,0.01500,1.075
6,self_attn.q_proj,2.72684455,0.01500,1.111
6,self_attn.o_proj,0.75209558,0.01500,1.127
6,mlp.up_proj,1.31616020,0.01500,1.132
6,mlp.gate_proj,1.32581091,0.01500,1.139
6,mlp.down_proj,2.13556457,0.01500,2.880
7,self_attn.k_proj,1.53838611,0.01500,1.087
7,self_attn.v_proj,0.22950518,0.01500,1.071
7,self_attn.q_proj,1.99251246,0.01500,1.109
7,self_attn.o_proj,0.50463128,0.01500,1.118
7,mlp.up_proj,1.58821356,0.01500,1.125
7,mlp.gate_proj,1.58579147,0.01500,1.147
7,mlp.down_proj,13.17560577,0.01500,2.849
8,self_attn.k_proj,0.73372823,0.01500,1.068
8,self_attn.v_proj,0.23304689,0.01500,1.088
8,self_attn.q_proj,2.41669130,0.01500,1.118
8,self_attn.o_proj,0.46610335,0.01500,1.116
8,mlp.up_proj,1.65750051,0.01500,1.136
8,mlp.gate_proj,1.56000757,0.01500,1.156
8,mlp.down_proj,8.41586971,0.01500,2.874
9,self_attn.k_proj,1.64468992,0.01500,1.094
9,self_attn.v_proj,0.18850568,0.01500,1.094
9,self_attn.q_proj,1.78751516,0.01500,1.112
9,self_attn.o_proj,1.78545237,0.01500,1.117
9,mlp.up_proj,1.77682400,0.01500,1.127
9,mlp.gate_proj,1.57283258,0.01500,1.141
9,mlp.down_proj,14.36819839,0.01500,2.873
10,self_attn.k_proj,1.32247448,0.01500,1.061
10,self_attn.v_proj,0.22332871,0.01500,1.074
10,self_attn.q_proj,1.70967674,0.01500,1.109
10,self_attn.o_proj,2.30593014,0.01500,1.119
10,mlp.up_proj,2.46851778,0.01500,1.129
10,mlp.gate_proj,2.33083105,0.01500,1.137
10,mlp.down_proj,17.56273270,0.01500,2.857
11,self_attn.k_proj,1.05880129,0.01500,1.068
11,self_attn.v_proj,0.20641716,0.01500,1.074
11,self_attn.q_proj,2.14066696,0.01500,1.111
11,self_attn.o_proj,2.36638355,0.01500,1.138
11,mlp.up_proj,2.62533450,0.01500,1.126
11,mlp.gate_proj,2.36855841,0.01500,1.117
11,mlp.down_proj,36624136.00000000,0.01500,2.888
12,self_attn.k_proj,0.60637605,0.01500,1.081
12,self_attn.v_proj,0.20556667,0.01500,1.108
12,self_attn.q_proj,6.41779613,0.01500,1.111
12,self_attn.o_proj,1.40109611,0.01500,1.119
12,mlp.up_proj,10.91535950,0.01500,1.132
12,mlp.gate_proj,4.99505901,0.01500,1.146
12,mlp.down_proj,9760.42968750,0.01500,2.909
13,self_attn.k_proj,2.24922800,0.01500,1.082
13,self_attn.v_proj,0.27756080,0.01500,1.086
13,self_attn.q_proj,7.30099392,0.01500,1.109
13,self_attn.o_proj,2.96828890,0.01500,1.118
13,mlp.up_proj,2.91019154,0.01500,1.123
13,mlp.gate_proj,6.23261738,0.01500,1.141
13,mlp.down_proj,6.46631765,0.01500,2.860
14,self_attn.k_proj,0.69264430,0.01500,1.071
14,self_attn.v_proj,0.51544046,0.01500,1.091
14,self_attn.q_proj,3.18851161,0.01500,1.131
14,self_attn.o_proj,1.25791931,0.01500,1.127
14,mlp.up_proj,2.58898783,0.01500,1.112
14,mlp.gate_proj,5.24106836,0.01500,1.133
14,mlp.down_proj,9.01900768,0.01500,2.851
15,self_attn.k_proj,0.67096651,0.01500,1.094
15,self_attn.v_proj,0.36131397,0.01500,1.112
15,self_attn.q_proj,3.81791139,0.01500,1.097
15,self_attn.o_proj,2.25381660,0.01500,1.114
15,mlp.up_proj,2.34244204,0.01500,1.116
15,mlp.gate_proj,4.29145336,0.01500,1.132
15,mlp.down_proj,7.26017952,0.01500,2.923
16,self_attn.k_proj,0.64388847,0.01500,1.060
16,self_attn.v_proj,0.34459960,0.01500,1.078
16,self_attn.q_proj,4.61652613,0.01500,1.101
16,self_attn.o_proj,1.88339543,0.01500,1.119
16,mlp.up_proj,2.72254467,0.01500,1.121
16,mlp.gate_proj,3.13850927,0.01500,1.119
16,mlp.down_proj,6.84692860,0.01500,2.887
17,self_attn.k_proj,0.55838877,0.01500,1.057
17,self_attn.v_proj,0.51657593,0.01500,1.071
17,self_attn.q_proj,4.33557653,0.01500,1.092
17,self_attn.o_proj,2.56168294,0.01500,1.126
17,mlp.up_proj,3.06461382,0.01500,1.110
17,mlp.gate_proj,3.21341205,0.01500,1.114
17,mlp.down_proj,7.29544258,0.01500,2.854
18,self_attn.k_proj,0.68149984,0.01500,1.102
18,self_attn.v_proj,1.32401478,0.01500,1.124
18,self_attn.q_proj,7.70216036,0.01500,1.098
18,self_attn.o_proj,2.28013134,0.01500,1.119
18,mlp.up_proj,3.90698004,0.01500,1.116
18,mlp.gate_proj,4.11436844,0.01500,1.152
18,mlp.down_proj,11.87063789,0.01500,2.870
19,self_attn.k_proj,0.65415150,0.01500,1.066
19,self_attn.v_proj,0.53765559,0.01500,1.075
19,self_attn.q_proj,6.70729065,0.01500,1.112
19,self_attn.o_proj,3.07730746,0.01500,1.132
19,mlp.up_proj,3.57759047,0.01500,1.119
19,mlp.gate_proj,5.04411411,0.01500,1.120
19,mlp.down_proj,13.49418736,0.01500,2.850
20,self_attn.k_proj,0.45334548,0.01500,1.062
20,self_attn.v_proj,1.12238181,0.01500,1.083
20,self_attn.q_proj,5.45634222,0.01500,1.106
20,self_attn.o_proj,2.11403751,0.01500,1.122
20,mlp.up_proj,3.80852771,0.01500,1.123
20,mlp.gate_proj,4.78546810,0.01500,1.129
20,mlp.down_proj,15.71007252,0.01500,2.860
21,self_attn.k_proj,0.67353952,0.01500,1.056
21,self_attn.v_proj,0.74522316,0.01500,1.084
21,self_attn.q_proj,4.39328623,0.01500,1.095
21,self_attn.o_proj,2.93690538,0.01500,1.109
21,mlp.up_proj,4.77232122,0.01500,1.108
21,mlp.gate_proj,5.83200645,0.01500,1.138
21,mlp.down_proj,19.96510315,0.01500,2.825
22,self_attn.k_proj,0.63552809,0.01500,1.060
22,self_attn.v_proj,1.77812839,0.01500,1.101
22,self_attn.q_proj,6.14302778,0.01500,1.112
22,self_attn.o_proj,3.85619378,0.01500,1.108
22,mlp.up_proj,5.24628830,0.01500,1.106
22,mlp.gate_proj,8.02893066,0.01500,1.106
22,mlp.down_proj,24.18618774,0.01500,2.823
23,self_attn.k_proj,0.82243836,0.01500,1.073
23,self_attn.v_proj,2.90332031,0.01500,1.065
23,self_attn.q_proj,9.50726032,0.01500,1.098
23,self_attn.o_proj,8.13974857,0.01500,1.113
23,mlp.up_proj,5.42801857,0.01500,1.099
23,mlp.gate_proj,10.77536011,0.01500,1.128
23,mlp.down_proj,29.22331047,0.01500,2.812
24,self_attn.k_proj,0.60857439,0.01500,1.061
24,self_attn.v_proj,1.17702281,0.01500,1.069
24,self_attn.q_proj,6.26180887,0.01500,1.110
24,self_attn.o_proj,4.30931950,0.01500,1.096
24,mlp.up_proj,5.46759701,0.01500,1.095
24,mlp.gate_proj,10.43561554,0.01500,1.102
24,mlp.down_proj,31.56058502,0.01500,2.808
25,self_attn.k_proj,0.78283930,0.01500,1.041
25,self_attn.v_proj,1.24567127,0.01500,1.058
25,self_attn.q_proj,4.97283077,0.01500,1.095
25,self_attn.o_proj,5.16120386,0.01500,1.105
25,mlp.up_proj,6.94152546,0.01500,1.102
25,mlp.gate_proj,9.48820877,0.01500,1.099
25,mlp.down_proj,37.16706085,0.01500,2.802
26,self_attn.k_proj,0.95313138,0.01500,1.052
26,self_attn.v_proj,1.37231970,0.01500,1.054
26,self_attn.q_proj,6.39235163,0.01500,1.087
26,self_attn.o_proj,5.90192604,0.01500,1.090
26,mlp.up_proj,12.41309357,0.01500,1.094
26,mlp.gate_proj,9.54691982,0.01500,1.093
26,mlp.down_proj,37.73841095,0.01500,2.798
27,self_attn.k_proj,0.49448842,0.01500,1.041
27,self_attn.v_proj,0.81519926,0.01500,1.044
27,self_attn.q_proj,5.96102524,0.01500,1.087
27,self_attn.o_proj,5.79659319,0.01500,1.101
27,mlp.up_proj,14.86005974,0.01500,1.099
27,mlp.gate_proj,29.81634903,0.01500,1.100
27,mlp.down_proj,702.13244629,0.01500,2.865
28,self_attn.k_proj,0.60215271,0.01500,1.045
28,self_attn.v_proj,1.07407022,0.01500,1.044
28,self_attn.q_proj,7.19515991,0.01500,1.075
28,self_attn.o_proj,6.81128788,0.01500,1.090
28,mlp.up_proj,28.30822754,0.01500,1.100
28,mlp.gate_proj,35.86479950,0.01500,1.100
28,mlp.down_proj,33054578.00000000,0.01500,2.789
29,self_attn.k_proj,0.62672096,0.01500,1.042
29,self_attn.v_proj,0.87135106,0.01500,1.051
29,self_attn.q_proj,12.68386078,0.01500,1.077
29,self_attn.o_proj,41.61279678,0.01500,1.103
29,mlp.up_proj,224.53115845,0.01500,1.092
29,mlp.gate_proj,142.67680359,0.01500,1.107
29,mlp.down_proj,10202.70410156,0.01500,2.805