|
layer,module,loss,samples,damp,time
|
|
0,self_attn.k_proj,0.0000000243,0.05000,1.346
|
|
0,self_attn.v_proj,0.0000000040,0.05000,1.044
|
|
0,self_attn.q_proj,0.0000000903,0.05000,1.080
|
|
0,self_attn.o_proj,0.0000000000,0.05000,1.098
|
|
0,mlp.gate_proj,0.0000000940,0.05000,1.349
|
|
0,mlp.up_proj,0.0000000836,0.05000,1.323
|
|
0,mlp.down_proj,0.0000000001,0.05000,4.570
|
|
1,self_attn.k_proj,0.0000001356,0.05000,1.074
|
|
1,self_attn.v_proj,0.0000000265,0.05000,1.093
|
|
1,self_attn.q_proj,0.0000002987,0.05000,1.117
|
|
1,self_attn.o_proj,0.0000000001,0.05000,1.154
|
|
1,mlp.gate_proj,0.0000003163,0.05000,1.123
|
|
1,mlp.up_proj,0.0000002789,0.05000,1.105
|
|
1,mlp.down_proj,0.0000000908,0.05000,4.407
|
|
2,self_attn.k_proj,0.0000009065,0.05000,1.114
|
|
2,self_attn.v_proj,0.0000000839,0.05000,1.056
|
|
2,self_attn.q_proj,0.0000016890,0.05000,1.104
|
|
2,self_attn.o_proj,0.0000000001,0.05000,1.082
|
|
2,mlp.gate_proj,0.0000006744,0.05000,1.100
|
|
2,mlp.up_proj,0.0000005911,0.05000,1.105
|
|
2,mlp.down_proj,0.0000000003,0.05000,4.560
|
|
3,self_attn.k_proj,0.0000006056,0.05000,1.147
|
|
3,self_attn.v_proj,0.0000000826,0.05000,1.076
|
|
3,self_attn.q_proj,0.0000011741,0.05000,1.094
|
|
3,self_attn.o_proj,0.0000000001,0.05000,1.081
|
|
3,mlp.gate_proj,0.0000011593,0.05000,1.104
|
|
3,mlp.up_proj,0.0000010041,0.05000,1.086
|
|
3,mlp.down_proj,0.0000000005,0.05000,4.424
|
|
4,self_attn.k_proj,0.0000008699,0.05000,1.165
|
|
4,self_attn.v_proj,0.0000001383,0.05000,1.057
|
|
4,self_attn.q_proj,0.0000018787,0.05000,1.104
|
|
4,self_attn.o_proj,0.0000000002,0.05000,1.063
|
|
4,mlp.gate_proj,0.0000017767,0.05000,1.102
|
|
4,mlp.up_proj,0.0000014464,0.05000,1.073
|
|
4,mlp.down_proj,0.0000000010,0.05000,4.394
|
|
5,self_attn.k_proj,0.0000011964,0.05000,1.125
|
|
5,self_attn.v_proj,0.0000001727,0.05000,1.074
|
|
5,self_attn.q_proj,0.0000026247,0.05000,1.063
|
|
5,self_attn.o_proj,0.0000000004,0.05000,1.098
|
|
5,mlp.gate_proj,0.0000026750,0.05000,1.144
|
|
5,mlp.up_proj,0.0000020422,0.05000,1.143
|
|
5,mlp.down_proj,0.0000000018,0.05000,4.481
|
|
6,self_attn.k_proj,0.0000012233,0.05000,1.092
|
|
6,self_attn.v_proj,0.0000001751,0.05000,1.063
|
|
6,self_attn.q_proj,0.0000025896,0.05000,1.096
|
|
6,self_attn.o_proj,0.0000000005,0.05000,1.093
|
|
6,mlp.gate_proj,0.0000033022,0.05000,1.108
|
|
6,mlp.up_proj,0.0000025730,0.05000,1.122
|
|
6,mlp.down_proj,0.0000000026,0.05000,4.475
|
|
7,self_attn.k_proj,0.0000015788,0.05000,1.092
|
|
7,self_attn.v_proj,0.0000002271,0.05000,1.053
|
|
7,self_attn.q_proj,0.0000032580,0.05000,1.086
|
|
7,self_attn.o_proj,0.0000000009,0.05000,1.101
|
|
7,mlp.gate_proj,0.0000040918,0.05000,1.105
|
|
7,mlp.up_proj,0.0000031199,0.05000,1.098
|
|
7,mlp.down_proj,0.0000000035,0.05000,4.402
|
|
8,self_attn.k_proj,0.0000013194,0.05000,1.116
|
|
8,self_attn.v_proj,0.0000002595,0.05000,1.085
|
|
8,self_attn.q_proj,0.0000028454,0.05000,1.102
|
|
8,self_attn.o_proj,0.0000000011,0.05000,1.071
|
|
8,mlp.gate_proj,0.0000046629,0.05000,1.125
|
|
8,mlp.up_proj,0.0000036305,0.05000,1.095
|
|
8,mlp.down_proj,0.0000000043,0.05000,4.342
|
|
9,self_attn.k_proj,0.0000019476,0.05000,1.046
|
|
9,self_attn.v_proj,0.0000003167,0.05000,1.053
|
|
9,self_attn.q_proj,0.0000040997,0.05000,1.078
|
|
9,self_attn.o_proj,0.0000000013,0.05000,1.072
|
|
9,mlp.gate_proj,0.0000050292,0.05000,1.109
|
|
9,mlp.up_proj,0.0000040537,0.05000,1.096
|
|
9,mlp.down_proj,0.0000000050,0.05000,4.360
|
|
10,self_attn.k_proj,0.0000017725,0.05000,1.063
|
|
10,self_attn.v_proj,0.0000002921,0.05000,1.088
|
|
10,self_attn.q_proj,0.0000036800,0.05000,1.225
|
|
10,self_attn.o_proj,0.0000000018,0.05000,1.099
|
|
10,mlp.gate_proj,0.0000052495,0.05000,1.118
|
|
10,mlp.up_proj,0.0000043227,0.05000,1.088
|
|
10,mlp.down_proj,0.0000000060,0.05000,4.511
|
|
11,self_attn.k_proj,0.0000021077,0.05000,1.058
|
|
11,self_attn.v_proj,0.0000004395,0.05000,1.063
|
|
11,self_attn.q_proj,0.0000045010,0.05000,1.069
|
|
11,self_attn.o_proj,0.0000000029,0.05000,1.066
|
|
11,mlp.gate_proj,0.0000057856,0.05000,1.111
|
|
11,mlp.up_proj,0.0000048466,0.05000,1.083
|
|
11,mlp.down_proj,0.0000000072,0.05000,4.406
|
|
12,self_attn.k_proj,0.0000027316,0.05000,1.064
|
|
12,self_attn.v_proj,0.0000004806,0.05000,1.100
|
|
12,self_attn.q_proj,0.0000059322,0.05000,1.121
|
|
12,self_attn.o_proj,0.0000000029,0.05000,1.075
|
|
12,mlp.gate_proj,0.0000064971,0.05000,1.098
|
|
12,mlp.up_proj,0.0000055545,0.05000,1.127
|
|
12,mlp.down_proj,0.0000000088,0.05000,4.425
|
|
13,self_attn.k_proj,0.0000024133,0.05000,1.064
|
|
13,self_attn.v_proj,0.0000005040,0.05000,1.064
|
|
13,self_attn.q_proj,0.0000049132,0.05000,1.111
|
|
13,self_attn.o_proj,0.0000000038,0.05000,1.058
|
|
13,mlp.gate_proj,0.0000072860,0.05000,1.325
|
|
13,mlp.up_proj,0.0000064150,0.05000,1.165
|
|
13,mlp.down_proj,0.0000000112,0.05000,4.474
|
|
14,self_attn.k_proj,0.0000024321,0.05000,1.054
|
|
14,self_attn.v_proj,0.0000008004,0.05000,1.082
|
|
14,self_attn.q_proj,0.0000056635,0.05000,1.112
|
|
14,self_attn.o_proj,0.0000000058,0.05000,1.097
|
|
14,mlp.gate_proj,0.0000083033,0.05000,1.100
|
|
14,mlp.up_proj,0.0000073240,0.05000,1.117
|
|
14,mlp.down_proj,0.0000000147,0.05000,4.616
|
|
15,self_attn.k_proj,0.0000032265,0.05000,1.105
|
|
15,self_attn.v_proj,0.0000009160,0.05000,1.047
|
|
15,self_attn.q_proj,0.0000071495,0.05000,1.086
|
|
15,self_attn.o_proj,0.0000000060,0.05000,1.086
|
|
15,mlp.gate_proj,0.0000098523,0.05000,1.120
|
|
15,mlp.up_proj,0.0000083736,0.05000,1.130
|
|
15,mlp.down_proj,0.0000000185,0.05000,4.463
|
|
16,self_attn.k_proj,0.0000031272,0.05000,1.091
|
|
16,self_attn.v_proj,0.0000009370,0.05000,1.104
|
|
16,self_attn.q_proj,0.0000068247,0.05000,1.105
|
|
16,self_attn.o_proj,0.0000000068,0.05000,1.062
|
|
16,mlp.gate_proj,0.0000123035,0.05000,1.140
|
|
16,mlp.up_proj,0.0000099590,0.05000,1.118
|
|
16,mlp.down_proj,0.0000000257,0.05000,4.493
|
|
17,self_attn.k_proj,0.0000025959,0.05000,1.102
|
|
17,self_attn.v_proj,0.0000008746,0.05000,1.019
|
|
17,self_attn.q_proj,0.0000061843,0.05000,1.097
|
|
17,self_attn.o_proj,0.0000000070,0.05000,1.062
|
|
17,mlp.gate_proj,0.0000143714,0.05000,1.106
|
|
17,mlp.up_proj,0.0000116310,0.05000,1.075
|
|
17,mlp.down_proj,0.0000000354,0.05000,4.374
|
|
18,self_attn.k_proj,0.0000031679,0.05000,1.108
|
|
18,self_attn.v_proj,0.0000010451,0.05000,1.063
|
|
18,self_attn.q_proj,0.0000077381,0.05000,1.101
|
|
18,self_attn.o_proj,0.0000000081,0.05000,1.116
|
|
18,mlp.gate_proj,0.0000163663,0.05000,1.183
|
|
18,mlp.up_proj,0.0000131605,0.05000,1.079
|
|
18,mlp.down_proj,0.0000000498,0.05000,4.473
|
|
19,self_attn.k_proj,0.0000032494,0.05000,1.097
|
|
19,self_attn.v_proj,0.0000012439,0.05000,1.052
|
|
19,self_attn.q_proj,0.0000074487,0.05000,1.106
|
|
19,self_attn.o_proj,0.0000000095,0.05000,1.069
|
|
19,mlp.gate_proj,0.0000187246,0.05000,1.102
|
|
19,mlp.up_proj,0.0000147143,0.05000,1.099
|
|
19,mlp.down_proj,0.0000000669,0.05000,4.367
|
|
20,self_attn.k_proj,0.0000034868,0.05000,1.079
|
|
20,self_attn.v_proj,0.0000013987,0.05000,1.067
|
|
20,self_attn.q_proj,0.0000081005,0.05000,1.068
|
|
20,self_attn.o_proj,0.0000000096,0.05000,1.068
|
|
20,mlp.gate_proj,0.0000216847,0.05000,1.121
|
|
20,mlp.up_proj,0.0000165116,0.05000,1.085
|
|
20,mlp.down_proj,0.0000000704,0.05000,4.444
|
|
21,self_attn.k_proj,0.0000034291,0.05000,1.102
|
|
21,self_attn.v_proj,0.0000015221,0.05000,1.075
|
|
21,self_attn.q_proj,0.0000080014,0.05000,1.108
|
|
21,self_attn.o_proj,0.0000000102,0.05000,1.090
|
|
21,mlp.gate_proj,0.0000261188,0.05000,1.127
|
|
21,mlp.up_proj,0.0000185324,0.05000,1.129
|
|
21,mlp.down_proj,0.0000000756,0.05000,4.455
|
|
22,self_attn.k_proj,0.0000032560,0.05000,1.095
|
|
22,self_attn.v_proj,0.0000016688,0.05000,1.114
|
|
22,self_attn.q_proj,0.0000078390,0.05000,1.093
|
|
22,self_attn.o_proj,0.0000000073,0.05000,1.072
|
|
22,mlp.gate_proj,0.0000279689,0.05000,1.113
|
|
22,mlp.up_proj,0.0000200703,0.05000,1.082
|
|
22,mlp.down_proj,0.0000000813,0.05000,4.367
|
|
23,self_attn.k_proj,0.0000031836,0.05000,1.087
|
|
23,self_attn.v_proj,0.0000016718,0.05000,1.033
|
|
23,self_attn.q_proj,0.0000079744,0.05000,1.077
|
|
23,self_attn.o_proj,0.0000000097,0.05000,1.138
|
|
23,mlp.gate_proj,0.0000311143,0.05000,1.119
|
|
23,mlp.up_proj,0.0000222295,0.05000,1.104
|
|
23,mlp.down_proj,0.0000000910,0.05000,4.489
|
|
24,self_attn.k_proj,0.0000037302,0.05000,1.076
|
|
24,self_attn.v_proj,0.0000019298,0.05000,1.046
|
|
24,self_attn.q_proj,0.0000092244,0.05000,1.073
|
|
24,self_attn.o_proj,0.0000000099,0.05000,1.096
|
|
24,mlp.gate_proj,0.0000349600,0.05000,1.102
|
|
24,mlp.up_proj,0.0000245547,0.05000,1.057
|
|
24,mlp.down_proj,0.0000000984,0.05000,4.411
|
|
25,self_attn.k_proj,0.0000035627,0.05000,1.108
|
|
25,self_attn.v_proj,0.0000022298,0.05000,1.061
|
|
25,self_attn.q_proj,0.0000092782,0.05000,1.120
|
|
25,self_attn.o_proj,0.0000000102,0.05000,1.109
|
|
25,mlp.gate_proj,0.0000381017,0.05000,1.124
|
|
25,mlp.up_proj,0.0000269863,0.05000,1.131
|
|
25,mlp.down_proj,0.0000001128,0.05000,4.506
|
|
26,self_attn.k_proj,0.0000033970,0.05000,1.119
|
|
26,self_attn.v_proj,0.0000023643,0.05000,1.134
|
|
26,self_attn.q_proj,0.0000088182,0.05000,1.124
|
|
26,self_attn.o_proj,0.0000000131,0.05000,1.094
|
|
26,mlp.gate_proj,0.0000397645,0.05000,1.222
|
|
26,mlp.up_proj,0.0000291584,0.05000,1.126
|
|
26,mlp.down_proj,0.0000001288,0.05000,4.435
|
|
27,self_attn.k_proj,0.0000032655,0.05000,1.078
|
|
27,self_attn.v_proj,0.0000021690,0.05000,1.054
|
|
27,self_attn.q_proj,0.0000090136,0.05000,1.098
|
|
27,self_attn.o_proj,0.0000000146,0.05000,1.074
|
|
27,mlp.gate_proj,0.0000431077,0.05000,1.092
|
|
27,mlp.up_proj,0.0000319081,0.05000,1.129
|
|
27,mlp.down_proj,0.0000001526,0.05000,4.389
|
|
28,self_attn.k_proj,0.0000033885,0.05000,1.079
|
|
28,self_attn.v_proj,0.0000031190,0.05000,1.050
|
|
28,self_attn.q_proj,0.0000090153,0.05000,1.100
|
|
28,self_attn.o_proj,0.0000000257,0.05000,1.092
|
|
28,mlp.gate_proj,0.0000462653,0.05000,1.106
|
|
28,mlp.up_proj,0.0000354446,0.05000,1.100
|
|
28,mlp.down_proj,0.0000002016,0.05000,4.429
|
|
29,self_attn.k_proj,0.0000032734,0.05000,1.080
|
|
29,self_attn.v_proj,0.0000044012,0.05000,1.043
|
|
29,self_attn.q_proj,0.0000103499,0.05000,1.089
|
|
29,self_attn.o_proj,0.0000000528,0.05000,1.084
|
|
29,mlp.gate_proj,0.0000452730,0.05000,1.120
|
|
29,mlp.up_proj,0.0000361531,0.05000,1.125
|
|
29,mlp.down_proj,0.0000002568,0.05000,4.422
|
|
30,self_attn.k_proj,0.0000033870,0.05000,1.224
|
|
30,self_attn.v_proj,0.0000048556,0.05000,1.072
|
|
30,self_attn.q_proj,0.0000102100,0.05000,1.077
|
|
30,self_attn.o_proj,0.0000000454,0.05000,1.065
|
|
30,mlp.gate_proj,0.0000465985,0.05000,1.123
|
|
30,mlp.up_proj,0.0000379377,0.05000,1.112
|
|
30,mlp.down_proj,0.0000003248,0.05000,4.327
|
|
31,self_attn.k_proj,0.0000031314,0.05000,1.107
|
|
31,self_attn.v_proj,0.0000050672,0.05000,1.026
|
|
31,self_attn.q_proj,0.0000093823,0.05000,1.097
|
|
31,self_attn.o_proj,0.0000000755,0.05000,1.084
|
|
31,mlp.gate_proj,0.0000427195,0.05000,1.119
|
|
31,mlp.up_proj,0.0000335756,0.05000,1.123
|
|
31,mlp.down_proj,0.0000004450,0.05000,4.457
|
|
|