wanzhenchn's picture
Add files using upload-large-folder tool
863a5a6 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00155976,0.01000,1.062
0,self_attn.v_proj,0.00025913,0.01000,0.787
0,self_attn.q_proj,0.00719704,0.01000,0.787
0,self_attn.o_proj,0.00054527,0.01000,0.788
0,mlp.up_proj,0.01172396,0.01000,1.031
0,mlp.gate_proj,0.05030622,0.01000,0.789
0,mlp.down_proj,0.00242973,0.01000,5.240
1,self_attn.k_proj,0.00112853,0.01000,0.799
1,self_attn.v_proj,0.00027177,0.01000,0.784
1,self_attn.q_proj,0.00409606,0.01000,0.787
1,self_attn.o_proj,0.00012127,0.01000,0.794
1,mlp.up_proj,0.16570595,0.01000,1.101
1,mlp.gate_proj,0.24966781,0.01000,0.792
1,mlp.down_proj,0.00164500,0.01000,5.814
2,self_attn.k_proj,0.00335347,0.01000,0.799
2,self_attn.v_proj,0.00058709,0.01000,0.785
2,self_attn.q_proj,0.01229042,0.01000,0.787
2,self_attn.o_proj,0.00026304,0.01000,0.793
2,mlp.up_proj,0.17873849,0.01000,0.842
2,mlp.gate_proj,0.27987424,0.01000,0.789
2,mlp.down_proj,0.00199898,0.01000,5.365
3,self_attn.k_proj,0.00343811,0.01000,0.800
3,self_attn.v_proj,0.00084825,0.01000,0.789
3,self_attn.q_proj,0.01284988,0.01000,0.789
3,self_attn.o_proj,0.00098652,0.01000,0.793
3,mlp.up_proj,0.40582055,0.01000,1.387
3,mlp.gate_proj,0.51479346,0.01000,0.789
3,mlp.down_proj,0.00173161,0.01250,5.484
4,self_attn.k_proj,0.00593009,0.01000,0.797
4,self_attn.v_proj,0.00177643,0.01000,0.784
4,self_attn.q_proj,0.02622460,0.01000,0.786
4,self_attn.o_proj,0.00066147,0.01000,0.791
4,mlp.up_proj,0.32957339,0.01000,0.886
4,mlp.gate_proj,0.46538600,0.01000,0.788
4,mlp.down_proj,0.00381376,0.01250,5.721
5,self_attn.k_proj,0.00514847,0.01000,0.799
5,self_attn.v_proj,0.00198115,0.01000,0.785
5,self_attn.q_proj,0.02455240,0.01000,0.783
5,self_attn.o_proj,0.00062956,0.01000,0.791
5,mlp.up_proj,0.47762388,0.01000,1.405
5,mlp.gate_proj,0.56400013,0.01000,0.787
5,mlp.down_proj,0.00257655,0.01000,5.255
6,self_attn.k_proj,0.00314261,0.01000,0.800
6,self_attn.v_proj,0.00155135,0.01000,0.784
6,self_attn.q_proj,0.01539165,0.01000,0.784
6,self_attn.o_proj,0.00091197,0.01000,0.788
6,mlp.up_proj,0.09667324,0.01000,1.931
6,mlp.gate_proj,0.13307354,0.01000,0.786
6,mlp.down_proj,0.00632601,0.01000,5.067
7,self_attn.k_proj,0.00304140,0.01000,0.798
7,self_attn.v_proj,0.00270048,0.01000,0.782
7,self_attn.q_proj,0.01698850,0.01000,0.784
7,self_attn.o_proj,0.00212090,0.01000,0.790
7,mlp.up_proj,0.08855421,0.01000,1.009
7,mlp.gate_proj,0.09552005,0.01000,0.785
7,mlp.down_proj,0.01180775,0.01000,4.990
8,self_attn.k_proj,0.00608621,0.01000,0.791
8,self_attn.v_proj,0.00238760,0.01000,0.780
8,self_attn.q_proj,0.02694480,0.01000,0.783
8,self_attn.o_proj,0.00259366,0.01000,0.790
8,mlp.up_proj,0.10740142,0.01000,1.080
8,mlp.gate_proj,0.10944308,0.01000,0.789
8,mlp.down_proj,0.01293161,0.01000,5.047
9,self_attn.k_proj,0.00471512,0.01000,0.801
9,self_attn.v_proj,0.00388974,0.01000,0.789
9,self_attn.q_proj,0.02587198,0.01000,0.782
9,self_attn.o_proj,0.00469003,0.01000,0.790
9,mlp.up_proj,0.20957302,0.01000,0.854
9,mlp.gate_proj,0.32561457,0.01000,0.788
9,mlp.down_proj,0.01337012,0.01000,5.412
10,self_attn.k_proj,0.00471528,0.01000,0.792
10,self_attn.v_proj,0.00264271,0.01000,0.781
10,self_attn.q_proj,0.02393553,0.01000,0.784
10,self_attn.o_proj,0.00264381,0.01000,0.788
10,mlp.up_proj,0.12181626,0.01000,0.950
10,mlp.gate_proj,0.13350184,0.01000,0.786
10,mlp.down_proj,0.01278039,0.01000,5.173
11,self_attn.k_proj,0.00577600,0.01000,0.792
11,self_attn.v_proj,0.00224589,0.01000,0.788
11,self_attn.q_proj,0.02511147,0.01000,0.786
11,self_attn.o_proj,0.00350016,0.01000,0.793
11,mlp.up_proj,0.11557153,0.01000,1.499
11,mlp.gate_proj,0.11823536,0.01000,0.798
11,mlp.down_proj,0.01270626,0.01000,4.847
12,self_attn.k_proj,0.00642343,0.01000,0.791
12,self_attn.v_proj,0.00316933,0.01000,0.781
12,self_attn.q_proj,0.02910189,0.01000,0.782
12,self_attn.o_proj,0.00412563,0.01000,0.789
12,mlp.up_proj,0.11880670,0.01000,1.194
12,mlp.gate_proj,0.11504072,0.01000,0.784
12,mlp.down_proj,0.01432998,0.01000,5.186
13,self_attn.k_proj,0.00591280,0.01000,0.794
13,self_attn.v_proj,0.00406316,0.01000,0.782
13,self_attn.q_proj,0.03183017,0.01000,0.784
13,self_attn.o_proj,0.00672564,0.01000,0.788
13,mlp.up_proj,0.11748554,0.01000,1.138
13,mlp.gate_proj,0.12213729,0.01000,0.788
13,mlp.down_proj,0.01387714,0.01000,5.608
14,self_attn.k_proj,0.00827686,0.01000,0.793
14,self_attn.v_proj,0.00373706,0.01000,0.781
14,self_attn.q_proj,0.04359435,0.01000,0.782
14,self_attn.o_proj,0.00580014,0.01000,0.788
14,mlp.up_proj,0.12862808,0.01000,0.996
14,mlp.gate_proj,0.12646139,0.01000,0.784
14,mlp.down_proj,0.01575416,0.01000,5.376
15,self_attn.k_proj,0.00811000,0.01000,0.800
15,self_attn.v_proj,0.00342697,0.01000,0.786
15,self_attn.q_proj,0.03669517,0.01000,0.785
15,self_attn.o_proj,0.00433463,0.01000,0.795
15,mlp.up_proj,0.12033606,0.01000,1.124
15,mlp.gate_proj,0.11524273,0.01000,0.791
15,mlp.down_proj,0.01562963,0.01000,6.173
16,self_attn.k_proj,0.00680479,0.01000,0.802
16,self_attn.v_proj,0.00406550,0.01000,0.787
16,self_attn.q_proj,0.03531701,0.01000,0.789
16,self_attn.o_proj,0.00676867,0.01000,0.795
16,mlp.up_proj,0.12406420,0.01000,0.953
16,mlp.gate_proj,0.11881709,0.01000,0.793
16,mlp.down_proj,0.01533428,0.01000,5.114
17,self_attn.k_proj,0.00725654,0.01000,0.797
17,self_attn.v_proj,0.00513020,0.01000,0.787
17,self_attn.q_proj,0.04127063,0.01000,0.787
17,self_attn.o_proj,0.00535848,0.01000,0.794
17,mlp.up_proj,0.14923008,0.01000,1.520
17,mlp.gate_proj,0.13929732,0.01000,0.793
17,mlp.down_proj,0.02103773,0.01000,5.127
18,self_attn.k_proj,0.00559972,0.01000,0.793
18,self_attn.v_proj,0.00583129,0.01000,0.782
18,self_attn.q_proj,0.03417122,0.01000,0.786
18,self_attn.o_proj,0.00802413,0.01000,0.788
18,mlp.up_proj,0.16005410,0.01000,0.985
18,mlp.gate_proj,0.14732890,0.01000,0.787
18,mlp.down_proj,0.02358853,0.01000,5.221
19,self_attn.k_proj,0.00579194,0.01000,0.793
19,self_attn.v_proj,0.00709500,0.01000,0.794
19,self_attn.q_proj,0.04169997,0.01000,0.787
19,self_attn.o_proj,0.00951104,0.01000,0.789
19,mlp.up_proj,0.17972152,0.01000,0.977
19,mlp.gate_proj,0.17223045,0.01000,0.793
19,mlp.down_proj,0.02714180,0.01000,5.023
20,self_attn.k_proj,0.00632930,0.01000,0.795
20,self_attn.v_proj,0.00811989,0.01000,0.784
20,self_attn.q_proj,0.04095495,0.01000,0.781
20,self_attn.o_proj,0.00566612,0.01000,0.788
20,mlp.up_proj,0.23348106,0.01000,0.937
20,mlp.gate_proj,0.22367485,0.01000,0.790
20,mlp.down_proj,0.05051873,0.01000,4.768
21,self_attn.k_proj,0.00692819,0.01000,0.809
21,self_attn.v_proj,0.01324287,0.01000,0.788
21,self_attn.q_proj,0.04916327,0.01000,0.798
21,self_attn.o_proj,0.02447969,0.01000,0.794
21,mlp.up_proj,0.31292075,0.01000,1.066
21,mlp.gate_proj,0.31510034,0.01000,0.784
21,mlp.down_proj,0.08189526,0.01000,4.754
22,self_attn.k_proj,0.00977395,0.01000,0.792
22,self_attn.v_proj,0.02283857,0.01000,0.783
22,self_attn.q_proj,0.07048599,0.01000,0.783
22,self_attn.o_proj,0.01367442,0.01000,0.791
22,mlp.up_proj,0.44392323,0.01000,1.053
22,mlp.gate_proj,0.44063938,0.01000,0.789
22,mlp.down_proj,0.14277048,0.01000,4.906
23,self_attn.k_proj,0.01447038,0.01000,0.807
23,self_attn.v_proj,0.03571455,0.01000,0.781
23,self_attn.q_proj,0.09172702,0.01000,0.789
23,self_attn.o_proj,0.03269874,0.01000,0.789
23,mlp.up_proj,0.62939668,0.01000,0.919
23,mlp.gate_proj,0.64281553,0.01000,0.785
23,mlp.down_proj,0.18784148,0.01000,5.470
24,self_attn.k_proj,0.01122671,0.01000,0.792
24,self_attn.v_proj,0.03257178,0.01000,0.781
24,self_attn.q_proj,0.08136713,0.01000,0.781
24,self_attn.o_proj,0.02107349,0.01000,0.785
24,mlp.up_proj,0.70693624,0.01000,1.003
24,mlp.gate_proj,0.66957319,0.01000,0.787
24,mlp.down_proj,0.24456905,0.01000,5.619
25,self_attn.k_proj,0.01374814,0.01000,0.803
25,self_attn.v_proj,0.05573160,0.01000,0.796
25,self_attn.q_proj,0.09728207,0.01000,0.790
25,self_attn.o_proj,0.03103936,0.01000,0.794
25,mlp.up_proj,0.92647898,0.01000,1.010
25,mlp.gate_proj,0.83161688,0.01000,0.787
25,mlp.down_proj,0.36596623,0.01000,5.688
26,self_attn.k_proj,0.01927220,0.01000,0.792
26,self_attn.v_proj,0.12979600,0.01000,0.781
26,self_attn.q_proj,0.15226346,0.01000,0.782
26,self_attn.o_proj,0.04822129,0.01000,0.787
26,mlp.up_proj,0.93774641,0.01000,0.959
26,mlp.gate_proj,0.82602507,0.01000,0.786
26,mlp.down_proj,0.00001807,0.01250,5.688
27,self_attn.k_proj,0.02325345,0.01000,0.799
27,self_attn.v_proj,0.19028476,0.01000,0.783
27,self_attn.q_proj,0.23687175,0.01000,0.791
27,self_attn.o_proj,0.06330681,0.01000,0.793
27,mlp.up_proj,1.18985558,0.01000,0.799
27,mlp.gate_proj,1.13962555,0.01000,0.799
27,mlp.down_proj,1.16460204,0.01000,4.988