chentianqi's picture
Add files using upload-large-folder tool
d5b0d72 verified
layer,module,loss,damp,time
0,attn_out,0.46341,0.01000,0.954
0,k_proj,0.34266,0.01000,0.776
0,v_proj,0.20672,0.01000,0.765
0,q_proj,0.35039,0.01000,0.767
0,ff_proj,0.13190,0.01000,0.781
0,up_proj,0.12847,0.01000,0.780
0,ff_out,0.01228,0.01000,3.181
1,attn_out,0.01194,0.01000,0.770
1,k_proj,0.23597,0.01000,0.771
1,v_proj,0.09884,0.01000,0.771
1,q_proj,0.20662,0.01000,0.769
1,ff_proj,0.20367,0.01000,0.784
1,up_proj,0.19539,0.01000,0.781
1,ff_out,0.02346,0.01000,3.186
2,attn_out,0.01837,0.01000,0.777
2,k_proj,0.54666,0.01000,0.769
2,v_proj,0.15541,0.01000,0.773
2,q_proj,0.48452,0.01000,0.774
2,ff_proj,0.48127,0.01000,0.787
2,up_proj,0.46108,0.01000,0.786
2,ff_out,0.07804,0.01000,3.186
3,attn_out,0.03099,0.01000,0.772
3,k_proj,0.38418,0.01000,0.769
3,v_proj,0.19304,0.01000,0.771
3,q_proj,0.35970,0.01000,0.769
3,ff_proj,1.27731,0.01000,0.784
3,up_proj,1.22143,0.01000,0.782
3,ff_out,0.20094,0.01000,3.188
4,attn_out,0.12638,0.01000,0.773
4,k_proj,0.83292,0.01000,0.770
4,v_proj,0.38806,0.01000,0.772
4,q_proj,0.77561,0.01000,0.773
4,ff_proj,2.68135,0.01000,0.783
4,up_proj,2.55238,0.01000,0.786
4,ff_out,0.38676,0.01000,3.189
5,attn_out,0.16436,0.01000,0.769
5,k_proj,1.79130,0.01000,0.777
5,v_proj,0.82750,0.01000,0.768
5,q_proj,1.64704,0.01000,0.769
5,ff_proj,4.76394,0.01000,0.783
5,up_proj,4.49322,0.01000,0.782
5,ff_out,0.58687,0.01000,3.194
6,attn_out,0.20771,0.01000,0.780
6,k_proj,2.01228,0.01000,0.767
6,v_proj,1.03743,0.01000,0.768
6,q_proj,1.89607,0.01000,0.771
6,ff_proj,6.48302,0.01000,0.782
6,up_proj,6.10663,0.01000,0.784
6,ff_out,0.74378,0.01000,3.192
7,attn_out,0.36060,0.01000,0.771
7,k_proj,4.17220,0.01000,0.774
7,v_proj,2.44076,0.01000,0.768
7,q_proj,4.06058,0.01000,0.774
7,ff_proj,9.79079,0.01000,0.783
7,up_proj,9.06263,0.01000,0.783
7,ff_out,1.07243,0.01000,3.186
8,attn_out,0.39326,0.01000,0.787
8,k_proj,3.43061,0.01000,0.795
8,v_proj,2.17513,0.01000,0.789
8,q_proj,3.33074,0.01000,0.787
8,ff_proj,13.66650,0.01000,0.787
8,up_proj,12.39581,0.01000,0.783
8,ff_out,1.46948,0.01000,3.188
9,attn_out,0.44965,0.01000,0.768
9,k_proj,3.89497,0.01000,0.769
9,v_proj,2.59796,0.01000,0.769
9,q_proj,3.78964,0.01000,0.768
9,ff_proj,15.71218,0.01000,0.781
9,up_proj,14.43543,0.01000,0.783
9,ff_out,1.73658,0.01000,3.185
10,attn_out,0.70652,0.01000,0.771
10,k_proj,9.19544,0.01000,0.768
10,v_proj,5.84565,0.01000,0.769
10,q_proj,9.08747,0.01000,0.769
10,ff_proj,18.82842,0.01000,0.780
10,up_proj,17.43126,0.01000,0.784
10,ff_out,2.19000,0.01000,3.186
11,attn_out,0.86296,0.01000,0.772
11,k_proj,5.60106,0.01000,0.769
11,v_proj,3.91052,0.01000,0.770
11,q_proj,5.47517,0.01000,0.768
11,ff_proj,20.85402,0.01000,0.785
11,up_proj,19.44729,0.01000,0.786
11,ff_out,2.66935,0.01000,3.186
12,attn_out,1.22999,0.01000,0.768
12,k_proj,7.09898,0.01000,0.768
12,v_proj,5.29340,0.01000,0.770
12,q_proj,6.99607,0.01000,0.771
12,ff_proj,20.98769,0.01000,0.785
12,up_proj,20.04654,0.01000,0.781
12,ff_out,3.13588,0.01000,3.187
13,attn_out,2.20784,0.01000,0.770
13,k_proj,12.16435,0.01000,0.766
13,v_proj,9.20147,0.01000,0.775
13,q_proj,12.00730,0.01000,0.767
13,ff_proj,25.78384,0.01000,0.782
13,up_proj,24.78483,0.01000,0.788
13,ff_out,3.97851,0.01000,3.193
14,attn_out,2.15204,0.01000,0.771
14,k_proj,9.78138,0.01000,0.769
14,v_proj,7.98051,0.01000,0.771
14,q_proj,9.64774,0.01000,0.771
14,ff_proj,28.72415,0.01000,0.782
14,up_proj,28.31051,0.01000,0.780
14,ff_out,4.65950,0.01000,3.189
15,attn_out,2.43048,0.01000,0.772
15,k_proj,10.99642,0.01000,0.769
15,v_proj,9.12490,0.01000,0.769
15,q_proj,10.80180,0.01000,0.774
15,ff_proj,26.85725,0.01000,0.785
15,up_proj,27.94277,0.01000,0.788
15,ff_out,5.20905,0.01000,3.193
16,attn_out,3.47777,0.01000,0.782
16,k_proj,15.06714,0.01000,0.770
16,v_proj,13.86565,0.01000,0.768
16,q_proj,14.89437,0.01000,0.772
16,ff_proj,32.00780,0.01000,0.783
16,up_proj,33.22430,0.01000,0.782
16,ff_out,5.62781,0.01000,3.191
17,attn_out,4.15703,0.01000,0.773
17,k_proj,14.72787,0.01000,0.767
17,v_proj,13.57190,0.01000,0.769
17,q_proj,14.44084,0.01000,0.770
17,ff_proj,33.70467,0.01000,0.781
17,up_proj,36.58906,0.01000,0.781
17,ff_out,6.80083,0.01000,3.191
18,attn_out,4.32158,0.01000,0.770
18,k_proj,14.62437,0.01000,0.770
18,v_proj,14.06934,0.01000,0.769
18,q_proj,14.27620,0.01000,0.770
18,ff_proj,34.71724,0.01000,0.782
18,up_proj,39.04211,0.01000,0.783
18,ff_out,7.68221,0.01000,3.191
19,attn_out,4.92948,0.01000,0.768
19,k_proj,17.51657,0.01000,0.773
19,v_proj,17.43266,0.01000,0.770
19,q_proj,17.24541,0.01000,0.772
19,ff_proj,37.16630,0.01000,0.782
19,up_proj,43.14838,0.01000,0.782
19,ff_out,9.42345,0.01000,3.188
20,attn_out,6.12879,0.01000,0.769
20,k_proj,15.77261,0.01000,0.772
20,v_proj,17.70500,0.01000,0.769
20,q_proj,15.46614,0.01000,0.772
20,ff_proj,37.29077,0.01000,0.786
20,up_proj,44.48997,0.01000,0.784
20,ff_out,10.20414,0.01000,3.192
21,attn_out,6.42759,0.01000,0.768
21,k_proj,17.71529,0.01000,0.769
21,v_proj,20.06910,0.01000,0.771
21,q_proj,17.42245,0.01000,0.771
21,ff_proj,41.39098,0.01000,0.783
21,up_proj,50.89703,0.01000,0.784
21,ff_out,12.42898,0.01000,3.199
22,attn_out,7.56994,0.01000,0.768
22,k_proj,19.16720,0.01000,0.770
22,v_proj,25.46598,0.01000,0.770
22,q_proj,18.93143,0.01000,0.768
22,ff_proj,45.91537,0.01000,0.783
22,up_proj,57.92929,0.01000,0.786
22,ff_out,14.98442,0.01000,3.194
23,attn_out,7.94560,0.01000,0.771
23,k_proj,19.21059,0.01000,0.767
23,v_proj,25.61421,0.01000,0.770
23,q_proj,19.07206,0.01000,0.767
23,ff_proj,52.68341,0.01000,0.787
23,up_proj,69.04587,0.01000,0.785
23,ff_out,20.84775,0.01000,3.205
24,attn_out,9.99096,0.01000,0.778
24,k_proj,18.64584,0.01000,0.769
24,v_proj,27.92673,0.01000,0.780
24,q_proj,18.41230,0.01000,0.768
24,ff_proj,56.93608,0.01000,0.783
24,up_proj,76.87387,0.01000,0.792
24,ff_out,27.15800,0.01000,3.193
25,attn_out,12.65934,0.01000,0.769
25,k_proj,20.20930,0.01000,0.770
25,v_proj,34.10970,0.01000,0.768
25,q_proj,20.15265,0.01000,0.769
25,ff_proj,64.59988,0.01000,0.780
25,up_proj,83.80959,0.01000,0.782
25,ff_out,35.60532,0.01000,3.190
26,attn_out,13.90159,0.01000,0.772
26,k_proj,19.57176,0.01000,0.771
26,v_proj,38.59014,0.01000,0.770
26,q_proj,19.55781,0.01000,0.770
26,ff_proj,79.34944,0.01000,0.785
26,up_proj,100.75468,0.01000,0.783
26,ff_out,47.41343,0.01000,3.191
27,attn_out,14.04380,0.01000,0.772
27,k_proj,21.52296,0.01000,0.772
27,v_proj,49.67180,0.01000,0.773
27,q_proj,21.66185,0.01000,0.772
27,ff_proj,88.83227,0.01000,0.786
27,up_proj,109.52364,0.01000,0.783
27,ff_out,67.93266,0.01000,3.197
28,attn_out,18.71825,0.01000,0.773
28,k_proj,21.00661,0.01000,0.771
28,v_proj,54.85551,0.01000,0.771
28,q_proj,21.08429,0.01000,0.771
28,ff_proj,97.04969,0.01000,0.784
28,up_proj,116.35686,0.01000,0.785
28,ff_out,68.13924,0.01000,3.191
29,attn_out,17.44988,0.01000,0.774
29,k_proj,19.76582,0.01000,0.770
29,v_proj,61.01070,0.01000,0.770
29,q_proj,19.79408,0.01000,0.766
29,ff_proj,103.81013,0.01000,0.785
29,up_proj,125.43891,0.01000,0.784
29,ff_out,69.22803,0.01000,3.194
30,attn_out,28.99095,0.01000,0.771
30,k_proj,21.20842,0.01000,0.771
30,v_proj,90.21648,0.01000,0.769
30,q_proj,21.18415,0.01000,0.772
30,ff_proj,114.58118,0.01000,0.783
30,up_proj,136.53314,0.01000,0.784
30,ff_out,81.22633,0.01000,3.211
31,attn_out,73.61667,0.01000,0.772
31,k_proj,23.93774,0.01000,0.776
31,v_proj,113.72330,0.01000,0.773
31,q_proj,24.07770,0.01000,0.775
31,ff_proj,127.92827,0.01000,0.795
31,up_proj,148.89145,0.01000,0.796
31,ff_out,233.53690,0.01000,3.204