|
layer,module,loss,damp,time
|
|
0,self_attn.k_proj,0.02492,0.01000,0.525
|
|
0,self_attn.v_proj,0.00294,0.01000,0.311
|
|
0,self_attn.q_proj,0.11607,0.01000,0.311
|
|
0,self_attn.o_proj,0.01075,0.01000,0.317
|
|
0,mlp.up_proj,0.06281,0.01000,0.376
|
|
0,mlp.gate_proj,0.08242,0.01000,0.377
|
|
0,mlp.down_proj,0.01717,0.01000,1.851
|
|
1,self_attn.k_proj,0.00611,0.01000,0.304
|
|
1,self_attn.v_proj,0.00105,0.01000,0.301
|
|
1,self_attn.q_proj,0.02166,0.01000,0.359
|
|
1,self_attn.o_proj,0.00488,0.01000,0.301
|
|
1,mlp.up_proj,33.61324,0.01000,0.384
|
|
1,mlp.gate_proj,44.10564,0.01000,0.382
|
|
1,mlp.down_proj,86.37712,0.01150,1.933
|
|
2,self_attn.k_proj,0.00515,0.01000,0.312
|
|
2,self_attn.v_proj,0.00131,0.01000,0.312
|
|
2,self_attn.q_proj,0.02350,0.01000,0.317
|
|
2,self_attn.o_proj,0.00436,0.01000,0.303
|
|
2,mlp.up_proj,3.17318,0.01000,0.392
|
|
2,mlp.gate_proj,3.04438,0.01000,0.389
|
|
2,mlp.down_proj,0.36477,0.01000,1.829
|
|
3,self_attn.k_proj,0.01766,0.01000,0.312
|
|
3,self_attn.v_proj,0.00325,0.01000,0.305
|
|
3,self_attn.q_proj,0.08171,0.01000,0.303
|
|
3,self_attn.o_proj,0.00389,0.01000,0.315
|
|
3,mlp.up_proj,2.92035,0.01000,0.380
|
|
3,mlp.gate_proj,3.56493,0.01000,0.386
|
|
3,mlp.down_proj,0.36580,0.01000,1.840
|
|
4,self_attn.k_proj,0.01346,0.01000,0.309
|
|
4,self_attn.v_proj,0.00445,0.01000,0.347
|
|
4,self_attn.q_proj,0.06788,0.01000,0.315
|
|
4,self_attn.o_proj,0.00535,0.01000,0.307
|
|
4,mlp.up_proj,2.09246,0.01000,0.372
|
|
4,mlp.gate_proj,3.32133,0.01000,0.373
|
|
4,mlp.down_proj,0.02293,0.01000,1.794
|
|
5,self_attn.k_proj,0.02415,0.01000,0.342
|
|
5,self_attn.v_proj,0.01077,0.01000,0.345
|
|
5,self_attn.q_proj,0.13446,0.01000,0.330
|
|
5,self_attn.o_proj,0.00286,0.01000,0.323
|
|
5,mlp.up_proj,3.12070,0.01000,0.376
|
|
5,mlp.gate_proj,4.24052,0.01000,0.375
|
|
5,mlp.down_proj,0.01281,0.01000,1.890
|
|
6,self_attn.k_proj,0.01575,0.01000,0.310
|
|
6,self_attn.v_proj,0.00902,0.01000,0.301
|
|
6,self_attn.q_proj,0.09437,0.01000,0.309
|
|
6,self_attn.o_proj,0.00904,0.01000,0.304
|
|
6,mlp.up_proj,3.62089,0.01000,0.376
|
|
6,mlp.gate_proj,4.67842,0.01000,0.377
|
|
6,mlp.down_proj,302.13599,0.01150,2.812
|
|
7,self_attn.k_proj,0.01845,0.01000,0.309
|
|
7,self_attn.v_proj,0.01332,0.01000,0.310
|
|
7,self_attn.q_proj,0.13009,0.01000,0.308
|
|
7,self_attn.o_proj,0.01129,0.01000,0.308
|
|
7,mlp.up_proj,2.63705,0.01000,0.377
|
|
7,mlp.gate_proj,3.50084,0.01000,0.383
|
|
7,mlp.down_proj,0.07220,0.01000,1.813
|
|
8,self_attn.k_proj,0.02072,0.01000,0.305
|
|
8,self_attn.v_proj,0.01378,0.01000,0.318
|
|
8,self_attn.q_proj,0.13361,0.01000,0.318
|
|
8,self_attn.o_proj,0.00984,0.01000,0.311
|
|
8,mlp.up_proj,2.40017,0.01000,0.375
|
|
8,mlp.gate_proj,3.57831,0.01000,0.373
|
|
8,mlp.down_proj,0.02811,0.01000,1.850
|
|
9,self_attn.k_proj,0.02001,0.01000,0.318
|
|
9,self_attn.v_proj,0.01114,0.01000,0.318
|
|
9,self_attn.q_proj,0.11113,0.01000,0.315
|
|
9,self_attn.o_proj,0.01068,0.01000,0.328
|
|
9,mlp.up_proj,2.04662,0.01000,0.380
|
|
9,mlp.gate_proj,3.31668,0.01000,0.377
|
|
9,mlp.down_proj,0.03126,0.01000,1.837
|
|
10,self_attn.k_proj,0.01916,0.01000,0.307
|
|
10,self_attn.v_proj,0.01567,0.01000,0.308
|
|
10,self_attn.q_proj,0.13137,0.01000,0.310
|
|
10,self_attn.o_proj,0.00836,0.01000,0.317
|
|
10,mlp.up_proj,1.37735,0.01000,0.386
|
|
10,mlp.gate_proj,2.27834,0.01000,0.376
|
|
10,mlp.down_proj,0.03523,0.01000,1.833
|
|
11,self_attn.k_proj,0.01605,0.01000,0.331
|
|
11,self_attn.v_proj,0.01337,0.01000,0.322
|
|
11,self_attn.q_proj,0.10693,0.01000,0.338
|
|
11,self_attn.o_proj,0.01003,0.01000,0.329
|
|
11,mlp.up_proj,0.65090,0.01000,0.377
|
|
11,mlp.gate_proj,0.93052,0.01000,0.381
|
|
11,mlp.down_proj,0.04017,0.01000,1.842
|
|
12,self_attn.k_proj,0.01832,0.01000,0.322
|
|
12,self_attn.v_proj,0.01308,0.01000,0.319
|
|
12,self_attn.q_proj,0.11686,0.01000,0.327
|
|
12,self_attn.o_proj,0.01222,0.01000,0.326
|
|
12,mlp.up_proj,0.74295,0.01000,0.385
|
|
12,mlp.gate_proj,1.08469,0.01000,0.384
|
|
12,mlp.down_proj,0.03477,0.01000,1.865
|
|
13,self_attn.k_proj,0.02904,0.01000,0.309
|
|
13,self_attn.v_proj,0.01042,0.01000,0.303
|
|
13,self_attn.q_proj,0.15010,0.01000,0.308
|
|
13,self_attn.o_proj,0.01055,0.01000,0.314
|
|
13,mlp.up_proj,0.46377,0.01000,0.379
|
|
13,mlp.gate_proj,0.48896,0.01000,0.393
|
|
13,mlp.down_proj,0.02837,0.01000,1.906
|
|
14,self_attn.k_proj,0.01903,0.01000,0.317
|
|
14,self_attn.v_proj,0.01184,0.01000,0.312
|
|
14,self_attn.q_proj,0.12252,0.01000,0.326
|
|
14,self_attn.o_proj,0.01461,0.01000,0.315
|
|
14,mlp.up_proj,0.44762,0.01000,0.384
|
|
14,mlp.gate_proj,0.47111,0.01000,0.388
|
|
14,mlp.down_proj,0.03708,0.01000,1.885
|
|
15,self_attn.k_proj,0.01979,0.01000,0.323
|
|
15,self_attn.v_proj,0.01177,0.01000,0.314
|
|
15,self_attn.q_proj,0.12753,0.01000,0.325
|
|
15,self_attn.o_proj,0.01587,0.01000,0.318
|
|
15,mlp.up_proj,0.41492,0.01000,0.395
|
|
15,mlp.gate_proj,0.39752,0.01000,0.381
|
|
15,mlp.down_proj,0.02674,0.01000,1.862
|
|
16,self_attn.k_proj,0.02060,0.01000,0.328
|
|
16,self_attn.v_proj,0.01169,0.01000,0.320
|
|
16,self_attn.q_proj,0.12014,0.01000,0.323
|
|
16,self_attn.o_proj,0.01013,0.01000,0.317
|
|
16,mlp.up_proj,0.40758,0.01000,0.388
|
|
16,mlp.gate_proj,0.42216,0.01000,0.417
|
|
16,mlp.down_proj,0.04034,0.01000,1.877
|
|
17,self_attn.k_proj,0.02709,0.01000,0.335
|
|
17,self_attn.v_proj,0.01575,0.01000,0.361
|
|
17,self_attn.q_proj,0.16969,0.01000,0.478
|
|
17,self_attn.o_proj,0.01246,0.01000,0.313
|
|
17,mlp.up_proj,0.37242,0.01000,0.378
|
|
17,mlp.gate_proj,0.36916,0.01000,0.391
|
|
17,mlp.down_proj,0.08583,0.01000,1.857
|
|
18,self_attn.k_proj,0.01850,0.01000,0.334
|
|
18,self_attn.v_proj,0.01267,0.01000,0.316
|
|
18,self_attn.q_proj,0.12267,0.01000,0.315
|
|
18,self_attn.o_proj,0.02005,0.01000,0.313
|
|
18,mlp.up_proj,0.37420,0.01000,0.392
|
|
18,mlp.gate_proj,0.38857,0.01000,0.396
|
|
18,mlp.down_proj,0.02179,0.01000,1.844
|
|
19,self_attn.k_proj,0.02543,0.01000,0.317
|
|
19,self_attn.v_proj,0.01350,0.01000,0.313
|
|
19,self_attn.q_proj,0.14413,0.01000,0.321
|
|
19,self_attn.o_proj,0.01953,0.01000,0.315
|
|
19,mlp.up_proj,0.36482,0.01000,0.378
|
|
19,mlp.gate_proj,0.35452,0.01000,0.394
|
|
19,mlp.down_proj,0.02073,0.01000,1.884
|
|
20,self_attn.k_proj,0.02436,0.01000,0.309
|
|
20,self_attn.v_proj,0.02385,0.01000,0.318
|
|
20,self_attn.q_proj,0.21024,0.01000,0.308
|
|
20,self_attn.o_proj,0.01820,0.01000,0.310
|
|
20,mlp.up_proj,0.37739,0.01000,0.404
|
|
20,mlp.gate_proj,0.36945,0.01000,0.392
|
|
20,mlp.down_proj,0.02357,0.01000,1.824
|
|
21,self_attn.k_proj,0.02344,0.01000,0.311
|
|
21,self_attn.v_proj,0.01694,0.01000,0.320
|
|
21,self_attn.q_proj,0.14892,0.01000,0.330
|
|
21,self_attn.o_proj,0.01645,0.01000,0.315
|
|
21,mlp.up_proj,0.38584,0.01000,0.376
|
|
21,mlp.gate_proj,0.41318,0.01000,0.392
|
|
21,mlp.down_proj,0.02412,0.01000,1.811
|
|
22,self_attn.k_proj,0.02461,0.01000,0.320
|
|
22,self_attn.v_proj,0.02272,0.01000,0.325
|
|
22,self_attn.q_proj,0.17470,0.01000,0.319
|
|
22,self_attn.o_proj,0.01448,0.01000,0.326
|
|
22,mlp.up_proj,0.40653,0.01000,0.389
|
|
22,mlp.gate_proj,0.41927,0.01000,0.392
|
|
22,mlp.down_proj,0.02593,0.01000,1.867
|
|
23,self_attn.k_proj,0.02775,0.01000,0.329
|
|
23,self_attn.v_proj,0.01436,0.01000,0.327
|
|
23,self_attn.q_proj,0.17269,0.01000,0.326
|
|
23,self_attn.o_proj,0.03151,0.01000,0.322
|
|
23,mlp.up_proj,0.45256,0.01000,0.372
|
|
23,mlp.gate_proj,0.43746,0.01000,0.378
|
|
23,mlp.down_proj,0.03640,0.01000,1.848
|
|
24,self_attn.k_proj,0.02138,0.01000,0.307
|
|
24,self_attn.v_proj,0.01727,0.01000,0.315
|
|
24,self_attn.q_proj,0.15001,0.01000,0.318
|
|
24,self_attn.o_proj,0.02432,0.01000,0.317
|
|
24,mlp.up_proj,0.49747,0.01000,0.380
|
|
24,mlp.gate_proj,0.48546,0.01000,0.405
|
|
24,mlp.down_proj,0.03852,0.01000,1.867
|
|
25,self_attn.k_proj,0.02145,0.01000,0.333
|
|
25,self_attn.v_proj,0.03011,0.01000,0.333
|
|
25,self_attn.q_proj,0.22257,0.01000,0.327
|
|
25,self_attn.o_proj,0.04651,0.01000,0.311
|
|
25,mlp.up_proj,0.55227,0.01000,0.392
|
|
25,mlp.gate_proj,0.53969,0.01000,0.394
|
|
25,mlp.down_proj,0.05975,0.01000,1.855
|
|
26,self_attn.k_proj,0.02050,0.01000,0.312
|
|
26,self_attn.v_proj,0.02565,0.01000,0.318
|
|
26,self_attn.q_proj,0.15829,0.01000,0.314
|
|
26,self_attn.o_proj,0.01995,0.01000,0.327
|
|
26,mlp.up_proj,0.66442,0.01000,0.378
|
|
26,mlp.gate_proj,0.61777,0.01000,0.383
|
|
26,mlp.down_proj,0.07678,0.01000,1.835
|
|
27,self_attn.k_proj,0.02527,0.01000,0.327
|
|
27,self_attn.v_proj,0.04113,0.01000,0.319
|
|
27,self_attn.q_proj,0.28250,0.01000,0.333
|
|
27,self_attn.o_proj,0.05472,0.01000,0.340
|
|
27,mlp.up_proj,0.74296,0.01000,0.388
|
|
27,mlp.gate_proj,0.72095,0.01000,0.383
|
|
27,mlp.down_proj,0.11280,0.01000,1.855
|
|
28,self_attn.k_proj,0.02487,0.01000,0.321
|
|
28,self_attn.v_proj,0.03989,0.01000,0.321
|
|
28,self_attn.q_proj,0.21990,0.01000,0.314
|
|
28,self_attn.o_proj,0.08156,0.01000,0.318
|
|
28,mlp.up_proj,0.86934,0.01000,0.380
|
|
28,mlp.gate_proj,0.85854,0.01000,0.394
|
|
28,mlp.down_proj,0.11322,0.01000,1.859
|
|
29,self_attn.k_proj,0.02944,0.01000,0.311
|
|
29,self_attn.v_proj,0.03956,0.01000,0.308
|
|
29,self_attn.q_proj,0.23179,0.01000,0.315
|
|
29,self_attn.o_proj,0.03262,0.01000,0.318
|
|
29,mlp.up_proj,1.05190,0.01000,0.377
|
|
29,mlp.gate_proj,1.02274,0.01000,0.378
|
|
29,mlp.down_proj,0.24230,0.01000,1.872
|
|
30,self_attn.k_proj,0.02382,0.01000,0.323
|
|
30,self_attn.v_proj,0.06437,0.01000,0.302
|
|
30,self_attn.q_proj,0.26883,0.01000,0.308
|
|
30,self_attn.o_proj,0.03537,0.01000,0.304
|
|
30,mlp.up_proj,1.76454,0.01000,0.376
|
|
30,mlp.gate_proj,1.63980,0.01000,0.386
|
|
30,mlp.down_proj,3.21348,0.01000,1.915
|
|
31,self_attn.k_proj,0.02542,0.01000,0.320
|
|
31,self_attn.v_proj,0.05646,0.01000,0.314
|
|
31,self_attn.q_proj,0.26133,0.01000,0.309
|
|
31,self_attn.o_proj,0.11226,0.01000,0.309
|
|
31,mlp.up_proj,1.65549,0.01000,0.379
|
|
31,mlp.gate_proj,1.43243,0.01000,0.385
|
|
31,mlp.down_proj,0.53940,0.01000,1.823
|
|
32,self_attn.k_proj,0.03259,0.01000,0.314
|
|
32,self_attn.v_proj,0.12466,0.01000,0.308
|
|
32,self_attn.q_proj,0.37828,0.01000,0.313
|
|
32,self_attn.o_proj,0.25247,0.01000,0.305
|
|
32,mlp.up_proj,1.61365,0.01000,0.378
|
|
32,mlp.gate_proj,1.40892,0.01000,0.372
|
|
32,mlp.down_proj,0.40446,0.01000,1.793
|
|
33,self_attn.k_proj,0.03303,0.01000,0.312
|
|
33,self_attn.v_proj,0.36150,0.01000,0.305
|
|
33,self_attn.q_proj,0.40468,0.01000,0.306
|
|
33,self_attn.o_proj,0.69143,0.01000,0.304
|
|
33,mlp.up_proj,1.46704,0.01000,0.394
|
|
33,mlp.gate_proj,1.19369,0.01000,0.383
|
|
33,mlp.down_proj,0.65678,0.01000,1.861
|
|
34,self_attn.k_proj,0.02516,0.01000,0.309
|
|
34,self_attn.v_proj,0.07476,0.01000,0.313
|
|
34,self_attn.q_proj,0.22417,0.01000,0.326
|
|
34,self_attn.o_proj,0.16745,0.01000,0.321
|
|
34,mlp.up_proj,1.71218,0.01000,0.383
|
|
34,mlp.gate_proj,1.46625,0.01000,0.390
|
|
34,mlp.down_proj,0.62922,0.01000,1.861
|
|
35,self_attn.k_proj,0.02152,0.01000,0.298
|
|
35,self_attn.v_proj,0.06205,0.01000,0.314
|
|
35,self_attn.q_proj,0.20710,0.01000,0.316
|
|
35,self_attn.o_proj,0.14783,0.01000,0.304
|
|
35,mlp.up_proj,2.95869,0.01000,0.378
|
|
35,mlp.gate_proj,2.88873,0.01000,0.387
|
|
35,mlp.down_proj,3.13214,0.01000,1.831
|
|
|