3v324v23's picture
init
8545fab
layer,module,loss,damp,time
0,self_attn.k_proj,0.02492,0.01000,0.525
0,self_attn.v_proj,0.00294,0.01000,0.311
0,self_attn.q_proj,0.11607,0.01000,0.311
0,self_attn.o_proj,0.01075,0.01000,0.317
0,mlp.up_proj,0.06281,0.01000,0.376
0,mlp.gate_proj,0.08242,0.01000,0.377
0,mlp.down_proj,0.01717,0.01000,1.851
1,self_attn.k_proj,0.00611,0.01000,0.304
1,self_attn.v_proj,0.00105,0.01000,0.301
1,self_attn.q_proj,0.02166,0.01000,0.359
1,self_attn.o_proj,0.00488,0.01000,0.301
1,mlp.up_proj,33.61324,0.01000,0.384
1,mlp.gate_proj,44.10564,0.01000,0.382
1,mlp.down_proj,86.37712,0.01150,1.933
2,self_attn.k_proj,0.00515,0.01000,0.312
2,self_attn.v_proj,0.00131,0.01000,0.312
2,self_attn.q_proj,0.02350,0.01000,0.317
2,self_attn.o_proj,0.00436,0.01000,0.303
2,mlp.up_proj,3.17318,0.01000,0.392
2,mlp.gate_proj,3.04438,0.01000,0.389
2,mlp.down_proj,0.36477,0.01000,1.829
3,self_attn.k_proj,0.01766,0.01000,0.312
3,self_attn.v_proj,0.00325,0.01000,0.305
3,self_attn.q_proj,0.08171,0.01000,0.303
3,self_attn.o_proj,0.00389,0.01000,0.315
3,mlp.up_proj,2.92035,0.01000,0.380
3,mlp.gate_proj,3.56493,0.01000,0.386
3,mlp.down_proj,0.36580,0.01000,1.840
4,self_attn.k_proj,0.01346,0.01000,0.309
4,self_attn.v_proj,0.00445,0.01000,0.347
4,self_attn.q_proj,0.06788,0.01000,0.315
4,self_attn.o_proj,0.00535,0.01000,0.307
4,mlp.up_proj,2.09246,0.01000,0.372
4,mlp.gate_proj,3.32133,0.01000,0.373
4,mlp.down_proj,0.02293,0.01000,1.794
5,self_attn.k_proj,0.02415,0.01000,0.342
5,self_attn.v_proj,0.01077,0.01000,0.345
5,self_attn.q_proj,0.13446,0.01000,0.330
5,self_attn.o_proj,0.00286,0.01000,0.323
5,mlp.up_proj,3.12070,0.01000,0.376
5,mlp.gate_proj,4.24052,0.01000,0.375
5,mlp.down_proj,0.01281,0.01000,1.890
6,self_attn.k_proj,0.01575,0.01000,0.310
6,self_attn.v_proj,0.00902,0.01000,0.301
6,self_attn.q_proj,0.09437,0.01000,0.309
6,self_attn.o_proj,0.00904,0.01000,0.304
6,mlp.up_proj,3.62089,0.01000,0.376
6,mlp.gate_proj,4.67842,0.01000,0.377
6,mlp.down_proj,302.13599,0.01150,2.812
7,self_attn.k_proj,0.01845,0.01000,0.309
7,self_attn.v_proj,0.01332,0.01000,0.310
7,self_attn.q_proj,0.13009,0.01000,0.308
7,self_attn.o_proj,0.01129,0.01000,0.308
7,mlp.up_proj,2.63705,0.01000,0.377
7,mlp.gate_proj,3.50084,0.01000,0.383
7,mlp.down_proj,0.07220,0.01000,1.813
8,self_attn.k_proj,0.02072,0.01000,0.305
8,self_attn.v_proj,0.01378,0.01000,0.318
8,self_attn.q_proj,0.13361,0.01000,0.318
8,self_attn.o_proj,0.00984,0.01000,0.311
8,mlp.up_proj,2.40017,0.01000,0.375
8,mlp.gate_proj,3.57831,0.01000,0.373
8,mlp.down_proj,0.02811,0.01000,1.850
9,self_attn.k_proj,0.02001,0.01000,0.318
9,self_attn.v_proj,0.01114,0.01000,0.318
9,self_attn.q_proj,0.11113,0.01000,0.315
9,self_attn.o_proj,0.01068,0.01000,0.328
9,mlp.up_proj,2.04662,0.01000,0.380
9,mlp.gate_proj,3.31668,0.01000,0.377
9,mlp.down_proj,0.03126,0.01000,1.837
10,self_attn.k_proj,0.01916,0.01000,0.307
10,self_attn.v_proj,0.01567,0.01000,0.308
10,self_attn.q_proj,0.13137,0.01000,0.310
10,self_attn.o_proj,0.00836,0.01000,0.317
10,mlp.up_proj,1.37735,0.01000,0.386
10,mlp.gate_proj,2.27834,0.01000,0.376
10,mlp.down_proj,0.03523,0.01000,1.833
11,self_attn.k_proj,0.01605,0.01000,0.331
11,self_attn.v_proj,0.01337,0.01000,0.322
11,self_attn.q_proj,0.10693,0.01000,0.338
11,self_attn.o_proj,0.01003,0.01000,0.329
11,mlp.up_proj,0.65090,0.01000,0.377
11,mlp.gate_proj,0.93052,0.01000,0.381
11,mlp.down_proj,0.04017,0.01000,1.842
12,self_attn.k_proj,0.01832,0.01000,0.322
12,self_attn.v_proj,0.01308,0.01000,0.319
12,self_attn.q_proj,0.11686,0.01000,0.327
12,self_attn.o_proj,0.01222,0.01000,0.326
12,mlp.up_proj,0.74295,0.01000,0.385
12,mlp.gate_proj,1.08469,0.01000,0.384
12,mlp.down_proj,0.03477,0.01000,1.865
13,self_attn.k_proj,0.02904,0.01000,0.309
13,self_attn.v_proj,0.01042,0.01000,0.303
13,self_attn.q_proj,0.15010,0.01000,0.308
13,self_attn.o_proj,0.01055,0.01000,0.314
13,mlp.up_proj,0.46377,0.01000,0.379
13,mlp.gate_proj,0.48896,0.01000,0.393
13,mlp.down_proj,0.02837,0.01000,1.906
14,self_attn.k_proj,0.01903,0.01000,0.317
14,self_attn.v_proj,0.01184,0.01000,0.312
14,self_attn.q_proj,0.12252,0.01000,0.326
14,self_attn.o_proj,0.01461,0.01000,0.315
14,mlp.up_proj,0.44762,0.01000,0.384
14,mlp.gate_proj,0.47111,0.01000,0.388
14,mlp.down_proj,0.03708,0.01000,1.885
15,self_attn.k_proj,0.01979,0.01000,0.323
15,self_attn.v_proj,0.01177,0.01000,0.314
15,self_attn.q_proj,0.12753,0.01000,0.325
15,self_attn.o_proj,0.01587,0.01000,0.318
15,mlp.up_proj,0.41492,0.01000,0.395
15,mlp.gate_proj,0.39752,0.01000,0.381
15,mlp.down_proj,0.02674,0.01000,1.862
16,self_attn.k_proj,0.02060,0.01000,0.328
16,self_attn.v_proj,0.01169,0.01000,0.320
16,self_attn.q_proj,0.12014,0.01000,0.323
16,self_attn.o_proj,0.01013,0.01000,0.317
16,mlp.up_proj,0.40758,0.01000,0.388
16,mlp.gate_proj,0.42216,0.01000,0.417
16,mlp.down_proj,0.04034,0.01000,1.877
17,self_attn.k_proj,0.02709,0.01000,0.335
17,self_attn.v_proj,0.01575,0.01000,0.361
17,self_attn.q_proj,0.16969,0.01000,0.478
17,self_attn.o_proj,0.01246,0.01000,0.313
17,mlp.up_proj,0.37242,0.01000,0.378
17,mlp.gate_proj,0.36916,0.01000,0.391
17,mlp.down_proj,0.08583,0.01000,1.857
18,self_attn.k_proj,0.01850,0.01000,0.334
18,self_attn.v_proj,0.01267,0.01000,0.316
18,self_attn.q_proj,0.12267,0.01000,0.315
18,self_attn.o_proj,0.02005,0.01000,0.313
18,mlp.up_proj,0.37420,0.01000,0.392
18,mlp.gate_proj,0.38857,0.01000,0.396
18,mlp.down_proj,0.02179,0.01000,1.844
19,self_attn.k_proj,0.02543,0.01000,0.317
19,self_attn.v_proj,0.01350,0.01000,0.313
19,self_attn.q_proj,0.14413,0.01000,0.321
19,self_attn.o_proj,0.01953,0.01000,0.315
19,mlp.up_proj,0.36482,0.01000,0.378
19,mlp.gate_proj,0.35452,0.01000,0.394
19,mlp.down_proj,0.02073,0.01000,1.884
20,self_attn.k_proj,0.02436,0.01000,0.309
20,self_attn.v_proj,0.02385,0.01000,0.318
20,self_attn.q_proj,0.21024,0.01000,0.308
20,self_attn.o_proj,0.01820,0.01000,0.310
20,mlp.up_proj,0.37739,0.01000,0.404
20,mlp.gate_proj,0.36945,0.01000,0.392
20,mlp.down_proj,0.02357,0.01000,1.824
21,self_attn.k_proj,0.02344,0.01000,0.311
21,self_attn.v_proj,0.01694,0.01000,0.320
21,self_attn.q_proj,0.14892,0.01000,0.330
21,self_attn.o_proj,0.01645,0.01000,0.315
21,mlp.up_proj,0.38584,0.01000,0.376
21,mlp.gate_proj,0.41318,0.01000,0.392
21,mlp.down_proj,0.02412,0.01000,1.811
22,self_attn.k_proj,0.02461,0.01000,0.320
22,self_attn.v_proj,0.02272,0.01000,0.325
22,self_attn.q_proj,0.17470,0.01000,0.319
22,self_attn.o_proj,0.01448,0.01000,0.326
22,mlp.up_proj,0.40653,0.01000,0.389
22,mlp.gate_proj,0.41927,0.01000,0.392
22,mlp.down_proj,0.02593,0.01000,1.867
23,self_attn.k_proj,0.02775,0.01000,0.329
23,self_attn.v_proj,0.01436,0.01000,0.327
23,self_attn.q_proj,0.17269,0.01000,0.326
23,self_attn.o_proj,0.03151,0.01000,0.322
23,mlp.up_proj,0.45256,0.01000,0.372
23,mlp.gate_proj,0.43746,0.01000,0.378
23,mlp.down_proj,0.03640,0.01000,1.848
24,self_attn.k_proj,0.02138,0.01000,0.307
24,self_attn.v_proj,0.01727,0.01000,0.315
24,self_attn.q_proj,0.15001,0.01000,0.318
24,self_attn.o_proj,0.02432,0.01000,0.317
24,mlp.up_proj,0.49747,0.01000,0.380
24,mlp.gate_proj,0.48546,0.01000,0.405
24,mlp.down_proj,0.03852,0.01000,1.867
25,self_attn.k_proj,0.02145,0.01000,0.333
25,self_attn.v_proj,0.03011,0.01000,0.333
25,self_attn.q_proj,0.22257,0.01000,0.327
25,self_attn.o_proj,0.04651,0.01000,0.311
25,mlp.up_proj,0.55227,0.01000,0.392
25,mlp.gate_proj,0.53969,0.01000,0.394
25,mlp.down_proj,0.05975,0.01000,1.855
26,self_attn.k_proj,0.02050,0.01000,0.312
26,self_attn.v_proj,0.02565,0.01000,0.318
26,self_attn.q_proj,0.15829,0.01000,0.314
26,self_attn.o_proj,0.01995,0.01000,0.327
26,mlp.up_proj,0.66442,0.01000,0.378
26,mlp.gate_proj,0.61777,0.01000,0.383
26,mlp.down_proj,0.07678,0.01000,1.835
27,self_attn.k_proj,0.02527,0.01000,0.327
27,self_attn.v_proj,0.04113,0.01000,0.319
27,self_attn.q_proj,0.28250,0.01000,0.333
27,self_attn.o_proj,0.05472,0.01000,0.340
27,mlp.up_proj,0.74296,0.01000,0.388
27,mlp.gate_proj,0.72095,0.01000,0.383
27,mlp.down_proj,0.11280,0.01000,1.855
28,self_attn.k_proj,0.02487,0.01000,0.321
28,self_attn.v_proj,0.03989,0.01000,0.321
28,self_attn.q_proj,0.21990,0.01000,0.314
28,self_attn.o_proj,0.08156,0.01000,0.318
28,mlp.up_proj,0.86934,0.01000,0.380
28,mlp.gate_proj,0.85854,0.01000,0.394
28,mlp.down_proj,0.11322,0.01000,1.859
29,self_attn.k_proj,0.02944,0.01000,0.311
29,self_attn.v_proj,0.03956,0.01000,0.308
29,self_attn.q_proj,0.23179,0.01000,0.315
29,self_attn.o_proj,0.03262,0.01000,0.318
29,mlp.up_proj,1.05190,0.01000,0.377
29,mlp.gate_proj,1.02274,0.01000,0.378
29,mlp.down_proj,0.24230,0.01000,1.872
30,self_attn.k_proj,0.02382,0.01000,0.323
30,self_attn.v_proj,0.06437,0.01000,0.302
30,self_attn.q_proj,0.26883,0.01000,0.308
30,self_attn.o_proj,0.03537,0.01000,0.304
30,mlp.up_proj,1.76454,0.01000,0.376
30,mlp.gate_proj,1.63980,0.01000,0.386
30,mlp.down_proj,3.21348,0.01000,1.915
31,self_attn.k_proj,0.02542,0.01000,0.320
31,self_attn.v_proj,0.05646,0.01000,0.314
31,self_attn.q_proj,0.26133,0.01000,0.309
31,self_attn.o_proj,0.11226,0.01000,0.309
31,mlp.up_proj,1.65549,0.01000,0.379
31,mlp.gate_proj,1.43243,0.01000,0.385
31,mlp.down_proj,0.53940,0.01000,1.823
32,self_attn.k_proj,0.03259,0.01000,0.314
32,self_attn.v_proj,0.12466,0.01000,0.308
32,self_attn.q_proj,0.37828,0.01000,0.313
32,self_attn.o_proj,0.25247,0.01000,0.305
32,mlp.up_proj,1.61365,0.01000,0.378
32,mlp.gate_proj,1.40892,0.01000,0.372
32,mlp.down_proj,0.40446,0.01000,1.793
33,self_attn.k_proj,0.03303,0.01000,0.312
33,self_attn.v_proj,0.36150,0.01000,0.305
33,self_attn.q_proj,0.40468,0.01000,0.306
33,self_attn.o_proj,0.69143,0.01000,0.304
33,mlp.up_proj,1.46704,0.01000,0.394
33,mlp.gate_proj,1.19369,0.01000,0.383
33,mlp.down_proj,0.65678,0.01000,1.861
34,self_attn.k_proj,0.02516,0.01000,0.309
34,self_attn.v_proj,0.07476,0.01000,0.313
34,self_attn.q_proj,0.22417,0.01000,0.326
34,self_attn.o_proj,0.16745,0.01000,0.321
34,mlp.up_proj,1.71218,0.01000,0.383
34,mlp.gate_proj,1.46625,0.01000,0.390
34,mlp.down_proj,0.62922,0.01000,1.861
35,self_attn.k_proj,0.02152,0.01000,0.298
35,self_attn.v_proj,0.06205,0.01000,0.314
35,self_attn.q_proj,0.20710,0.01000,0.316
35,self_attn.o_proj,0.14783,0.01000,0.304
35,mlp.up_proj,2.95869,0.01000,0.378
35,mlp.gate_proj,2.88873,0.01000,0.387
35,mlp.down_proj,3.13214,0.01000,1.831