|
layer,module,loss,samples,damp,time
|
|
0,self_attn.k_proj,0.00006717,0.01000,0.743
|
|
0,self_attn.v_proj,0.00000782,0.01000,0.540
|
|
0,self_attn.q_proj,0.00026253,0.01000,0.537
|
|
0,self_attn.o_proj,0.00008649,0.01000,0.538
|
|
0,mlp.up_proj,0.00024544,0.01000,0.564
|
|
0,mlp.gate_proj,0.00042476,0.01000,0.558
|
|
0,mlp.down_proj,304.70507812,0.01250,4.287
|
|
1,self_attn.k_proj,0.00003458,0.01000,0.543
|
|
1,self_attn.v_proj,0.00001160,0.01000,0.540
|
|
1,self_attn.q_proj,0.00012922,0.01000,0.539
|
|
1,self_attn.o_proj,0.00001389,0.01000,0.540
|
|
1,mlp.up_proj,0.00507102,0.01000,0.564
|
|
1,mlp.gate_proj,0.00740672,0.01000,0.561
|
|
1,mlp.down_proj,201.20426941,0.01250,4.277
|
|
2,self_attn.k_proj,0.00002051,0.01000,0.545
|
|
2,self_attn.v_proj,0.00000462,0.01000,0.542
|
|
2,self_attn.q_proj,0.00008908,0.01000,0.541
|
|
2,self_attn.o_proj,0.00002082,0.01000,0.540
|
|
2,mlp.up_proj,0.00323103,0.01000,0.564
|
|
2,mlp.gate_proj,0.00482144,0.01000,0.559
|
|
2,mlp.down_proj,265.71157837,0.01250,4.258
|
|
3,self_attn.k_proj,0.00003836,0.01000,0.542
|
|
3,self_attn.v_proj,0.00001136,0.01000,0.542
|
|
3,self_attn.q_proj,0.00017052,0.01000,0.537
|
|
3,self_attn.o_proj,0.00010798,0.01000,0.541
|
|
3,mlp.up_proj,0.01222713,0.01000,0.562
|
|
3,mlp.gate_proj,0.01548911,0.01000,0.558
|
|
3,mlp.down_proj,0.12992305,0.01250,4.263
|
|
4,self_attn.k_proj,0.00000324,0.01000,0.543
|
|
4,self_attn.v_proj,0.00000160,0.01000,0.538
|
|
4,self_attn.q_proj,0.00001570,0.01000,0.539
|
|
4,self_attn.o_proj,0.00000409,0.01000,0.540
|
|
4,mlp.up_proj,0.00579107,0.01000,0.564
|
|
4,mlp.gate_proj,0.00821990,0.01000,0.562
|
|
4,mlp.down_proj,0.17879479,0.01250,4.295
|
|
5,self_attn.k_proj,0.00000587,0.01000,0.542
|
|
5,self_attn.v_proj,0.00000278,0.01000,0.539
|
|
5,self_attn.q_proj,0.00002992,0.01000,0.543
|
|
5,self_attn.o_proj,0.00000610,0.01000,0.544
|
|
5,mlp.up_proj,0.01783431,0.01000,0.566
|
|
5,mlp.gate_proj,0.02152922,0.01000,0.562
|
|
5,mlp.down_proj,7.94002533,0.01250,4.278
|
|
6,self_attn.k_proj,0.00000566,0.01000,0.546
|
|
6,self_attn.v_proj,0.00000298,0.01000,0.543
|
|
6,self_attn.q_proj,0.00002906,0.01000,0.545
|
|
6,self_attn.o_proj,0.00000604,0.01000,0.543
|
|
6,mlp.up_proj,0.00136981,0.01000,0.563
|
|
6,mlp.gate_proj,0.00192878,0.01000,0.563
|
|
6,mlp.down_proj,29.80362320,0.01250,4.302
|
|
7,self_attn.k_proj,0.00000723,0.01000,0.543
|
|
7,self_attn.v_proj,0.00000818,0.01000,0.543
|
|
7,self_attn.q_proj,0.00004528,0.01000,0.540
|
|
7,self_attn.o_proj,0.00000810,0.01000,0.542
|
|
7,mlp.up_proj,0.00104278,0.01000,0.565
|
|
7,mlp.gate_proj,0.00117535,0.01000,0.562
|
|
7,mlp.down_proj,73.25530243,0.01250,4.280
|
|
8,self_attn.k_proj,0.00000813,0.01000,0.540
|
|
8,self_attn.v_proj,0.00000380,0.01000,0.538
|
|
8,self_attn.q_proj,0.00003767,0.01000,0.538
|
|
8,self_attn.o_proj,0.00001477,0.01000,0.540
|
|
8,mlp.up_proj,0.00108770,0.01000,0.566
|
|
8,mlp.gate_proj,0.00114401,0.01000,0.563
|
|
8,mlp.down_proj,118.72260284,0.01250,4.273
|
|
9,self_attn.k_proj,0.00000741,0.01000,0.545
|
|
9,self_attn.v_proj,0.00000789,0.01000,0.543
|
|
9,self_attn.q_proj,0.00004401,0.01000,0.542
|
|
9,self_attn.o_proj,0.00001458,0.01000,0.540
|
|
9,mlp.up_proj,0.00241637,0.01000,0.562
|
|
9,mlp.gate_proj,0.00358828,0.01000,0.560
|
|
9,mlp.down_proj,20.12282372,0.01250,4.280
|
|
10,self_attn.k_proj,0.00000835,0.01000,0.544
|
|
10,self_attn.v_proj,0.00000538,0.01000,0.541
|
|
10,self_attn.q_proj,0.00004422,0.01000,0.542
|
|
10,self_attn.o_proj,0.00001159,0.01000,0.542
|
|
10,mlp.up_proj,0.00074800,0.01000,0.565
|
|
10,mlp.gate_proj,0.00083565,0.01000,0.561
|
|
10,mlp.down_proj,351.15560913,0.01250,4.264
|
|
11,self_attn.k_proj,0.00001277,0.01000,0.546
|
|
11,self_attn.v_proj,0.00000565,0.01000,0.541
|
|
11,self_attn.q_proj,0.00006044,0.01000,0.540
|
|
11,self_attn.o_proj,0.00001777,0.01000,0.540
|
|
11,mlp.up_proj,0.00086147,0.01000,0.564
|
|
11,mlp.gate_proj,0.00089606,0.01000,0.565
|
|
11,mlp.down_proj,4.85732031,0.01250,4.274
|
|
12,self_attn.k_proj,0.00001361,0.01000,0.541
|
|
12,self_attn.v_proj,0.00000723,0.01000,0.538
|
|
12,self_attn.q_proj,0.00006449,0.01000,0.538
|
|
12,self_attn.o_proj,0.00001664,0.01000,0.539
|
|
12,mlp.up_proj,0.00072561,0.01000,0.563
|
|
12,mlp.gate_proj,0.00070967,0.01000,0.566
|
|
12,mlp.down_proj,84.20599365,0.01250,4.295
|
|
13,self_attn.k_proj,0.00002183,0.01000,0.545
|
|
13,self_attn.v_proj,0.00001649,0.01000,0.539
|
|
13,self_attn.q_proj,0.00011990,0.01000,0.540
|
|
13,self_attn.o_proj,0.00001876,0.01000,0.541
|
|
13,mlp.up_proj,0.00052857,0.01000,0.566
|
|
13,mlp.gate_proj,0.00055504,0.01000,0.563
|
|
13,mlp.down_proj,434.47857666,0.01250,4.278
|
|
14,self_attn.k_proj,0.00001691,0.01000,0.546
|
|
14,self_attn.v_proj,0.00000920,0.01000,0.541
|
|
14,self_attn.q_proj,0.00008929,0.01000,0.539
|
|
14,self_attn.o_proj,0.00002732,0.01000,0.539
|
|
14,mlp.up_proj,0.00055212,0.01000,0.566
|
|
14,mlp.gate_proj,0.00054635,0.01000,0.562
|
|
14,mlp.down_proj,410.56881714,0.01250,4.284
|
|
15,self_attn.k_proj,0.00004251,0.01000,0.548
|
|
15,self_attn.v_proj,0.00002116,0.01000,0.545
|
|
15,self_attn.q_proj,0.00020286,0.01000,0.546
|
|
15,self_attn.o_proj,0.00002885,0.01000,0.542
|
|
15,mlp.up_proj,0.00051129,0.01000,0.566
|
|
15,mlp.gate_proj,0.00048951,0.01000,0.564
|
|
15,mlp.down_proj,815.28625488,0.01250,4.290
|
|
16,self_attn.k_proj,0.00002103,0.01000,0.546
|
|
16,self_attn.v_proj,0.00001660,0.01000,0.541
|
|
16,self_attn.q_proj,0.00011751,0.01000,0.541
|
|
16,self_attn.o_proj,0.00002044,0.01000,0.540
|
|
16,mlp.up_proj,0.00043137,0.01000,0.574
|
|
16,mlp.gate_proj,0.00041475,0.01000,0.562
|
|
16,mlp.down_proj,1187.52331543,0.01250,4.284
|
|
17,self_attn.k_proj,0.00002322,0.01000,0.547
|
|
17,self_attn.v_proj,0.00001877,0.01000,0.542
|
|
17,self_attn.q_proj,0.00013999,0.01000,0.543
|
|
17,self_attn.o_proj,0.00003512,0.01000,0.543
|
|
17,mlp.up_proj,0.00046121,0.01000,0.567
|
|
17,mlp.gate_proj,0.00043173,0.01000,0.565
|
|
17,mlp.down_proj,972.71276855,0.01250,4.288
|
|
18,self_attn.k_proj,0.00001954,0.01000,0.549
|
|
18,self_attn.v_proj,0.00002303,0.01000,0.546
|
|
18,self_attn.q_proj,0.00011826,0.01000,0.543
|
|
18,self_attn.o_proj,0.00003064,0.01000,0.544
|
|
18,mlp.up_proj,0.00046868,0.01000,0.569
|
|
18,mlp.gate_proj,0.00043091,0.01000,0.563
|
|
18,mlp.down_proj,463.82571411,0.01250,4.275
|
|
19,self_attn.k_proj,0.00001841,0.01000,0.543
|
|
19,self_attn.v_proj,0.00002542,0.01000,0.540
|
|
19,self_attn.q_proj,0.00012729,0.01000,0.538
|
|
19,self_attn.o_proj,0.00003190,0.01000,0.538
|
|
19,mlp.up_proj,0.00048951,0.01000,0.566
|
|
19,mlp.gate_proj,0.00047259,0.01000,0.562
|
|
19,mlp.down_proj,430.34570312,0.01250,4.288
|
|
20,self_attn.k_proj,0.00001788,0.01000,0.546
|
|
20,self_attn.v_proj,0.00002601,0.01000,0.543
|
|
20,self_attn.q_proj,0.00011715,0.01000,0.538
|
|
20,self_attn.o_proj,0.00003250,0.01000,0.539
|
|
20,mlp.up_proj,0.00057619,0.01000,0.565
|
|
20,mlp.gate_proj,0.00055857,0.01000,0.562
|
|
20,mlp.down_proj,46.70051575,0.01250,4.290
|
|
21,self_attn.k_proj,0.00001234,0.01000,0.546
|
|
21,self_attn.v_proj,0.00002742,0.01000,0.543
|
|
21,self_attn.q_proj,0.00009824,0.01000,0.543
|
|
21,self_attn.o_proj,0.00004398,0.01000,0.540
|
|
21,mlp.up_proj,0.00063331,0.01000,0.571
|
|
21,mlp.gate_proj,0.00064088,0.01000,0.567
|
|
21,mlp.down_proj,202.07145691,0.01250,4.289
|
|
22,self_attn.k_proj,0.00001307,0.01000,0.544
|
|
22,self_attn.v_proj,0.00003479,0.01000,0.541
|
|
22,self_attn.q_proj,0.00011022,0.01000,0.540
|
|
22,self_attn.o_proj,0.00004273,0.01000,0.542
|
|
22,mlp.up_proj,0.00103869,0.01000,0.571
|
|
22,mlp.gate_proj,0.00103481,0.01000,0.563
|
|
22,mlp.down_proj,94.00750732,0.01250,4.299
|
|
23,self_attn.k_proj,0.00001350,0.01000,0.546
|
|
23,self_attn.v_proj,0.00003311,0.01000,0.543
|
|
23,self_attn.q_proj,0.00010460,0.01000,0.542
|
|
23,self_attn.o_proj,0.00008125,0.01000,0.542
|
|
23,mlp.up_proj,0.00153192,0.01000,0.567
|
|
23,mlp.gate_proj,0.00151269,0.01000,0.564
|
|
23,mlp.down_proj,37.44200134,0.01250,4.282
|
|
24,self_attn.k_proj,0.00001306,0.01000,0.548
|
|
24,self_attn.v_proj,0.00004170,0.01000,0.543
|
|
24,self_attn.q_proj,0.00010361,0.01000,0.540
|
|
24,self_attn.o_proj,0.00009263,0.01000,0.540
|
|
24,mlp.up_proj,0.00185848,0.01000,0.567
|
|
24,mlp.gate_proj,0.00169903,0.01000,0.562
|
|
24,mlp.down_proj,7.99997807,0.01250,4.296
|
|
25,self_attn.k_proj,0.00001203,0.01000,0.547
|
|
25,self_attn.v_proj,0.00005703,0.01000,0.542
|
|
25,self_attn.q_proj,0.00010856,0.01000,0.540
|
|
25,self_attn.o_proj,0.00011315,0.01000,0.542
|
|
25,mlp.up_proj,0.00322402,0.01000,0.567
|
|
25,mlp.gate_proj,0.00282585,0.01000,0.562
|
|
25,mlp.down_proj,1.47514915,0.01250,4.288
|
|
26,self_attn.k_proj,0.00001247,0.01000,0.545
|
|
26,self_attn.v_proj,0.00007589,0.01000,0.542
|
|
26,self_attn.q_proj,0.00010745,0.01000,0.541
|
|
26,self_attn.o_proj,0.00023876,0.01000,0.542
|
|
26,mlp.up_proj,0.01456263,0.01000,0.568
|
|
26,mlp.gate_proj,0.01264119,0.01000,0.564
|
|
26,mlp.down_proj,6.14609051,0.01000,3.593
|
|
27,self_attn.k_proj,0.00026983,0.01000,0.545
|
|
27,self_attn.v_proj,0.00129112,0.01000,0.542
|
|
27,self_attn.q_proj,0.00255784,0.01000,0.542
|
|
27,self_attn.o_proj,0.03490701,0.01000,0.541
|
|
27,mlp.up_proj,0.02056599,0.01000,0.566
|
|
27,mlp.gate_proj,0.01958771,0.01000,0.563
|
|
27,mlp.down_proj,0.06864744,0.01250,4.293
|
|
|