|
layer,module,loss,samples,damp,time
|
|
0,self_attn.k_proj,0.00006715,0.01000,0.718
|
|
0,self_attn.v_proj,0.00000780,0.01000,0.514
|
|
0,self_attn.q_proj,0.00026270,0.01000,0.516
|
|
0,self_attn.o_proj,0.00008650,0.01000,0.518
|
|
0,mlp.up_proj,0.00024506,0.01000,0.542
|
|
0,mlp.gate_proj,0.00042573,0.01000,0.535
|
|
0,mlp.down_proj,304.12640381,0.01250,4.190
|
|
1,self_attn.k_proj,0.00003489,0.01000,0.517
|
|
1,self_attn.v_proj,0.00001167,0.01000,0.511
|
|
1,self_attn.q_proj,0.00013022,0.01000,0.513
|
|
1,self_attn.o_proj,0.00001387,0.01000,0.520
|
|
1,mlp.up_proj,0.00507348,0.01000,0.547
|
|
1,mlp.gate_proj,0.00740717,0.01000,0.539
|
|
1,mlp.down_proj,205.67033386,0.01250,4.144
|
|
2,self_attn.k_proj,0.00002055,0.01000,0.513
|
|
2,self_attn.v_proj,0.00000462,0.01000,0.510
|
|
2,self_attn.q_proj,0.00008936,0.01000,0.509
|
|
2,self_attn.o_proj,0.00002058,0.01000,0.511
|
|
2,mlp.up_proj,0.00318930,0.01000,0.536
|
|
2,mlp.gate_proj,0.00475867,0.01000,0.532
|
|
2,mlp.down_proj,258.93670654,0.01250,4.158
|
|
3,self_attn.k_proj,0.00003845,0.01000,0.514
|
|
3,self_attn.v_proj,0.00001134,0.01000,0.510
|
|
3,self_attn.q_proj,0.00017001,0.01000,0.509
|
|
3,self_attn.o_proj,0.00010790,0.01000,0.508
|
|
3,mlp.up_proj,0.01201856,0.01000,0.543
|
|
3,mlp.gate_proj,0.01521150,0.01000,0.531
|
|
3,mlp.down_proj,0.13716114,0.01250,4.141
|
|
4,self_attn.k_proj,0.00000328,0.01000,0.516
|
|
4,self_attn.v_proj,0.00000161,0.01000,0.512
|
|
4,self_attn.q_proj,0.00001588,0.01000,0.509
|
|
4,self_attn.o_proj,0.00000415,0.01000,0.511
|
|
4,mlp.up_proj,0.00581097,0.01000,0.537
|
|
4,mlp.gate_proj,0.00825511,0.01000,0.533
|
|
4,mlp.down_proj,0.17886887,0.01250,4.135
|
|
5,self_attn.k_proj,0.00000587,0.01000,0.520
|
|
5,self_attn.v_proj,0.00000279,0.01000,0.516
|
|
5,self_attn.q_proj,0.00002999,0.01000,0.525
|
|
5,self_attn.o_proj,0.00000599,0.01000,0.554
|
|
5,mlp.up_proj,0.01785859,0.01000,0.544
|
|
5,mlp.gate_proj,0.02156129,0.01000,0.542
|
|
5,mlp.down_proj,7.14856195,0.01250,4.134
|
|
6,self_attn.k_proj,0.00000563,0.01000,0.512
|
|
6,self_attn.v_proj,0.00000298,0.01000,0.512
|
|
6,self_attn.q_proj,0.00002899,0.01000,0.513
|
|
6,self_attn.o_proj,0.00000588,0.01000,0.514
|
|
6,mlp.up_proj,0.00137024,0.01000,0.539
|
|
6,mlp.gate_proj,0.00192763,0.01000,0.536
|
|
6,mlp.down_proj,29.77047348,0.01250,4.173
|
|
7,self_attn.k_proj,0.00000720,0.01000,0.518
|
|
7,self_attn.v_proj,0.00000816,0.01000,0.517
|
|
7,self_attn.q_proj,0.00004514,0.01000,0.515
|
|
7,self_attn.o_proj,0.00000802,0.01000,0.511
|
|
7,mlp.up_proj,0.00104425,0.01000,0.541
|
|
7,mlp.gate_proj,0.00117585,0.01000,0.538
|
|
7,mlp.down_proj,72.96322632,0.01250,4.139
|
|
8,self_attn.k_proj,0.00000808,0.01000,0.514
|
|
8,self_attn.v_proj,0.00000379,0.01000,0.511
|
|
8,self_attn.q_proj,0.00003749,0.01000,0.511
|
|
8,self_attn.o_proj,0.00001481,0.01000,0.509
|
|
8,mlp.up_proj,0.00108723,0.01000,0.536
|
|
8,mlp.gate_proj,0.00114396,0.01000,0.534
|
|
8,mlp.down_proj,118.67788696,0.01250,4.132
|
|
9,self_attn.k_proj,0.00000740,0.01000,0.520
|
|
9,self_attn.v_proj,0.00000784,0.01000,0.516
|
|
9,self_attn.q_proj,0.00004375,0.01000,0.513
|
|
9,self_attn.o_proj,0.00001444,0.01000,0.518
|
|
9,mlp.up_proj,0.00241198,0.01000,0.540
|
|
9,mlp.gate_proj,0.00358187,0.01000,0.535
|
|
9,mlp.down_proj,20.16089630,0.01250,4.150
|
|
10,self_attn.k_proj,0.00000830,0.01000,0.518
|
|
10,self_attn.v_proj,0.00000535,0.01000,0.515
|
|
10,self_attn.q_proj,0.00004396,0.01000,0.515
|
|
10,self_attn.o_proj,0.00001136,0.01000,0.516
|
|
10,mlp.up_proj,0.00074554,0.01000,0.538
|
|
10,mlp.gate_proj,0.00083315,0.01000,0.537
|
|
10,mlp.down_proj,353.91262817,0.01250,4.127
|
|
11,self_attn.k_proj,0.00001261,0.01000,0.515
|
|
11,self_attn.v_proj,0.00000557,0.01000,0.511
|
|
11,self_attn.q_proj,0.00005965,0.01000,0.511
|
|
11,self_attn.o_proj,0.00001752,0.01000,0.512
|
|
11,mlp.up_proj,0.00085733,0.01000,0.537
|
|
11,mlp.gate_proj,0.00089207,0.01000,0.534
|
|
11,mlp.down_proj,4.76699162,0.01250,4.146
|
|
12,self_attn.k_proj,0.00001338,0.01000,0.517
|
|
12,self_attn.v_proj,0.00000711,0.01000,0.513
|
|
12,self_attn.q_proj,0.00006364,0.01000,0.513
|
|
12,self_attn.o_proj,0.00001614,0.01000,0.518
|
|
12,mlp.up_proj,0.00072253,0.01000,0.539
|
|
12,mlp.gate_proj,0.00070775,0.01000,0.536
|
|
12,mlp.down_proj,84.15060425,0.01250,4.142
|
|
13,self_attn.k_proj,0.00002151,0.01000,0.519
|
|
13,self_attn.v_proj,0.00001624,0.01000,0.521
|
|
13,self_attn.q_proj,0.00011856,0.01000,0.520
|
|
13,self_attn.o_proj,0.00001842,0.01000,0.520
|
|
13,mlp.up_proj,0.00052484,0.01000,0.543
|
|
13,mlp.gate_proj,0.00055117,0.01000,0.538
|
|
13,mlp.down_proj,433.72549438,0.01250,4.137
|
|
14,self_attn.k_proj,0.00001664,0.01000,0.521
|
|
14,self_attn.v_proj,0.00000903,0.01000,0.515
|
|
14,self_attn.q_proj,0.00008787,0.01000,0.513
|
|
14,self_attn.o_proj,0.00002697,0.01000,0.515
|
|
14,mlp.up_proj,0.00054731,0.01000,0.540
|
|
14,mlp.gate_proj,0.00054132,0.01000,0.537
|
|
14,mlp.down_proj,434.25894165,0.01250,4.187
|
|
15,self_attn.k_proj,0.00004199,0.01000,0.523
|
|
15,self_attn.v_proj,0.00002103,0.01000,0.524
|
|
15,self_attn.q_proj,0.00020090,0.01000,0.520
|
|
15,self_attn.o_proj,0.00002861,0.01000,0.519
|
|
15,mlp.up_proj,0.00050712,0.01000,0.545
|
|
15,mlp.gate_proj,0.00048530,0.01000,0.544
|
|
15,mlp.down_proj,825.07031250,0.01250,4.188
|
|
16,self_attn.k_proj,0.00002080,0.01000,0.521
|
|
16,self_attn.v_proj,0.00001646,0.01000,0.517
|
|
16,self_attn.q_proj,0.00011679,0.01000,0.515
|
|
16,self_attn.o_proj,0.00001977,0.01000,0.518
|
|
16,mlp.up_proj,0.00042822,0.01000,0.541
|
|
16,mlp.gate_proj,0.00041165,0.01000,0.539
|
|
16,mlp.down_proj,1216.13427734,0.01250,4.141
|
|
17,self_attn.k_proj,0.00002302,0.01000,0.518
|
|
17,self_attn.v_proj,0.00001865,0.01000,0.515
|
|
17,self_attn.q_proj,0.00013881,0.01000,0.511
|
|
17,self_attn.o_proj,0.00003463,0.01000,0.512
|
|
17,mlp.up_proj,0.00045801,0.01000,0.535
|
|
17,mlp.gate_proj,0.00042881,0.01000,0.533
|
|
17,mlp.down_proj,1000.17590332,0.01250,4.154
|
|
18,self_attn.k_proj,0.00001940,0.01000,0.518
|
|
18,self_attn.v_proj,0.00002290,0.01000,0.515
|
|
18,self_attn.q_proj,0.00011717,0.01000,0.513
|
|
18,self_attn.o_proj,0.00002894,0.01000,0.514
|
|
18,mlp.up_proj,0.00046425,0.01000,0.541
|
|
18,mlp.gate_proj,0.00042691,0.01000,0.538
|
|
18,mlp.down_proj,494.97500610,0.01250,4.136
|
|
19,self_attn.k_proj,0.00001817,0.01000,0.519
|
|
19,self_attn.v_proj,0.00002528,0.01000,0.515
|
|
19,self_attn.q_proj,0.00012607,0.01000,0.517
|
|
19,self_attn.o_proj,0.00003120,0.01000,0.517
|
|
19,mlp.up_proj,0.00048594,0.01000,0.540
|
|
19,mlp.gate_proj,0.00046907,0.01000,0.538
|
|
19,mlp.down_proj,443.67700195,0.01250,4.201
|
|
20,self_attn.k_proj,0.00001768,0.01000,0.516
|
|
20,self_attn.v_proj,0.00002585,0.01000,0.513
|
|
20,self_attn.q_proj,0.00011644,0.01000,0.512
|
|
20,self_attn.o_proj,0.00003165,0.01000,0.512
|
|
20,mlp.up_proj,0.00057360,0.01000,0.536
|
|
20,mlp.gate_proj,0.00055578,0.01000,0.533
|
|
20,mlp.down_proj,45.72077942,0.01250,4.162
|
|
21,self_attn.k_proj,0.00001222,0.01000,0.516
|
|
21,self_attn.v_proj,0.00002728,0.01000,0.514
|
|
21,self_attn.q_proj,0.00009766,0.01000,0.512
|
|
21,self_attn.o_proj,0.00004468,0.01000,0.512
|
|
21,mlp.up_proj,0.00063293,0.01000,0.541
|
|
21,mlp.gate_proj,0.00064172,0.01000,0.538
|
|
21,mlp.down_proj,206.07777405,0.01250,4.161
|
|
22,self_attn.k_proj,0.00001299,0.01000,0.515
|
|
22,self_attn.v_proj,0.00003446,0.01000,0.512
|
|
22,self_attn.q_proj,0.00011036,0.01000,0.511
|
|
22,self_attn.o_proj,0.00004398,0.01000,0.511
|
|
22,mlp.up_proj,0.00103744,0.01000,0.536
|
|
22,mlp.gate_proj,0.00103252,0.01000,0.534
|
|
22,mlp.down_proj,92.18318939,0.01250,4.143
|
|
23,self_attn.k_proj,0.00001359,0.01000,0.517
|
|
23,self_attn.v_proj,0.00003331,0.01000,0.513
|
|
23,self_attn.q_proj,0.00010572,0.01000,0.514
|
|
23,self_attn.o_proj,0.00008590,0.01000,0.514
|
|
23,mlp.up_proj,0.00153257,0.01000,0.537
|
|
23,mlp.gate_proj,0.00151383,0.01000,0.535
|
|
23,mlp.down_proj,36.93452454,0.01250,4.153
|
|
24,self_attn.k_proj,0.00001319,0.01000,0.519
|
|
24,self_attn.v_proj,0.00004230,0.01000,0.515
|
|
24,self_attn.q_proj,0.00010442,0.01000,0.514
|
|
24,self_attn.o_proj,0.00009598,0.01000,0.516
|
|
24,mlp.up_proj,0.00185951,0.01000,0.538
|
|
24,mlp.gate_proj,0.00170149,0.01000,0.536
|
|
24,mlp.down_proj,8.04627609,0.01250,4.140
|
|
25,self_attn.k_proj,0.00001232,0.01000,0.521
|
|
25,self_attn.v_proj,0.00005826,0.01000,0.515
|
|
25,self_attn.q_proj,0.00011131,0.01000,0.515
|
|
25,self_attn.o_proj,0.00012100,0.01000,0.516
|
|
25,mlp.up_proj,0.00324263,0.01000,0.537
|
|
25,mlp.gate_proj,0.00284433,0.01000,0.533
|
|
25,mlp.down_proj,1.74767351,0.01250,4.181
|
|
26,self_attn.k_proj,0.00001294,0.01000,0.519
|
|
26,self_attn.v_proj,0.00007807,0.01000,0.516
|
|
26,self_attn.q_proj,0.00011034,0.01000,0.514
|
|
26,self_attn.o_proj,0.00027705,0.01000,0.516
|
|
26,mlp.up_proj,0.01450638,0.01000,0.542
|
|
26,mlp.gate_proj,0.01259876,0.01000,0.538
|
|
26,mlp.down_proj,5.78889465,0.01000,3.461
|
|
27,self_attn.k_proj,0.00026575,0.01000,0.517
|
|
27,self_attn.v_proj,0.00128777,0.01000,0.513
|
|
27,self_attn.q_proj,0.00252120,0.01000,0.513
|
|
27,self_attn.o_proj,0.03436147,0.01000,0.513
|
|
27,mlp.up_proj,0.01967174,0.01000,0.538
|
|
27,mlp.gate_proj,0.01874932,0.01000,0.537
|
|
27,mlp.down_proj,0.07177597,0.01250,4.151
|
|
|