dmeck's picture
Upload folder using huggingface_hub
0e24342 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00006715,0.01000,0.718
0,self_attn.v_proj,0.00000780,0.01000,0.514
0,self_attn.q_proj,0.00026270,0.01000,0.516
0,self_attn.o_proj,0.00008650,0.01000,0.518
0,mlp.up_proj,0.00024506,0.01000,0.542
0,mlp.gate_proj,0.00042573,0.01000,0.535
0,mlp.down_proj,304.12640381,0.01250,4.190
1,self_attn.k_proj,0.00003489,0.01000,0.517
1,self_attn.v_proj,0.00001167,0.01000,0.511
1,self_attn.q_proj,0.00013022,0.01000,0.513
1,self_attn.o_proj,0.00001387,0.01000,0.520
1,mlp.up_proj,0.00507348,0.01000,0.547
1,mlp.gate_proj,0.00740717,0.01000,0.539
1,mlp.down_proj,205.67033386,0.01250,4.144
2,self_attn.k_proj,0.00002055,0.01000,0.513
2,self_attn.v_proj,0.00000462,0.01000,0.510
2,self_attn.q_proj,0.00008936,0.01000,0.509
2,self_attn.o_proj,0.00002058,0.01000,0.511
2,mlp.up_proj,0.00318930,0.01000,0.536
2,mlp.gate_proj,0.00475867,0.01000,0.532
2,mlp.down_proj,258.93670654,0.01250,4.158
3,self_attn.k_proj,0.00003845,0.01000,0.514
3,self_attn.v_proj,0.00001134,0.01000,0.510
3,self_attn.q_proj,0.00017001,0.01000,0.509
3,self_attn.o_proj,0.00010790,0.01000,0.508
3,mlp.up_proj,0.01201856,0.01000,0.543
3,mlp.gate_proj,0.01521150,0.01000,0.531
3,mlp.down_proj,0.13716114,0.01250,4.141
4,self_attn.k_proj,0.00000328,0.01000,0.516
4,self_attn.v_proj,0.00000161,0.01000,0.512
4,self_attn.q_proj,0.00001588,0.01000,0.509
4,self_attn.o_proj,0.00000415,0.01000,0.511
4,mlp.up_proj,0.00581097,0.01000,0.537
4,mlp.gate_proj,0.00825511,0.01000,0.533
4,mlp.down_proj,0.17886887,0.01250,4.135
5,self_attn.k_proj,0.00000587,0.01000,0.520
5,self_attn.v_proj,0.00000279,0.01000,0.516
5,self_attn.q_proj,0.00002999,0.01000,0.525
5,self_attn.o_proj,0.00000599,0.01000,0.554
5,mlp.up_proj,0.01785859,0.01000,0.544
5,mlp.gate_proj,0.02156129,0.01000,0.542
5,mlp.down_proj,7.14856195,0.01250,4.134
6,self_attn.k_proj,0.00000563,0.01000,0.512
6,self_attn.v_proj,0.00000298,0.01000,0.512
6,self_attn.q_proj,0.00002899,0.01000,0.513
6,self_attn.o_proj,0.00000588,0.01000,0.514
6,mlp.up_proj,0.00137024,0.01000,0.539
6,mlp.gate_proj,0.00192763,0.01000,0.536
6,mlp.down_proj,29.77047348,0.01250,4.173
7,self_attn.k_proj,0.00000720,0.01000,0.518
7,self_attn.v_proj,0.00000816,0.01000,0.517
7,self_attn.q_proj,0.00004514,0.01000,0.515
7,self_attn.o_proj,0.00000802,0.01000,0.511
7,mlp.up_proj,0.00104425,0.01000,0.541
7,mlp.gate_proj,0.00117585,0.01000,0.538
7,mlp.down_proj,72.96322632,0.01250,4.139
8,self_attn.k_proj,0.00000808,0.01000,0.514
8,self_attn.v_proj,0.00000379,0.01000,0.511
8,self_attn.q_proj,0.00003749,0.01000,0.511
8,self_attn.o_proj,0.00001481,0.01000,0.509
8,mlp.up_proj,0.00108723,0.01000,0.536
8,mlp.gate_proj,0.00114396,0.01000,0.534
8,mlp.down_proj,118.67788696,0.01250,4.132
9,self_attn.k_proj,0.00000740,0.01000,0.520
9,self_attn.v_proj,0.00000784,0.01000,0.516
9,self_attn.q_proj,0.00004375,0.01000,0.513
9,self_attn.o_proj,0.00001444,0.01000,0.518
9,mlp.up_proj,0.00241198,0.01000,0.540
9,mlp.gate_proj,0.00358187,0.01000,0.535
9,mlp.down_proj,20.16089630,0.01250,4.150
10,self_attn.k_proj,0.00000830,0.01000,0.518
10,self_attn.v_proj,0.00000535,0.01000,0.515
10,self_attn.q_proj,0.00004396,0.01000,0.515
10,self_attn.o_proj,0.00001136,0.01000,0.516
10,mlp.up_proj,0.00074554,0.01000,0.538
10,mlp.gate_proj,0.00083315,0.01000,0.537
10,mlp.down_proj,353.91262817,0.01250,4.127
11,self_attn.k_proj,0.00001261,0.01000,0.515
11,self_attn.v_proj,0.00000557,0.01000,0.511
11,self_attn.q_proj,0.00005965,0.01000,0.511
11,self_attn.o_proj,0.00001752,0.01000,0.512
11,mlp.up_proj,0.00085733,0.01000,0.537
11,mlp.gate_proj,0.00089207,0.01000,0.534
11,mlp.down_proj,4.76699162,0.01250,4.146
12,self_attn.k_proj,0.00001338,0.01000,0.517
12,self_attn.v_proj,0.00000711,0.01000,0.513
12,self_attn.q_proj,0.00006364,0.01000,0.513
12,self_attn.o_proj,0.00001614,0.01000,0.518
12,mlp.up_proj,0.00072253,0.01000,0.539
12,mlp.gate_proj,0.00070775,0.01000,0.536
12,mlp.down_proj,84.15060425,0.01250,4.142
13,self_attn.k_proj,0.00002151,0.01000,0.519
13,self_attn.v_proj,0.00001624,0.01000,0.521
13,self_attn.q_proj,0.00011856,0.01000,0.520
13,self_attn.o_proj,0.00001842,0.01000,0.520
13,mlp.up_proj,0.00052484,0.01000,0.543
13,mlp.gate_proj,0.00055117,0.01000,0.538
13,mlp.down_proj,433.72549438,0.01250,4.137
14,self_attn.k_proj,0.00001664,0.01000,0.521
14,self_attn.v_proj,0.00000903,0.01000,0.515
14,self_attn.q_proj,0.00008787,0.01000,0.513
14,self_attn.o_proj,0.00002697,0.01000,0.515
14,mlp.up_proj,0.00054731,0.01000,0.540
14,mlp.gate_proj,0.00054132,0.01000,0.537
14,mlp.down_proj,434.25894165,0.01250,4.187
15,self_attn.k_proj,0.00004199,0.01000,0.523
15,self_attn.v_proj,0.00002103,0.01000,0.524
15,self_attn.q_proj,0.00020090,0.01000,0.520
15,self_attn.o_proj,0.00002861,0.01000,0.519
15,mlp.up_proj,0.00050712,0.01000,0.545
15,mlp.gate_proj,0.00048530,0.01000,0.544
15,mlp.down_proj,825.07031250,0.01250,4.188
16,self_attn.k_proj,0.00002080,0.01000,0.521
16,self_attn.v_proj,0.00001646,0.01000,0.517
16,self_attn.q_proj,0.00011679,0.01000,0.515
16,self_attn.o_proj,0.00001977,0.01000,0.518
16,mlp.up_proj,0.00042822,0.01000,0.541
16,mlp.gate_proj,0.00041165,0.01000,0.539
16,mlp.down_proj,1216.13427734,0.01250,4.141
17,self_attn.k_proj,0.00002302,0.01000,0.518
17,self_attn.v_proj,0.00001865,0.01000,0.515
17,self_attn.q_proj,0.00013881,0.01000,0.511
17,self_attn.o_proj,0.00003463,0.01000,0.512
17,mlp.up_proj,0.00045801,0.01000,0.535
17,mlp.gate_proj,0.00042881,0.01000,0.533
17,mlp.down_proj,1000.17590332,0.01250,4.154
18,self_attn.k_proj,0.00001940,0.01000,0.518
18,self_attn.v_proj,0.00002290,0.01000,0.515
18,self_attn.q_proj,0.00011717,0.01000,0.513
18,self_attn.o_proj,0.00002894,0.01000,0.514
18,mlp.up_proj,0.00046425,0.01000,0.541
18,mlp.gate_proj,0.00042691,0.01000,0.538
18,mlp.down_proj,494.97500610,0.01250,4.136
19,self_attn.k_proj,0.00001817,0.01000,0.519
19,self_attn.v_proj,0.00002528,0.01000,0.515
19,self_attn.q_proj,0.00012607,0.01000,0.517
19,self_attn.o_proj,0.00003120,0.01000,0.517
19,mlp.up_proj,0.00048594,0.01000,0.540
19,mlp.gate_proj,0.00046907,0.01000,0.538
19,mlp.down_proj,443.67700195,0.01250,4.201
20,self_attn.k_proj,0.00001768,0.01000,0.516
20,self_attn.v_proj,0.00002585,0.01000,0.513
20,self_attn.q_proj,0.00011644,0.01000,0.512
20,self_attn.o_proj,0.00003165,0.01000,0.512
20,mlp.up_proj,0.00057360,0.01000,0.536
20,mlp.gate_proj,0.00055578,0.01000,0.533
20,mlp.down_proj,45.72077942,0.01250,4.162
21,self_attn.k_proj,0.00001222,0.01000,0.516
21,self_attn.v_proj,0.00002728,0.01000,0.514
21,self_attn.q_proj,0.00009766,0.01000,0.512
21,self_attn.o_proj,0.00004468,0.01000,0.512
21,mlp.up_proj,0.00063293,0.01000,0.541
21,mlp.gate_proj,0.00064172,0.01000,0.538
21,mlp.down_proj,206.07777405,0.01250,4.161
22,self_attn.k_proj,0.00001299,0.01000,0.515
22,self_attn.v_proj,0.00003446,0.01000,0.512
22,self_attn.q_proj,0.00011036,0.01000,0.511
22,self_attn.o_proj,0.00004398,0.01000,0.511
22,mlp.up_proj,0.00103744,0.01000,0.536
22,mlp.gate_proj,0.00103252,0.01000,0.534
22,mlp.down_proj,92.18318939,0.01250,4.143
23,self_attn.k_proj,0.00001359,0.01000,0.517
23,self_attn.v_proj,0.00003331,0.01000,0.513
23,self_attn.q_proj,0.00010572,0.01000,0.514
23,self_attn.o_proj,0.00008590,0.01000,0.514
23,mlp.up_proj,0.00153257,0.01000,0.537
23,mlp.gate_proj,0.00151383,0.01000,0.535
23,mlp.down_proj,36.93452454,0.01250,4.153
24,self_attn.k_proj,0.00001319,0.01000,0.519
24,self_attn.v_proj,0.00004230,0.01000,0.515
24,self_attn.q_proj,0.00010442,0.01000,0.514
24,self_attn.o_proj,0.00009598,0.01000,0.516
24,mlp.up_proj,0.00185951,0.01000,0.538
24,mlp.gate_proj,0.00170149,0.01000,0.536
24,mlp.down_proj,8.04627609,0.01250,4.140
25,self_attn.k_proj,0.00001232,0.01000,0.521
25,self_attn.v_proj,0.00005826,0.01000,0.515
25,self_attn.q_proj,0.00011131,0.01000,0.515
25,self_attn.o_proj,0.00012100,0.01000,0.516
25,mlp.up_proj,0.00324263,0.01000,0.537
25,mlp.gate_proj,0.00284433,0.01000,0.533
25,mlp.down_proj,1.74767351,0.01250,4.181
26,self_attn.k_proj,0.00001294,0.01000,0.519
26,self_attn.v_proj,0.00007807,0.01000,0.516
26,self_attn.q_proj,0.00011034,0.01000,0.514
26,self_attn.o_proj,0.00027705,0.01000,0.516
26,mlp.up_proj,0.01450638,0.01000,0.542
26,mlp.gate_proj,0.01259876,0.01000,0.538
26,mlp.down_proj,5.78889465,0.01000,3.461
27,self_attn.k_proj,0.00026575,0.01000,0.517
27,self_attn.v_proj,0.00128777,0.01000,0.513
27,self_attn.q_proj,0.00252120,0.01000,0.513
27,self_attn.o_proj,0.03436147,0.01000,0.513
27,mlp.up_proj,0.01967174,0.01000,0.538
27,mlp.gate_proj,0.01874932,0.01000,0.537
27,mlp.down_proj,0.07177597,0.01250,4.151