dmeck's picture
Upload folder using huggingface_hub
1ae3779 verified
layer,module,loss,samples,damp,time
0,self_attn.k_proj,0.00006717,0.01000,0.743
0,self_attn.v_proj,0.00000782,0.01000,0.540
0,self_attn.q_proj,0.00026253,0.01000,0.537
0,self_attn.o_proj,0.00008649,0.01000,0.538
0,mlp.up_proj,0.00024544,0.01000,0.564
0,mlp.gate_proj,0.00042476,0.01000,0.558
0,mlp.down_proj,304.70507812,0.01250,4.287
1,self_attn.k_proj,0.00003458,0.01000,0.543
1,self_attn.v_proj,0.00001160,0.01000,0.540
1,self_attn.q_proj,0.00012922,0.01000,0.539
1,self_attn.o_proj,0.00001389,0.01000,0.540
1,mlp.up_proj,0.00507102,0.01000,0.564
1,mlp.gate_proj,0.00740672,0.01000,0.561
1,mlp.down_proj,201.20426941,0.01250,4.277
2,self_attn.k_proj,0.00002051,0.01000,0.545
2,self_attn.v_proj,0.00000462,0.01000,0.542
2,self_attn.q_proj,0.00008908,0.01000,0.541
2,self_attn.o_proj,0.00002082,0.01000,0.540
2,mlp.up_proj,0.00323103,0.01000,0.564
2,mlp.gate_proj,0.00482144,0.01000,0.559
2,mlp.down_proj,265.71157837,0.01250,4.258
3,self_attn.k_proj,0.00003836,0.01000,0.542
3,self_attn.v_proj,0.00001136,0.01000,0.542
3,self_attn.q_proj,0.00017052,0.01000,0.537
3,self_attn.o_proj,0.00010798,0.01000,0.541
3,mlp.up_proj,0.01222713,0.01000,0.562
3,mlp.gate_proj,0.01548911,0.01000,0.558
3,mlp.down_proj,0.12992305,0.01250,4.263
4,self_attn.k_proj,0.00000324,0.01000,0.543
4,self_attn.v_proj,0.00000160,0.01000,0.538
4,self_attn.q_proj,0.00001570,0.01000,0.539
4,self_attn.o_proj,0.00000409,0.01000,0.540
4,mlp.up_proj,0.00579107,0.01000,0.564
4,mlp.gate_proj,0.00821990,0.01000,0.562
4,mlp.down_proj,0.17879479,0.01250,4.295
5,self_attn.k_proj,0.00000587,0.01000,0.542
5,self_attn.v_proj,0.00000278,0.01000,0.539
5,self_attn.q_proj,0.00002992,0.01000,0.543
5,self_attn.o_proj,0.00000610,0.01000,0.544
5,mlp.up_proj,0.01783431,0.01000,0.566
5,mlp.gate_proj,0.02152922,0.01000,0.562
5,mlp.down_proj,7.94002533,0.01250,4.278
6,self_attn.k_proj,0.00000566,0.01000,0.546
6,self_attn.v_proj,0.00000298,0.01000,0.543
6,self_attn.q_proj,0.00002906,0.01000,0.545
6,self_attn.o_proj,0.00000604,0.01000,0.543
6,mlp.up_proj,0.00136981,0.01000,0.563
6,mlp.gate_proj,0.00192878,0.01000,0.563
6,mlp.down_proj,29.80362320,0.01250,4.302
7,self_attn.k_proj,0.00000723,0.01000,0.543
7,self_attn.v_proj,0.00000818,0.01000,0.543
7,self_attn.q_proj,0.00004528,0.01000,0.540
7,self_attn.o_proj,0.00000810,0.01000,0.542
7,mlp.up_proj,0.00104278,0.01000,0.565
7,mlp.gate_proj,0.00117535,0.01000,0.562
7,mlp.down_proj,73.25530243,0.01250,4.280
8,self_attn.k_proj,0.00000813,0.01000,0.540
8,self_attn.v_proj,0.00000380,0.01000,0.538
8,self_attn.q_proj,0.00003767,0.01000,0.538
8,self_attn.o_proj,0.00001477,0.01000,0.540
8,mlp.up_proj,0.00108770,0.01000,0.566
8,mlp.gate_proj,0.00114401,0.01000,0.563
8,mlp.down_proj,118.72260284,0.01250,4.273
9,self_attn.k_proj,0.00000741,0.01000,0.545
9,self_attn.v_proj,0.00000789,0.01000,0.543
9,self_attn.q_proj,0.00004401,0.01000,0.542
9,self_attn.o_proj,0.00001458,0.01000,0.540
9,mlp.up_proj,0.00241637,0.01000,0.562
9,mlp.gate_proj,0.00358828,0.01000,0.560
9,mlp.down_proj,20.12282372,0.01250,4.280
10,self_attn.k_proj,0.00000835,0.01000,0.544
10,self_attn.v_proj,0.00000538,0.01000,0.541
10,self_attn.q_proj,0.00004422,0.01000,0.542
10,self_attn.o_proj,0.00001159,0.01000,0.542
10,mlp.up_proj,0.00074800,0.01000,0.565
10,mlp.gate_proj,0.00083565,0.01000,0.561
10,mlp.down_proj,351.15560913,0.01250,4.264
11,self_attn.k_proj,0.00001277,0.01000,0.546
11,self_attn.v_proj,0.00000565,0.01000,0.541
11,self_attn.q_proj,0.00006044,0.01000,0.540
11,self_attn.o_proj,0.00001777,0.01000,0.540
11,mlp.up_proj,0.00086147,0.01000,0.564
11,mlp.gate_proj,0.00089606,0.01000,0.565
11,mlp.down_proj,4.85732031,0.01250,4.274
12,self_attn.k_proj,0.00001361,0.01000,0.541
12,self_attn.v_proj,0.00000723,0.01000,0.538
12,self_attn.q_proj,0.00006449,0.01000,0.538
12,self_attn.o_proj,0.00001664,0.01000,0.539
12,mlp.up_proj,0.00072561,0.01000,0.563
12,mlp.gate_proj,0.00070967,0.01000,0.566
12,mlp.down_proj,84.20599365,0.01250,4.295
13,self_attn.k_proj,0.00002183,0.01000,0.545
13,self_attn.v_proj,0.00001649,0.01000,0.539
13,self_attn.q_proj,0.00011990,0.01000,0.540
13,self_attn.o_proj,0.00001876,0.01000,0.541
13,mlp.up_proj,0.00052857,0.01000,0.566
13,mlp.gate_proj,0.00055504,0.01000,0.563
13,mlp.down_proj,434.47857666,0.01250,4.278
14,self_attn.k_proj,0.00001691,0.01000,0.546
14,self_attn.v_proj,0.00000920,0.01000,0.541
14,self_attn.q_proj,0.00008929,0.01000,0.539
14,self_attn.o_proj,0.00002732,0.01000,0.539
14,mlp.up_proj,0.00055212,0.01000,0.566
14,mlp.gate_proj,0.00054635,0.01000,0.562
14,mlp.down_proj,410.56881714,0.01250,4.284
15,self_attn.k_proj,0.00004251,0.01000,0.548
15,self_attn.v_proj,0.00002116,0.01000,0.545
15,self_attn.q_proj,0.00020286,0.01000,0.546
15,self_attn.o_proj,0.00002885,0.01000,0.542
15,mlp.up_proj,0.00051129,0.01000,0.566
15,mlp.gate_proj,0.00048951,0.01000,0.564
15,mlp.down_proj,815.28625488,0.01250,4.290
16,self_attn.k_proj,0.00002103,0.01000,0.546
16,self_attn.v_proj,0.00001660,0.01000,0.541
16,self_attn.q_proj,0.00011751,0.01000,0.541
16,self_attn.o_proj,0.00002044,0.01000,0.540
16,mlp.up_proj,0.00043137,0.01000,0.574
16,mlp.gate_proj,0.00041475,0.01000,0.562
16,mlp.down_proj,1187.52331543,0.01250,4.284
17,self_attn.k_proj,0.00002322,0.01000,0.547
17,self_attn.v_proj,0.00001877,0.01000,0.542
17,self_attn.q_proj,0.00013999,0.01000,0.543
17,self_attn.o_proj,0.00003512,0.01000,0.543
17,mlp.up_proj,0.00046121,0.01000,0.567
17,mlp.gate_proj,0.00043173,0.01000,0.565
17,mlp.down_proj,972.71276855,0.01250,4.288
18,self_attn.k_proj,0.00001954,0.01000,0.549
18,self_attn.v_proj,0.00002303,0.01000,0.546
18,self_attn.q_proj,0.00011826,0.01000,0.543
18,self_attn.o_proj,0.00003064,0.01000,0.544
18,mlp.up_proj,0.00046868,0.01000,0.569
18,mlp.gate_proj,0.00043091,0.01000,0.563
18,mlp.down_proj,463.82571411,0.01250,4.275
19,self_attn.k_proj,0.00001841,0.01000,0.543
19,self_attn.v_proj,0.00002542,0.01000,0.540
19,self_attn.q_proj,0.00012729,0.01000,0.538
19,self_attn.o_proj,0.00003190,0.01000,0.538
19,mlp.up_proj,0.00048951,0.01000,0.566
19,mlp.gate_proj,0.00047259,0.01000,0.562
19,mlp.down_proj,430.34570312,0.01250,4.288
20,self_attn.k_proj,0.00001788,0.01000,0.546
20,self_attn.v_proj,0.00002601,0.01000,0.543
20,self_attn.q_proj,0.00011715,0.01000,0.538
20,self_attn.o_proj,0.00003250,0.01000,0.539
20,mlp.up_proj,0.00057619,0.01000,0.565
20,mlp.gate_proj,0.00055857,0.01000,0.562
20,mlp.down_proj,46.70051575,0.01250,4.290
21,self_attn.k_proj,0.00001234,0.01000,0.546
21,self_attn.v_proj,0.00002742,0.01000,0.543
21,self_attn.q_proj,0.00009824,0.01000,0.543
21,self_attn.o_proj,0.00004398,0.01000,0.540
21,mlp.up_proj,0.00063331,0.01000,0.571
21,mlp.gate_proj,0.00064088,0.01000,0.567
21,mlp.down_proj,202.07145691,0.01250,4.289
22,self_attn.k_proj,0.00001307,0.01000,0.544
22,self_attn.v_proj,0.00003479,0.01000,0.541
22,self_attn.q_proj,0.00011022,0.01000,0.540
22,self_attn.o_proj,0.00004273,0.01000,0.542
22,mlp.up_proj,0.00103869,0.01000,0.571
22,mlp.gate_proj,0.00103481,0.01000,0.563
22,mlp.down_proj,94.00750732,0.01250,4.299
23,self_attn.k_proj,0.00001350,0.01000,0.546
23,self_attn.v_proj,0.00003311,0.01000,0.543
23,self_attn.q_proj,0.00010460,0.01000,0.542
23,self_attn.o_proj,0.00008125,0.01000,0.542
23,mlp.up_proj,0.00153192,0.01000,0.567
23,mlp.gate_proj,0.00151269,0.01000,0.564
23,mlp.down_proj,37.44200134,0.01250,4.282
24,self_attn.k_proj,0.00001306,0.01000,0.548
24,self_attn.v_proj,0.00004170,0.01000,0.543
24,self_attn.q_proj,0.00010361,0.01000,0.540
24,self_attn.o_proj,0.00009263,0.01000,0.540
24,mlp.up_proj,0.00185848,0.01000,0.567
24,mlp.gate_proj,0.00169903,0.01000,0.562
24,mlp.down_proj,7.99997807,0.01250,4.296
25,self_attn.k_proj,0.00001203,0.01000,0.547
25,self_attn.v_proj,0.00005703,0.01000,0.542
25,self_attn.q_proj,0.00010856,0.01000,0.540
25,self_attn.o_proj,0.00011315,0.01000,0.542
25,mlp.up_proj,0.00322402,0.01000,0.567
25,mlp.gate_proj,0.00282585,0.01000,0.562
25,mlp.down_proj,1.47514915,0.01250,4.288
26,self_attn.k_proj,0.00001247,0.01000,0.545
26,self_attn.v_proj,0.00007589,0.01000,0.542
26,self_attn.q_proj,0.00010745,0.01000,0.541
26,self_attn.o_proj,0.00023876,0.01000,0.542
26,mlp.up_proj,0.01456263,0.01000,0.568
26,mlp.gate_proj,0.01264119,0.01000,0.564
26,mlp.down_proj,6.14609051,0.01000,3.593
27,self_attn.k_proj,0.00026983,0.01000,0.545
27,self_attn.v_proj,0.00129112,0.01000,0.542
27,self_attn.q_proj,0.00255784,0.01000,0.542
27,self_attn.o_proj,0.03490701,0.01000,0.541
27,mlp.up_proj,0.02056599,0.01000,0.566
27,mlp.gate_proj,0.01958771,0.01000,0.563
27,mlp.down_proj,0.06864744,0.01250,4.293