Abdohaaland's picture
Upload folder using huggingface_hub
414df82 verified
layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000037035,0.05000,1.695
0,self_attn.o_proj,0.0000001912,0.05000,0.993
0,mlp.up_proj,0.0000102369,0.05000,2.424
0,mlp.gate_proj,0.0000107023,0.05000,2.453
0,mlp.down_proj,0.0000007776,0.05000,2.854
1,self_attn.qkv_proj,0.0000286602,0.05000,1.281
1,self_attn.o_proj,0.0000004302,0.05000,1.073
1,mlp.gate_proj,0.0000156239,0.05000,2.984
1,mlp.up_proj,0.0000145528,0.05000,3.031
1,mlp.down_proj,0.0000015817,0.05000,3.079
2,self_attn.qkv_proj,0.0000670091,0.05000,1.059
2,self_attn.o_proj,0.0000003938,0.05000,1.070
2,mlp.up_proj,0.0000224096,0.05000,2.395
2,mlp.gate_proj,0.0000242441,0.05000,2.416
2,mlp.down_proj,0.0000015780,0.05000,2.917
3,self_attn.qkv_proj,0.0000974988,0.05000,1.073
3,self_attn.o_proj,0.0000007507,0.05000,1.034
3,mlp.up_proj,0.0000273527,0.05000,2.420
3,mlp.gate_proj,0.0000303579,0.05000,2.439
3,mlp.down_proj,0.0002998998,0.05000,2.971
4,self_attn.qkv_proj,0.0000910987,0.05000,1.059
4,self_attn.o_proj,0.0000010523,0.05000,1.028
4,mlp.up_proj,0.0000352418,0.05000,2.337
4,mlp.gate_proj,0.0000410384,0.05000,2.362
4,mlp.down_proj,0.0000039988,0.05000,2.978
5,self_attn.qkv_proj,0.0001155192,0.05000,1.047
5,self_attn.o_proj,0.0000016719,0.05000,1.026
5,mlp.gate_proj,0.0000496211,0.05000,2.362
5,mlp.up_proj,0.0000416632,0.05000,2.390
5,mlp.down_proj,0.0000057624,0.05000,3.039
6,self_attn.qkv_proj,0.0000936164,0.05000,1.020
6,self_attn.o_proj,0.0000023169,0.05000,1.018
6,mlp.gate_proj,0.0000478458,0.05000,2.404
6,mlp.up_proj,0.0000420634,0.05000,2.419
6,mlp.down_proj,0.0000064274,0.05000,3.008
7,self_attn.qkv_proj,0.0001384777,0.05000,1.049
7,self_attn.o_proj,0.0000026701,0.05000,1.038
7,mlp.gate_proj,0.0000488039,0.05000,2.357
7,mlp.up_proj,0.0000447177,0.05000,2.384
7,mlp.down_proj,0.0000080068,0.05000,2.957
8,self_attn.qkv_proj,0.0001268911,0.05000,1.066
8,self_attn.o_proj,0.0000035567,0.05000,1.000
8,mlp.gate_proj,0.0000463068,0.05000,2.386
8,mlp.up_proj,0.0000451744,0.05000,2.408
8,mlp.down_proj,0.0000082719,0.05000,2.994
9,self_attn.qkv_proj,0.0001118555,0.05000,1.019
9,self_attn.o_proj,0.0000036070,0.05000,1.045
9,mlp.up_proj,0.0000490196,0.05000,2.307
9,mlp.gate_proj,0.0000489556,0.05000,2.306
9,mlp.down_proj,0.0000078682,0.05000,2.932
10,self_attn.qkv_proj,0.0001195859,0.05000,1.039
10,self_attn.o_proj,0.0000053637,0.05000,1.004
10,mlp.gate_proj,0.0000508104,0.05000,2.384
10,mlp.up_proj,0.0000506414,0.05000,2.403
10,mlp.down_proj,0.0000088444,0.05000,2.987
11,self_attn.qkv_proj,0.0001189149,0.05000,1.026
11,self_attn.o_proj,0.0000047267,0.05000,1.049
11,mlp.up_proj,0.0000525891,0.05000,2.311
11,mlp.gate_proj,0.0000505481,0.05000,2.330
11,mlp.down_proj,0.0000090989,0.05000,3.007
12,self_attn.qkv_proj,0.0001222839,0.05000,1.036
12,self_attn.o_proj,0.0000046178,0.05000,1.048
12,mlp.up_proj,0.0000535870,0.05000,2.276
12,mlp.gate_proj,0.0000492890,0.05000,2.301
12,mlp.down_proj,0.0000108105,0.05000,2.947
13,self_attn.qkv_proj,0.0001456172,0.05000,1.026
13,self_attn.o_proj,0.0000059778,0.05000,1.031
13,mlp.gate_proj,0.0000507735,0.05000,2.282
13,mlp.up_proj,0.0000571203,0.05000,2.302
13,mlp.down_proj,0.0000114501,0.05000,2.939
14,self_attn.qkv_proj,0.0001290736,0.05000,1.052
14,self_attn.o_proj,0.0000053882,0.05000,1.012
14,mlp.gate_proj,0.0000560465,0.05000,2.260
14,mlp.up_proj,0.0000626098,0.05000,2.263
14,mlp.down_proj,0.0000130744,0.05000,2.974
15,self_attn.qkv_proj,0.0001434816,0.05000,1.038
15,self_attn.o_proj,0.0000051712,0.05000,1.004
15,mlp.up_proj,0.0000692544,0.05000,2.446
15,mlp.gate_proj,0.0000621178,0.05000,2.473
15,mlp.down_proj,0.0000150576,0.05000,2.920
16,self_attn.qkv_proj,0.0001369979,0.05000,1.019
16,self_attn.o_proj,0.0000090328,0.05000,1.007
16,mlp.gate_proj,0.0000653503,0.05000,2.323
16,mlp.up_proj,0.0000734144,0.05000,2.352
16,mlp.down_proj,0.0000200746,0.05000,2.964
17,self_attn.qkv_proj,0.0001395030,0.05000,1.015
17,self_attn.o_proj,0.0000068804,0.05000,1.013
17,mlp.gate_proj,0.0000694652,0.05000,2.324
17,mlp.up_proj,0.0000789464,0.05000,2.343
17,mlp.down_proj,0.0000242481,0.05000,2.968
18,self_attn.qkv_proj,0.0001378879,0.05000,1.040
18,self_attn.o_proj,0.0000118515,0.05000,1.062
18,mlp.up_proj,0.0000885018,0.05000,2.303
18,mlp.gate_proj,0.0000787926,0.05000,2.330
18,mlp.down_proj,0.0000361241,0.05000,2.967
19,self_attn.qkv_proj,0.0001587094,0.05000,1.029
19,self_attn.o_proj,0.0000144369,0.05000,1.015
19,mlp.gate_proj,0.0000868370,0.05000,2.312
19,mlp.up_proj,0.0000961948,0.05000,2.332
19,mlp.down_proj,0.0000418560,0.05000,2.953
20,self_attn.qkv_proj,0.0001532980,0.05000,1.032
20,self_attn.o_proj,0.0000176382,0.05000,1.009
20,mlp.gate_proj,0.0001063069,0.05000,2.306
20,mlp.up_proj,0.0001176227,0.05000,2.338
20,mlp.down_proj,0.0000541321,0.05000,2.950
21,self_attn.qkv_proj,0.0001821614,0.05000,1.026
21,self_attn.o_proj,0.0000128516,0.05000,1.015
21,mlp.up_proj,0.0001266831,0.05000,2.502
21,mlp.gate_proj,0.0001130891,0.05000,2.516
21,mlp.down_proj,0.0000670870,0.05000,3.011
22,self_attn.qkv_proj,0.0001746809,0.05000,1.028
22,self_attn.o_proj,0.0000238040,0.05000,1.043
22,mlp.up_proj,0.0001363046,0.05000,2.250
22,mlp.gate_proj,0.0001202949,0.05000,2.275
22,mlp.down_proj,0.0000788939,0.05000,2.992
23,self_attn.qkv_proj,0.0001925415,0.05000,1.013
23,self_attn.o_proj,0.0000102084,0.05000,1.015
23,mlp.gate_proj,0.0001299220,0.05000,2.277
23,mlp.up_proj,0.0001462273,0.05000,2.299
23,mlp.down_proj,0.0000795165,0.05000,2.962
24,self_attn.qkv_proj,0.0002069782,0.05000,1.031
24,self_attn.o_proj,0.0000115072,0.05000,1.051
24,mlp.gate_proj,0.0001396862,0.05000,2.344
24,mlp.up_proj,0.0001586309,0.05000,2.348
24,mlp.down_proj,0.0000930914,0.05000,2.952
25,self_attn.qkv_proj,0.0002230113,0.05000,1.052
25,self_attn.o_proj,0.0000204678,0.05000,0.996
25,mlp.gate_proj,0.0001546881,0.05000,2.336
25,mlp.up_proj,0.0001761131,0.05000,2.359
25,mlp.down_proj,0.0001077607,0.05000,2.968
26,self_attn.qkv_proj,0.0001977103,0.05000,1.014
26,self_attn.o_proj,0.0000338197,0.05000,1.015
26,mlp.up_proj,0.0001833882,0.05000,2.316
26,mlp.gate_proj,0.0001614466,0.05000,2.336
26,mlp.down_proj,0.0001312572,0.05000,2.941
27,self_attn.qkv_proj,0.0001965278,0.05000,1.011
27,self_attn.o_proj,0.0000231340,0.05000,1.005
27,mlp.gate_proj,0.0001804944,0.05000,2.462
27,mlp.up_proj,0.0002018597,0.05000,2.477
27,mlp.down_proj,0.0001707861,0.05000,2.984
28,self_attn.qkv_proj,0.0002510537,0.05000,1.017
28,self_attn.o_proj,0.0000287529,0.05000,1.024
28,mlp.up_proj,0.0002194517,0.05000,2.276
28,mlp.gate_proj,0.0002030963,0.05000,2.300
28,mlp.down_proj,0.0002290906,0.05000,2.962
29,self_attn.qkv_proj,0.0002273341,0.05000,1.045
29,self_attn.o_proj,0.0000351872,0.05000,1.027
29,mlp.gate_proj,0.0002264227,0.05000,2.352
29,mlp.up_proj,0.0002236534,0.05000,2.373
29,mlp.down_proj,0.0003785557,0.05000,2.977
30,self_attn.qkv_proj,0.0001608474,0.05000,1.024
30,self_attn.o_proj,0.0000363605,0.05000,1.023
30,mlp.gate_proj,0.0002430771,0.05000,2.505
30,mlp.up_proj,0.0002131529,0.05000,2.513
30,mlp.down_proj,0.0014835209,0.05000,2.926
31,self_attn.qkv_proj,0.0000034551,0.05000,1.074
31,self_attn.o_proj,0.0000042867,0.05000,1.011
31,mlp.gate_proj,0.0001017404,0.05000,2.333
31,mlp.up_proj,0.0000593105,0.05000,2.351
31,mlp.down_proj,0.0004770287,0.05000,2.931