File size: 7,379 Bytes
414df82 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 | layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000037035,0.05000,1.695
0,self_attn.o_proj,0.0000001912,0.05000,0.993
0,mlp.up_proj,0.0000102369,0.05000,2.424
0,mlp.gate_proj,0.0000107023,0.05000,2.453
0,mlp.down_proj,0.0000007776,0.05000,2.854
1,self_attn.qkv_proj,0.0000286602,0.05000,1.281
1,self_attn.o_proj,0.0000004302,0.05000,1.073
1,mlp.gate_proj,0.0000156239,0.05000,2.984
1,mlp.up_proj,0.0000145528,0.05000,3.031
1,mlp.down_proj,0.0000015817,0.05000,3.079
2,self_attn.qkv_proj,0.0000670091,0.05000,1.059
2,self_attn.o_proj,0.0000003938,0.05000,1.070
2,mlp.up_proj,0.0000224096,0.05000,2.395
2,mlp.gate_proj,0.0000242441,0.05000,2.416
2,mlp.down_proj,0.0000015780,0.05000,2.917
3,self_attn.qkv_proj,0.0000974988,0.05000,1.073
3,self_attn.o_proj,0.0000007507,0.05000,1.034
3,mlp.up_proj,0.0000273527,0.05000,2.420
3,mlp.gate_proj,0.0000303579,0.05000,2.439
3,mlp.down_proj,0.0002998998,0.05000,2.971
4,self_attn.qkv_proj,0.0000910987,0.05000,1.059
4,self_attn.o_proj,0.0000010523,0.05000,1.028
4,mlp.up_proj,0.0000352418,0.05000,2.337
4,mlp.gate_proj,0.0000410384,0.05000,2.362
4,mlp.down_proj,0.0000039988,0.05000,2.978
5,self_attn.qkv_proj,0.0001155192,0.05000,1.047
5,self_attn.o_proj,0.0000016719,0.05000,1.026
5,mlp.gate_proj,0.0000496211,0.05000,2.362
5,mlp.up_proj,0.0000416632,0.05000,2.390
5,mlp.down_proj,0.0000057624,0.05000,3.039
6,self_attn.qkv_proj,0.0000936164,0.05000,1.020
6,self_attn.o_proj,0.0000023169,0.05000,1.018
6,mlp.gate_proj,0.0000478458,0.05000,2.404
6,mlp.up_proj,0.0000420634,0.05000,2.419
6,mlp.down_proj,0.0000064274,0.05000,3.008
7,self_attn.qkv_proj,0.0001384777,0.05000,1.049
7,self_attn.o_proj,0.0000026701,0.05000,1.038
7,mlp.gate_proj,0.0000488039,0.05000,2.357
7,mlp.up_proj,0.0000447177,0.05000,2.384
7,mlp.down_proj,0.0000080068,0.05000,2.957
8,self_attn.qkv_proj,0.0001268911,0.05000,1.066
8,self_attn.o_proj,0.0000035567,0.05000,1.000
8,mlp.gate_proj,0.0000463068,0.05000,2.386
8,mlp.up_proj,0.0000451744,0.05000,2.408
8,mlp.down_proj,0.0000082719,0.05000,2.994
9,self_attn.qkv_proj,0.0001118555,0.05000,1.019
9,self_attn.o_proj,0.0000036070,0.05000,1.045
9,mlp.up_proj,0.0000490196,0.05000,2.307
9,mlp.gate_proj,0.0000489556,0.05000,2.306
9,mlp.down_proj,0.0000078682,0.05000,2.932
10,self_attn.qkv_proj,0.0001195859,0.05000,1.039
10,self_attn.o_proj,0.0000053637,0.05000,1.004
10,mlp.gate_proj,0.0000508104,0.05000,2.384
10,mlp.up_proj,0.0000506414,0.05000,2.403
10,mlp.down_proj,0.0000088444,0.05000,2.987
11,self_attn.qkv_proj,0.0001189149,0.05000,1.026
11,self_attn.o_proj,0.0000047267,0.05000,1.049
11,mlp.up_proj,0.0000525891,0.05000,2.311
11,mlp.gate_proj,0.0000505481,0.05000,2.330
11,mlp.down_proj,0.0000090989,0.05000,3.007
12,self_attn.qkv_proj,0.0001222839,0.05000,1.036
12,self_attn.o_proj,0.0000046178,0.05000,1.048
12,mlp.up_proj,0.0000535870,0.05000,2.276
12,mlp.gate_proj,0.0000492890,0.05000,2.301
12,mlp.down_proj,0.0000108105,0.05000,2.947
13,self_attn.qkv_proj,0.0001456172,0.05000,1.026
13,self_attn.o_proj,0.0000059778,0.05000,1.031
13,mlp.gate_proj,0.0000507735,0.05000,2.282
13,mlp.up_proj,0.0000571203,0.05000,2.302
13,mlp.down_proj,0.0000114501,0.05000,2.939
14,self_attn.qkv_proj,0.0001290736,0.05000,1.052
14,self_attn.o_proj,0.0000053882,0.05000,1.012
14,mlp.gate_proj,0.0000560465,0.05000,2.260
14,mlp.up_proj,0.0000626098,0.05000,2.263
14,mlp.down_proj,0.0000130744,0.05000,2.974
15,self_attn.qkv_proj,0.0001434816,0.05000,1.038
15,self_attn.o_proj,0.0000051712,0.05000,1.004
15,mlp.up_proj,0.0000692544,0.05000,2.446
15,mlp.gate_proj,0.0000621178,0.05000,2.473
15,mlp.down_proj,0.0000150576,0.05000,2.920
16,self_attn.qkv_proj,0.0001369979,0.05000,1.019
16,self_attn.o_proj,0.0000090328,0.05000,1.007
16,mlp.gate_proj,0.0000653503,0.05000,2.323
16,mlp.up_proj,0.0000734144,0.05000,2.352
16,mlp.down_proj,0.0000200746,0.05000,2.964
17,self_attn.qkv_proj,0.0001395030,0.05000,1.015
17,self_attn.o_proj,0.0000068804,0.05000,1.013
17,mlp.gate_proj,0.0000694652,0.05000,2.324
17,mlp.up_proj,0.0000789464,0.05000,2.343
17,mlp.down_proj,0.0000242481,0.05000,2.968
18,self_attn.qkv_proj,0.0001378879,0.05000,1.040
18,self_attn.o_proj,0.0000118515,0.05000,1.062
18,mlp.up_proj,0.0000885018,0.05000,2.303
18,mlp.gate_proj,0.0000787926,0.05000,2.330
18,mlp.down_proj,0.0000361241,0.05000,2.967
19,self_attn.qkv_proj,0.0001587094,0.05000,1.029
19,self_attn.o_proj,0.0000144369,0.05000,1.015
19,mlp.gate_proj,0.0000868370,0.05000,2.312
19,mlp.up_proj,0.0000961948,0.05000,2.332
19,mlp.down_proj,0.0000418560,0.05000,2.953
20,self_attn.qkv_proj,0.0001532980,0.05000,1.032
20,self_attn.o_proj,0.0000176382,0.05000,1.009
20,mlp.gate_proj,0.0001063069,0.05000,2.306
20,mlp.up_proj,0.0001176227,0.05000,2.338
20,mlp.down_proj,0.0000541321,0.05000,2.950
21,self_attn.qkv_proj,0.0001821614,0.05000,1.026
21,self_attn.o_proj,0.0000128516,0.05000,1.015
21,mlp.up_proj,0.0001266831,0.05000,2.502
21,mlp.gate_proj,0.0001130891,0.05000,2.516
21,mlp.down_proj,0.0000670870,0.05000,3.011
22,self_attn.qkv_proj,0.0001746809,0.05000,1.028
22,self_attn.o_proj,0.0000238040,0.05000,1.043
22,mlp.up_proj,0.0001363046,0.05000,2.250
22,mlp.gate_proj,0.0001202949,0.05000,2.275
22,mlp.down_proj,0.0000788939,0.05000,2.992
23,self_attn.qkv_proj,0.0001925415,0.05000,1.013
23,self_attn.o_proj,0.0000102084,0.05000,1.015
23,mlp.gate_proj,0.0001299220,0.05000,2.277
23,mlp.up_proj,0.0001462273,0.05000,2.299
23,mlp.down_proj,0.0000795165,0.05000,2.962
24,self_attn.qkv_proj,0.0002069782,0.05000,1.031
24,self_attn.o_proj,0.0000115072,0.05000,1.051
24,mlp.gate_proj,0.0001396862,0.05000,2.344
24,mlp.up_proj,0.0001586309,0.05000,2.348
24,mlp.down_proj,0.0000930914,0.05000,2.952
25,self_attn.qkv_proj,0.0002230113,0.05000,1.052
25,self_attn.o_proj,0.0000204678,0.05000,0.996
25,mlp.gate_proj,0.0001546881,0.05000,2.336
25,mlp.up_proj,0.0001761131,0.05000,2.359
25,mlp.down_proj,0.0001077607,0.05000,2.968
26,self_attn.qkv_proj,0.0001977103,0.05000,1.014
26,self_attn.o_proj,0.0000338197,0.05000,1.015
26,mlp.up_proj,0.0001833882,0.05000,2.316
26,mlp.gate_proj,0.0001614466,0.05000,2.336
26,mlp.down_proj,0.0001312572,0.05000,2.941
27,self_attn.qkv_proj,0.0001965278,0.05000,1.011
27,self_attn.o_proj,0.0000231340,0.05000,1.005
27,mlp.gate_proj,0.0001804944,0.05000,2.462
27,mlp.up_proj,0.0002018597,0.05000,2.477
27,mlp.down_proj,0.0001707861,0.05000,2.984
28,self_attn.qkv_proj,0.0002510537,0.05000,1.017
28,self_attn.o_proj,0.0000287529,0.05000,1.024
28,mlp.up_proj,0.0002194517,0.05000,2.276
28,mlp.gate_proj,0.0002030963,0.05000,2.300
28,mlp.down_proj,0.0002290906,0.05000,2.962
29,self_attn.qkv_proj,0.0002273341,0.05000,1.045
29,self_attn.o_proj,0.0000351872,0.05000,1.027
29,mlp.gate_proj,0.0002264227,0.05000,2.352
29,mlp.up_proj,0.0002236534,0.05000,2.373
29,mlp.down_proj,0.0003785557,0.05000,2.977
30,self_attn.qkv_proj,0.0001608474,0.05000,1.024
30,self_attn.o_proj,0.0000363605,0.05000,1.023
30,mlp.gate_proj,0.0002430771,0.05000,2.505
30,mlp.up_proj,0.0002131529,0.05000,2.513
30,mlp.down_proj,0.0014835209,0.05000,2.926
31,self_attn.qkv_proj,0.0000034551,0.05000,1.074
31,self_attn.o_proj,0.0000042867,0.05000,1.011
31,mlp.gate_proj,0.0001017404,0.05000,2.333
31,mlp.up_proj,0.0000593105,0.05000,2.351
31,mlp.down_proj,0.0004770287,0.05000,2.931
|