File size: 7,379 Bytes
53bb6fd | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 | layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000029929,0.05000,1.589
0,self_attn.o_proj,0.0000001045,0.05000,0.964
0,mlp.gate_proj,0.0000063314,0.05000,2.138
0,mlp.up_proj,0.0000059726,0.05000,2.171
0,mlp.down_proj,0.0000001969,0.05000,2.824
1,self_attn.qkv_proj,0.0000177958,0.05000,1.157
1,self_attn.o_proj,0.0000001157,0.05000,1.036
1,mlp.gate_proj,0.0000088358,0.05000,2.975
1,mlp.up_proj,0.0000080169,0.05000,3.019
1,mlp.down_proj,0.0000003500,0.05000,2.972
2,self_attn.qkv_proj,0.0000283670,0.05000,1.035
2,self_attn.o_proj,0.0000001541,0.05000,1.075
2,mlp.gate_proj,0.0000087870,0.05000,2.253
2,mlp.up_proj,0.0000078665,0.05000,2.265
2,mlp.down_proj,0.0000003255,0.05000,2.942
3,self_attn.qkv_proj,0.0000338127,0.05000,1.005
3,self_attn.o_proj,0.0000003137,0.05000,1.011
3,mlp.gate_proj,0.0000158869,0.05000,2.163
3,mlp.up_proj,0.0000136104,0.05000,2.196
3,mlp.down_proj,0.0000427317,0.05000,2.914
4,self_attn.qkv_proj,0.0000373079,0.05000,1.048
4,self_attn.o_proj,0.0000003564,0.05000,0.996
4,mlp.up_proj,0.0000131388,0.05000,2.286
4,mlp.gate_proj,0.0000163559,0.05000,2.303
4,mlp.down_proj,0.0000009839,0.05000,2.888
5,self_attn.qkv_proj,0.0000445573,0.05000,1.013
5,self_attn.o_proj,0.0000005962,0.05000,1.023
5,mlp.gate_proj,0.0000180498,0.05000,2.378
5,mlp.up_proj,0.0000140669,0.05000,2.414
5,mlp.down_proj,0.0000012192,0.05000,2.923
6,self_attn.qkv_proj,0.0000341724,0.05000,1.010
6,self_attn.o_proj,0.0000011619,0.05000,1.020
6,mlp.gate_proj,0.0000183702,0.05000,2.365
6,mlp.up_proj,0.0000152781,0.05000,2.367
6,mlp.down_proj,0.0000016868,0.05000,2.890
7,self_attn.qkv_proj,0.0000553964,0.05000,1.012
7,self_attn.o_proj,0.0000007415,0.05000,0.993
7,mlp.gate_proj,0.0000174044,0.05000,2.255
7,mlp.up_proj,0.0000152908,0.05000,2.276
7,mlp.down_proj,0.0000016985,0.05000,2.981
8,self_attn.qkv_proj,0.0000495149,0.05000,1.002
8,self_attn.o_proj,0.0000006034,0.05000,0.999
8,mlp.gate_proj,0.0000178227,0.05000,2.266
8,mlp.up_proj,0.0000171840,0.05000,2.289
8,mlp.down_proj,0.0000018485,0.05000,2.960
9,self_attn.qkv_proj,0.0000430816,0.05000,1.006
9,self_attn.o_proj,0.0000009036,0.05000,1.081
9,mlp.gate_proj,0.0000173485,0.05000,2.280
9,mlp.up_proj,0.0000173551,0.05000,2.298
9,mlp.down_proj,0.0000018817,0.05000,2.903
10,self_attn.qkv_proj,0.0000433983,0.05000,1.010
10,self_attn.o_proj,0.0000012253,0.05000,1.009
10,mlp.up_proj,0.0000191325,0.05000,2.302
10,mlp.gate_proj,0.0000193263,0.05000,2.319
10,mlp.down_proj,0.0000021741,0.05000,2.882
11,self_attn.qkv_proj,0.0000463978,0.05000,1.046
11,self_attn.o_proj,0.0000018500,0.05000,0.981
11,mlp.up_proj,0.0000213888,0.05000,2.286
11,mlp.gate_proj,0.0000202338,0.05000,2.311
11,mlp.down_proj,0.0000025080,0.05000,2.888
12,self_attn.qkv_proj,0.0000507519,0.05000,1.118
12,self_attn.o_proj,0.0000016432,0.05000,1.053
12,mlp.gate_proj,0.0000210578,0.05000,2.404
12,mlp.up_proj,0.0000233956,0.05000,2.436
12,mlp.down_proj,0.0000030367,0.05000,3.036
13,self_attn.qkv_proj,0.0000660197,0.05000,1.024
13,self_attn.o_proj,0.0000018919,0.05000,1.027
13,mlp.gate_proj,0.0000217064,0.05000,2.295
13,mlp.up_proj,0.0000255225,0.05000,2.312
13,mlp.down_proj,0.0000033143,0.05000,2.927
14,self_attn.qkv_proj,0.0000574443,0.05000,0.995
14,self_attn.o_proj,0.0000015500,0.05000,1.016
14,mlp.up_proj,0.0000290123,0.05000,2.244
14,mlp.gate_proj,0.0000248531,0.05000,2.264
14,mlp.down_proj,0.0000037807,0.05000,2.944
15,self_attn.qkv_proj,0.0000651020,0.05000,1.009
15,self_attn.o_proj,0.0000026469,0.05000,1.033
15,mlp.up_proj,0.0000307608,0.05000,2.212
15,mlp.gate_proj,0.0000263729,0.05000,2.240
15,mlp.down_proj,0.0000042095,0.05000,2.912
16,self_attn.qkv_proj,0.0000577900,0.05000,1.016
16,self_attn.o_proj,0.0000031993,0.05000,1.026
16,mlp.up_proj,0.0000332469,0.05000,2.312
16,mlp.gate_proj,0.0000283605,0.05000,2.331
16,mlp.down_proj,0.0000052141,0.05000,2.921
17,self_attn.qkv_proj,0.0000622398,0.05000,1.017
17,self_attn.o_proj,0.0000029537,0.05000,1.056
17,mlp.gate_proj,0.0000317461,0.05000,2.302
17,mlp.up_proj,0.0000378686,0.05000,2.327
17,mlp.down_proj,0.0000068786,0.05000,2.916
18,self_attn.qkv_proj,0.0000657631,0.05000,1.011
18,self_attn.o_proj,0.0000065101,0.05000,1.037
18,mlp.up_proj,0.0000418297,0.05000,2.208
18,mlp.gate_proj,0.0000357805,0.05000,2.237
18,mlp.down_proj,0.0000089543,0.05000,2.894
19,self_attn.qkv_proj,0.0000770983,0.05000,1.020
19,self_attn.o_proj,0.0000077340,0.05000,1.028
19,mlp.up_proj,0.0000444914,0.05000,2.382
19,mlp.gate_proj,0.0000386684,0.05000,2.380
19,mlp.down_proj,0.0000109362,0.05000,2.911
20,self_attn.qkv_proj,0.0000740929,0.05000,1.003
20,self_attn.o_proj,0.0000081113,0.05000,0.986
20,mlp.gate_proj,0.0000472041,0.05000,2.307
20,mlp.up_proj,0.0000543119,0.05000,2.330
20,mlp.down_proj,0.0000145892,0.05000,2.990
21,self_attn.qkv_proj,0.0000857731,0.05000,1.021
21,self_attn.o_proj,0.0000068950,0.05000,0.998
21,mlp.up_proj,0.0000586656,0.05000,2.283
21,mlp.gate_proj,0.0000500638,0.05000,2.313
21,mlp.down_proj,0.0000176288,0.05000,2.957
22,self_attn.qkv_proj,0.0000867742,0.05000,1.019
22,self_attn.o_proj,0.0000102738,0.05000,0.996
22,mlp.up_proj,0.0000663261,0.05000,2.281
22,mlp.gate_proj,0.0000555567,0.05000,2.303
22,mlp.down_proj,0.0000202035,0.05000,2.910
23,self_attn.qkv_proj,0.0000962782,0.05000,1.005
23,self_attn.o_proj,0.0000096911,0.05000,1.009
23,mlp.up_proj,0.0000733566,0.05000,2.193
23,mlp.gate_proj,0.0000619966,0.05000,2.214
23,mlp.down_proj,0.0000254390,0.05000,2.972
24,self_attn.qkv_proj,0.0001047326,0.05000,1.043
24,self_attn.o_proj,0.0000094759,0.05000,0.995
24,mlp.up_proj,0.0000819970,0.05000,2.187
24,mlp.gate_proj,0.0000681171,0.05000,2.217
24,mlp.down_proj,0.0000320756,0.05000,2.875
25,self_attn.qkv_proj,0.0001196687,0.05000,1.032
25,self_attn.o_proj,0.0000178841,0.05000,0.992
25,mlp.gate_proj,0.0000786205,0.05000,2.282
25,mlp.up_proj,0.0000949818,0.05000,2.302
25,mlp.down_proj,0.0000417770,0.05000,2.970
26,self_attn.qkv_proj,0.0001117620,0.05000,1.023
26,self_attn.o_proj,0.0000252745,0.05000,0.996
26,mlp.up_proj,0.0001003381,0.05000,2.225
26,mlp.gate_proj,0.0000833383,0.05000,2.252
26,mlp.down_proj,0.0000515722,0.05000,2.924
27,self_attn.qkv_proj,0.0001086565,0.05000,1.016
27,self_attn.o_proj,0.0000264664,0.05000,0.999
27,mlp.up_proj,0.0001091925,0.05000,2.223
27,mlp.gate_proj,0.0000928646,0.05000,2.222
27,mlp.down_proj,0.0000621013,0.05000,2.919
28,self_attn.qkv_proj,0.0001426622,0.05000,1.013
28,self_attn.o_proj,0.0000346105,0.05000,0.997
28,mlp.up_proj,0.0001217435,0.05000,2.149
28,mlp.gate_proj,0.0001090677,0.05000,2.162
28,mlp.down_proj,0.0000804849,0.05000,2.925
29,self_attn.qkv_proj,0.0001282340,0.05000,1.021
29,self_attn.o_proj,0.0000445930,0.05000,1.029
29,mlp.up_proj,0.0001171631,0.05000,2.218
29,mlp.gate_proj,0.0001193069,0.05000,2.254
29,mlp.down_proj,0.0000950395,0.05000,2.887
30,self_attn.qkv_proj,0.0001681025,0.05000,0.995
30,self_attn.o_proj,0.0000827839,0.05000,1.008
30,mlp.up_proj,0.0002124111,0.05000,2.299
30,mlp.gate_proj,0.0002344202,0.05000,2.309
30,mlp.down_proj,1.6844320378,0.05000,2.899
31,self_attn.qkv_proj,0.0000036079,0.05000,1.055
31,self_attn.o_proj,0.0000053948,0.05000,1.004
31,mlp.gate_proj,0.0000985641,0.05000,2.237
31,mlp.up_proj,0.0000607404,0.05000,2.259
31,mlp.down_proj,0.0000745720,0.05000,2.906
|