File size: 7,379 Bytes
a2d6e86 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 | layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000234433,0.05000,1.515
0,self_attn.o_proj,0.0000012551,0.05000,0.936
0,mlp.up_proj,0.0000740401,0.05000,2.474
0,mlp.gate_proj,0.0000768478,0.05000,2.490
0,mlp.down_proj,0.0000051061,0.05000,2.818
1,self_attn.qkv_proj,0.0001699547,0.05000,1.280
1,self_attn.o_proj,0.0000034763,0.05000,1.143
1,mlp.up_proj,0.0001173471,0.05000,2.850
1,mlp.gate_proj,0.0001244575,0.05000,2.885
1,mlp.down_proj,0.0000244783,0.05000,2.984
2,self_attn.qkv_proj,0.0004539477,0.05000,1.043
2,self_attn.o_proj,0.0000030893,0.05000,1.040
2,mlp.gate_proj,0.0001873295,0.05000,2.737
2,mlp.up_proj,0.0001750478,0.05000,2.793
2,mlp.down_proj,0.0000109788,0.05000,2.954
3,self_attn.qkv_proj,0.0006435827,0.05000,1.123
3,self_attn.o_proj,0.0000069274,0.05000,1.466
3,mlp.gate_proj,0.0002680054,0.05000,2.202
3,mlp.up_proj,0.0002448218,0.05000,2.228
3,mlp.down_proj,0.0319495132,0.05000,2.865
4,self_attn.qkv_proj,0.0006558018,0.05000,1.006
4,self_attn.o_proj,0.0000090045,0.05000,1.075
4,mlp.gate_proj,0.0003298683,0.05000,2.266
4,mlp.up_proj,0.0002895112,0.05000,2.286
4,mlp.down_proj,0.0000298855,0.05000,2.908
5,self_attn.qkv_proj,0.0007604120,0.05000,1.000
5,self_attn.o_proj,0.0000106954,0.05000,0.994
5,mlp.gate_proj,0.0003911948,0.05000,2.291
5,mlp.up_proj,0.0003372076,0.05000,2.310
5,mlp.down_proj,0.0000409930,0.05000,2.908
6,self_attn.qkv_proj,0.0006467403,0.05000,1.010
6,self_attn.o_proj,0.0000139023,0.05000,1.011
6,mlp.up_proj,0.0003379441,0.05000,2.350
6,mlp.gate_proj,0.0003750805,0.05000,2.376
6,mlp.down_proj,0.0000462578,0.05000,2.866
7,self_attn.qkv_proj,0.0009227887,0.05000,1.002
7,self_attn.o_proj,0.0000164297,0.05000,1.034
7,mlp.up_proj,0.0003586256,0.05000,2.228
7,mlp.gate_proj,0.0003832810,0.05000,2.231
7,mlp.down_proj,0.0000597295,0.05000,2.858
8,self_attn.qkv_proj,0.0008569787,0.05000,1.008
8,self_attn.o_proj,0.0000230205,0.05000,0.988
8,mlp.gate_proj,0.0003839790,0.05000,2.448
8,mlp.up_proj,0.0003800165,0.05000,2.468
8,mlp.down_proj,0.0000743382,0.05000,2.908
9,self_attn.qkv_proj,0.0007942334,0.05000,1.002
9,self_attn.o_proj,0.0000246915,0.05000,0.993
9,mlp.up_proj,0.0004031824,0.05000,2.326
9,mlp.gate_proj,0.0003977984,0.05000,2.348
9,mlp.down_proj,0.0000619588,0.05000,2.897
10,self_attn.qkv_proj,0.0008438398,0.05000,1.008
10,self_attn.o_proj,0.0000353785,0.05000,1.018
10,mlp.gate_proj,0.0004070449,0.05000,2.320
10,mlp.up_proj,0.0004118055,0.05000,2.346
10,mlp.down_proj,0.0000657525,0.05000,2.923
11,self_attn.qkv_proj,0.0008194585,0.05000,1.053
11,self_attn.o_proj,0.0000269038,0.05000,1.002
11,mlp.gate_proj,0.0004062071,0.05000,2.399
11,mlp.up_proj,0.0004268940,0.05000,2.419
11,mlp.down_proj,0.0000666463,0.05000,2.858
12,self_attn.qkv_proj,0.0008770282,0.05000,0.997
12,self_attn.o_proj,0.0000251990,0.05000,0.993
12,mlp.up_proj,0.0004276355,0.05000,2.300
12,mlp.gate_proj,0.0003912912,0.05000,2.328
12,mlp.down_proj,0.0000774838,0.05000,2.917
13,self_attn.qkv_proj,0.0009794771,0.05000,1.004
13,self_attn.o_proj,0.0000277290,0.05000,0.988
13,mlp.gate_proj,0.0004115693,0.05000,2.315
13,mlp.up_proj,0.0004629706,0.05000,2.340
13,mlp.down_proj,0.0000860639,0.05000,2.901
14,self_attn.qkv_proj,0.0009111086,0.05000,1.044
14,self_attn.o_proj,0.0000270905,0.05000,1.004
14,mlp.gate_proj,0.0004456694,0.05000,2.327
14,mlp.up_proj,0.0004985755,0.05000,2.338
14,mlp.down_proj,0.0000911287,0.05000,2.874
15,self_attn.qkv_proj,0.0010071384,0.05000,1.075
15,self_attn.o_proj,0.0000243394,0.05000,0.988
15,mlp.up_proj,0.0005489160,0.05000,2.215
15,mlp.gate_proj,0.0004908784,0.05000,2.236
15,mlp.down_proj,0.0001038040,0.05000,2.908
16,self_attn.qkv_proj,0.0009476236,0.05000,0.991
16,self_attn.o_proj,0.0000485368,0.05000,0.992
16,mlp.up_proj,0.0005693908,0.05000,2.308
16,mlp.gate_proj,0.0005057035,0.05000,2.330
16,mlp.down_proj,0.0001301657,0.05000,2.891
17,self_attn.qkv_proj,0.0009925160,0.05000,0.998
17,self_attn.o_proj,0.0000390900,0.05000,0.973
17,mlp.up_proj,0.0006069203,0.05000,2.314
17,mlp.gate_proj,0.0005327590,0.05000,2.330
17,mlp.down_proj,0.0001544745,0.05000,2.872
18,self_attn.qkv_proj,0.0009654888,0.05000,1.009
18,self_attn.o_proj,0.0000608897,0.05000,1.001
18,mlp.gate_proj,0.0005690133,0.05000,2.385
18,mlp.up_proj,0.0006410199,0.05000,2.407
18,mlp.down_proj,0.0002298194,0.05000,2.914
19,self_attn.qkv_proj,0.0010355139,0.05000,1.041
19,self_attn.o_proj,0.0000674389,0.05000,1.006
19,mlp.gate_proj,0.0006108685,0.05000,2.337
19,mlp.up_proj,0.0006793319,0.05000,2.365
19,mlp.down_proj,0.0002456510,0.05000,2.942
20,self_attn.qkv_proj,0.0009955477,0.05000,1.016
20,self_attn.o_proj,0.0000853179,0.05000,1.034
20,mlp.gate_proj,0.0007368962,0.05000,2.192
20,mlp.up_proj,0.0008203884,0.05000,2.213
20,mlp.down_proj,0.0003082218,0.05000,2.854
21,self_attn.qkv_proj,0.0011595939,0.05000,1.044
21,self_attn.o_proj,0.0000631391,0.05000,0.988
21,mlp.gate_proj,0.0007788413,0.05000,2.444
21,mlp.up_proj,0.0008753389,0.05000,2.463
21,mlp.down_proj,0.0003915850,0.05000,2.931
22,self_attn.qkv_proj,0.0011074981,0.05000,0.991
22,self_attn.o_proj,0.0000896787,0.05000,1.015
22,mlp.gate_proj,0.0008228205,0.05000,2.343
22,mlp.up_proj,0.0009325047,0.05000,2.386
22,mlp.down_proj,0.0004434848,0.05000,2.865
23,self_attn.qkv_proj,0.0012805010,0.05000,1.000
23,self_attn.o_proj,0.0000562911,0.05000,0.999
23,mlp.up_proj,0.0010011470,0.05000,2.290
23,mlp.gate_proj,0.0008901170,0.05000,2.314
23,mlp.down_proj,0.0004554649,0.05000,2.926
24,self_attn.qkv_proj,0.0013814587,0.05000,1.040
24,self_attn.o_proj,0.0000568903,0.05000,0.987
24,mlp.up_proj,0.0010863662,0.05000,2.384
24,mlp.gate_proj,0.0009593617,0.05000,2.422
24,mlp.down_proj,0.0005254694,0.05000,2.875
25,self_attn.qkv_proj,0.0014469156,0.05000,0.980
25,self_attn.o_proj,0.0000781728,0.05000,1.000
25,mlp.gate_proj,0.0010634154,0.05000,2.338
25,mlp.up_proj,0.0012082151,0.05000,2.360
25,mlp.down_proj,0.0006043160,0.05000,3.007
26,self_attn.qkv_proj,0.0012781918,0.05000,1.039
26,self_attn.o_proj,0.0001430641,0.05000,1.003
26,mlp.up_proj,0.0012724487,0.05000,2.332
26,mlp.gate_proj,0.0011216506,0.05000,2.359
26,mlp.down_proj,0.0007345894,0.05000,2.880
27,self_attn.qkv_proj,0.0013309020,0.05000,1.018
27,self_attn.o_proj,0.0001508330,0.05000,0.996
27,mlp.up_proj,0.0013503263,0.05000,2.279
27,mlp.gate_proj,0.0012045613,0.05000,2.307
27,mlp.down_proj,0.0008768519,0.05000,2.940
28,self_attn.qkv_proj,0.0015792458,0.05000,1.007
28,self_attn.o_proj,0.0001596175,0.05000,1.028
28,mlp.up_proj,0.0014309376,0.05000,2.394
28,mlp.gate_proj,0.0013091725,0.05000,2.401
28,mlp.down_proj,0.0011007471,0.05000,2.875
29,self_attn.qkv_proj,0.0014297700,0.05000,1.039
29,self_attn.o_proj,0.0002247341,0.05000,0.988
29,mlp.gate_proj,0.0014194082,0.05000,2.382
29,mlp.up_proj,0.0014341137,0.05000,2.406
29,mlp.down_proj,0.0018299969,0.05000,2.897
30,self_attn.qkv_proj,0.0009961152,0.05000,1.045
30,self_attn.o_proj,0.0002220271,0.05000,1.001
30,mlp.up_proj,0.0013122857,0.05000,2.346
30,mlp.gate_proj,0.0014473631,0.05000,2.370
30,mlp.down_proj,0.0182979599,0.05000,2.924
31,self_attn.qkv_proj,0.0000219487,0.05000,1.020
31,self_attn.o_proj,0.0000321238,0.05000,0.988
31,mlp.gate_proj,0.0006197570,0.05000,2.283
31,mlp.up_proj,0.0003814784,0.05000,2.303
31,mlp.down_proj,0.0030642595,0.05000,2.861
|