File size: 7,379 Bytes
6a102df | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 | layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000033337,0.05000,1.970
0,self_attn.o_proj,0.0000001568,0.05000,1.193
0,mlp.gate_proj,0.0000094541,0.05000,2.477
0,mlp.up_proj,0.0000090174,0.05000,2.527
0,mlp.down_proj,0.0000005734,0.05000,2.784
1,self_attn.qkv_proj,0.0000253673,0.05000,1.153
1,self_attn.o_proj,0.0000003501,0.05000,1.191
1,mlp.up_proj,0.0000115117,0.05000,2.958
1,mlp.gate_proj,0.0000125914,0.05000,2.991
1,mlp.down_proj,0.0000009363,0.05000,3.015
2,self_attn.qkv_proj,0.0000545575,0.05000,1.052
2,self_attn.o_proj,0.0000003618,0.05000,1.068
2,mlp.up_proj,0.0000162658,0.05000,3.042
2,mlp.gate_proj,0.0000179054,0.05000,3.061
2,mlp.down_proj,0.0000010033,0.05000,2.914
3,self_attn.qkv_proj,0.0000754067,0.05000,1.075
3,self_attn.o_proj,0.0000005250,0.05000,0.998
3,mlp.up_proj,0.0000187377,0.05000,2.269
3,mlp.gate_proj,0.0000214041,0.05000,2.297
3,mlp.down_proj,0.0002351547,0.05000,2.890
4,self_attn.qkv_proj,0.0000709153,0.05000,1.011
4,self_attn.o_proj,0.0000009426,0.05000,1.000
4,mlp.up_proj,0.0000266585,0.05000,2.434
4,mlp.gate_proj,0.0000322079,0.05000,2.466
4,mlp.down_proj,0.0000028561,0.05000,2.926
5,self_attn.qkv_proj,0.0000920992,0.05000,1.010
5,self_attn.o_proj,0.0000015057,0.05000,1.010
5,mlp.up_proj,0.0000311401,0.05000,2.282
5,mlp.gate_proj,0.0000387061,0.05000,2.308
5,mlp.down_proj,0.0000040372,0.05000,2.975
6,self_attn.qkv_proj,0.0000751325,0.05000,1.011
6,self_attn.o_proj,0.0000017975,0.05000,1.018
6,mlp.gate_proj,0.0000391059,0.05000,2.604
6,mlp.up_proj,0.0000332029,0.05000,2.646
6,mlp.down_proj,0.0000049817,0.05000,2.970
7,self_attn.qkv_proj,0.0001157685,0.05000,1.043
7,self_attn.o_proj,0.0000020251,0.05000,1.062
7,mlp.up_proj,0.0000352015,0.05000,2.432
7,mlp.gate_proj,0.0000395090,0.05000,2.451
7,mlp.down_proj,0.0000058283,0.05000,2.930
8,self_attn.qkv_proj,0.0001045483,0.05000,1.025
8,self_attn.o_proj,0.0000020512,0.05000,1.005
8,mlp.gate_proj,0.0000368261,0.05000,2.249
8,mlp.up_proj,0.0000355081,0.05000,2.276
8,mlp.down_proj,0.0000057011,0.05000,2.933
9,self_attn.qkv_proj,0.0000903360,0.05000,1.021
9,self_attn.o_proj,0.0000025147,0.05000,1.024
9,mlp.gate_proj,0.0000381440,0.05000,2.258
9,mlp.up_proj,0.0000379692,0.05000,2.287
9,mlp.down_proj,0.0000054069,0.05000,2.922
10,self_attn.qkv_proj,0.0000977697,0.05000,1.010
10,self_attn.o_proj,0.0000037061,0.05000,1.050
10,mlp.up_proj,0.0000417211,0.05000,2.357
10,mlp.gate_proj,0.0000421710,0.05000,2.380
10,mlp.down_proj,0.0000064649,0.05000,2.948
11,self_attn.qkv_proj,0.0001041781,0.05000,1.010
11,self_attn.o_proj,0.0000043695,0.05000,1.035
11,mlp.gate_proj,0.0000435187,0.05000,2.366
11,mlp.up_proj,0.0000454773,0.05000,2.381
11,mlp.down_proj,0.0000071585,0.05000,2.931
12,self_attn.qkv_proj,0.0001108157,0.05000,1.013
12,self_attn.o_proj,0.0000038909,0.05000,1.009
12,mlp.gate_proj,0.0000440640,0.05000,2.264
12,mlp.up_proj,0.0000483411,0.05000,2.282
12,mlp.down_proj,0.0000083439,0.05000,2.919
13,self_attn.qkv_proj,0.0001360751,0.05000,1.019
13,self_attn.o_proj,0.0000052360,0.05000,0.993
13,mlp.gate_proj,0.0000448895,0.05000,2.295
13,mlp.up_proj,0.0000516026,0.05000,2.308
13,mlp.down_proj,0.0000088433,0.05000,2.981
14,self_attn.qkv_proj,0.0001205465,0.05000,1.058
14,self_attn.o_proj,0.0000045024,0.05000,1.012
14,mlp.gate_proj,0.0000490126,0.05000,2.358
14,mlp.up_proj,0.0000558636,0.05000,2.385
14,mlp.down_proj,0.0000094944,0.05000,2.907
15,self_attn.qkv_proj,0.0001328261,0.05000,1.018
15,self_attn.o_proj,0.0000043096,0.05000,1.019
15,mlp.gate_proj,0.0000536100,0.05000,2.319
15,mlp.up_proj,0.0000610305,0.05000,2.339
15,mlp.down_proj,0.0000106724,0.05000,2.888
16,self_attn.qkv_proj,0.0001251596,0.05000,1.025
16,self_attn.o_proj,0.0000077229,0.05000,1.004
16,mlp.up_proj,0.0000627541,0.05000,2.347
16,mlp.gate_proj,0.0000547321,0.05000,2.372
16,mlp.down_proj,0.0000136088,0.05000,2.974
17,self_attn.qkv_proj,0.0001212124,0.05000,1.015
17,self_attn.o_proj,0.0000051576,0.05000,1.019
17,mlp.gate_proj,0.0000581634,0.05000,2.241
17,mlp.up_proj,0.0000677224,0.05000,2.266
17,mlp.down_proj,0.0000170442,0.05000,2.977
18,self_attn.qkv_proj,0.0001200134,0.05000,0.988
18,self_attn.o_proj,0.0000090346,0.05000,1.000
18,mlp.gate_proj,0.0000653781,0.05000,2.245
18,mlp.up_proj,0.0000751556,0.05000,2.282
18,mlp.down_proj,0.0000247040,0.05000,2.888
19,self_attn.qkv_proj,0.0001405187,0.05000,1.018
19,self_attn.o_proj,0.0000128052,0.05000,1.005
19,mlp.up_proj,0.0000819399,0.05000,2.238
19,mlp.gate_proj,0.0000723034,0.05000,2.255
19,mlp.down_proj,0.0000287014,0.05000,2.892
20,self_attn.qkv_proj,0.0001370618,0.05000,1.049
20,self_attn.o_proj,0.0000141441,0.05000,0.995
20,mlp.gate_proj,0.0000871970,0.05000,2.277
20,mlp.up_proj,0.0000987938,0.05000,2.300
20,mlp.down_proj,0.0000353455,0.05000,2.886
21,self_attn.qkv_proj,0.0001576805,0.05000,1.020
21,self_attn.o_proj,0.0000103696,0.05000,0.997
21,mlp.gate_proj,0.0000898126,0.05000,2.334
21,mlp.up_proj,0.0001034518,0.05000,2.360
21,mlp.down_proj,0.0000406898,0.05000,2.901
22,self_attn.qkv_proj,0.0001496053,0.05000,1.007
22,self_attn.o_proj,0.0000179317,0.05000,1.007
22,mlp.up_proj,0.0001094033,0.05000,2.271
22,mlp.gate_proj,0.0000937537,0.05000,2.296
22,mlp.down_proj,0.0000450660,0.05000,2.890
23,self_attn.qkv_proj,0.0001562641,0.05000,1.000
23,self_attn.o_proj,0.0000076899,0.05000,1.000
23,mlp.up_proj,0.0001155189,0.05000,2.287
23,mlp.gate_proj,0.0000998504,0.05000,2.312
23,mlp.down_proj,0.0000445921,0.05000,2.932
24,self_attn.qkv_proj,0.0001635886,0.05000,1.013
24,self_attn.o_proj,0.0000070508,0.05000,1.015
24,mlp.up_proj,0.0001205805,0.05000,2.324
24,mlp.gate_proj,0.0001030940,0.05000,2.348
24,mlp.down_proj,0.0000522420,0.05000,2.951
25,self_attn.qkv_proj,0.0001784758,0.05000,1.019
25,self_attn.o_proj,0.0000145658,0.05000,0.995
25,mlp.up_proj,0.0001376533,0.05000,2.229
25,mlp.gate_proj,0.0001171439,0.05000,2.260
25,mlp.down_proj,0.0000661028,0.05000,2.879
26,self_attn.qkv_proj,0.0001639939,0.05000,1.066
26,self_attn.o_proj,0.0000326306,0.05000,1.007
26,mlp.gate_proj,0.0001198269,0.05000,2.302
26,mlp.up_proj,0.0001404009,0.05000,2.325
26,mlp.down_proj,0.0000833422,0.05000,2.896
27,self_attn.qkv_proj,0.0001548430,0.05000,1.001
27,self_attn.o_proj,0.0000179886,0.05000,1.018
27,mlp.gate_proj,0.0001427162,0.05000,2.394
27,mlp.up_proj,0.0001644143,0.05000,2.412
27,mlp.down_proj,0.0001287594,0.05000,2.911
28,self_attn.qkv_proj,0.0002212718,0.05000,1.007
28,self_attn.o_proj,0.0000247850,0.05000,1.008
28,mlp.up_proj,0.0001861897,0.05000,2.333
28,mlp.gate_proj,0.0001679264,0.05000,2.360
28,mlp.down_proj,0.0001937283,0.05000,2.891
29,self_attn.qkv_proj,0.0002001585,0.05000,1.004
29,self_attn.o_proj,0.0000316542,0.05000,0.983
29,mlp.up_proj,0.0001901275,0.05000,2.192
29,mlp.gate_proj,0.0001900747,0.05000,2.212
29,mlp.down_proj,0.0003015468,0.05000,2.929
30,self_attn.qkv_proj,0.0001382461,0.05000,1.006
30,self_attn.o_proj,0.0000314998,0.05000,1.010
30,mlp.gate_proj,0.0002096816,0.05000,2.345
30,mlp.up_proj,0.0001791842,0.05000,2.372
30,mlp.down_proj,0.0031376772,0.05000,2.968
31,self_attn.qkv_proj,0.0000025484,0.05000,1.065
31,self_attn.o_proj,0.0000041746,0.05000,1.192
31,mlp.gate_proj,0.0000727343,0.05000,2.339
31,mlp.up_proj,0.0000396456,0.05000,2.364
31,mlp.down_proj,0.0004075643,0.05000,2.979
|