File size: 7,379 Bytes
414df82
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000037035,0.05000,1.695
0,self_attn.o_proj,0.0000001912,0.05000,0.993
0,mlp.up_proj,0.0000102369,0.05000,2.424
0,mlp.gate_proj,0.0000107023,0.05000,2.453
0,mlp.down_proj,0.0000007776,0.05000,2.854
1,self_attn.qkv_proj,0.0000286602,0.05000,1.281
1,self_attn.o_proj,0.0000004302,0.05000,1.073
1,mlp.gate_proj,0.0000156239,0.05000,2.984
1,mlp.up_proj,0.0000145528,0.05000,3.031
1,mlp.down_proj,0.0000015817,0.05000,3.079
2,self_attn.qkv_proj,0.0000670091,0.05000,1.059
2,self_attn.o_proj,0.0000003938,0.05000,1.070
2,mlp.up_proj,0.0000224096,0.05000,2.395
2,mlp.gate_proj,0.0000242441,0.05000,2.416
2,mlp.down_proj,0.0000015780,0.05000,2.917
3,self_attn.qkv_proj,0.0000974988,0.05000,1.073
3,self_attn.o_proj,0.0000007507,0.05000,1.034
3,mlp.up_proj,0.0000273527,0.05000,2.420
3,mlp.gate_proj,0.0000303579,0.05000,2.439
3,mlp.down_proj,0.0002998998,0.05000,2.971
4,self_attn.qkv_proj,0.0000910987,0.05000,1.059
4,self_attn.o_proj,0.0000010523,0.05000,1.028
4,mlp.up_proj,0.0000352418,0.05000,2.337
4,mlp.gate_proj,0.0000410384,0.05000,2.362
4,mlp.down_proj,0.0000039988,0.05000,2.978
5,self_attn.qkv_proj,0.0001155192,0.05000,1.047
5,self_attn.o_proj,0.0000016719,0.05000,1.026
5,mlp.gate_proj,0.0000496211,0.05000,2.362
5,mlp.up_proj,0.0000416632,0.05000,2.390
5,mlp.down_proj,0.0000057624,0.05000,3.039
6,self_attn.qkv_proj,0.0000936164,0.05000,1.020
6,self_attn.o_proj,0.0000023169,0.05000,1.018
6,mlp.gate_proj,0.0000478458,0.05000,2.404
6,mlp.up_proj,0.0000420634,0.05000,2.419
6,mlp.down_proj,0.0000064274,0.05000,3.008
7,self_attn.qkv_proj,0.0001384777,0.05000,1.049
7,self_attn.o_proj,0.0000026701,0.05000,1.038
7,mlp.gate_proj,0.0000488039,0.05000,2.357
7,mlp.up_proj,0.0000447177,0.05000,2.384
7,mlp.down_proj,0.0000080068,0.05000,2.957
8,self_attn.qkv_proj,0.0001268911,0.05000,1.066
8,self_attn.o_proj,0.0000035567,0.05000,1.000
8,mlp.gate_proj,0.0000463068,0.05000,2.386
8,mlp.up_proj,0.0000451744,0.05000,2.408
8,mlp.down_proj,0.0000082719,0.05000,2.994
9,self_attn.qkv_proj,0.0001118555,0.05000,1.019
9,self_attn.o_proj,0.0000036070,0.05000,1.045
9,mlp.up_proj,0.0000490196,0.05000,2.307
9,mlp.gate_proj,0.0000489556,0.05000,2.306
9,mlp.down_proj,0.0000078682,0.05000,2.932
10,self_attn.qkv_proj,0.0001195859,0.05000,1.039
10,self_attn.o_proj,0.0000053637,0.05000,1.004
10,mlp.gate_proj,0.0000508104,0.05000,2.384
10,mlp.up_proj,0.0000506414,0.05000,2.403
10,mlp.down_proj,0.0000088444,0.05000,2.987
11,self_attn.qkv_proj,0.0001189149,0.05000,1.026
11,self_attn.o_proj,0.0000047267,0.05000,1.049
11,mlp.up_proj,0.0000525891,0.05000,2.311
11,mlp.gate_proj,0.0000505481,0.05000,2.330
11,mlp.down_proj,0.0000090989,0.05000,3.007
12,self_attn.qkv_proj,0.0001222839,0.05000,1.036
12,self_attn.o_proj,0.0000046178,0.05000,1.048
12,mlp.up_proj,0.0000535870,0.05000,2.276
12,mlp.gate_proj,0.0000492890,0.05000,2.301
12,mlp.down_proj,0.0000108105,0.05000,2.947
13,self_attn.qkv_proj,0.0001456172,0.05000,1.026
13,self_attn.o_proj,0.0000059778,0.05000,1.031
13,mlp.gate_proj,0.0000507735,0.05000,2.282
13,mlp.up_proj,0.0000571203,0.05000,2.302
13,mlp.down_proj,0.0000114501,0.05000,2.939
14,self_attn.qkv_proj,0.0001290736,0.05000,1.052
14,self_attn.o_proj,0.0000053882,0.05000,1.012
14,mlp.gate_proj,0.0000560465,0.05000,2.260
14,mlp.up_proj,0.0000626098,0.05000,2.263
14,mlp.down_proj,0.0000130744,0.05000,2.974
15,self_attn.qkv_proj,0.0001434816,0.05000,1.038
15,self_attn.o_proj,0.0000051712,0.05000,1.004
15,mlp.up_proj,0.0000692544,0.05000,2.446
15,mlp.gate_proj,0.0000621178,0.05000,2.473
15,mlp.down_proj,0.0000150576,0.05000,2.920
16,self_attn.qkv_proj,0.0001369979,0.05000,1.019
16,self_attn.o_proj,0.0000090328,0.05000,1.007
16,mlp.gate_proj,0.0000653503,0.05000,2.323
16,mlp.up_proj,0.0000734144,0.05000,2.352
16,mlp.down_proj,0.0000200746,0.05000,2.964
17,self_attn.qkv_proj,0.0001395030,0.05000,1.015
17,self_attn.o_proj,0.0000068804,0.05000,1.013
17,mlp.gate_proj,0.0000694652,0.05000,2.324
17,mlp.up_proj,0.0000789464,0.05000,2.343
17,mlp.down_proj,0.0000242481,0.05000,2.968
18,self_attn.qkv_proj,0.0001378879,0.05000,1.040
18,self_attn.o_proj,0.0000118515,0.05000,1.062
18,mlp.up_proj,0.0000885018,0.05000,2.303
18,mlp.gate_proj,0.0000787926,0.05000,2.330
18,mlp.down_proj,0.0000361241,0.05000,2.967
19,self_attn.qkv_proj,0.0001587094,0.05000,1.029
19,self_attn.o_proj,0.0000144369,0.05000,1.015
19,mlp.gate_proj,0.0000868370,0.05000,2.312
19,mlp.up_proj,0.0000961948,0.05000,2.332
19,mlp.down_proj,0.0000418560,0.05000,2.953
20,self_attn.qkv_proj,0.0001532980,0.05000,1.032
20,self_attn.o_proj,0.0000176382,0.05000,1.009
20,mlp.gate_proj,0.0001063069,0.05000,2.306
20,mlp.up_proj,0.0001176227,0.05000,2.338
20,mlp.down_proj,0.0000541321,0.05000,2.950
21,self_attn.qkv_proj,0.0001821614,0.05000,1.026
21,self_attn.o_proj,0.0000128516,0.05000,1.015
21,mlp.up_proj,0.0001266831,0.05000,2.502
21,mlp.gate_proj,0.0001130891,0.05000,2.516
21,mlp.down_proj,0.0000670870,0.05000,3.011
22,self_attn.qkv_proj,0.0001746809,0.05000,1.028
22,self_attn.o_proj,0.0000238040,0.05000,1.043
22,mlp.up_proj,0.0001363046,0.05000,2.250
22,mlp.gate_proj,0.0001202949,0.05000,2.275
22,mlp.down_proj,0.0000788939,0.05000,2.992
23,self_attn.qkv_proj,0.0001925415,0.05000,1.013
23,self_attn.o_proj,0.0000102084,0.05000,1.015
23,mlp.gate_proj,0.0001299220,0.05000,2.277
23,mlp.up_proj,0.0001462273,0.05000,2.299
23,mlp.down_proj,0.0000795165,0.05000,2.962
24,self_attn.qkv_proj,0.0002069782,0.05000,1.031
24,self_attn.o_proj,0.0000115072,0.05000,1.051
24,mlp.gate_proj,0.0001396862,0.05000,2.344
24,mlp.up_proj,0.0001586309,0.05000,2.348
24,mlp.down_proj,0.0000930914,0.05000,2.952
25,self_attn.qkv_proj,0.0002230113,0.05000,1.052
25,self_attn.o_proj,0.0000204678,0.05000,0.996
25,mlp.gate_proj,0.0001546881,0.05000,2.336
25,mlp.up_proj,0.0001761131,0.05000,2.359
25,mlp.down_proj,0.0001077607,0.05000,2.968
26,self_attn.qkv_proj,0.0001977103,0.05000,1.014
26,self_attn.o_proj,0.0000338197,0.05000,1.015
26,mlp.up_proj,0.0001833882,0.05000,2.316
26,mlp.gate_proj,0.0001614466,0.05000,2.336
26,mlp.down_proj,0.0001312572,0.05000,2.941
27,self_attn.qkv_proj,0.0001965278,0.05000,1.011
27,self_attn.o_proj,0.0000231340,0.05000,1.005
27,mlp.gate_proj,0.0001804944,0.05000,2.462
27,mlp.up_proj,0.0002018597,0.05000,2.477
27,mlp.down_proj,0.0001707861,0.05000,2.984
28,self_attn.qkv_proj,0.0002510537,0.05000,1.017
28,self_attn.o_proj,0.0000287529,0.05000,1.024
28,mlp.up_proj,0.0002194517,0.05000,2.276
28,mlp.gate_proj,0.0002030963,0.05000,2.300
28,mlp.down_proj,0.0002290906,0.05000,2.962
29,self_attn.qkv_proj,0.0002273341,0.05000,1.045
29,self_attn.o_proj,0.0000351872,0.05000,1.027
29,mlp.gate_proj,0.0002264227,0.05000,2.352
29,mlp.up_proj,0.0002236534,0.05000,2.373
29,mlp.down_proj,0.0003785557,0.05000,2.977
30,self_attn.qkv_proj,0.0001608474,0.05000,1.024
30,self_attn.o_proj,0.0000363605,0.05000,1.023
30,mlp.gate_proj,0.0002430771,0.05000,2.505
30,mlp.up_proj,0.0002131529,0.05000,2.513
30,mlp.down_proj,0.0014835209,0.05000,2.926
31,self_attn.qkv_proj,0.0000034551,0.05000,1.074
31,self_attn.o_proj,0.0000042867,0.05000,1.011
31,mlp.gate_proj,0.0001017404,0.05000,2.333
31,mlp.up_proj,0.0000593105,0.05000,2.351
31,mlp.down_proj,0.0004770287,0.05000,2.931