File size: 7,379 Bytes
a2d6e86
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
layer,module,loss,samples,damp,time
0,self_attn.qkv_proj,0.0000234433,0.05000,1.515
0,self_attn.o_proj,0.0000012551,0.05000,0.936
0,mlp.up_proj,0.0000740401,0.05000,2.474
0,mlp.gate_proj,0.0000768478,0.05000,2.490
0,mlp.down_proj,0.0000051061,0.05000,2.818
1,self_attn.qkv_proj,0.0001699547,0.05000,1.280
1,self_attn.o_proj,0.0000034763,0.05000,1.143
1,mlp.up_proj,0.0001173471,0.05000,2.850
1,mlp.gate_proj,0.0001244575,0.05000,2.885
1,mlp.down_proj,0.0000244783,0.05000,2.984
2,self_attn.qkv_proj,0.0004539477,0.05000,1.043
2,self_attn.o_proj,0.0000030893,0.05000,1.040
2,mlp.gate_proj,0.0001873295,0.05000,2.737
2,mlp.up_proj,0.0001750478,0.05000,2.793
2,mlp.down_proj,0.0000109788,0.05000,2.954
3,self_attn.qkv_proj,0.0006435827,0.05000,1.123
3,self_attn.o_proj,0.0000069274,0.05000,1.466
3,mlp.gate_proj,0.0002680054,0.05000,2.202
3,mlp.up_proj,0.0002448218,0.05000,2.228
3,mlp.down_proj,0.0319495132,0.05000,2.865
4,self_attn.qkv_proj,0.0006558018,0.05000,1.006
4,self_attn.o_proj,0.0000090045,0.05000,1.075
4,mlp.gate_proj,0.0003298683,0.05000,2.266
4,mlp.up_proj,0.0002895112,0.05000,2.286
4,mlp.down_proj,0.0000298855,0.05000,2.908
5,self_attn.qkv_proj,0.0007604120,0.05000,1.000
5,self_attn.o_proj,0.0000106954,0.05000,0.994
5,mlp.gate_proj,0.0003911948,0.05000,2.291
5,mlp.up_proj,0.0003372076,0.05000,2.310
5,mlp.down_proj,0.0000409930,0.05000,2.908
6,self_attn.qkv_proj,0.0006467403,0.05000,1.010
6,self_attn.o_proj,0.0000139023,0.05000,1.011
6,mlp.up_proj,0.0003379441,0.05000,2.350
6,mlp.gate_proj,0.0003750805,0.05000,2.376
6,mlp.down_proj,0.0000462578,0.05000,2.866
7,self_attn.qkv_proj,0.0009227887,0.05000,1.002
7,self_attn.o_proj,0.0000164297,0.05000,1.034
7,mlp.up_proj,0.0003586256,0.05000,2.228
7,mlp.gate_proj,0.0003832810,0.05000,2.231
7,mlp.down_proj,0.0000597295,0.05000,2.858
8,self_attn.qkv_proj,0.0008569787,0.05000,1.008
8,self_attn.o_proj,0.0000230205,0.05000,0.988
8,mlp.gate_proj,0.0003839790,0.05000,2.448
8,mlp.up_proj,0.0003800165,0.05000,2.468
8,mlp.down_proj,0.0000743382,0.05000,2.908
9,self_attn.qkv_proj,0.0007942334,0.05000,1.002
9,self_attn.o_proj,0.0000246915,0.05000,0.993
9,mlp.up_proj,0.0004031824,0.05000,2.326
9,mlp.gate_proj,0.0003977984,0.05000,2.348
9,mlp.down_proj,0.0000619588,0.05000,2.897
10,self_attn.qkv_proj,0.0008438398,0.05000,1.008
10,self_attn.o_proj,0.0000353785,0.05000,1.018
10,mlp.gate_proj,0.0004070449,0.05000,2.320
10,mlp.up_proj,0.0004118055,0.05000,2.346
10,mlp.down_proj,0.0000657525,0.05000,2.923
11,self_attn.qkv_proj,0.0008194585,0.05000,1.053
11,self_attn.o_proj,0.0000269038,0.05000,1.002
11,mlp.gate_proj,0.0004062071,0.05000,2.399
11,mlp.up_proj,0.0004268940,0.05000,2.419
11,mlp.down_proj,0.0000666463,0.05000,2.858
12,self_attn.qkv_proj,0.0008770282,0.05000,0.997
12,self_attn.o_proj,0.0000251990,0.05000,0.993
12,mlp.up_proj,0.0004276355,0.05000,2.300
12,mlp.gate_proj,0.0003912912,0.05000,2.328
12,mlp.down_proj,0.0000774838,0.05000,2.917
13,self_attn.qkv_proj,0.0009794771,0.05000,1.004
13,self_attn.o_proj,0.0000277290,0.05000,0.988
13,mlp.gate_proj,0.0004115693,0.05000,2.315
13,mlp.up_proj,0.0004629706,0.05000,2.340
13,mlp.down_proj,0.0000860639,0.05000,2.901
14,self_attn.qkv_proj,0.0009111086,0.05000,1.044
14,self_attn.o_proj,0.0000270905,0.05000,1.004
14,mlp.gate_proj,0.0004456694,0.05000,2.327
14,mlp.up_proj,0.0004985755,0.05000,2.338
14,mlp.down_proj,0.0000911287,0.05000,2.874
15,self_attn.qkv_proj,0.0010071384,0.05000,1.075
15,self_attn.o_proj,0.0000243394,0.05000,0.988
15,mlp.up_proj,0.0005489160,0.05000,2.215
15,mlp.gate_proj,0.0004908784,0.05000,2.236
15,mlp.down_proj,0.0001038040,0.05000,2.908
16,self_attn.qkv_proj,0.0009476236,0.05000,0.991
16,self_attn.o_proj,0.0000485368,0.05000,0.992
16,mlp.up_proj,0.0005693908,0.05000,2.308
16,mlp.gate_proj,0.0005057035,0.05000,2.330
16,mlp.down_proj,0.0001301657,0.05000,2.891
17,self_attn.qkv_proj,0.0009925160,0.05000,0.998
17,self_attn.o_proj,0.0000390900,0.05000,0.973
17,mlp.up_proj,0.0006069203,0.05000,2.314
17,mlp.gate_proj,0.0005327590,0.05000,2.330
17,mlp.down_proj,0.0001544745,0.05000,2.872
18,self_attn.qkv_proj,0.0009654888,0.05000,1.009
18,self_attn.o_proj,0.0000608897,0.05000,1.001
18,mlp.gate_proj,0.0005690133,0.05000,2.385
18,mlp.up_proj,0.0006410199,0.05000,2.407
18,mlp.down_proj,0.0002298194,0.05000,2.914
19,self_attn.qkv_proj,0.0010355139,0.05000,1.041
19,self_attn.o_proj,0.0000674389,0.05000,1.006
19,mlp.gate_proj,0.0006108685,0.05000,2.337
19,mlp.up_proj,0.0006793319,0.05000,2.365
19,mlp.down_proj,0.0002456510,0.05000,2.942
20,self_attn.qkv_proj,0.0009955477,0.05000,1.016
20,self_attn.o_proj,0.0000853179,0.05000,1.034
20,mlp.gate_proj,0.0007368962,0.05000,2.192
20,mlp.up_proj,0.0008203884,0.05000,2.213
20,mlp.down_proj,0.0003082218,0.05000,2.854
21,self_attn.qkv_proj,0.0011595939,0.05000,1.044
21,self_attn.o_proj,0.0000631391,0.05000,0.988
21,mlp.gate_proj,0.0007788413,0.05000,2.444
21,mlp.up_proj,0.0008753389,0.05000,2.463
21,mlp.down_proj,0.0003915850,0.05000,2.931
22,self_attn.qkv_proj,0.0011074981,0.05000,0.991
22,self_attn.o_proj,0.0000896787,0.05000,1.015
22,mlp.gate_proj,0.0008228205,0.05000,2.343
22,mlp.up_proj,0.0009325047,0.05000,2.386
22,mlp.down_proj,0.0004434848,0.05000,2.865
23,self_attn.qkv_proj,0.0012805010,0.05000,1.000
23,self_attn.o_proj,0.0000562911,0.05000,0.999
23,mlp.up_proj,0.0010011470,0.05000,2.290
23,mlp.gate_proj,0.0008901170,0.05000,2.314
23,mlp.down_proj,0.0004554649,0.05000,2.926
24,self_attn.qkv_proj,0.0013814587,0.05000,1.040
24,self_attn.o_proj,0.0000568903,0.05000,0.987
24,mlp.up_proj,0.0010863662,0.05000,2.384
24,mlp.gate_proj,0.0009593617,0.05000,2.422
24,mlp.down_proj,0.0005254694,0.05000,2.875
25,self_attn.qkv_proj,0.0014469156,0.05000,0.980
25,self_attn.o_proj,0.0000781728,0.05000,1.000
25,mlp.gate_proj,0.0010634154,0.05000,2.338
25,mlp.up_proj,0.0012082151,0.05000,2.360
25,mlp.down_proj,0.0006043160,0.05000,3.007
26,self_attn.qkv_proj,0.0012781918,0.05000,1.039
26,self_attn.o_proj,0.0001430641,0.05000,1.003
26,mlp.up_proj,0.0012724487,0.05000,2.332
26,mlp.gate_proj,0.0011216506,0.05000,2.359
26,mlp.down_proj,0.0007345894,0.05000,2.880
27,self_attn.qkv_proj,0.0013309020,0.05000,1.018
27,self_attn.o_proj,0.0001508330,0.05000,0.996
27,mlp.up_proj,0.0013503263,0.05000,2.279
27,mlp.gate_proj,0.0012045613,0.05000,2.307
27,mlp.down_proj,0.0008768519,0.05000,2.940
28,self_attn.qkv_proj,0.0015792458,0.05000,1.007
28,self_attn.o_proj,0.0001596175,0.05000,1.028
28,mlp.up_proj,0.0014309376,0.05000,2.394
28,mlp.gate_proj,0.0013091725,0.05000,2.401
28,mlp.down_proj,0.0011007471,0.05000,2.875
29,self_attn.qkv_proj,0.0014297700,0.05000,1.039
29,self_attn.o_proj,0.0002247341,0.05000,0.988
29,mlp.gate_proj,0.0014194082,0.05000,2.382
29,mlp.up_proj,0.0014341137,0.05000,2.406
29,mlp.down_proj,0.0018299969,0.05000,2.897
30,self_attn.qkv_proj,0.0009961152,0.05000,1.045
30,self_attn.o_proj,0.0002220271,0.05000,1.001
30,mlp.up_proj,0.0013122857,0.05000,2.346
30,mlp.gate_proj,0.0014473631,0.05000,2.370
30,mlp.down_proj,0.0182979599,0.05000,2.924
31,self_attn.qkv_proj,0.0000219487,0.05000,1.020
31,self_attn.o_proj,0.0000321238,0.05000,0.988
31,mlp.gate_proj,0.0006197570,0.05000,2.283
31,mlp.up_proj,0.0003814784,0.05000,2.303
31,mlp.down_proj,0.0030642595,0.05000,2.861