ryanmarten commited on
Commit
3fd46aa
·
verified ·
1 Parent(s): 5baba45

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae5105c793eceefa873b7db60adb69fc3099387bc094c3e79ac607ab866ca2da
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eea52015812e86b05fa3eab9c8175f374dd1c9a7c9abe5b416bda24bd337536
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c3757f38d9a56b05240b69f1c260a136528f15daa959448b8f4111bae15a88f3
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14d7ec9d2d6a38c3ce622b1d88baf76ae943103fa21ce885661fc3a05a397daf
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:104d44e1ab9ba72bebb32cd77a75061fd8483e0ec6bb4e60008022ccd3e2c5b9
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fae6868e43a8f628f1ac0fef4471c8f4a1322439dcc88cbc836708efe6e795da
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cc577704a1f6be90b9306b7f80ea08808b505d1c73d6da70ac1244ea9bac7436
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8a820121c3c9f5e9fc539d76dfb4fe9dcb734be8f5e608c96e08d762b6d95404
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -156,3 +156,158 @@
156
  {"current_steps": 156, "total_steps": 775, "loss": 0.5427, "lr": 3.877666473835899e-05, "epoch": 1.0032154340836013, "percentage": 20.13, "elapsed_time": "1:53:34", "remaining_time": "7:30:40"}
157
  {"current_steps": 157, "total_steps": 775, "loss": 0.5225, "lr": 3.874543029856609e-05, "epoch": 1.0096463022508038, "percentage": 20.26, "elapsed_time": "1:54:18", "remaining_time": "7:29:58"}
158
  {"current_steps": 158, "total_steps": 775, "loss": 0.5165, "lr": 3.871381503077668e-05, "epoch": 1.0160771704180065, "percentage": 20.39, "elapsed_time": "1:55:03", "remaining_time": "7:29:19"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
156
  {"current_steps": 156, "total_steps": 775, "loss": 0.5427, "lr": 3.877666473835899e-05, "epoch": 1.0032154340836013, "percentage": 20.13, "elapsed_time": "1:53:34", "remaining_time": "7:30:40"}
157
  {"current_steps": 157, "total_steps": 775, "loss": 0.5225, "lr": 3.874543029856609e-05, "epoch": 1.0096463022508038, "percentage": 20.26, "elapsed_time": "1:54:18", "remaining_time": "7:29:58"}
158
  {"current_steps": 158, "total_steps": 775, "loss": 0.5165, "lr": 3.871381503077668e-05, "epoch": 1.0160771704180065, "percentage": 20.39, "elapsed_time": "1:55:03", "remaining_time": "7:29:19"}
159
+ {"current_steps": 159, "total_steps": 775, "loss": 0.498, "lr": 3.8681819577279515e-05, "epoch": 1.022508038585209, "percentage": 20.52, "elapsed_time": "1:55:48", "remaining_time": "7:28:39"}
160
+ {"current_steps": 160, "total_steps": 775, "loss": 0.5176, "lr": 3.864944458808712e-05, "epoch": 1.0289389067524115, "percentage": 20.65, "elapsed_time": "1:56:25", "remaining_time": "7:27:32"}
161
+ {"current_steps": 161, "total_steps": 775, "loss": 0.5121, "lr": 3.861669072092258e-05, "epoch": 1.0353697749196142, "percentage": 20.77, "elapsed_time": "1:57:09", "remaining_time": "7:26:48"}
162
+ {"current_steps": 162, "total_steps": 775, "loss": 0.5092, "lr": 3.8583558641206183e-05, "epoch": 1.0418006430868167, "percentage": 20.9, "elapsed_time": "1:57:55", "remaining_time": "7:26:12"}
163
+ {"current_steps": 163, "total_steps": 775, "loss": 0.5106, "lr": 3.85500490220419e-05, "epoch": 1.0482315112540193, "percentage": 21.03, "elapsed_time": "1:58:46", "remaining_time": "7:25:57"}
164
+ {"current_steps": 164, "total_steps": 775, "loss": 0.5009, "lr": 3.85161625442037e-05, "epoch": 1.0546623794212218, "percentage": 21.16, "elapsed_time": "1:59:40", "remaining_time": "7:25:53"}
165
+ {"current_steps": 165, "total_steps": 775, "loss": 0.5056, "lr": 3.8481899896121744e-05, "epoch": 1.0610932475884245, "percentage": 21.29, "elapsed_time": "2:00:32", "remaining_time": "7:25:36"}
166
+ {"current_steps": 166, "total_steps": 775, "loss": 0.5035, "lr": 3.8447261773868376e-05, "epoch": 1.067524115755627, "percentage": 21.42, "elapsed_time": "2:01:17", "remaining_time": "7:24:58"}
167
+ {"current_steps": 167, "total_steps": 775, "loss": 0.5102, "lr": 3.8412248881144e-05, "epoch": 1.0739549839228295, "percentage": 21.55, "elapsed_time": "2:02:02", "remaining_time": "7:24:17"}
168
+ {"current_steps": 168, "total_steps": 775, "loss": 0.5114, "lr": 3.837686192926274e-05, "epoch": 1.0803858520900322, "percentage": 21.68, "elapsed_time": "2:02:49", "remaining_time": "7:23:46"}
169
+ {"current_steps": 169, "total_steps": 775, "loss": 0.5141, "lr": 3.834110163713806e-05, "epoch": 1.0868167202572347, "percentage": 21.81, "elapsed_time": "2:03:35", "remaining_time": "7:23:10"}
170
+ {"current_steps": 170, "total_steps": 775, "loss": 0.5043, "lr": 3.830496873126812e-05, "epoch": 1.0932475884244373, "percentage": 21.94, "elapsed_time": "2:04:13", "remaining_time": "7:22:05"}
171
+ {"current_steps": 171, "total_steps": 775, "loss": 0.5126, "lr": 3.826846394572099e-05, "epoch": 1.09967845659164, "percentage": 22.06, "elapsed_time": "2:04:58", "remaining_time": "7:21:27"}
172
+ {"current_steps": 172, "total_steps": 775, "loss": 0.5042, "lr": 3.823158802211979e-05, "epoch": 1.1061093247588425, "percentage": 22.19, "elapsed_time": "2:05:40", "remaining_time": "7:20:34"}
173
+ {"current_steps": 173, "total_steps": 775, "loss": 0.5199, "lr": 3.8194341709627595e-05, "epoch": 1.112540192926045, "percentage": 22.32, "elapsed_time": "2:06:22", "remaining_time": "7:19:44"}
174
+ {"current_steps": 174, "total_steps": 775, "loss": 0.5221, "lr": 3.81567257649322e-05, "epoch": 1.1189710610932475, "percentage": 22.45, "elapsed_time": "2:07:06", "remaining_time": "7:19:01"}
175
+ {"current_steps": 175, "total_steps": 775, "loss": 0.5202, "lr": 3.811874095223078e-05, "epoch": 1.1254019292604502, "percentage": 22.58, "elapsed_time": "2:07:49", "remaining_time": "7:18:16"}
176
+ {"current_steps": 176, "total_steps": 775, "loss": 0.5207, "lr": 3.808038804321436e-05, "epoch": 1.1318327974276527, "percentage": 22.71, "elapsed_time": "2:08:31", "remaining_time": "7:17:26"}
177
+ {"current_steps": 177, "total_steps": 775, "loss": 0.5037, "lr": 3.804166781705211e-05, "epoch": 1.1382636655948553, "percentage": 22.84, "elapsed_time": "2:09:11", "remaining_time": "7:16:28"}
178
+ {"current_steps": 178, "total_steps": 775, "loss": 0.5036, "lr": 3.8002581060375535e-05, "epoch": 1.144694533762058, "percentage": 22.97, "elapsed_time": "2:09:46", "remaining_time": "7:15:16"}
179
+ {"current_steps": 179, "total_steps": 775, "loss": 0.5163, "lr": 3.796312856726252e-05, "epoch": 1.1511254019292605, "percentage": 23.1, "elapsed_time": "2:10:29", "remaining_time": "7:14:29"}
180
+ {"current_steps": 180, "total_steps": 775, "loss": 0.5172, "lr": 3.7923311139221114e-05, "epoch": 1.157556270096463, "percentage": 23.23, "elapsed_time": "2:11:16", "remaining_time": "7:13:56"}
181
+ {"current_steps": 181, "total_steps": 775, "loss": 0.5053, "lr": 3.7883129585173365e-05, "epoch": 1.1639871382636655, "percentage": 23.35, "elapsed_time": "2:11:54", "remaining_time": "7:12:52"}
182
+ {"current_steps": 182, "total_steps": 775, "loss": 0.5112, "lr": 3.784258472143878e-05, "epoch": 1.1704180064308682, "percentage": 23.48, "elapsed_time": "2:12:38", "remaining_time": "7:12:10"}
183
+ {"current_steps": 183, "total_steps": 775, "loss": 0.5292, "lr": 3.7801677371717825e-05, "epoch": 1.1768488745980707, "percentage": 23.61, "elapsed_time": "2:13:24", "remaining_time": "7:11:34"}
184
+ {"current_steps": 184, "total_steps": 775, "loss": 0.5095, "lr": 3.77604083670751e-05, "epoch": 1.1832797427652733, "percentage": 23.74, "elapsed_time": "2:14:05", "remaining_time": "7:10:40"}
185
+ {"current_steps": 185, "total_steps": 775, "loss": 0.5263, "lr": 3.771877854592254e-05, "epoch": 1.189710610932476, "percentage": 23.87, "elapsed_time": "2:14:48", "remaining_time": "7:09:56"}
186
+ {"current_steps": 186, "total_steps": 775, "loss": 0.5109, "lr": 3.767678875400235e-05, "epoch": 1.1961414790996785, "percentage": 24.0, "elapsed_time": "2:15:29", "remaining_time": "7:09:02"}
187
+ {"current_steps": 187, "total_steps": 775, "loss": 0.522, "lr": 3.76344398443698e-05, "epoch": 1.202572347266881, "percentage": 24.13, "elapsed_time": "2:16:15", "remaining_time": "7:08:26"}
188
+ {"current_steps": 188, "total_steps": 775, "loss": 0.4934, "lr": 3.7591732677375936e-05, "epoch": 1.2090032154340835, "percentage": 24.26, "elapsed_time": "2:16:54", "remaining_time": "7:07:29"}
189
+ {"current_steps": 189, "total_steps": 775, "loss": 0.5076, "lr": 3.754866812065008e-05, "epoch": 1.2154340836012862, "percentage": 24.39, "elapsed_time": "2:17:35", "remaining_time": "7:06:36"}
190
+ {"current_steps": 190, "total_steps": 775, "loss": 0.4922, "lr": 3.750524704908218e-05, "epoch": 1.2218649517684887, "percentage": 24.52, "elapsed_time": "2:18:17", "remaining_time": "7:05:48"}
191
+ {"current_steps": 191, "total_steps": 775, "loss": 0.5071, "lr": 3.746147034480508e-05, "epoch": 1.2282958199356913, "percentage": 24.65, "elapsed_time": "2:19:04", "remaining_time": "7:05:15"}
192
+ {"current_steps": 192, "total_steps": 775, "loss": 0.501, "lr": 3.741733889717659e-05, "epoch": 1.234726688102894, "percentage": 24.77, "elapsed_time": "2:19:48", "remaining_time": "7:04:30"}
193
+ {"current_steps": 193, "total_steps": 775, "loss": 0.5211, "lr": 3.737285360276138e-05, "epoch": 1.2411575562700965, "percentage": 24.9, "elapsed_time": "2:20:34", "remaining_time": "7:03:53"}
194
+ {"current_steps": 194, "total_steps": 775, "loss": 0.5143, "lr": 3.7328015365312815e-05, "epoch": 1.247588424437299, "percentage": 25.03, "elapsed_time": "2:21:16", "remaining_time": "7:03:04"}
195
+ {"current_steps": 195, "total_steps": 775, "loss": 0.5162, "lr": 3.728282509575456e-05, "epoch": 1.2540192926045015, "percentage": 25.16, "elapsed_time": "2:21:56", "remaining_time": "7:02:11"}
196
+ {"current_steps": 196, "total_steps": 775, "loss": 0.5113, "lr": 3.7237283712162083e-05, "epoch": 1.2604501607717042, "percentage": 25.29, "elapsed_time": "2:22:41", "remaining_time": "7:01:32"}
197
+ {"current_steps": 197, "total_steps": 775, "loss": 0.4998, "lr": 3.719139213974403e-05, "epoch": 1.2668810289389068, "percentage": 25.42, "elapsed_time": "2:23:19", "remaining_time": "7:00:31"}
198
+ {"current_steps": 198, "total_steps": 775, "loss": 0.5148, "lr": 3.7145151310823365e-05, "epoch": 1.2733118971061093, "percentage": 25.55, "elapsed_time": "2:24:02", "remaining_time": "6:59:44"}
199
+ {"current_steps": 199, "total_steps": 775, "loss": 0.5039, "lr": 3.709856216481852e-05, "epoch": 1.279742765273312, "percentage": 25.68, "elapsed_time": "2:24:46", "remaining_time": "6:59:01"}
200
+ {"current_steps": 200, "total_steps": 775, "loss": 0.512, "lr": 3.705162564822421e-05, "epoch": 1.2861736334405145, "percentage": 25.81, "elapsed_time": "2:25:32", "remaining_time": "6:58:24"}
201
+ {"current_steps": 201, "total_steps": 775, "loss": 0.4976, "lr": 3.700434271459229e-05, "epoch": 1.292604501607717, "percentage": 25.94, "elapsed_time": "2:26:18", "remaining_time": "6:57:50"}
202
+ {"current_steps": 202, "total_steps": 775, "loss": 0.5096, "lr": 3.6956714324512325e-05, "epoch": 1.2990353697749195, "percentage": 26.06, "elapsed_time": "2:27:02", "remaining_time": "6:57:05"}
203
+ {"current_steps": 203, "total_steps": 775, "loss": 0.4857, "lr": 3.6908741445592104e-05, "epoch": 1.3054662379421222, "percentage": 26.19, "elapsed_time": "2:27:51", "remaining_time": "6:56:36"}
204
+ {"current_steps": 204, "total_steps": 775, "loss": 0.508, "lr": 3.6860425052437986e-05, "epoch": 1.3118971061093248, "percentage": 26.32, "elapsed_time": "2:28:26", "remaining_time": "6:55:30"}
205
+ {"current_steps": 205, "total_steps": 775, "loss": 0.5209, "lr": 3.6811766126635064e-05, "epoch": 1.3183279742765273, "percentage": 26.45, "elapsed_time": "2:29:08", "remaining_time": "6:54:40"}
206
+ {"current_steps": 206, "total_steps": 775, "loss": 0.5183, "lr": 3.6762765656727274e-05, "epoch": 1.32475884244373, "percentage": 26.58, "elapsed_time": "2:29:56", "remaining_time": "6:54:09"}
207
+ {"current_steps": 207, "total_steps": 775, "loss": 0.5046, "lr": 3.6713424638197264e-05, "epoch": 1.3311897106109325, "percentage": 26.71, "elapsed_time": "2:30:43", "remaining_time": "6:53:34"}
208
+ {"current_steps": 208, "total_steps": 775, "loss": 0.5097, "lr": 3.6663744073446206e-05, "epoch": 1.337620578778135, "percentage": 26.84, "elapsed_time": "2:31:26", "remaining_time": "6:52:50"}
209
+ {"current_steps": 209, "total_steps": 775, "loss": 0.5264, "lr": 3.6613724971773426e-05, "epoch": 1.3440514469453375, "percentage": 26.97, "elapsed_time": "2:32:09", "remaining_time": "6:52:03"}
210
+ {"current_steps": 210, "total_steps": 775, "loss": 0.5418, "lr": 3.6563368349355855e-05, "epoch": 1.3504823151125402, "percentage": 27.1, "elapsed_time": "2:32:55", "remaining_time": "6:51:26"}
211
+ {"current_steps": 211, "total_steps": 775, "loss": 0.4984, "lr": 3.651267522922746e-05, "epoch": 1.3569131832797428, "percentage": 27.23, "elapsed_time": "2:33:41", "remaining_time": "6:50:48"}
212
+ {"current_steps": 212, "total_steps": 775, "loss": 0.5195, "lr": 3.646164664125841e-05, "epoch": 1.3633440514469453, "percentage": 27.35, "elapsed_time": "2:34:23", "remaining_time": "6:50:00"}
213
+ {"current_steps": 213, "total_steps": 775, "loss": 0.5015, "lr": 3.6410283622134146e-05, "epoch": 1.369774919614148, "percentage": 27.48, "elapsed_time": "2:35:00", "remaining_time": "6:48:58"}
214
+ {"current_steps": 214, "total_steps": 775, "loss": 0.5101, "lr": 3.6358587215334355e-05, "epoch": 1.3762057877813505, "percentage": 27.61, "elapsed_time": "2:35:46", "remaining_time": "6:48:21"}
215
+ {"current_steps": 215, "total_steps": 775, "loss": 0.5184, "lr": 3.630655847111175e-05, "epoch": 1.382636655948553, "percentage": 27.74, "elapsed_time": "2:36:31", "remaining_time": "6:47:40"}
216
+ {"current_steps": 216, "total_steps": 775, "loss": 0.5134, "lr": 3.6254198446470745e-05, "epoch": 1.3890675241157555, "percentage": 27.87, "elapsed_time": "2:37:11", "remaining_time": "6:46:48"}
217
+ {"current_steps": 217, "total_steps": 775, "loss": 0.5217, "lr": 3.6201508205145956e-05, "epoch": 1.3954983922829582, "percentage": 28.0, "elapsed_time": "2:37:55", "remaining_time": "6:46:05"}
218
+ {"current_steps": 218, "total_steps": 775, "loss": 0.5198, "lr": 3.614848881758062e-05, "epoch": 1.4019292604501608, "percentage": 28.13, "elapsed_time": "2:38:39", "remaining_time": "6:45:22"}
219
+ {"current_steps": 219, "total_steps": 775, "loss": 0.4967, "lr": 3.609514136090483e-05, "epoch": 1.4083601286173635, "percentage": 28.26, "elapsed_time": "2:39:17", "remaining_time": "6:44:24"}
220
+ {"current_steps": 220, "total_steps": 775, "loss": 0.529, "lr": 3.604146691891367e-05, "epoch": 1.414790996784566, "percentage": 28.39, "elapsed_time": "2:40:05", "remaining_time": "6:43:52"}
221
+ {"current_steps": 221, "total_steps": 775, "loss": 0.4997, "lr": 3.598746658204517e-05, "epoch": 1.4212218649517685, "percentage": 28.52, "elapsed_time": "2:40:45", "remaining_time": "6:42:58"}
222
+ {"current_steps": 222, "total_steps": 775, "loss": 0.5109, "lr": 3.5933141447358176e-05, "epoch": 1.427652733118971, "percentage": 28.65, "elapsed_time": "2:41:30", "remaining_time": "6:42:19"}
223
+ {"current_steps": 223, "total_steps": 775, "loss": 0.5058, "lr": 3.5878492618510055e-05, "epoch": 1.4340836012861735, "percentage": 28.77, "elapsed_time": "2:42:15", "remaining_time": "6:41:39"}
224
+ {"current_steps": 224, "total_steps": 775, "loss": 0.5178, "lr": 3.582352120573427e-05, "epoch": 1.4405144694533762, "percentage": 28.9, "elapsed_time": "2:42:55", "remaining_time": "6:40:46"}
225
+ {"current_steps": 225, "total_steps": 775, "loss": 0.5221, "lr": 3.576822832581783e-05, "epoch": 1.4469453376205788, "percentage": 29.03, "elapsed_time": "2:43:38", "remaining_time": "6:40:01"}
226
+ {"current_steps": 226, "total_steps": 775, "loss": 0.5026, "lr": 3.571261510207858e-05, "epoch": 1.4533762057877815, "percentage": 29.16, "elapsed_time": "2:44:20", "remaining_time": "6:39:13"}
227
+ {"current_steps": 227, "total_steps": 775, "loss": 0.5076, "lr": 3.565668266434243e-05, "epoch": 1.459807073954984, "percentage": 29.29, "elapsed_time": "2:45:05", "remaining_time": "6:38:33"}
228
+ {"current_steps": 228, "total_steps": 775, "loss": 0.4994, "lr": 3.5600432148920366e-05, "epoch": 1.4662379421221865, "percentage": 29.42, "elapsed_time": "2:45:48", "remaining_time": "6:37:46"}
229
+ {"current_steps": 229, "total_steps": 775, "loss": 0.5122, "lr": 3.554386469858534e-05, "epoch": 1.472668810289389, "percentage": 29.55, "elapsed_time": "2:46:29", "remaining_time": "6:36:58"}
230
+ {"current_steps": 230, "total_steps": 775, "loss": 0.5239, "lr": 3.548698146254911e-05, "epoch": 1.4790996784565915, "percentage": 29.68, "elapsed_time": "2:47:14", "remaining_time": "6:36:17"}
231
+ {"current_steps": 231, "total_steps": 775, "loss": 0.4992, "lr": 3.5429783596438864e-05, "epoch": 1.4855305466237942, "percentage": 29.81, "elapsed_time": "2:48:05", "remaining_time": "6:35:52"}
232
+ {"current_steps": 232, "total_steps": 775, "loss": 0.515, "lr": 3.5372272262273734e-05, "epoch": 1.4919614147909968, "percentage": 29.94, "elapsed_time": "2:48:45", "remaining_time": "6:35:00"}
233
+ {"current_steps": 233, "total_steps": 775, "loss": 0.5225, "lr": 3.531444862844121e-05, "epoch": 1.4983922829581995, "percentage": 30.06, "elapsed_time": "2:49:35", "remaining_time": "6:34:30"}
234
+ {"current_steps": 234, "total_steps": 775, "loss": 0.5108, "lr": 3.5256313869673385e-05, "epoch": 1.504823151125402, "percentage": 30.19, "elapsed_time": "2:50:16", "remaining_time": "6:33:40"}
235
+ {"current_steps": 235, "total_steps": 775, "loss": 0.5075, "lr": 3.51978691670231e-05, "epoch": 1.5112540192926045, "percentage": 30.32, "elapsed_time": "2:51:00", "remaining_time": "6:32:56"}
236
+ {"current_steps": 236, "total_steps": 775, "loss": 0.509, "lr": 3.5139115707839947e-05, "epoch": 1.517684887459807, "percentage": 30.45, "elapsed_time": "2:51:42", "remaining_time": "6:32:09"}
237
+ {"current_steps": 237, "total_steps": 775, "loss": 0.504, "lr": 3.5080054685746155e-05, "epoch": 1.5241157556270095, "percentage": 30.58, "elapsed_time": "2:52:23", "remaining_time": "6:31:19"}
238
+ {"current_steps": 238, "total_steps": 775, "loss": 0.5211, "lr": 3.502068730061231e-05, "epoch": 1.5305466237942122, "percentage": 30.71, "elapsed_time": "2:53:01", "remaining_time": "6:30:23"}
239
+ {"current_steps": 239, "total_steps": 775, "loss": 0.5021, "lr": 3.4961014758533025e-05, "epoch": 1.5369774919614148, "percentage": 30.84, "elapsed_time": "2:53:45", "remaining_time": "6:29:40"}
240
+ {"current_steps": 240, "total_steps": 775, "loss": 0.5184, "lr": 3.4901038271802404e-05, "epoch": 1.5434083601286175, "percentage": 30.97, "elapsed_time": "2:54:27", "remaining_time": "6:28:53"}
241
+ {"current_steps": 241, "total_steps": 775, "loss": 0.5261, "lr": 3.4840759058889425e-05, "epoch": 1.54983922829582, "percentage": 31.1, "elapsed_time": "2:55:14", "remaining_time": "6:28:18"}
242
+ {"current_steps": 242, "total_steps": 775, "loss": 0.5076, "lr": 3.478017834441319e-05, "epoch": 1.5562700964630225, "percentage": 31.23, "elapsed_time": "2:56:03", "remaining_time": "6:27:45"}
243
+ {"current_steps": 243, "total_steps": 775, "loss": 0.5059, "lr": 3.471929735911801e-05, "epoch": 1.562700964630225, "percentage": 31.35, "elapsed_time": "2:56:46", "remaining_time": "6:27:00"}
244
+ {"current_steps": 244, "total_steps": 775, "loss": 0.5175, "lr": 3.4658117339848476e-05, "epoch": 1.5691318327974275, "percentage": 31.48, "elapsed_time": "2:57:30", "remaining_time": "6:26:17"}
245
+ {"current_steps": 245, "total_steps": 775, "loss": 0.4996, "lr": 3.459663952952425e-05, "epoch": 1.5755627009646302, "percentage": 31.61, "elapsed_time": "2:58:16", "remaining_time": "6:25:38"}
246
+ {"current_steps": 246, "total_steps": 775, "loss": 0.525, "lr": 3.453486517711489e-05, "epoch": 1.5819935691318328, "percentage": 31.74, "elapsed_time": "2:59:03", "remaining_time": "6:25:03"}
247
+ {"current_steps": 247, "total_steps": 775, "loss": 0.5067, "lr": 3.447279553761438e-05, "epoch": 1.5884244372990355, "percentage": 31.87, "elapsed_time": "2:59:56", "remaining_time": "6:24:39"}
248
+ {"current_steps": 248, "total_steps": 775, "loss": 0.4938, "lr": 3.441043187201574e-05, "epoch": 1.594855305466238, "percentage": 32.0, "elapsed_time": "3:00:46", "remaining_time": "6:24:09"}
249
+ {"current_steps": 249, "total_steps": 775, "loss": 0.5073, "lr": 3.434777544728535e-05, "epoch": 1.6012861736334405, "percentage": 32.13, "elapsed_time": "3:01:29", "remaining_time": "6:23:22"}
250
+ {"current_steps": 250, "total_steps": 775, "loss": 0.5015, "lr": 3.428482753633719e-05, "epoch": 1.607717041800643, "percentage": 32.26, "elapsed_time": "3:02:11", "remaining_time": "6:22:35"}
251
+ {"current_steps": 251, "total_steps": 775, "loss": 0.5063, "lr": 3.422158941800706e-05, "epoch": 1.6141479099678455, "percentage": 32.39, "elapsed_time": "3:02:50", "remaining_time": "6:21:43"}
252
+ {"current_steps": 252, "total_steps": 775, "loss": 0.514, "lr": 3.415806237702649e-05, "epoch": 1.6205787781350482, "percentage": 32.52, "elapsed_time": "3:03:32", "remaining_time": "6:20:56"}
253
+ {"current_steps": 253, "total_steps": 775, "loss": 0.4948, "lr": 3.409424770399675e-05, "epoch": 1.6270096463022508, "percentage": 32.65, "elapsed_time": "3:04:20", "remaining_time": "6:20:20"}
254
+ {"current_steps": 254, "total_steps": 775, "loss": 0.5018, "lr": 3.403014669536254e-05, "epoch": 1.6334405144694535, "percentage": 32.77, "elapsed_time": "3:05:04", "remaining_time": "6:19:36"}
255
+ {"current_steps": 255, "total_steps": 775, "loss": 0.5091, "lr": 3.396576065338572e-05, "epoch": 1.639871382636656, "percentage": 32.9, "elapsed_time": "3:05:45", "remaining_time": "6:18:48"}
256
+ {"current_steps": 256, "total_steps": 775, "loss": 0.507, "lr": 3.3901090886118814e-05, "epoch": 1.6463022508038585, "percentage": 33.03, "elapsed_time": "3:06:29", "remaining_time": "6:18:03"}
257
+ {"current_steps": 257, "total_steps": 775, "loss": 0.5049, "lr": 3.3836138707378434e-05, "epoch": 1.652733118971061, "percentage": 33.16, "elapsed_time": "3:07:16", "remaining_time": "6:17:27"}
258
+ {"current_steps": 258, "total_steps": 775, "loss": 0.5194, "lr": 3.377090543671861e-05, "epoch": 1.6591639871382635, "percentage": 33.29, "elapsed_time": "3:07:59", "remaining_time": "6:16:42"}
259
+ {"current_steps": 259, "total_steps": 775, "loss": 0.5039, "lr": 3.370539239940398e-05, "epoch": 1.6655948553054662, "percentage": 33.42, "elapsed_time": "3:08:43", "remaining_time": "6:15:58"}
260
+ {"current_steps": 260, "total_steps": 775, "loss": 0.5107, "lr": 3.3639600926382854e-05, "epoch": 1.6720257234726688, "percentage": 33.55, "elapsed_time": "3:09:28", "remaining_time": "6:15:19"}
261
+ {"current_steps": 261, "total_steps": 775, "loss": 0.5022, "lr": 3.357353235426017e-05, "epoch": 1.6784565916398715, "percentage": 33.68, "elapsed_time": "3:10:12", "remaining_time": "6:14:34"}
262
+ {"current_steps": 262, "total_steps": 775, "loss": 0.5269, "lr": 3.350718802527036e-05, "epoch": 1.684887459807074, "percentage": 33.81, "elapsed_time": "3:10:56", "remaining_time": "6:13:52"}
263
+ {"current_steps": 263, "total_steps": 775, "loss": 0.5153, "lr": 3.344056928725007e-05, "epoch": 1.6913183279742765, "percentage": 33.94, "elapsed_time": "3:11:33", "remaining_time": "6:12:55"}
264
+ {"current_steps": 264, "total_steps": 775, "loss": 0.5016, "lr": 3.337367749361079e-05, "epoch": 1.697749196141479, "percentage": 34.06, "elapsed_time": "3:12:17", "remaining_time": "6:12:11"}
265
+ {"current_steps": 265, "total_steps": 775, "loss": 0.5242, "lr": 3.3306514003311305e-05, "epoch": 1.7041800643086815, "percentage": 34.19, "elapsed_time": "3:13:01", "remaining_time": "6:11:29"}
266
+ {"current_steps": 266, "total_steps": 775, "loss": 0.5132, "lr": 3.3239080180830194e-05, "epoch": 1.7106109324758842, "percentage": 34.32, "elapsed_time": "3:13:49", "remaining_time": "6:10:52"}
267
+ {"current_steps": 267, "total_steps": 775, "loss": 0.5022, "lr": 3.317137739613799e-05, "epoch": 1.717041800643087, "percentage": 34.45, "elapsed_time": "3:14:29", "remaining_time": "6:10:01"}
268
+ {"current_steps": 268, "total_steps": 775, "loss": 0.519, "lr": 3.310340702466943e-05, "epoch": 1.7234726688102895, "percentage": 34.58, "elapsed_time": "3:15:13", "remaining_time": "6:09:20"}
269
+ {"current_steps": 269, "total_steps": 775, "loss": 0.5199, "lr": 3.3035170447295477e-05, "epoch": 1.729903536977492, "percentage": 34.71, "elapsed_time": "3:15:59", "remaining_time": "6:08:40"}
270
+ {"current_steps": 270, "total_steps": 775, "loss": 0.5009, "lr": 3.296666905029527e-05, "epoch": 1.7363344051446945, "percentage": 34.84, "elapsed_time": "3:16:41", "remaining_time": "6:07:52"}
271
+ {"current_steps": 271, "total_steps": 775, "loss": 0.5126, "lr": 3.289790422532797e-05, "epoch": 1.742765273311897, "percentage": 34.97, "elapsed_time": "3:17:26", "remaining_time": "6:07:11"}
272
+ {"current_steps": 272, "total_steps": 775, "loss": 0.5147, "lr": 3.282887736940448e-05, "epoch": 1.7491961414790995, "percentage": 35.1, "elapsed_time": "3:18:07", "remaining_time": "6:06:23"}
273
+ {"current_steps": 273, "total_steps": 775, "loss": 0.5117, "lr": 3.275958988485907e-05, "epoch": 1.7556270096463023, "percentage": 35.23, "elapsed_time": "3:18:49", "remaining_time": "6:05:36"}
274
+ {"current_steps": 274, "total_steps": 775, "loss": 0.5102, "lr": 3.269004317932088e-05, "epoch": 1.762057877813505, "percentage": 35.35, "elapsed_time": "3:19:33", "remaining_time": "6:04:53"}
275
+ {"current_steps": 275, "total_steps": 775, "loss": 0.5064, "lr": 3.262023866568531e-05, "epoch": 1.7684887459807075, "percentage": 35.48, "elapsed_time": "3:20:15", "remaining_time": "6:04:05"}
276
+ {"current_steps": 276, "total_steps": 775, "loss": 0.519, "lr": 3.255017776208537e-05, "epoch": 1.77491961414791, "percentage": 35.61, "elapsed_time": "3:20:57", "remaining_time": "6:03:19"}
277
+ {"current_steps": 277, "total_steps": 775, "loss": 0.526, "lr": 3.2479861891862803e-05, "epoch": 1.7813504823151125, "percentage": 35.74, "elapsed_time": "3:21:42", "remaining_time": "6:02:37"}
278
+ {"current_steps": 278, "total_steps": 775, "loss": 0.4995, "lr": 3.24092924835392e-05, "epoch": 1.787781350482315, "percentage": 35.87, "elapsed_time": "3:22:25", "remaining_time": "6:01:53"}
279
+ {"current_steps": 279, "total_steps": 775, "loss": 0.5043, "lr": 3.2338470970786975e-05, "epoch": 1.7942122186495175, "percentage": 36.0, "elapsed_time": "3:23:10", "remaining_time": "6:01:12"}
280
+ {"current_steps": 280, "total_steps": 775, "loss": 0.5157, "lr": 3.2267398792400254e-05, "epoch": 1.8006430868167203, "percentage": 36.13, "elapsed_time": "3:23:52", "remaining_time": "6:00:25"}
281
+ {"current_steps": 281, "total_steps": 775, "loss": 0.5093, "lr": 3.219607739226561e-05, "epoch": 1.807073954983923, "percentage": 36.26, "elapsed_time": "3:24:34", "remaining_time": "5:59:39"}
282
+ {"current_steps": 282, "total_steps": 775, "loss": 0.502, "lr": 3.212450821933277e-05, "epoch": 1.8135048231511255, "percentage": 36.39, "elapsed_time": "3:25:20", "remaining_time": "5:58:58"}
283
+ {"current_steps": 283, "total_steps": 775, "loss": 0.5039, "lr": 3.205269272758513e-05, "epoch": 1.819935691318328, "percentage": 36.52, "elapsed_time": "3:26:04", "remaining_time": "5:58:16"}
284
+ {"current_steps": 284, "total_steps": 775, "loss": 0.5306, "lr": 3.198063237601028e-05, "epoch": 1.8263665594855305, "percentage": 36.65, "elapsed_time": "3:26:46", "remaining_time": "5:57:30"}
285
+ {"current_steps": 285, "total_steps": 775, "loss": 0.5137, "lr": 3.1908328628570306e-05, "epoch": 1.832797427652733, "percentage": 36.77, "elapsed_time": "3:27:30", "remaining_time": "5:56:46"}
286
+ {"current_steps": 286, "total_steps": 775, "loss": 0.5116, "lr": 3.183578295417208e-05, "epoch": 1.8392282958199357, "percentage": 36.9, "elapsed_time": "3:28:16", "remaining_time": "5:56:06"}
287
+ {"current_steps": 287, "total_steps": 775, "loss": 0.5046, "lr": 3.1762996826637386e-05, "epoch": 1.8456591639871383, "percentage": 37.03, "elapsed_time": "3:28:54", "remaining_time": "5:55:13"}
288
+ {"current_steps": 288, "total_steps": 775, "loss": 0.5143, "lr": 3.168997172467303e-05, "epoch": 1.852090032154341, "percentage": 37.16, "elapsed_time": "3:29:40", "remaining_time": "5:54:32"}
289
+ {"current_steps": 289, "total_steps": 775, "loss": 0.5202, "lr": 3.161670913184075e-05, "epoch": 1.8585209003215435, "percentage": 37.29, "elapsed_time": "3:30:20", "remaining_time": "5:53:44"}
290
+ {"current_steps": 290, "total_steps": 775, "loss": 0.5093, "lr": 3.15432105365271e-05, "epoch": 1.864951768488746, "percentage": 37.42, "elapsed_time": "3:31:05", "remaining_time": "5:53:01"}
291
+ {"current_steps": 291, "total_steps": 775, "loss": 0.5083, "lr": 3.146947743191323e-05, "epoch": 1.8713826366559485, "percentage": 37.55, "elapsed_time": "3:31:46", "remaining_time": "5:52:13"}
292
+ {"current_steps": 292, "total_steps": 775, "loss": 0.4984, "lr": 3.139551131594449e-05, "epoch": 1.877813504823151, "percentage": 37.68, "elapsed_time": "3:32:30", "remaining_time": "5:51:30"}
293
+ {"current_steps": 293, "total_steps": 775, "loss": 0.5035, "lr": 3.1321313691300055e-05, "epoch": 1.8842443729903537, "percentage": 37.81, "elapsed_time": "3:33:11", "remaining_time": "5:50:43"}
294
+ {"current_steps": 294, "total_steps": 775, "loss": 0.5156, "lr": 3.1246886065362384e-05, "epoch": 1.8906752411575563, "percentage": 37.94, "elapsed_time": "3:33:55", "remaining_time": "5:49:59"}
295
+ {"current_steps": 295, "total_steps": 775, "loss": 0.5055, "lr": 3.117222995018659e-05, "epoch": 1.897106109324759, "percentage": 38.06, "elapsed_time": "3:34:37", "remaining_time": "5:49:13"}
296
+ {"current_steps": 296, "total_steps": 775, "loss": 0.5026, "lr": 3.109734686246972e-05, "epoch": 1.9035369774919615, "percentage": 38.19, "elapsed_time": "3:35:20", "remaining_time": "5:48:28"}
297
+ {"current_steps": 297, "total_steps": 775, "loss": 0.5009, "lr": 3.1022238323519945e-05, "epoch": 1.909967845659164, "percentage": 38.32, "elapsed_time": "3:36:03", "remaining_time": "5:47:44"}
298
+ {"current_steps": 298, "total_steps": 775, "loss": 0.5136, "lr": 3.094690585922564e-05, "epoch": 1.9163987138263665, "percentage": 38.45, "elapsed_time": "3:36:42", "remaining_time": "5:46:52"}
299
+ {"current_steps": 299, "total_steps": 775, "loss": 0.5237, "lr": 3.0871351000024425e-05, "epoch": 1.922829581993569, "percentage": 38.58, "elapsed_time": "3:37:27", "remaining_time": "5:46:11"}
300
+ {"current_steps": 300, "total_steps": 775, "loss": 0.5038, "lr": 3.0795575280872024e-05, "epoch": 1.9292604501607717, "percentage": 38.71, "elapsed_time": "3:38:10", "remaining_time": "5:45:26"}
301
+ {"current_steps": 301, "total_steps": 775, "loss": 0.5417, "lr": 3.071958024121111e-05, "epoch": 1.9356913183279743, "percentage": 38.84, "elapsed_time": "3:38:49", "remaining_time": "5:44:35"}
302
+ {"current_steps": 302, "total_steps": 775, "loss": 0.4988, "lr": 3.0643367424940026e-05, "epoch": 1.942122186495177, "percentage": 38.97, "elapsed_time": "3:39:34", "remaining_time": "5:43:54"}
303
+ {"current_steps": 303, "total_steps": 775, "loss": 0.5177, "lr": 3.05669383803814e-05, "epoch": 1.9485530546623795, "percentage": 39.1, "elapsed_time": "3:40:20", "remaining_time": "5:43:14"}
304
+ {"current_steps": 304, "total_steps": 775, "loss": 0.515, "lr": 3.049029466025073e-05, "epoch": 1.954983922829582, "percentage": 39.23, "elapsed_time": "3:41:00", "remaining_time": "5:42:24"}
305
+ {"current_steps": 305, "total_steps": 775, "loss": 0.5148, "lr": 3.0413437821624795e-05, "epoch": 1.9614147909967845, "percentage": 39.35, "elapsed_time": "3:41:42", "remaining_time": "5:41:38"}
306
+ {"current_steps": 306, "total_steps": 775, "loss": 0.5071, "lr": 3.0336369425910058e-05, "epoch": 1.967845659163987, "percentage": 39.48, "elapsed_time": "3:42:24", "remaining_time": "5:40:53"}
307
+ {"current_steps": 307, "total_steps": 775, "loss": 0.5082, "lr": 3.0259091038810916e-05, "epoch": 1.9742765273311897, "percentage": 39.61, "elapsed_time": "3:43:01", "remaining_time": "5:39:59"}
308
+ {"current_steps": 308, "total_steps": 775, "loss": 0.5229, "lr": 3.018160423029791e-05, "epoch": 1.9807073954983923, "percentage": 39.74, "elapsed_time": "3:43:40", "remaining_time": "5:39:09"}
309
+ {"current_steps": 309, "total_steps": 775, "loss": 0.5145, "lr": 3.010391057457582e-05, "epoch": 1.987138263665595, "percentage": 39.87, "elapsed_time": "3:44:27", "remaining_time": "5:38:30"}
310
+ {"current_steps": 310, "total_steps": 775, "loss": 0.4858, "lr": 3.0026011650051695e-05, "epoch": 1.9935691318327975, "percentage": 40.0, "elapsed_time": "3:45:07", "remaining_time": "5:37:40"}
311
+ {"current_steps": 311, "total_steps": 775, "loss": 0.5149, "lr": 2.994790903930278e-05, "epoch": 2.0, "percentage": 40.13, "elapsed_time": "3:45:48", "remaining_time": "5:36:53"}
312
+ {"current_steps": 312, "total_steps": 775, "loss": 0.4287, "lr": 2.9869604329044345e-05, "epoch": 2.0064308681672025, "percentage": 40.26, "elapsed_time": "3:47:20", "remaining_time": "5:37:21"}
313
+ {"current_steps": 313, "total_steps": 775, "loss": 0.4263, "lr": 2.9791099110097502e-05, "epoch": 2.012861736334405, "percentage": 40.39, "elapsed_time": "3:48:07", "remaining_time": "5:36:43"}