ryanmarten commited on
Commit
d517317
·
verified ·
1 Parent(s): 3fd46aa

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8eea52015812e86b05fa3eab9c8175f374dd1c9a7c9abe5b416bda24bd337536
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:813e141444b3adbcddacbd5a0c9a43e5007ac0922bbd15d85f47216ab3e1f342
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:14d7ec9d2d6a38c3ce622b1d88baf76ae943103fa21ce885661fc3a05a397daf
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b12e1b493bfe2fa72ec24f6dc498b7e5d44a29a1d15a63e4f6777909cae20ec0
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fae6868e43a8f628f1ac0fef4471c8f4a1322439dcc88cbc836708efe6e795da
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94493130bf78a0825b5e2288b4a594017c1cadc497eeeb729755d94d4a9b74ea
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a820121c3c9f5e9fc539d76dfb4fe9dcb734be8f5e608c96e08d762b6d95404
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a8bd49002c50a0aed27a0976dd085c84e1be1b980ff952e7174f89c7e35b73d
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -311,3 +311,159 @@
311
  {"current_steps": 311, "total_steps": 775, "loss": 0.5149, "lr": 2.994790903930278e-05, "epoch": 2.0, "percentage": 40.13, "elapsed_time": "3:45:48", "remaining_time": "5:36:53"}
312
  {"current_steps": 312, "total_steps": 775, "loss": 0.4287, "lr": 2.9869604329044345e-05, "epoch": 2.0064308681672025, "percentage": 40.26, "elapsed_time": "3:47:20", "remaining_time": "5:37:21"}
313
  {"current_steps": 313, "total_steps": 775, "loss": 0.4263, "lr": 2.9791099110097502e-05, "epoch": 2.012861736334405, "percentage": 40.39, "elapsed_time": "3:48:07", "remaining_time": "5:36:43"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
311
  {"current_steps": 311, "total_steps": 775, "loss": 0.5149, "lr": 2.994790903930278e-05, "epoch": 2.0, "percentage": 40.13, "elapsed_time": "3:45:48", "remaining_time": "5:36:53"}
312
  {"current_steps": 312, "total_steps": 775, "loss": 0.4287, "lr": 2.9869604329044345e-05, "epoch": 2.0064308681672025, "percentage": 40.26, "elapsed_time": "3:47:20", "remaining_time": "5:37:21"}
313
  {"current_steps": 313, "total_steps": 775, "loss": 0.4263, "lr": 2.9791099110097502e-05, "epoch": 2.012861736334405, "percentage": 40.39, "elapsed_time": "3:48:07", "remaining_time": "5:36:43"}
314
+ {"current_steps": 314, "total_steps": 775, "loss": 0.4118, "lr": 2.9712394977356824e-05, "epoch": 2.0192926045016075, "percentage": 40.52, "elapsed_time": "3:48:54", "remaining_time": "5:36:04"}
315
+ {"current_steps": 315, "total_steps": 775, "loss": 0.4089, "lr": 2.9633493529757988e-05, "epoch": 2.0257234726688105, "percentage": 40.65, "elapsed_time": "3:49:33", "remaining_time": "5:35:14"}
316
+ {"current_steps": 316, "total_steps": 775, "loss": 0.4197, "lr": 2.955439637024526e-05, "epoch": 2.032154340836013, "percentage": 40.77, "elapsed_time": "3:50:19", "remaining_time": "5:34:33"}
317
+ {"current_steps": 317, "total_steps": 775, "loss": 0.4191, "lr": 2.947510510573897e-05, "epoch": 2.0385852090032155, "percentage": 40.9, "elapsed_time": "3:51:03", "remaining_time": "5:33:50"}
318
+ {"current_steps": 318, "total_steps": 775, "loss": 0.4368, "lr": 2.9395621347102817e-05, "epoch": 2.045016077170418, "percentage": 41.03, "elapsed_time": "3:51:48", "remaining_time": "5:33:07"}
319
+ {"current_steps": 319, "total_steps": 775, "loss": 0.403, "lr": 2.931594670911119e-05, "epoch": 2.0514469453376205, "percentage": 41.16, "elapsed_time": "3:52:30", "remaining_time": "5:32:21"}
320
+ {"current_steps": 320, "total_steps": 775, "loss": 0.4228, "lr": 2.9236082810416316e-05, "epoch": 2.057877813504823, "percentage": 41.29, "elapsed_time": "3:53:11", "remaining_time": "5:31:34"}
321
+ {"current_steps": 321, "total_steps": 775, "loss": 0.4436, "lr": 2.9156031273515427e-05, "epoch": 2.0643086816720255, "percentage": 41.42, "elapsed_time": "3:53:57", "remaining_time": "5:30:53"}
322
+ {"current_steps": 322, "total_steps": 775, "loss": 0.4002, "lr": 2.9075793724717755e-05, "epoch": 2.0707395498392285, "percentage": 41.55, "elapsed_time": "3:54:34", "remaining_time": "5:30:01"}
323
+ {"current_steps": 323, "total_steps": 775, "loss": 0.4135, "lr": 2.8995371794111515e-05, "epoch": 2.077170418006431, "percentage": 41.68, "elapsed_time": "3:55:17", "remaining_time": "5:29:15"}
324
+ {"current_steps": 324, "total_steps": 775, "loss": 0.3909, "lr": 2.891476711553077e-05, "epoch": 2.0836012861736335, "percentage": 41.81, "elapsed_time": "3:56:00", "remaining_time": "5:28:31"}
325
+ {"current_steps": 325, "total_steps": 775, "loss": 0.4316, "lr": 2.883398132652226e-05, "epoch": 2.090032154340836, "percentage": 41.94, "elapsed_time": "3:56:42", "remaining_time": "5:27:45"}
326
+ {"current_steps": 326, "total_steps": 775, "loss": 0.4275, "lr": 2.8753016068312124e-05, "epoch": 2.0964630225080385, "percentage": 42.06, "elapsed_time": "3:57:33", "remaining_time": "5:27:10"}
327
+ {"current_steps": 327, "total_steps": 775, "loss": 0.4106, "lr": 2.867187298577257e-05, "epoch": 2.102893890675241, "percentage": 42.19, "elapsed_time": "3:58:20", "remaining_time": "5:26:31"}
328
+ {"current_steps": 328, "total_steps": 775, "loss": 0.4031, "lr": 2.859055372738841e-05, "epoch": 2.1093247588424435, "percentage": 42.32, "elapsed_time": "3:59:08", "remaining_time": "5:25:54"}
329
+ {"current_steps": 329, "total_steps": 775, "loss": 0.4116, "lr": 2.850905994522364e-05, "epoch": 2.1157556270096465, "percentage": 42.45, "elapsed_time": "3:59:53", "remaining_time": "5:25:12"}
330
+ {"current_steps": 330, "total_steps": 775, "loss": 0.4349, "lr": 2.842739329488783e-05, "epoch": 2.122186495176849, "percentage": 42.58, "elapsed_time": "4:00:40", "remaining_time": "5:24:33"}
331
+ {"current_steps": 331, "total_steps": 775, "loss": 0.4226, "lr": 2.83455554355025e-05, "epoch": 2.1286173633440515, "percentage": 42.71, "elapsed_time": "4:01:27", "remaining_time": "5:23:53"}
332
+ {"current_steps": 332, "total_steps": 775, "loss": 0.4311, "lr": 2.8263548029667413e-05, "epoch": 2.135048231511254, "percentage": 42.84, "elapsed_time": "4:02:09", "remaining_time": "5:23:07"}
333
+ {"current_steps": 333, "total_steps": 775, "loss": 0.4004, "lr": 2.8181372743426805e-05, "epoch": 2.1414790996784565, "percentage": 42.97, "elapsed_time": "4:02:51", "remaining_time": "5:22:21"}
334
+ {"current_steps": 334, "total_steps": 775, "loss": 0.411, "lr": 2.8099031246235518e-05, "epoch": 2.147909967845659, "percentage": 43.1, "elapsed_time": "4:03:35", "remaining_time": "5:21:37"}
335
+ {"current_steps": 335, "total_steps": 775, "loss": 0.4275, "lr": 2.8016525210925146e-05, "epoch": 2.154340836012862, "percentage": 43.23, "elapsed_time": "4:04:24", "remaining_time": "5:21:00"}
336
+ {"current_steps": 336, "total_steps": 775, "loss": 0.4158, "lr": 2.793385631366993e-05, "epoch": 2.1607717041800645, "percentage": 43.35, "elapsed_time": "4:05:11", "remaining_time": "5:20:20"}
337
+ {"current_steps": 337, "total_steps": 775, "loss": 0.4229, "lr": 2.7851026233952844e-05, "epoch": 2.167202572347267, "percentage": 43.48, "elapsed_time": "4:05:52", "remaining_time": "5:19:33"}
338
+ {"current_steps": 338, "total_steps": 775, "loss": 0.4361, "lr": 2.7768036654531365e-05, "epoch": 2.1736334405144695, "percentage": 43.61, "elapsed_time": "4:06:33", "remaining_time": "5:18:46"}
339
+ {"current_steps": 339, "total_steps": 775, "loss": 0.432, "lr": 2.768488926140336e-05, "epoch": 2.180064308681672, "percentage": 43.74, "elapsed_time": "4:07:18", "remaining_time": "5:18:03"}
340
+ {"current_steps": 340, "total_steps": 775, "loss": 0.4247, "lr": 2.760158574377278e-05, "epoch": 2.1864951768488745, "percentage": 43.87, "elapsed_time": "4:08:02", "remaining_time": "5:17:20"}
341
+ {"current_steps": 341, "total_steps": 775, "loss": 0.4179, "lr": 2.7518127794015384e-05, "epoch": 2.192926045016077, "percentage": 44.0, "elapsed_time": "4:08:41", "remaining_time": "5:16:31"}
342
+ {"current_steps": 342, "total_steps": 775, "loss": 0.4368, "lr": 2.743451710764433e-05, "epoch": 2.19935691318328, "percentage": 44.13, "elapsed_time": "4:09:25", "remaining_time": "5:15:47"}
343
+ {"current_steps": 343, "total_steps": 775, "loss": 0.3995, "lr": 2.7350755383275757e-05, "epoch": 2.2057877813504825, "percentage": 44.26, "elapsed_time": "4:10:07", "remaining_time": "5:15:00"}
344
+ {"current_steps": 344, "total_steps": 775, "loss": 0.4115, "lr": 2.7266844322594228e-05, "epoch": 2.212218649517685, "percentage": 44.39, "elapsed_time": "4:10:51", "remaining_time": "5:14:18"}
345
+ {"current_steps": 345, "total_steps": 775, "loss": 0.435, "lr": 2.718278563031821e-05, "epoch": 2.2186495176848875, "percentage": 44.52, "elapsed_time": "4:11:34", "remaining_time": "5:13:33"}
346
+ {"current_steps": 346, "total_steps": 775, "loss": 0.4362, "lr": 2.7098581014165426e-05, "epoch": 2.22508038585209, "percentage": 44.65, "elapsed_time": "4:12:20", "remaining_time": "5:12:52"}
347
+ {"current_steps": 347, "total_steps": 775, "loss": 0.4102, "lr": 2.7014232184818134e-05, "epoch": 2.2315112540192925, "percentage": 44.77, "elapsed_time": "4:13:04", "remaining_time": "5:12:09"}
348
+ {"current_steps": 348, "total_steps": 775, "loss": 0.414, "lr": 2.6929740855888416e-05, "epoch": 2.237942122186495, "percentage": 44.9, "elapsed_time": "4:13:44", "remaining_time": "5:11:20"}
349
+ {"current_steps": 349, "total_steps": 775, "loss": 0.4191, "lr": 2.684510874388333e-05, "epoch": 2.244372990353698, "percentage": 45.03, "elapsed_time": "4:14:31", "remaining_time": "5:10:40"}
350
+ {"current_steps": 350, "total_steps": 775, "loss": 0.4158, "lr": 2.6760337568170056e-05, "epoch": 2.2508038585209005, "percentage": 45.16, "elapsed_time": "4:15:14", "remaining_time": "5:09:55"}
351
+ {"current_steps": 351, "total_steps": 775, "loss": 0.4218, "lr": 2.6675429050940976e-05, "epoch": 2.257234726688103, "percentage": 45.29, "elapsed_time": "4:15:53", "remaining_time": "5:09:07"}
352
+ {"current_steps": 352, "total_steps": 775, "loss": 0.4095, "lr": 2.659038491717864e-05, "epoch": 2.2636655948553055, "percentage": 45.42, "elapsed_time": "4:16:38", "remaining_time": "5:08:24"}
353
+ {"current_steps": 353, "total_steps": 775, "loss": 0.4384, "lr": 2.650520689462079e-05, "epoch": 2.270096463022508, "percentage": 45.55, "elapsed_time": "4:17:24", "remaining_time": "5:07:43"}
354
+ {"current_steps": 354, "total_steps": 775, "loss": 0.4252, "lr": 2.6419896713725194e-05, "epoch": 2.2765273311897105, "percentage": 45.68, "elapsed_time": "4:18:08", "remaining_time": "5:07:00"}
355
+ {"current_steps": 355, "total_steps": 775, "loss": 0.4066, "lr": 2.6334456107634526e-05, "epoch": 2.282958199356913, "percentage": 45.81, "elapsed_time": "4:18:51", "remaining_time": "5:06:14"}
356
+ {"current_steps": 356, "total_steps": 775, "loss": 0.4063, "lr": 2.6248886812141164e-05, "epoch": 2.289389067524116, "percentage": 45.94, "elapsed_time": "4:19:35", "remaining_time": "5:05:31"}
357
+ {"current_steps": 357, "total_steps": 775, "loss": 0.4064, "lr": 2.6163190565651895e-05, "epoch": 2.2958199356913185, "percentage": 46.06, "elapsed_time": "4:20:13", "remaining_time": "5:04:41"}
358
+ {"current_steps": 358, "total_steps": 775, "loss": 0.4271, "lr": 2.6077369109152617e-05, "epoch": 2.302250803858521, "percentage": 46.19, "elapsed_time": "4:21:03", "remaining_time": "5:04:05"}
359
+ {"current_steps": 359, "total_steps": 775, "loss": 0.4337, "lr": 2.599142418617299e-05, "epoch": 2.3086816720257235, "percentage": 46.32, "elapsed_time": "4:21:46", "remaining_time": "5:03:20"}
360
+ {"current_steps": 360, "total_steps": 775, "loss": 0.3997, "lr": 2.5905357542750937e-05, "epoch": 2.315112540192926, "percentage": 46.45, "elapsed_time": "4:22:25", "remaining_time": "5:02:30"}
361
+ {"current_steps": 361, "total_steps": 775, "loss": 0.4048, "lr": 2.5819170927397288e-05, "epoch": 2.3215434083601285, "percentage": 46.58, "elapsed_time": "4:23:08", "remaining_time": "5:01:46"}
362
+ {"current_steps": 362, "total_steps": 775, "loss": 0.4302, "lr": 2.573286609106016e-05, "epoch": 2.327974276527331, "percentage": 46.71, "elapsed_time": "4:23:52", "remaining_time": "5:01:02"}
363
+ {"current_steps": 363, "total_steps": 775, "loss": 0.437, "lr": 2.5646444787089435e-05, "epoch": 2.334405144694534, "percentage": 46.84, "elapsed_time": "4:24:36", "remaining_time": "5:00:19"}
364
+ {"current_steps": 364, "total_steps": 775, "loss": 0.4192, "lr": 2.555990877120111e-05, "epoch": 2.3408360128617365, "percentage": 46.97, "elapsed_time": "4:25:15", "remaining_time": "4:59:30"}
365
+ {"current_steps": 365, "total_steps": 775, "loss": 0.4191, "lr": 2.5473259801441663e-05, "epoch": 2.347266881028939, "percentage": 47.1, "elapsed_time": "4:25:57", "remaining_time": "4:58:45"}
366
+ {"current_steps": 366, "total_steps": 775, "loss": 0.4142, "lr": 2.53864996381523e-05, "epoch": 2.3536977491961415, "percentage": 47.23, "elapsed_time": "4:26:40", "remaining_time": "4:58:00"}
367
+ {"current_steps": 367, "total_steps": 775, "loss": 0.4187, "lr": 2.529963004393324e-05, "epoch": 2.360128617363344, "percentage": 47.35, "elapsed_time": "4:27:20", "remaining_time": "4:57:11"}
368
+ {"current_steps": 368, "total_steps": 775, "loss": 0.414, "lr": 2.521265278360783e-05, "epoch": 2.3665594855305465, "percentage": 47.48, "elapsed_time": "4:28:03", "remaining_time": "4:56:28"}
369
+ {"current_steps": 369, "total_steps": 775, "loss": 0.4247, "lr": 2.5125569624186782e-05, "epoch": 2.372990353697749, "percentage": 47.61, "elapsed_time": "4:28:47", "remaining_time": "4:55:44"}
370
+ {"current_steps": 370, "total_steps": 775, "loss": 0.3911, "lr": 2.5038382334832207e-05, "epoch": 2.379421221864952, "percentage": 47.74, "elapsed_time": "4:29:28", "remaining_time": "4:54:58"}
371
+ {"current_steps": 371, "total_steps": 775, "loss": 0.39, "lr": 2.4951092686821697e-05, "epoch": 2.3858520900321545, "percentage": 47.87, "elapsed_time": "4:30:08", "remaining_time": "4:54:09"}
372
+ {"current_steps": 372, "total_steps": 775, "loss": 0.4198, "lr": 2.486370245351235e-05, "epoch": 2.392282958199357, "percentage": 48.0, "elapsed_time": "4:30:48", "remaining_time": "4:53:22"}
373
+ {"current_steps": 373, "total_steps": 775, "loss": 0.424, "lr": 2.4776213410304722e-05, "epoch": 2.3987138263665595, "percentage": 48.13, "elapsed_time": "4:31:28", "remaining_time": "4:52:35"}
374
+ {"current_steps": 374, "total_steps": 775, "loss": 0.398, "lr": 2.4688627334606773e-05, "epoch": 2.405144694533762, "percentage": 48.26, "elapsed_time": "4:32:10", "remaining_time": "4:51:49"}
375
+ {"current_steps": 375, "total_steps": 775, "loss": 0.4317, "lr": 2.460094600579777e-05, "epoch": 2.4115755627009645, "percentage": 48.39, "elapsed_time": "4:32:57", "remaining_time": "4:51:09"}
376
+ {"current_steps": 376, "total_steps": 775, "loss": 0.4295, "lr": 2.4513171205192076e-05, "epoch": 2.418006430868167, "percentage": 48.52, "elapsed_time": "4:33:41", "remaining_time": "4:50:26"}
377
+ {"current_steps": 377, "total_steps": 775, "loss": 0.4293, "lr": 2.4425304716003065e-05, "epoch": 2.42443729903537, "percentage": 48.65, "elapsed_time": "4:34:27", "remaining_time": "4:49:44"}
378
+ {"current_steps": 378, "total_steps": 775, "loss": 0.4183, "lr": 2.433734832330679e-05, "epoch": 2.4308681672025725, "percentage": 48.77, "elapsed_time": "4:35:05", "remaining_time": "4:48:55"}
379
+ {"current_steps": 379, "total_steps": 775, "loss": 0.4348, "lr": 2.4249303814005787e-05, "epoch": 2.437299035369775, "percentage": 48.9, "elapsed_time": "4:35:48", "remaining_time": "4:48:11"}
380
+ {"current_steps": 380, "total_steps": 775, "loss": 0.418, "lr": 2.416117297679274e-05, "epoch": 2.4437299035369775, "percentage": 49.03, "elapsed_time": "4:36:30", "remaining_time": "4:47:25"}
381
+ {"current_steps": 381, "total_steps": 775, "loss": 0.4314, "lr": 2.407295760211415e-05, "epoch": 2.45016077170418, "percentage": 49.16, "elapsed_time": "4:37:10", "remaining_time": "4:46:37"}
382
+ {"current_steps": 382, "total_steps": 775, "loss": 0.4139, "lr": 2.3984659482133964e-05, "epoch": 2.4565916398713825, "percentage": 49.29, "elapsed_time": "4:37:53", "remaining_time": "4:45:53"}
383
+ {"current_steps": 383, "total_steps": 775, "loss": 0.3907, "lr": 2.3896280410697184e-05, "epoch": 2.463022508038585, "percentage": 49.42, "elapsed_time": "4:38:29", "remaining_time": "4:45:02"}
384
+ {"current_steps": 384, "total_steps": 775, "loss": 0.4013, "lr": 2.380782218329337e-05, "epoch": 2.469453376205788, "percentage": 49.55, "elapsed_time": "4:39:15", "remaining_time": "4:44:21"}
385
+ {"current_steps": 385, "total_steps": 775, "loss": 0.4318, "lr": 2.3719286597020223e-05, "epoch": 2.4758842443729905, "percentage": 49.68, "elapsed_time": "4:39:55", "remaining_time": "4:43:33"}
386
+ {"current_steps": 386, "total_steps": 775, "loss": 0.3992, "lr": 2.3630675450547035e-05, "epoch": 2.482315112540193, "percentage": 49.81, "elapsed_time": "4:40:34", "remaining_time": "4:42:45"}
387
+ {"current_steps": 387, "total_steps": 775, "loss": 0.4151, "lr": 2.354199054407817e-05, "epoch": 2.4887459807073955, "percentage": 49.94, "elapsed_time": "4:41:16", "remaining_time": "4:42:00"}
388
+ {"current_steps": 388, "total_steps": 775, "loss": 0.4062, "lr": 2.3453233679316474e-05, "epoch": 2.495176848874598, "percentage": 50.06, "elapsed_time": "4:42:03", "remaining_time": "4:41:19"}
389
+ {"current_steps": 389, "total_steps": 775, "loss": 0.4272, "lr": 2.33644066594267e-05, "epoch": 2.5016077170418005, "percentage": 50.19, "elapsed_time": "4:42:52", "remaining_time": "4:40:41"}
390
+ {"current_steps": 390, "total_steps": 775, "loss": 0.4225, "lr": 2.327551128899884e-05, "epoch": 2.508038585209003, "percentage": 50.32, "elapsed_time": "4:43:38", "remaining_time": "4:40:00"}
391
+ {"current_steps": 391, "total_steps": 775, "loss": 0.4074, "lr": 2.3186549374011484e-05, "epoch": 2.514469453376206, "percentage": 50.45, "elapsed_time": "4:44:16", "remaining_time": "4:39:10"}
392
+ {"current_steps": 392, "total_steps": 775, "loss": 0.4138, "lr": 2.3097522721795135e-05, "epoch": 2.5209003215434085, "percentage": 50.58, "elapsed_time": "4:44:55", "remaining_time": "4:38:23"}
393
+ {"current_steps": 393, "total_steps": 775, "loss": 0.4273, "lr": 2.3008433140995473e-05, "epoch": 2.527331189710611, "percentage": 50.71, "elapsed_time": "4:45:41", "remaining_time": "4:37:42"}
394
+ {"current_steps": 394, "total_steps": 775, "loss": 0.4282, "lr": 2.2919282441536622e-05, "epoch": 2.5337620578778135, "percentage": 50.84, "elapsed_time": "4:46:30", "remaining_time": "4:37:03"}
395
+ {"current_steps": 395, "total_steps": 775, "loss": 0.4103, "lr": 2.283007243458438e-05, "epoch": 2.540192926045016, "percentage": 50.97, "elapsed_time": "4:47:27", "remaining_time": "4:36:32"}
396
+ {"current_steps": 396, "total_steps": 775, "loss": 0.4155, "lr": 2.2740804932509443e-05, "epoch": 2.5466237942122185, "percentage": 51.1, "elapsed_time": "4:48:11", "remaining_time": "4:35:48"}
397
+ {"current_steps": 397, "total_steps": 775, "loss": 0.4062, "lr": 2.2651481748850522e-05, "epoch": 2.553054662379421, "percentage": 51.23, "elapsed_time": "4:48:52", "remaining_time": "4:35:03"}
398
+ {"current_steps": 398, "total_steps": 775, "loss": 0.4054, "lr": 2.2562104698277587e-05, "epoch": 2.559485530546624, "percentage": 51.35, "elapsed_time": "4:49:34", "remaining_time": "4:34:17"}
399
+ {"current_steps": 399, "total_steps": 775, "loss": 0.4068, "lr": 2.247267559655492e-05, "epoch": 2.5659163987138265, "percentage": 51.48, "elapsed_time": "4:50:17", "remaining_time": "4:33:33"}
400
+ {"current_steps": 400, "total_steps": 775, "loss": 0.4289, "lr": 2.2383196260504297e-05, "epoch": 2.572347266881029, "percentage": 51.61, "elapsed_time": "4:51:01", "remaining_time": "4:32:49"}
401
+ {"current_steps": 401, "total_steps": 775, "loss": 0.4027, "lr": 2.2293668507968015e-05, "epoch": 2.5787781350482315, "percentage": 51.74, "elapsed_time": "4:51:47", "remaining_time": "4:32:08"}
402
+ {"current_steps": 402, "total_steps": 775, "loss": 0.4435, "lr": 2.2204094157772e-05, "epoch": 2.585209003215434, "percentage": 51.87, "elapsed_time": "4:52:32", "remaining_time": "4:31:26"}
403
+ {"current_steps": 403, "total_steps": 775, "loss": 0.4186, "lr": 2.2114475029688845e-05, "epoch": 2.5916398713826365, "percentage": 52.0, "elapsed_time": "4:53:13", "remaining_time": "4:30:39"}
404
+ {"current_steps": 404, "total_steps": 775, "loss": 0.4194, "lr": 2.202481294440086e-05, "epoch": 2.598070739549839, "percentage": 52.13, "elapsed_time": "4:53:56", "remaining_time": "4:29:56"}
405
+ {"current_steps": 405, "total_steps": 775, "loss": 0.4222, "lr": 2.1935109723463018e-05, "epoch": 2.604501607717042, "percentage": 52.26, "elapsed_time": "4:54:38", "remaining_time": "4:29:10"}
406
+ {"current_steps": 406, "total_steps": 775, "loss": 0.4213, "lr": 2.184536718926604e-05, "epoch": 2.6109324758842445, "percentage": 52.39, "elapsed_time": "4:55:21", "remaining_time": "4:28:26"}
407
+ {"current_steps": 407, "total_steps": 775, "loss": 0.4379, "lr": 2.1755587164999308e-05, "epoch": 2.617363344051447, "percentage": 52.52, "elapsed_time": "4:56:08", "remaining_time": "4:27:45"}
408
+ {"current_steps": 408, "total_steps": 775, "loss": 0.4108, "lr": 2.1665771474613844e-05, "epoch": 2.6237942122186495, "percentage": 52.65, "elapsed_time": "4:56:55", "remaining_time": "4:27:04"}
409
+ {"current_steps": 409, "total_steps": 775, "loss": 0.4414, "lr": 2.1575921942785247e-05, "epoch": 2.630225080385852, "percentage": 52.77, "elapsed_time": "4:57:44", "remaining_time": "4:26:26"}
410
+ {"current_steps": 410, "total_steps": 775, "loss": 0.4185, "lr": 2.1486040394876653e-05, "epoch": 2.6366559485530545, "percentage": 52.9, "elapsed_time": "4:58:27", "remaining_time": "4:25:41"}
411
+ {"current_steps": 411, "total_steps": 775, "loss": 0.4324, "lr": 2.1396128656901613e-05, "epoch": 2.643086816720257, "percentage": 53.03, "elapsed_time": "4:59:19", "remaining_time": "4:25:05"}
412
+ {"current_steps": 412, "total_steps": 775, "loss": 0.4065, "lr": 2.1306188555487012e-05, "epoch": 2.64951768488746, "percentage": 53.16, "elapsed_time": "5:00:12", "remaining_time": "4:24:30"}
413
+ {"current_steps": 413, "total_steps": 775, "loss": 0.4428, "lr": 2.1216221917835963e-05, "epoch": 2.6559485530546625, "percentage": 53.29, "elapsed_time": "5:00:59", "remaining_time": "4:23:49"}
414
+ {"current_steps": 414, "total_steps": 775, "loss": 0.4406, "lr": 2.1126230571690688e-05, "epoch": 2.662379421221865, "percentage": 53.42, "elapsed_time": "5:01:41", "remaining_time": "4:23:04"}
415
+ {"current_steps": 415, "total_steps": 775, "loss": 0.4056, "lr": 2.1036216345295384e-05, "epoch": 2.6688102893890675, "percentage": 53.55, "elapsed_time": "5:02:27", "remaining_time": "4:22:22"}
416
+ {"current_steps": 416, "total_steps": 775, "loss": 0.4223, "lr": 2.0946181067359066e-05, "epoch": 2.67524115755627, "percentage": 53.68, "elapsed_time": "5:03:14", "remaining_time": "4:21:41"}
417
+ {"current_steps": 417, "total_steps": 775, "loss": 0.4129, "lr": 2.085612656701843e-05, "epoch": 2.6816720257234725, "percentage": 53.81, "elapsed_time": "5:03:54", "remaining_time": "4:20:54"}
418
+ {"current_steps": 418, "total_steps": 775, "loss": 0.4211, "lr": 2.076605467380071e-05, "epoch": 2.688102893890675, "percentage": 53.94, "elapsed_time": "5:04:37", "remaining_time": "4:20:10"}
419
+ {"current_steps": 419, "total_steps": 775, "loss": 0.4097, "lr": 2.0675967217586453e-05, "epoch": 2.694533762057878, "percentage": 54.06, "elapsed_time": "5:05:19", "remaining_time": "4:19:25"}
420
+ {"current_steps": 420, "total_steps": 775, "loss": 0.4232, "lr": 2.058586602857242e-05, "epoch": 2.7009646302250805, "percentage": 54.19, "elapsed_time": "5:06:00", "remaining_time": "4:18:38"}
421
+ {"current_steps": 421, "total_steps": 775, "loss": 0.4226, "lr": 2.049575293723433e-05, "epoch": 2.707395498392283, "percentage": 54.32, "elapsed_time": "5:06:43", "remaining_time": "4:17:54"}
422
+ {"current_steps": 422, "total_steps": 775, "loss": 0.4179, "lr": 2.0405629774289726e-05, "epoch": 2.7138263665594855, "percentage": 54.45, "elapsed_time": "5:07:23", "remaining_time": "4:17:07"}
423
+ {"current_steps": 423, "total_steps": 775, "loss": 0.4186, "lr": 2.0315498370660767e-05, "epoch": 2.720257234726688, "percentage": 54.58, "elapsed_time": "5:08:03", "remaining_time": "4:16:21"}
424
+ {"current_steps": 424, "total_steps": 775, "loss": 0.4294, "lr": 2.022536055743702e-05, "epoch": 2.7266881028938905, "percentage": 54.71, "elapsed_time": "5:08:50", "remaining_time": "4:15:40"}
425
+ {"current_steps": 425, "total_steps": 775, "loss": 0.4203, "lr": 2.0135218165838256e-05, "epoch": 2.733118971061093, "percentage": 54.84, "elapsed_time": "5:09:33", "remaining_time": "4:14:55"}
426
+ {"current_steps": 426, "total_steps": 775, "loss": 0.4045, "lr": 2.004507302717729e-05, "epoch": 2.739549839228296, "percentage": 54.97, "elapsed_time": "5:10:13", "remaining_time": "4:14:08"}
427
+ {"current_steps": 427, "total_steps": 775, "loss": 0.4185, "lr": 1.9954926972822716e-05, "epoch": 2.7459807073954985, "percentage": 55.1, "elapsed_time": "5:10:56", "remaining_time": "4:13:24"}
428
+ {"current_steps": 428, "total_steps": 775, "loss": 0.401, "lr": 1.9864781834161748e-05, "epoch": 2.752411575562701, "percentage": 55.23, "elapsed_time": "5:11:37", "remaining_time": "4:12:38"}
429
+ {"current_steps": 429, "total_steps": 775, "loss": 0.4296, "lr": 1.9774639442562994e-05, "epoch": 2.7588424437299035, "percentage": 55.35, "elapsed_time": "5:12:15", "remaining_time": "4:11:51"}
430
+ {"current_steps": 430, "total_steps": 775, "loss": 0.4191, "lr": 1.968450162933924e-05, "epoch": 2.765273311897106, "percentage": 55.48, "elapsed_time": "5:12:58", "remaining_time": "4:11:06"}
431
+ {"current_steps": 431, "total_steps": 775, "loss": 0.4096, "lr": 1.959437022571028e-05, "epoch": 2.7717041800643085, "percentage": 55.61, "elapsed_time": "5:13:41", "remaining_time": "4:10:22"}
432
+ {"current_steps": 432, "total_steps": 775, "loss": 0.4313, "lr": 1.9504247062765674e-05, "epoch": 2.778135048231511, "percentage": 55.74, "elapsed_time": "5:14:23", "remaining_time": "4:09:37"}
433
+ {"current_steps": 433, "total_steps": 775, "loss": 0.4348, "lr": 1.941413397142759e-05, "epoch": 2.784565916398714, "percentage": 55.87, "elapsed_time": "5:15:12", "remaining_time": "4:08:57"}
434
+ {"current_steps": 434, "total_steps": 775, "loss": 0.4071, "lr": 1.932403278241355e-05, "epoch": 2.7909967845659165, "percentage": 56.0, "elapsed_time": "5:15:55", "remaining_time": "4:08:13"}
435
+ {"current_steps": 435, "total_steps": 775, "loss": 0.4139, "lr": 1.9233945326199295e-05, "epoch": 2.797427652733119, "percentage": 56.13, "elapsed_time": "5:16:38", "remaining_time": "4:07:29"}
436
+ {"current_steps": 436, "total_steps": 775, "loss": 0.439, "lr": 1.9143873432981566e-05, "epoch": 2.8038585209003215, "percentage": 56.26, "elapsed_time": "5:17:22", "remaining_time": "4:06:46"}
437
+ {"current_steps": 437, "total_steps": 775, "loss": 0.4174, "lr": 1.905381893264094e-05, "epoch": 2.810289389067524, "percentage": 56.39, "elapsed_time": "5:18:04", "remaining_time": "4:06:01"}
438
+ {"current_steps": 438, "total_steps": 775, "loss": 0.424, "lr": 1.896378365470462e-05, "epoch": 2.816720257234727, "percentage": 56.52, "elapsed_time": "5:18:45", "remaining_time": "4:05:15"}
439
+ {"current_steps": 439, "total_steps": 775, "loss": 0.4487, "lr": 1.8873769428309315e-05, "epoch": 2.823151125401929, "percentage": 56.65, "elapsed_time": "5:19:31", "remaining_time": "4:04:33"}
440
+ {"current_steps": 440, "total_steps": 775, "loss": 0.3996, "lr": 1.878377808216404e-05, "epoch": 2.829581993569132, "percentage": 56.77, "elapsed_time": "5:20:11", "remaining_time": "4:03:46"}
441
+ {"current_steps": 441, "total_steps": 775, "loss": 0.4038, "lr": 1.8693811444512998e-05, "epoch": 2.8360128617363345, "percentage": 56.9, "elapsed_time": "5:20:51", "remaining_time": "4:03:00"}
442
+ {"current_steps": 442, "total_steps": 775, "loss": 0.4244, "lr": 1.8603871343098397e-05, "epoch": 2.842443729903537, "percentage": 57.03, "elapsed_time": "5:21:36", "remaining_time": "4:02:18"}
443
+ {"current_steps": 443, "total_steps": 775, "loss": 0.4076, "lr": 1.851395960512335e-05, "epoch": 2.8488745980707395, "percentage": 57.16, "elapsed_time": "5:22:19", "remaining_time": "4:01:34"}
444
+ {"current_steps": 444, "total_steps": 775, "loss": 0.43, "lr": 1.8424078057214753e-05, "epoch": 2.855305466237942, "percentage": 57.29, "elapsed_time": "5:23:02", "remaining_time": "4:00:49"}
445
+ {"current_steps": 445, "total_steps": 775, "loss": 0.4023, "lr": 1.8334228525386166e-05, "epoch": 2.861736334405145, "percentage": 57.42, "elapsed_time": "5:23:43", "remaining_time": "4:00:04"}
446
+ {"current_steps": 446, "total_steps": 775, "loss": 0.4376, "lr": 1.8244412835000696e-05, "epoch": 2.868167202572347, "percentage": 57.55, "elapsed_time": "5:24:24", "remaining_time": "3:59:18"}
447
+ {"current_steps": 447, "total_steps": 775, "loss": 0.4045, "lr": 1.815463281073396e-05, "epoch": 2.87459807073955, "percentage": 57.68, "elapsed_time": "5:25:03", "remaining_time": "3:58:31"}
448
+ {"current_steps": 448, "total_steps": 775, "loss": 0.4099, "lr": 1.8064890276536985e-05, "epoch": 2.8810289389067525, "percentage": 57.81, "elapsed_time": "5:25:47", "remaining_time": "3:57:47"}
449
+ {"current_steps": 449, "total_steps": 775, "loss": 0.4433, "lr": 1.7975187055599153e-05, "epoch": 2.887459807073955, "percentage": 57.94, "elapsed_time": "5:26:26", "remaining_time": "3:57:01"}
450
+ {"current_steps": 450, "total_steps": 775, "loss": 0.4248, "lr": 1.7885524970311158e-05, "epoch": 2.8938906752411575, "percentage": 58.06, "elapsed_time": "5:27:07", "remaining_time": "3:56:15"}
451
+ {"current_steps": 451, "total_steps": 775, "loss": 0.388, "lr": 1.7795905842228008e-05, "epoch": 2.90032154340836, "percentage": 58.19, "elapsed_time": "5:27:51", "remaining_time": "3:55:32"}
452
+ {"current_steps": 452, "total_steps": 775, "loss": 0.4115, "lr": 1.7706331492031995e-05, "epoch": 2.906752411575563, "percentage": 58.32, "elapsed_time": "5:28:36", "remaining_time": "3:54:49"}
453
+ {"current_steps": 453, "total_steps": 775, "loss": 0.4138, "lr": 1.7616803739495716e-05, "epoch": 2.913183279742765, "percentage": 58.45, "elapsed_time": "5:29:19", "remaining_time": "3:54:05"}
454
+ {"current_steps": 454, "total_steps": 775, "loss": 0.4033, "lr": 1.7527324403445086e-05, "epoch": 2.919614147909968, "percentage": 58.58, "elapsed_time": "5:30:02", "remaining_time": "3:53:21"}
455
+ {"current_steps": 455, "total_steps": 775, "loss": 0.4277, "lr": 1.7437895301722424e-05, "epoch": 2.9260450160771705, "percentage": 58.71, "elapsed_time": "5:30:47", "remaining_time": "3:52:38"}
456
+ {"current_steps": 456, "total_steps": 775, "loss": 0.4169, "lr": 1.734851825114948e-05, "epoch": 2.932475884244373, "percentage": 58.84, "elapsed_time": "5:31:34", "remaining_time": "3:51:57"}
457
+ {"current_steps": 457, "total_steps": 775, "loss": 0.4285, "lr": 1.7259195067490567e-05, "epoch": 2.9389067524115755, "percentage": 58.97, "elapsed_time": "5:32:19", "remaining_time": "3:51:14"}
458
+ {"current_steps": 458, "total_steps": 775, "loss": 0.4139, "lr": 1.7169927565415624e-05, "epoch": 2.945337620578778, "percentage": 59.1, "elapsed_time": "5:33:03", "remaining_time": "3:50:31"}
459
+ {"current_steps": 459, "total_steps": 775, "loss": 0.4199, "lr": 1.708071755846338e-05, "epoch": 2.951768488745981, "percentage": 59.23, "elapsed_time": "5:33:46", "remaining_time": "3:49:47"}
460
+ {"current_steps": 460, "total_steps": 775, "loss": 0.4165, "lr": 1.6991566859004534e-05, "epoch": 2.958199356913183, "percentage": 59.35, "elapsed_time": "5:34:25", "remaining_time": "3:49:00"}
461
+ {"current_steps": 461, "total_steps": 775, "loss": 0.434, "lr": 1.6902477278204875e-05, "epoch": 2.964630225080386, "percentage": 59.48, "elapsed_time": "5:35:12", "remaining_time": "3:48:18"}
462
+ {"current_steps": 462, "total_steps": 775, "loss": 0.4111, "lr": 1.681345062598852e-05, "epoch": 2.9710610932475885, "percentage": 59.61, "elapsed_time": "5:35:51", "remaining_time": "3:47:32"}
463
+ {"current_steps": 463, "total_steps": 775, "loss": 0.4467, "lr": 1.6724488711001166e-05, "epoch": 2.977491961414791, "percentage": 59.74, "elapsed_time": "5:36:29", "remaining_time": "3:46:44"}
464
+ {"current_steps": 464, "total_steps": 775, "loss": 0.4209, "lr": 1.66355933405733e-05, "epoch": 2.9839228295819935, "percentage": 59.87, "elapsed_time": "5:37:05", "remaining_time": "3:45:56"}
465
+ {"current_steps": 465, "total_steps": 775, "loss": 0.4199, "lr": 1.6546766320683532e-05, "epoch": 2.990353697749196, "percentage": 60.0, "elapsed_time": "5:37:46", "remaining_time": "3:45:11"}
466
+ {"current_steps": 466, "total_steps": 775, "loss": 0.3981, "lr": 1.6458009455921842e-05, "epoch": 2.996784565916399, "percentage": 60.13, "elapsed_time": "5:38:24", "remaining_time": "3:44:23"}
467
+ {"current_steps": 467, "total_steps": 775, "loss": 0.3891, "lr": 1.636932454945297e-05, "epoch": 3.0032154340836015, "percentage": 60.26, "elapsed_time": "5:39:59", "remaining_time": "3:44:14"}
468
+ {"current_steps": 468, "total_steps": 775, "loss": 0.3477, "lr": 1.6280713402979784e-05, "epoch": 3.009646302250804, "percentage": 60.39, "elapsed_time": "5:40:46", "remaining_time": "3:43:32"}
469
+ {"current_steps": 469, "total_steps": 775, "loss": 0.3435, "lr": 1.619217781670663e-05, "epoch": 3.0160771704180065, "percentage": 60.52, "elapsed_time": "5:41:31", "remaining_time": "3:42:49"}