| { |
| "best_metric": 98.29925818708159, |
| "best_model_checkpoint": "./whisper-bangla-dialect/checkpoint-1620", |
| "epoch": 4.992295839753467, |
| "eval_steps": 500, |
| "global_step": 1620, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.15408320493066255, |
| "grad_norm": 4.895554065704346, |
| "learning_rate": 4.9000000000000005e-06, |
| "loss": 1.7624, |
| "step": 50 |
| }, |
| { |
| "epoch": 0.3081664098613251, |
| "grad_norm": 3.634995460510254, |
| "learning_rate": 9.9e-06, |
| "loss": 1.5119, |
| "step": 100 |
| }, |
| { |
| "epoch": 0.4622496147919877, |
| "grad_norm": 2.232389211654663, |
| "learning_rate": 1.4900000000000001e-05, |
| "loss": 1.4947, |
| "step": 150 |
| }, |
| { |
| "epoch": 0.6163328197226502, |
| "grad_norm": 2.1193408966064453, |
| "learning_rate": 1.9900000000000003e-05, |
| "loss": 1.473, |
| "step": 200 |
| }, |
| { |
| "epoch": 0.7704160246533128, |
| "grad_norm": 1.3372803926467896, |
| "learning_rate": 1.9941297059390586e-05, |
| "loss": 1.4826, |
| "step": 250 |
| }, |
| { |
| "epoch": 0.9244992295839753, |
| "grad_norm": 3.3661787509918213, |
| "learning_rate": 1.97610942687054e-05, |
| "loss": 1.4619, |
| "step": 300 |
| }, |
| { |
| "epoch": 0.9984591679506933, |
| "eval_loss": 1.4470419883728027, |
| "eval_norm_levenshtein_similarity": 95.46770399855255, |
| "eval_runtime": 351.6357, |
| "eval_samples_per_second": 1.641, |
| "eval_steps_per_second": 0.412, |
| "eval_wer": 5.913978494623656, |
| "step": 324 |
| }, |
| { |
| "epoch": 1.078582434514638, |
| "grad_norm": 1.7728036642074585, |
| "learning_rate": 1.946156998812636e-05, |
| "loss": 1.457, |
| "step": 350 |
| }, |
| { |
| "epoch": 1.2326656394453004, |
| "grad_norm": 2.1206459999084473, |
| "learning_rate": 1.9046385659950213e-05, |
| "loss": 1.4547, |
| "step": 400 |
| }, |
| { |
| "epoch": 1.386748844375963, |
| "grad_norm": 1.305923342704773, |
| "learning_rate": 1.8520616577095447e-05, |
| "loss": 1.4502, |
| "step": 450 |
| }, |
| { |
| "epoch": 1.5408320493066254, |
| "grad_norm": 3.612596035003662, |
| "learning_rate": 1.7890689841747463e-05, |
| "loss": 1.4495, |
| "step": 500 |
| }, |
| { |
| "epoch": 1.694915254237288, |
| "grad_norm": 1.3930879831314087, |
| "learning_rate": 1.716430579922786e-05, |
| "loss": 1.442, |
| "step": 550 |
| }, |
| { |
| "epoch": 1.8489984591679507, |
| "grad_norm": 1.770542025566101, |
| "learning_rate": 1.6350343907495195e-05, |
| "loss": 1.4445, |
| "step": 600 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_loss": 1.434973120689392, |
| "eval_norm_levenshtein_similarity": 96.86991134430976, |
| "eval_runtime": 348.1264, |
| "eval_samples_per_second": 1.657, |
| "eval_steps_per_second": 0.417, |
| "eval_wer": 4.69208211143695, |
| "step": 649 |
| }, |
| { |
| "epoch": 2.0030816640986133, |
| "grad_norm": 1.691462755203247, |
| "learning_rate": 1.54587541929466e-05, |
| "loss": 1.4416, |
| "step": 650 |
| }, |
| { |
| "epoch": 2.157164869029276, |
| "grad_norm": 1.5759495496749878, |
| "learning_rate": 1.4500435619385243e-05, |
| "loss": 1.4332, |
| "step": 700 |
| }, |
| { |
| "epoch": 2.3112480739599386, |
| "grad_norm": 1.881423830986023, |
| "learning_rate": 1.348710285699486e-05, |
| "loss": 1.4319, |
| "step": 750 |
| }, |
| { |
| "epoch": 2.4653312788906008, |
| "grad_norm": 1.305807113647461, |
| "learning_rate": 1.2431143079962917e-05, |
| "loss": 1.4324, |
| "step": 800 |
| }, |
| { |
| "epoch": 2.6194144838212634, |
| "grad_norm": 1.3964393138885498, |
| "learning_rate": 1.1345464543285721e-05, |
| "loss": 1.4343, |
| "step": 850 |
| }, |
| { |
| "epoch": 2.773497688751926, |
| "grad_norm": 1.2005863189697266, |
| "learning_rate": 1.0243338789781722e-05, |
| "loss": 1.431, |
| "step": 900 |
| }, |
| { |
| "epoch": 2.9275808936825887, |
| "grad_norm": 0.7941581606864929, |
| "learning_rate": 9.13823841620477e-06, |
| "loss": 1.432, |
| "step": 950 |
| }, |
| { |
| "epoch": 2.9984591679506933, |
| "eval_loss": 1.427686095237732, |
| "eval_norm_levenshtein_similarity": 97.37651528858332, |
| "eval_runtime": 346.2984, |
| "eval_samples_per_second": 1.666, |
| "eval_steps_per_second": 0.419, |
| "eval_wer": 3.5679374389051812, |
| "step": 973 |
| }, |
| { |
| "epoch": 3.0816640986132513, |
| "grad_norm": 0.9101853966712952, |
| "learning_rate": 8.043672381635423e-06, |
| "loss": 1.4277, |
| "step": 1000 |
| }, |
| { |
| "epoch": 3.2357473035439135, |
| "grad_norm": 0.7756341695785522, |
| "learning_rate": 6.9730208713722456e-06, |
| "loss": 1.425, |
| "step": 1050 |
| }, |
| { |
| "epoch": 3.389830508474576, |
| "grad_norm": 1.314003586769104, |
| "learning_rate": 5.9393717349785064e-06, |
| "loss": 1.4231, |
| "step": 1100 |
| }, |
| { |
| "epoch": 3.5439137134052388, |
| "grad_norm": 2.220507860183716, |
| "learning_rate": 4.955360497897032e-06, |
| "loss": 1.4263, |
| "step": 1150 |
| }, |
| { |
| "epoch": 3.6979969183359014, |
| "grad_norm": 0.39077863097190857, |
| "learning_rate": 4.033015902361899e-06, |
| "loss": 1.423, |
| "step": 1200 |
| }, |
| { |
| "epoch": 3.852080123266564, |
| "grad_norm": 0.3764391839504242, |
| "learning_rate": 3.183612865744584e-06, |
| "loss": 1.4232, |
| "step": 1250 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_loss": 1.4236760139465332, |
| "eval_norm_levenshtein_similarity": 98.16356070200833, |
| "eval_runtime": 346.601, |
| "eval_samples_per_second": 1.665, |
| "eval_steps_per_second": 0.418, |
| "eval_wer": 2.3949169110459434, |
| "step": 1298 |
| }, |
| { |
| "epoch": 4.006163328197227, |
| "grad_norm": 0.7122958898544312, |
| "learning_rate": 2.4175346537998824e-06, |
| "loss": 1.4221, |
| "step": 1300 |
| }, |
| { |
| "epoch": 4.160246533127889, |
| "grad_norm": 0.48986372351646423, |
| "learning_rate": 1.744145953632339e-06, |
| "loss": 1.4217, |
| "step": 1350 |
| }, |
| { |
| "epoch": 4.314329738058552, |
| "grad_norm": 1.2581398487091064, |
| "learning_rate": 1.1716783979636393e-06, |
| "loss": 1.4206, |
| "step": 1400 |
| }, |
| { |
| "epoch": 4.4684129429892145, |
| "grad_norm": 0.4906635880470276, |
| "learning_rate": 7.071299400742126e-07, |
| "loss": 1.4204, |
| "step": 1450 |
| }, |
| { |
| "epoch": 4.622496147919877, |
| "grad_norm": 0.4289968013763428, |
| "learning_rate": 3.56179309479151e-07, |
| "loss": 1.4199, |
| "step": 1500 |
| }, |
| { |
| "epoch": 4.776579352850539, |
| "grad_norm": 0.8411958813667297, |
| "learning_rate": 1.231165940486234e-07, |
| "loss": 1.4201, |
| "step": 1550 |
| }, |
| { |
| "epoch": 4.9306625577812015, |
| "grad_norm": 0.30201002955436707, |
| "learning_rate": 1.079079715032183e-08, |
| "loss": 1.422, |
| "step": 1600 |
| }, |
| { |
| "epoch": 4.992295839753467, |
| "eval_loss": 1.4230467081069946, |
| "eval_norm_levenshtein_similarity": 98.29925818708159, |
| "eval_runtime": 350.1125, |
| "eval_samples_per_second": 1.648, |
| "eval_steps_per_second": 0.414, |
| "eval_wer": 2.297165200391007, |
| "step": 1620 |
| } |
| ], |
| "logging_steps": 50, |
| "max_steps": 1620, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 5, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 7.47782489309184e+18, |
| "train_batch_size": 4, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|