| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 20.337552742616033, | |
| "global_step": 2400, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 3.39, | |
| "learning_rate": 0.00023999999999999998, | |
| "loss": 6.3317, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 3.39, | |
| "eval_loss": 3.161163806915283, | |
| "eval_runtime": 205.0119, | |
| "eval_samples_per_second": 8.687, | |
| "eval_wer": 1.0, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 6.78, | |
| "learning_rate": 0.0002703947368421052, | |
| "loss": 1.6739, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 6.78, | |
| "eval_loss": 0.6274727582931519, | |
| "eval_runtime": 205.8605, | |
| "eval_samples_per_second": 8.651, | |
| "eval_wer": 1.008992553042012, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 10.17, | |
| "learning_rate": 0.00023092105263157893, | |
| "loss": 0.3726, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 10.17, | |
| "eval_loss": 0.6007506847381592, | |
| "eval_runtime": 208.514, | |
| "eval_samples_per_second": 8.541, | |
| "eval_wer": 0.9197695658282984, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 13.56, | |
| "learning_rate": 0.00019144736842105262, | |
| "loss": 0.2323, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 13.56, | |
| "eval_loss": 0.62809157371521, | |
| "eval_runtime": 207.5386, | |
| "eval_samples_per_second": 8.582, | |
| "eval_wer": 0.9513840101166222, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 16.95, | |
| "learning_rate": 0.00015197368421052628, | |
| "loss": 0.1598, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 16.95, | |
| "eval_loss": 0.679410994052887, | |
| "eval_runtime": 213.3742, | |
| "eval_samples_per_second": 8.347, | |
| "eval_wer": 0.8642686525221301, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 20.34, | |
| "learning_rate": 0.0001125, | |
| "loss": 0.1258, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 20.34, | |
| "eval_loss": 0.7365503311157227, | |
| "eval_runtime": 210.0426, | |
| "eval_samples_per_second": 8.479, | |
| "eval_wer": 0.8294225094843333, | |
| "step": 2400 | |
| } | |
| ], | |
| "max_steps": 3540, | |
| "num_train_epochs": 30, | |
| "total_flos": 1.022364819420586e+19, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |