{ "best_metric": null, "best_model_checkpoint": null, "epoch": 26.395939086294415, "global_step": 5200, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 2.03, "learning_rate": 0.0002, "loss": 0.2479, "step": 400 }, { "epoch": 2.03, "eval_loss": 0.47397056221961975, "eval_runtime": 121.9231, "eval_samples_per_second": 17.47, "eval_steps_per_second": 2.19, "eval_wer": 0.5506920619898261, "step": 400 }, { "epoch": 4.06, "learning_rate": 0.00018605221657613458, "loss": 0.2306, "step": 800 }, { "epoch": 4.06, "eval_loss": 0.4647212624549866, "eval_runtime": 123.4969, "eval_samples_per_second": 17.247, "eval_steps_per_second": 2.162, "eval_wer": 0.5497456524310895, "step": 800 }, { "epoch": 6.09, "learning_rate": 0.00017206938847029964, "loss": 0.201, "step": 1200 }, { "epoch": 6.09, "eval_loss": 0.43976637721061707, "eval_runtime": 125.3202, "eval_samples_per_second": 16.996, "eval_steps_per_second": 2.131, "eval_wer": 0.5441854962735123, "step": 1200 }, { "epoch": 8.12, "learning_rate": 0.0001580515156824952, "loss": 0.2676, "step": 1600 }, { "epoch": 8.12, "eval_loss": 0.46590062975883484, "eval_runtime": 127.6886, "eval_samples_per_second": 16.681, "eval_steps_per_second": 2.091, "eval_wer": 0.5331834851532, "step": 1600 }, { "epoch": 10.15, "learning_rate": 0.00014403364289469075, "loss": 0.2295, "step": 2000 }, { "epoch": 10.15, "eval_loss": 0.433741956949234, "eval_runtime": 126.2574, "eval_samples_per_second": 16.87, "eval_steps_per_second": 2.115, "eval_wer": 0.5302259552821483, "step": 2000 }, { "epoch": 12.18, "learning_rate": 0.00013001577010688628, "loss": 0.2011, "step": 2400 }, { "epoch": 12.18, "eval_loss": 0.43763187527656555, "eval_runtime": 127.2021, "eval_samples_per_second": 16.745, "eval_steps_per_second": 2.099, "eval_wer": 0.5218265704483616, "step": 2400 }, { "epoch": 14.21, "learning_rate": 0.00011599789731908184, "loss": 0.1883, "step": 2800 }, { "epoch": 14.21, "eval_loss": 0.4427320659160614, "eval_runtime": 133.553, "eval_samples_per_second": 15.949, "eval_steps_per_second": 1.999, "eval_wer": 0.5275050278007808, "step": 2800 }, { "epoch": 16.24, "learning_rate": 0.00010198002453127737, "loss": 0.1599, "step": 3200 }, { "epoch": 16.24, "eval_loss": 0.4528989791870117, "eval_runtime": 130.4751, "eval_samples_per_second": 16.325, "eval_steps_per_second": 2.046, "eval_wer": 0.5167396190701526, "step": 3200 }, { "epoch": 18.27, "learning_rate": 8.796215174347293e-05, "loss": 0.1473, "step": 3600 }, { "epoch": 18.27, "eval_loss": 0.46878582239151, "eval_runtime": 130.7961, "eval_samples_per_second": 16.285, "eval_steps_per_second": 2.041, "eval_wer": 0.5125990772506802, "step": 3600 }, { "epoch": 20.3, "learning_rate": 7.394427895566848e-05, "loss": 0.1306, "step": 4000 }, { "epoch": 20.3, "eval_loss": 0.46525096893310547, "eval_runtime": 130.9702, "eval_samples_per_second": 16.263, "eval_steps_per_second": 2.039, "eval_wer": 0.5118892700816279, "step": 4000 }, { "epoch": 22.34, "learning_rate": 5.9926406167864026e-05, "loss": 0.1222, "step": 4400 }, { "epoch": 22.34, "eval_loss": 0.4552956223487854, "eval_runtime": 132.9038, "eval_samples_per_second": 16.027, "eval_steps_per_second": 2.009, "eval_wer": 0.5014787649355259, "step": 4400 }, { "epoch": 24.37, "learning_rate": 4.5908533380059577e-05, "loss": 0.1097, "step": 4800 }, { "epoch": 24.37, "eval_loss": 0.4868864417076111, "eval_runtime": 128.1956, "eval_samples_per_second": 16.615, "eval_steps_per_second": 2.083, "eval_wer": 0.5012421625458418, "step": 4800 }, { "epoch": 26.4, "learning_rate": 3.189066059225513e-05, "loss": 0.0988, "step": 5200 }, { "epoch": 26.4, "eval_loss": 0.45241138339042664, "eval_runtime": 127.9868, "eval_samples_per_second": 16.642, "eval_steps_per_second": 2.086, "eval_wer": 0.4968650183366852, "step": 5200 } ], "max_steps": 6107, "num_train_epochs": 31, "total_flos": 1.2361810216998281e+19, "trial_name": null, "trial_params": null }