| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 15.0, | |
| "global_step": 1635, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.92, | |
| "eval_loss": 3.585611343383789, | |
| "eval_runtime": 69.1996, | |
| "eval_samples_per_second": 23.801, | |
| "eval_steps_per_second": 2.977, | |
| "eval_wer": 1.0, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 1.83, | |
| "eval_loss": 3.0358903408050537, | |
| "eval_runtime": 70.0289, | |
| "eval_samples_per_second": 23.519, | |
| "eval_steps_per_second": 2.942, | |
| "eval_wer": 0.9998978653865795, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 2.75, | |
| "eval_loss": 0.9341107606887817, | |
| "eval_runtime": 69.5975, | |
| "eval_samples_per_second": 23.665, | |
| "eval_steps_per_second": 2.96, | |
| "eval_wer": 0.7737718312736186, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 3.67, | |
| "eval_loss": 0.5874470472335815, | |
| "eval_runtime": 69.8546, | |
| "eval_samples_per_second": 23.578, | |
| "eval_steps_per_second": 2.949, | |
| "eval_wer": 0.6386477377183127, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 4.59, | |
| "learning_rate": 0.0002988, | |
| "loss": 3.214, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 4.59, | |
| "eval_loss": 0.5316070914268494, | |
| "eval_runtime": 69.5825, | |
| "eval_samples_per_second": 23.67, | |
| "eval_steps_per_second": 2.961, | |
| "eval_wer": 0.5525482586048411, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 5.5, | |
| "eval_loss": 0.45860984921455383, | |
| "eval_runtime": 68.7814, | |
| "eval_samples_per_second": 23.945, | |
| "eval_steps_per_second": 2.995, | |
| "eval_wer": 0.519252374629762, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 6.42, | |
| "eval_loss": 0.45034125447273254, | |
| "eval_runtime": 67.077, | |
| "eval_samples_per_second": 24.554, | |
| "eval_steps_per_second": 3.071, | |
| "eval_wer": 0.4605249719129813, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 7.34, | |
| "eval_loss": 0.41716983914375305, | |
| "eval_runtime": 68.1176, | |
| "eval_samples_per_second": 24.179, | |
| "eval_steps_per_second": 3.024, | |
| "eval_wer": 0.4390767030946788, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 8.26, | |
| "eval_loss": 0.4093872606754303, | |
| "eval_runtime": 69.7848, | |
| "eval_samples_per_second": 23.601, | |
| "eval_steps_per_second": 2.952, | |
| "eval_wer": 0.41854764579716064, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 9.17, | |
| "learning_rate": 0.00016837004405286342, | |
| "loss": 0.2284, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 9.17, | |
| "eval_loss": 0.4091317355632782, | |
| "eval_runtime": 70.1477, | |
| "eval_samples_per_second": 23.479, | |
| "eval_steps_per_second": 2.937, | |
| "eval_wer": 0.39985701154121134, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 10.09, | |
| "eval_loss": 0.39890098571777344, | |
| "eval_runtime": 69.3262, | |
| "eval_samples_per_second": 23.757, | |
| "eval_steps_per_second": 2.971, | |
| "eval_wer": 0.40404453069145135, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 11.01, | |
| "eval_loss": 0.4066716432571411, | |
| "eval_runtime": 69.7662, | |
| "eval_samples_per_second": 23.607, | |
| "eval_steps_per_second": 2.953, | |
| "eval_wer": 0.3930139924420386, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 11.93, | |
| "eval_loss": 0.40022560954093933, | |
| "eval_runtime": 67.6908, | |
| "eval_samples_per_second": 24.331, | |
| "eval_steps_per_second": 3.043, | |
| "eval_wer": 0.3775916658155449, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 12.84, | |
| "eval_loss": 0.3982270061969757, | |
| "eval_runtime": 66.5115, | |
| "eval_samples_per_second": 24.763, | |
| "eval_steps_per_second": 3.097, | |
| "eval_wer": 0.36492697375140437, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 13.76, | |
| "learning_rate": 3.621145374449339e-05, | |
| "loss": 0.1029, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 13.76, | |
| "eval_loss": 0.38969308137893677, | |
| "eval_runtime": 65.75, | |
| "eval_samples_per_second": 25.049, | |
| "eval_steps_per_second": 3.133, | |
| "eval_wer": 0.3703401082626902, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 14.68, | |
| "eval_loss": 0.3836365342140198, | |
| "eval_runtime": 65.8183, | |
| "eval_samples_per_second": 25.023, | |
| "eval_steps_per_second": 3.13, | |
| "eval_wer": 0.3566540700643448, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 15.0, | |
| "step": 1635, | |
| "total_flos": 6.429866751096261e+18, | |
| "train_loss": 1.0907053682053125, | |
| "train_runtime": 3864.236, | |
| "train_samples_per_second": 13.501, | |
| "train_steps_per_second": 0.423 | |
| } | |
| ], | |
| "max_steps": 1635, | |
| "num_train_epochs": 15, | |
| "total_flos": 6.429866751096261e+18, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |