{ "best_metric": 15.23105066412153, "best_model_checkpoint": "./whisper-small-dv-syn/checkpoint-4000", "epoch": 2.7416038382453736, "global_step": 4000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.03, "learning_rate": 9.4e-06, "loss": 4.2925, "step": 50 }, { "epoch": 0.07, "learning_rate": 1e-05, "loss": 1.5599, "step": 100 }, { "epoch": 0.1, "learning_rate": 1e-05, "loss": 0.7325, "step": 150 }, { "epoch": 0.14, "learning_rate": 1e-05, "loss": 0.1344, "step": 200 }, { "epoch": 0.17, "learning_rate": 1e-05, "loss": 0.0581, "step": 250 }, { "epoch": 0.21, "learning_rate": 1e-05, "loss": 0.0471, "step": 300 }, { "epoch": 0.24, "learning_rate": 1e-05, "loss": 0.0406, "step": 350 }, { "epoch": 0.27, "learning_rate": 1e-05, "loss": 0.0377, "step": 400 }, { "epoch": 0.31, "learning_rate": 1e-05, "loss": 0.034, "step": 450 }, { "epoch": 0.34, "learning_rate": 1e-05, "loss": 0.0327, "step": 500 }, { "epoch": 0.38, "learning_rate": 1e-05, "loss": 0.0304, "step": 550 }, { "epoch": 0.41, "learning_rate": 1e-05, "loss": 0.0294, "step": 600 }, { "epoch": 0.45, "learning_rate": 1e-05, "loss": 0.0275, "step": 650 }, { "epoch": 0.48, "learning_rate": 1e-05, "loss": 0.0268, "step": 700 }, { "epoch": 0.51, "learning_rate": 1e-05, "loss": 0.0261, "step": 750 }, { "epoch": 0.55, "learning_rate": 1e-05, "loss": 0.0246, "step": 800 }, { "epoch": 0.58, "learning_rate": 1e-05, "loss": 0.0242, "step": 850 }, { "epoch": 0.62, "learning_rate": 1e-05, "loss": 0.0243, "step": 900 }, { "epoch": 0.65, "learning_rate": 1e-05, "loss": 0.0228, "step": 950 }, { "epoch": 0.69, "learning_rate": 1e-05, "loss": 0.0233, "step": 1000 }, { "epoch": 0.69, "eval_loss": 0.23616750538349152, "eval_runtime": 227.0219, "eval_samples_per_second": 2.202, "eval_steps_per_second": 0.07, "eval_wer": 18.86582359023304, "eval_wer_ortho": 75.35455404979514, "step": 1000 }, { "epoch": 0.72, "learning_rate": 1e-05, "loss": 0.0219, "step": 1050 }, { "epoch": 0.75, "learning_rate": 1e-05, "loss": 0.0218, "step": 1100 }, { "epoch": 0.79, "learning_rate": 1e-05, "loss": 0.0213, "step": 1150 }, { "epoch": 0.82, "learning_rate": 1e-05, "loss": 0.0207, "step": 1200 }, { "epoch": 0.86, "learning_rate": 1e-05, "loss": 0.021, "step": 1250 }, { "epoch": 0.89, "learning_rate": 1e-05, "loss": 0.0201, "step": 1300 }, { "epoch": 0.93, "learning_rate": 1e-05, "loss": 0.0206, "step": 1350 }, { "epoch": 0.96, "learning_rate": 1e-05, "loss": 0.0194, "step": 1400 }, { "epoch": 0.99, "learning_rate": 1e-05, "loss": 0.0193, "step": 1450 }, { "epoch": 1.03, "learning_rate": 1e-05, "loss": 0.0169, "step": 1500 }, { "epoch": 1.06, "learning_rate": 1e-05, "loss": 0.0157, "step": 1550 }, { "epoch": 1.1, "learning_rate": 1e-05, "loss": 0.0154, "step": 1600 }, { "epoch": 1.13, "learning_rate": 1e-05, "loss": 0.0159, "step": 1650 }, { "epoch": 1.17, "learning_rate": 1e-05, "loss": 0.0153, "step": 1700 }, { "epoch": 1.2, "learning_rate": 1e-05, "loss": 0.0156, "step": 1750 }, { "epoch": 1.23, "learning_rate": 1e-05, "loss": 0.0151, "step": 1800 }, { "epoch": 1.27, "learning_rate": 1e-05, "loss": 0.0151, "step": 1850 }, { "epoch": 1.3, "learning_rate": 1e-05, "loss": 0.0152, "step": 1900 }, { "epoch": 1.34, "learning_rate": 1e-05, "loss": 0.015, "step": 1950 }, { "epoch": 1.37, "learning_rate": 1e-05, "loss": 0.0147, "step": 2000 }, { "epoch": 1.37, "eval_loss": 0.21357361972332, "eval_runtime": 225.8202, "eval_samples_per_second": 2.214, "eval_steps_per_second": 0.071, "eval_wer": 16.734271852382086, "eval_wer_ortho": 70.94232587456666, "step": 2000 }, { "epoch": 1.41, "learning_rate": 1e-05, "loss": 0.0149, "step": 2050 }, { "epoch": 1.44, "learning_rate": 1e-05, "loss": 0.0148, "step": 2100 }, { "epoch": 1.47, "learning_rate": 1e-05, "loss": 0.0152, "step": 2150 }, { "epoch": 1.51, "learning_rate": 1e-05, "loss": 0.0146, "step": 2200 }, { "epoch": 1.54, "learning_rate": 1e-05, "loss": 0.0146, "step": 2250 }, { "epoch": 1.58, "learning_rate": 1e-05, "loss": 0.0141, "step": 2300 }, { "epoch": 1.61, "learning_rate": 1e-05, "loss": 0.0143, "step": 2350 }, { "epoch": 1.64, "learning_rate": 1e-05, "loss": 0.0144, "step": 2400 }, { "epoch": 1.68, "learning_rate": 1e-05, "loss": 0.0142, "step": 2450 }, { "epoch": 1.71, "learning_rate": 1e-05, "loss": 0.0145, "step": 2500 }, { "epoch": 1.75, "learning_rate": 1e-05, "loss": 0.014, "step": 2550 }, { "epoch": 1.78, "learning_rate": 1e-05, "loss": 0.0141, "step": 2600 }, { "epoch": 1.82, "learning_rate": 1e-05, "loss": 0.0142, "step": 2650 }, { "epoch": 1.85, "learning_rate": 1e-05, "loss": 0.0143, "step": 2700 }, { "epoch": 1.88, "learning_rate": 1e-05, "loss": 0.0137, "step": 2750 }, { "epoch": 1.92, "learning_rate": 1e-05, "loss": 0.0137, "step": 2800 }, { "epoch": 1.95, "learning_rate": 1e-05, "loss": 0.0144, "step": 2850 }, { "epoch": 1.99, "learning_rate": 1e-05, "loss": 0.0138, "step": 2900 }, { "epoch": 2.02, "learning_rate": 1e-05, "loss": 0.0113, "step": 2950 }, { "epoch": 2.06, "learning_rate": 1e-05, "loss": 0.0102, "step": 3000 }, { "epoch": 2.06, "eval_loss": 0.20163850486278534, "eval_runtime": 226.4401, "eval_samples_per_second": 2.208, "eval_steps_per_second": 0.071, "eval_wer": 15.57305336832896, "eval_wer_ortho": 65.64765206429247, "step": 3000 }, { "epoch": 2.09, "learning_rate": 1e-05, "loss": 0.0099, "step": 3050 }, { "epoch": 2.12, "learning_rate": 1e-05, "loss": 0.01, "step": 3100 }, { "epoch": 2.16, "learning_rate": 1e-05, "loss": 0.0099, "step": 3150 }, { "epoch": 2.19, "learning_rate": 1e-05, "loss": 0.0098, "step": 3200 }, { "epoch": 2.23, "learning_rate": 1e-05, "loss": 0.0107, "step": 3250 }, { "epoch": 2.26, "learning_rate": 1e-05, "loss": 0.0098, "step": 3300 }, { "epoch": 2.3, "learning_rate": 1e-05, "loss": 0.01, "step": 3350 }, { "epoch": 2.33, "learning_rate": 1e-05, "loss": 0.0103, "step": 3400 }, { "epoch": 2.36, "learning_rate": 1e-05, "loss": 0.0106, "step": 3450 }, { "epoch": 2.4, "learning_rate": 1e-05, "loss": 0.0102, "step": 3500 }, { "epoch": 2.43, "learning_rate": 1e-05, "loss": 0.0103, "step": 3550 }, { "epoch": 2.47, "learning_rate": 1e-05, "loss": 0.0099, "step": 3600 }, { "epoch": 2.5, "learning_rate": 1e-05, "loss": 0.0103, "step": 3650 }, { "epoch": 2.54, "learning_rate": 1e-05, "loss": 0.0102, "step": 3700 }, { "epoch": 2.57, "learning_rate": 1e-05, "loss": 0.0105, "step": 3750 }, { "epoch": 2.6, "learning_rate": 1e-05, "loss": 0.0104, "step": 3800 }, { "epoch": 2.64, "learning_rate": 1e-05, "loss": 0.0101, "step": 3850 }, { "epoch": 2.67, "learning_rate": 1e-05, "loss": 0.01, "step": 3900 }, { "epoch": 2.71, "learning_rate": 1e-05, "loss": 0.0101, "step": 3950 }, { "epoch": 2.74, "learning_rate": 1e-05, "loss": 0.01, "step": 4000 }, { "epoch": 2.74, "eval_loss": 0.20110772550106049, "eval_runtime": 225.7624, "eval_samples_per_second": 2.215, "eval_steps_per_second": 0.071, "eval_wer": 15.23105066412153, "eval_wer_ortho": 66.34100220611408, "step": 4000 } ], "max_steps": 4000, "num_train_epochs": 3, "total_flos": 1.4770435676258304e+20, "trial_name": null, "trial_params": null }