{ "best_metric": 0.17176076769828796, "best_model_checkpoint": "wavlm-korean-phoneme-v3/checkpoint-7500", "epoch": 11.980047885075818, "global_step": 7500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.16, "learning_rate": 2.9999999999999997e-05, "loss": 5.4024, "step": 100 }, { "epoch": 0.32, "learning_rate": 5.9999999999999995e-05, "loss": 2.7142, "step": 200 }, { "epoch": 0.48, "learning_rate": 8.999999999999999e-05, "loss": 2.6325, "step": 300 }, { "epoch": 0.64, "learning_rate": 0.00011999999999999999, "loss": 2.4302, "step": 400 }, { "epoch": 0.8, "learning_rate": 0.00015, "loss": 1.5708, "step": 500 }, { "epoch": 0.8, "eval_cer": 0.5738695561575328, "eval_loss": 1.0533815622329712, "eval_runtime": 257.0727, "eval_samples_per_second": 8.663, "eval_steps_per_second": 1.085, "step": 500 }, { "epoch": 0.96, "learning_rate": 0.00017999999999999998, "loss": 0.9274, "step": 600 }, { "epoch": 1.12, "learning_rate": 0.00020999999999999998, "loss": 0.7045, "step": 700 }, { "epoch": 1.28, "learning_rate": 0.00023999999999999998, "loss": 0.5879, "step": 800 }, { "epoch": 1.44, "learning_rate": 0.00027, "loss": 0.5315, "step": 900 }, { "epoch": 1.6, "learning_rate": 0.0003, "loss": 0.4842, "step": 1000 }, { "epoch": 1.6, "eval_cer": 0.2984314260873314, "eval_loss": 0.4019908010959625, "eval_runtime": 213.6605, "eval_samples_per_second": 10.423, "eval_steps_per_second": 1.306, "step": 1000 }, { "epoch": 1.76, "learning_rate": 0.00029900990099009897, "loss": 0.4486, "step": 1100 }, { "epoch": 1.92, "learning_rate": 0.000298019801980198, "loss": 0.4091, "step": 1200 }, { "epoch": 2.08, "learning_rate": 0.000297029702970297, "loss": 0.3663, "step": 1300 }, { "epoch": 2.24, "learning_rate": 0.000296039603960396, "loss": 0.3333, "step": 1400 }, { "epoch": 2.4, "learning_rate": 0.000295049504950495, "loss": 0.3181, "step": 1500 }, { "epoch": 2.4, "eval_cer": 0.20734923223947518, "eval_loss": 0.2830340266227722, "eval_runtime": 213.9837, "eval_samples_per_second": 10.407, "eval_steps_per_second": 1.304, "step": 1500 }, { "epoch": 2.56, "learning_rate": 0.000294059405940594, "loss": 0.3238, "step": 1600 }, { "epoch": 2.72, "learning_rate": 0.00029306930693069307, "loss": 0.3005, "step": 1700 }, { "epoch": 2.87, "learning_rate": 0.00029207920792079207, "loss": 0.3013, "step": 1800 }, { "epoch": 3.04, "learning_rate": 0.00029108910891089107, "loss": 0.2795, "step": 1900 }, { "epoch": 3.19, "learning_rate": 0.00029009900990099006, "loss": 0.2421, "step": 2000 }, { "epoch": 3.19, "eval_cer": 0.17599212479611415, "eval_loss": 0.2522282004356384, "eval_runtime": 210.0211, "eval_samples_per_second": 10.604, "eval_steps_per_second": 1.328, "step": 2000 }, { "epoch": 3.35, "learning_rate": 0.00028910891089108906, "loss": 0.2436, "step": 2100 }, { "epoch": 3.51, "learning_rate": 0.00028811881188118806, "loss": 0.234, "step": 2200 }, { "epoch": 3.67, "learning_rate": 0.0002871287128712871, "loss": 0.2347, "step": 2300 }, { "epoch": 3.83, "learning_rate": 0.0002861386138613861, "loss": 0.2356, "step": 2400 }, { "epoch": 3.99, "learning_rate": 0.0002851485148514851, "loss": 0.2255, "step": 2500 }, { "epoch": 3.99, "eval_cer": 0.1599614862291713, "eval_loss": 0.22431106865406036, "eval_runtime": 203.7474, "eval_samples_per_second": 10.93, "eval_steps_per_second": 1.369, "step": 2500 }, { "epoch": 4.15, "learning_rate": 0.00028415841584158416, "loss": 0.1892, "step": 2600 }, { "epoch": 4.31, "learning_rate": 0.00028316831683168316, "loss": 0.1927, "step": 2700 }, { "epoch": 4.47, "learning_rate": 0.00028217821782178216, "loss": 0.1832, "step": 2800 }, { "epoch": 4.63, "learning_rate": 0.00028118811881188116, "loss": 0.1914, "step": 2900 }, { "epoch": 4.79, "learning_rate": 0.00028019801980198015, "loss": 0.1879, "step": 3000 }, { "epoch": 4.79, "eval_cer": 0.14389492063720172, "eval_loss": 0.21251684427261353, "eval_runtime": 199.7095, "eval_samples_per_second": 11.151, "eval_steps_per_second": 1.397, "step": 3000 }, { "epoch": 4.95, "learning_rate": 0.0002792079207920792, "loss": 0.186, "step": 3100 }, { "epoch": 5.11, "learning_rate": 0.0002782178217821782, "loss": 0.1716, "step": 3200 }, { "epoch": 5.27, "learning_rate": 0.0002772277227722772, "loss": 0.1588, "step": 3300 }, { "epoch": 5.43, "learning_rate": 0.0002762376237623762, "loss": 0.1555, "step": 3400 }, { "epoch": 5.59, "learning_rate": 0.0002752475247524752, "loss": 0.1604, "step": 3500 }, { "epoch": 5.59, "eval_cer": 0.13375631417464845, "eval_loss": 0.2036324292421341, "eval_runtime": 200.1074, "eval_samples_per_second": 11.129, "eval_steps_per_second": 1.394, "step": 3500 }, { "epoch": 5.75, "learning_rate": 0.0002742574257425742, "loss": 0.158, "step": 3600 }, { "epoch": 5.91, "learning_rate": 0.00027326732673267325, "loss": 0.1619, "step": 3700 }, { "epoch": 6.07, "learning_rate": 0.00027227722772277225, "loss": 0.1497, "step": 3800 }, { "epoch": 6.23, "learning_rate": 0.00027128712871287125, "loss": 0.1397, "step": 3900 }, { "epoch": 6.39, "learning_rate": 0.0002702970297029703, "loss": 0.1382, "step": 4000 }, { "epoch": 6.39, "eval_cer": 0.127418786959927, "eval_loss": 0.189874529838562, "eval_runtime": 198.5164, "eval_samples_per_second": 11.218, "eval_steps_per_second": 1.405, "step": 4000 }, { "epoch": 6.55, "learning_rate": 0.0002693069306930693, "loss": 0.1371, "step": 4100 }, { "epoch": 6.71, "learning_rate": 0.0002683168316831683, "loss": 0.1385, "step": 4200 }, { "epoch": 6.87, "learning_rate": 0.0002673267326732673, "loss": 0.1382, "step": 4300 }, { "epoch": 7.03, "learning_rate": 0.0002663366336633663, "loss": 0.138, "step": 4400 }, { "epoch": 7.19, "learning_rate": 0.00026534653465346534, "loss": 0.1228, "step": 4500 }, { "epoch": 7.19, "eval_cer": 0.12003937601942934, "eval_loss": 0.1979004442691803, "eval_runtime": 201.8805, "eval_samples_per_second": 11.031, "eval_steps_per_second": 1.382, "step": 4500 }, { "epoch": 7.35, "learning_rate": 0.00026435643564356434, "loss": 0.128, "step": 4600 }, { "epoch": 7.51, "learning_rate": 0.00026336633663366334, "loss": 0.1248, "step": 4700 }, { "epoch": 7.67, "learning_rate": 0.00026237623762376234, "loss": 0.1191, "step": 4800 }, { "epoch": 7.83, "learning_rate": 0.00026138613861386134, "loss": 0.1241, "step": 4900 }, { "epoch": 7.99, "learning_rate": 0.00026039603960396033, "loss": 0.1275, "step": 5000 }, { "epoch": 7.99, "eval_cer": 0.11670534809694548, "eval_loss": 0.18830785155296326, "eval_runtime": 215.0184, "eval_samples_per_second": 10.357, "eval_steps_per_second": 1.298, "step": 5000 }, { "epoch": 8.15, "learning_rate": 0.0002594059405940594, "loss": 0.1133, "step": 5100 }, { "epoch": 8.31, "learning_rate": 0.0002584158415841584, "loss": 0.1121, "step": 5200 }, { "epoch": 8.47, "learning_rate": 0.0002574257425742574, "loss": 0.112, "step": 5300 }, { "epoch": 8.63, "learning_rate": 0.00025643564356435644, "loss": 0.108, "step": 5400 }, { "epoch": 8.79, "learning_rate": 0.00025544554455445543, "loss": 0.1093, "step": 5500 }, { "epoch": 8.79, "eval_cer": 0.11560598113112645, "eval_loss": 0.1854041963815689, "eval_runtime": 221.0978, "eval_samples_per_second": 10.072, "eval_steps_per_second": 1.262, "step": 5500 }, { "epoch": 8.94, "learning_rate": 0.00025445544554455443, "loss": 0.1094, "step": 5600 }, { "epoch": 9.11, "learning_rate": 0.00025346534653465343, "loss": 0.1139, "step": 5700 }, { "epoch": 9.26, "learning_rate": 0.00025247524752475243, "loss": 0.1015, "step": 5800 }, { "epoch": 9.42, "learning_rate": 0.0002514851485148515, "loss": 0.1062, "step": 5900 }, { "epoch": 9.58, "learning_rate": 0.0002504950495049505, "loss": 0.1089, "step": 6000 }, { "epoch": 9.58, "eval_cer": 0.1084421323407894, "eval_loss": 0.1830228716135025, "eval_runtime": 220.3658, "eval_samples_per_second": 10.106, "eval_steps_per_second": 1.266, "step": 6000 }, { "epoch": 9.74, "learning_rate": 0.0002495148514851485, "loss": 0.1076, "step": 6100 }, { "epoch": 9.9, "learning_rate": 0.0002485247524752475, "loss": 0.1063, "step": 6200 }, { "epoch": 10.06, "learning_rate": 0.0002475346534653465, "loss": 0.1009, "step": 6300 }, { "epoch": 10.22, "learning_rate": 0.0002465445544554455, "loss": 0.0987, "step": 6400 }, { "epoch": 10.38, "learning_rate": 0.0002455643564356435, "loss": 0.0968, "step": 6500 }, { "epoch": 10.38, "eval_cer": 0.10436082229774882, "eval_loss": 0.17644909024238586, "eval_runtime": 220.8492, "eval_samples_per_second": 10.084, "eval_steps_per_second": 1.263, "step": 6500 }, { "epoch": 10.54, "learning_rate": 0.0002445742574257425, "loss": 0.0937, "step": 6600 }, { "epoch": 10.7, "learning_rate": 0.00024358415841584157, "loss": 0.0964, "step": 6700 }, { "epoch": 10.86, "learning_rate": 0.00024259405940594056, "loss": 0.0956, "step": 6800 }, { "epoch": 11.02, "learning_rate": 0.0002416039603960396, "loss": 0.0971, "step": 6900 }, { "epoch": 11.18, "learning_rate": 0.0002406138613861386, "loss": 0.0862, "step": 7000 }, { "epoch": 11.18, "eval_cer": 0.10214771755610005, "eval_loss": 0.19613920152187347, "eval_runtime": 296.3031, "eval_samples_per_second": 7.516, "eval_steps_per_second": 0.942, "step": 7000 }, { "epoch": 11.34, "learning_rate": 0.00023962376237623759, "loss": 0.0901, "step": 7100 }, { "epoch": 11.5, "learning_rate": 0.00023863366336633664, "loss": 0.0957, "step": 7200 }, { "epoch": 11.66, "learning_rate": 0.00023764356435643564, "loss": 0.0929, "step": 7300 }, { "epoch": 11.82, "learning_rate": 0.00023665346534653463, "loss": 0.0918, "step": 7400 }, { "epoch": 11.98, "learning_rate": 0.00023566336633663366, "loss": 0.0933, "step": 7500 }, { "epoch": 11.98, "eval_cer": 0.10178126190082704, "eval_loss": 0.17176076769828796, "eval_runtime": 220.1598, "eval_samples_per_second": 10.115, "eval_steps_per_second": 1.267, "step": 7500 } ], "max_steps": 31300, "num_train_epochs": 50, "total_flos": 6.187118202284854e+19, "trial_name": null, "trial_params": null }