| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 5.0, | |
| "global_step": 11395, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.04, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 762.0088, | |
| "eval_samples_per_second": 19.376, | |
| "eval_steps_per_second": 2.423, | |
| "eval_wer": 1.0, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.09, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 760.7665, | |
| "eval_samples_per_second": 19.408, | |
| "eval_steps_per_second": 2.427, | |
| "eval_wer": 0.9983381717130623, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.13, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 758.492, | |
| "eval_samples_per_second": 19.466, | |
| "eval_steps_per_second": 2.434, | |
| "eval_wer": 0.7671578598961529, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 0.18, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 763.9298, | |
| "eval_samples_per_second": 19.328, | |
| "eval_steps_per_second": 2.416, | |
| "eval_wer": 0.6919342715882527, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "learning_rate": 0.000996, | |
| "loss": 2.9929, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.22, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 771.5199, | |
| "eval_samples_per_second": 19.138, | |
| "eval_steps_per_second": 2.393, | |
| "eval_wer": 0.6265920108122272, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.26, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 768.8673, | |
| "eval_samples_per_second": 19.204, | |
| "eval_steps_per_second": 2.401, | |
| "eval_wer": 0.5512649892084595, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 0.31, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 774.562, | |
| "eval_samples_per_second": 19.062, | |
| "eval_steps_per_second": 2.383, | |
| "eval_wer": 0.508133304831714, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 0.35, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 770.4155, | |
| "eval_samples_per_second": 19.165, | |
| "eval_steps_per_second": 2.396, | |
| "eval_wer": 0.4944870053302625, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 0.39, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 769.5888, | |
| "eval_samples_per_second": 19.186, | |
| "eval_steps_per_second": 2.399, | |
| "eval_wer": 0.4720419801270161, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "learning_rate": 0.0009542909591555759, | |
| "loss": 0.5311, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.44, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 772.8626, | |
| "eval_samples_per_second": 19.104, | |
| "eval_steps_per_second": 2.389, | |
| "eval_wer": 0.4387433544107405, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.48, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 769.5289, | |
| "eval_samples_per_second": 19.187, | |
| "eval_steps_per_second": 2.399, | |
| "eval_wer": 0.4410533646851146, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 0.53, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 780.8054, | |
| "eval_samples_per_second": 18.91, | |
| "eval_steps_per_second": 2.364, | |
| "eval_wer": 0.44290826845767167, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 0.57, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 774.2302, | |
| "eval_samples_per_second": 19.071, | |
| "eval_steps_per_second": 2.384, | |
| "eval_wer": 0.43216499679356785, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 0.61, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 768.9729, | |
| "eval_samples_per_second": 19.201, | |
| "eval_steps_per_second": 2.401, | |
| "eval_wer": 0.4531826425138428, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "learning_rate": 0.0009083983478659936, | |
| "loss": 0.4654, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.66, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.4905, | |
| "eval_samples_per_second": 18.991, | |
| "eval_steps_per_second": 2.374, | |
| "eval_wer": 0.44915563952806836, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 0.7, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 773.9985, | |
| "eval_samples_per_second": 19.076, | |
| "eval_steps_per_second": 2.385, | |
| "eval_wer": 0.3878817550561643, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 0.75, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 773.8841, | |
| "eval_samples_per_second": 19.079, | |
| "eval_steps_per_second": 2.385, | |
| "eval_wer": 0.3835927210541922, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 0.79, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 773.515, | |
| "eval_samples_per_second": 19.088, | |
| "eval_steps_per_second": 2.387, | |
| "eval_wer": 0.37425614221388626, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 774.3742, | |
| "eval_samples_per_second": 19.067, | |
| "eval_steps_per_second": 2.384, | |
| "eval_wer": 0.36867074423704155, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "learning_rate": 0.0008625975217989904, | |
| "loss": 0.4254, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.88, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 774.0591, | |
| "eval_samples_per_second": 19.075, | |
| "eval_steps_per_second": 2.385, | |
| "eval_wer": 0.3792830003930465, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.92, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 768.0215, | |
| "eval_samples_per_second": 19.225, | |
| "eval_steps_per_second": 2.404, | |
| "eval_wer": 0.3766006302535495, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 772.2372, | |
| "eval_samples_per_second": 19.12, | |
| "eval_steps_per_second": 2.39, | |
| "eval_wer": 0.3705256480095986, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 1.01, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 767.2028, | |
| "eval_samples_per_second": 19.245, | |
| "eval_steps_per_second": 2.406, | |
| "eval_wer": 0.3271802014880604, | |
| "step": 2300 | |
| }, | |
| { | |
| "epoch": 1.05, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 768.4281, | |
| "eval_samples_per_second": 19.215, | |
| "eval_steps_per_second": 2.402, | |
| "eval_wer": 0.31850559574130644, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "learning_rate": 0.000816704910509408, | |
| "loss": 0.3997, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 1.1, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 767.2666, | |
| "eval_samples_per_second": 19.244, | |
| "eval_steps_per_second": 2.406, | |
| "eval_wer": 0.3244426669241006, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 1.14, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 767.2447, | |
| "eval_samples_per_second": 19.244, | |
| "eval_steps_per_second": 2.406, | |
| "eval_wer": 0.30816916170761477, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 1.18, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 771.1785, | |
| "eval_samples_per_second": 19.146, | |
| "eval_steps_per_second": 2.394, | |
| "eval_wer": 0.30403872542597277, | |
| "step": 2700 | |
| }, | |
| { | |
| "epoch": 1.23, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 761.2544, | |
| "eval_samples_per_second": 19.396, | |
| "eval_steps_per_second": 2.425, | |
| "eval_wer": 0.30282510808779417, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 1.27, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 770.9042, | |
| "eval_samples_per_second": 19.153, | |
| "eval_steps_per_second": 2.395, | |
| "eval_wer": 0.3112101006061191, | |
| "step": 2900 | |
| }, | |
| { | |
| "epoch": 1.32, | |
| "learning_rate": 0.0007709040844424048, | |
| "loss": 0.3668, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 1.32, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 763.6174, | |
| "eval_samples_per_second": 19.336, | |
| "eval_steps_per_second": 2.417, | |
| "eval_wer": 0.31098944290826847, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 1.36, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 765.7415, | |
| "eval_samples_per_second": 19.282, | |
| "eval_steps_per_second": 2.411, | |
| "eval_wer": 0.3066521400348915, | |
| "step": 3100 | |
| }, | |
| { | |
| "epoch": 1.4, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 762.1465, | |
| "eval_samples_per_second": 19.373, | |
| "eval_steps_per_second": 2.422, | |
| "eval_wer": 0.29612952606863835, | |
| "step": 3200 | |
| }, | |
| { | |
| "epoch": 1.45, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 764.1293, | |
| "eval_samples_per_second": 19.323, | |
| "eval_steps_per_second": 2.416, | |
| "eval_wer": 0.3080933106239786, | |
| "step": 3300 | |
| }, | |
| { | |
| "epoch": 1.49, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 764.6533, | |
| "eval_samples_per_second": 19.309, | |
| "eval_steps_per_second": 2.414, | |
| "eval_wer": 0.2936195447555871, | |
| "step": 3400 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "learning_rate": 0.0007250114731528225, | |
| "loss": 0.3645, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 1.54, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 762.2683, | |
| "eval_samples_per_second": 19.37, | |
| "eval_steps_per_second": 2.422, | |
| "eval_wer": 0.30368015666696546, | |
| "step": 3500 | |
| }, | |
| { | |
| "epoch": 1.58, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 760.0026, | |
| "eval_samples_per_second": 19.428, | |
| "eval_steps_per_second": 2.429, | |
| "eval_wer": 0.2973914122782218, | |
| "step": 3600 | |
| }, | |
| { | |
| "epoch": 1.62, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 760.5942, | |
| "eval_samples_per_second": 19.412, | |
| "eval_steps_per_second": 2.427, | |
| "eval_wer": 0.30096330876217925, | |
| "step": 3700 | |
| }, | |
| { | |
| "epoch": 1.67, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 761.2356, | |
| "eval_samples_per_second": 19.396, | |
| "eval_steps_per_second": 2.425, | |
| "eval_wer": 0.2985498651919377, | |
| "step": 3800 | |
| }, | |
| { | |
| "epoch": 1.71, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 767.0946, | |
| "eval_samples_per_second": 19.248, | |
| "eval_steps_per_second": 2.406, | |
| "eval_wer": 0.2975775922107833, | |
| "step": 3900 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "learning_rate": 0.00067911886186324, | |
| "loss": 0.3624, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 1.76, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 764.3373, | |
| "eval_samples_per_second": 19.317, | |
| "eval_steps_per_second": 2.415, | |
| "eval_wer": 0.292757600623358, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 778.1044, | |
| "eval_samples_per_second": 18.976, | |
| "eval_steps_per_second": 2.372, | |
| "eval_wer": 0.2859516897552768, | |
| "step": 4100 | |
| }, | |
| { | |
| "epoch": 1.84, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 780.7174, | |
| "eval_samples_per_second": 18.912, | |
| "eval_steps_per_second": 2.364, | |
| "eval_wer": 0.29222664303790485, | |
| "step": 4200 | |
| }, | |
| { | |
| "epoch": 1.89, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 778.463, | |
| "eval_samples_per_second": 18.967, | |
| "eval_steps_per_second": 2.371, | |
| "eval_wer": 0.2865929761896553, | |
| "step": 4300 | |
| }, | |
| { | |
| "epoch": 1.93, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.1309, | |
| "eval_samples_per_second": 18.999, | |
| "eval_steps_per_second": 2.375, | |
| "eval_wer": 0.2775529061308362, | |
| "step": 4400 | |
| }, | |
| { | |
| "epoch": 1.97, | |
| "learning_rate": 0.0006332262505736577, | |
| "loss": 0.3527, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 1.97, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 776.0915, | |
| "eval_samples_per_second": 19.025, | |
| "eval_steps_per_second": 2.379, | |
| "eval_wer": 0.27924921218306314, | |
| "step": 4500 | |
| }, | |
| { | |
| "epoch": 2.02, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.8615, | |
| "eval_samples_per_second": 18.982, | |
| "eval_steps_per_second": 2.373, | |
| "eval_wer": 0.2857655098227153, | |
| "step": 4600 | |
| }, | |
| { | |
| "epoch": 2.06, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 779.7088, | |
| "eval_samples_per_second": 18.937, | |
| "eval_steps_per_second": 2.368, | |
| "eval_wer": 0.27665648423331796, | |
| "step": 4700 | |
| }, | |
| { | |
| "epoch": 2.11, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 780.5896, | |
| "eval_samples_per_second": 18.915, | |
| "eval_steps_per_second": 2.365, | |
| "eval_wer": 0.28240047993049283, | |
| "step": 4800 | |
| }, | |
| { | |
| "epoch": 2.15, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 781.7435, | |
| "eval_samples_per_second": 18.887, | |
| "eval_steps_per_second": 2.361, | |
| "eval_wer": 0.27986291640521027, | |
| "step": 4900 | |
| }, | |
| { | |
| "epoch": 2.19, | |
| "learning_rate": 0.0005873336392840752, | |
| "loss": 0.3162, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 2.19, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 785.7508, | |
| "eval_samples_per_second": 18.791, | |
| "eval_steps_per_second": 2.349, | |
| "eval_wer": 0.26727853207466507, | |
| "step": 5000 | |
| }, | |
| { | |
| "epoch": 2.24, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 789.097, | |
| "eval_samples_per_second": 18.711, | |
| "eval_steps_per_second": 2.339, | |
| "eval_wer": 0.2961915860461588, | |
| "step": 5100 | |
| }, | |
| { | |
| "epoch": 2.28, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 782.4986, | |
| "eval_samples_per_second": 18.869, | |
| "eval_steps_per_second": 2.359, | |
| "eval_wer": 0.2735948586756401, | |
| "step": 5200 | |
| }, | |
| { | |
| "epoch": 2.33, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 780.5596, | |
| "eval_samples_per_second": 18.916, | |
| "eval_steps_per_second": 2.365, | |
| "eval_wer": 0.2651547017328525, | |
| "step": 5300 | |
| }, | |
| { | |
| "epoch": 2.37, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 782.8773, | |
| "eval_samples_per_second": 18.86, | |
| "eval_steps_per_second": 2.358, | |
| "eval_wer": 0.2550527165031271, | |
| "step": 5400 | |
| }, | |
| { | |
| "epoch": 2.41, | |
| "learning_rate": 0.0005414410279944929, | |
| "loss": 0.3063, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 2.41, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 779.9742, | |
| "eval_samples_per_second": 18.93, | |
| "eval_steps_per_second": 2.367, | |
| "eval_wer": 0.26804393846408453, | |
| "step": 5500 | |
| }, | |
| { | |
| "epoch": 2.46, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 783.4711, | |
| "eval_samples_per_second": 18.846, | |
| "eval_steps_per_second": 2.356, | |
| "eval_wer": 0.2557767495741996, | |
| "step": 5600 | |
| }, | |
| { | |
| "epoch": 2.5, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 792.9653, | |
| "eval_samples_per_second": 18.62, | |
| "eval_steps_per_second": 2.328, | |
| "eval_wer": 0.2597830659008006, | |
| "step": 5700 | |
| }, | |
| { | |
| "epoch": 2.54, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 788.5494, | |
| "eval_samples_per_second": 18.724, | |
| "eval_steps_per_second": 2.341, | |
| "eval_wer": 0.25175664214148297, | |
| "step": 5800 | |
| }, | |
| { | |
| "epoch": 2.59, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.5477, | |
| "eval_samples_per_second": 18.989, | |
| "eval_steps_per_second": 2.374, | |
| "eval_wer": 0.254149399052551, | |
| "step": 5900 | |
| }, | |
| { | |
| "epoch": 2.63, | |
| "learning_rate": 0.0004955484167049105, | |
| "loss": 0.2913, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 2.63, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 785.1255, | |
| "eval_samples_per_second": 18.806, | |
| "eval_steps_per_second": 2.351, | |
| "eval_wer": 0.2507361002889237, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 2.68, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 785.3479, | |
| "eval_samples_per_second": 18.801, | |
| "eval_steps_per_second": 2.351, | |
| "eval_wer": 0.24998448500561987, | |
| "step": 6100 | |
| }, | |
| { | |
| "epoch": 2.72, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 781.3987, | |
| "eval_samples_per_second": 18.896, | |
| "eval_steps_per_second": 2.362, | |
| "eval_wer": 0.24352335179043036, | |
| "step": 6200 | |
| }, | |
| { | |
| "epoch": 2.76, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 781.4686, | |
| "eval_samples_per_second": 18.894, | |
| "eval_steps_per_second": 2.362, | |
| "eval_wer": 0.23755180284234698, | |
| "step": 6300 | |
| }, | |
| { | |
| "epoch": 2.81, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 775.7634, | |
| "eval_samples_per_second": 19.033, | |
| "eval_steps_per_second": 2.38, | |
| "eval_wer": 0.23476599940698245, | |
| "step": 6400 | |
| }, | |
| { | |
| "epoch": 2.85, | |
| "learning_rate": 0.0004497475906379073, | |
| "loss": 0.2797, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 2.85, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 772.9219, | |
| "eval_samples_per_second": 19.103, | |
| "eval_steps_per_second": 2.388, | |
| "eval_wer": 0.2512049978968563, | |
| "step": 6500 | |
| }, | |
| { | |
| "epoch": 2.9, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 771.2336, | |
| "eval_samples_per_second": 19.145, | |
| "eval_steps_per_second": 2.394, | |
| "eval_wer": 0.23818619372366762, | |
| "step": 6600 | |
| }, | |
| { | |
| "epoch": 2.94, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.0185, | |
| "eval_samples_per_second": 19.002, | |
| "eval_steps_per_second": 2.376, | |
| "eval_wer": 0.2523082863861096, | |
| "step": 6700 | |
| }, | |
| { | |
| "epoch": 2.98, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 773.6017, | |
| "eval_samples_per_second": 19.086, | |
| "eval_steps_per_second": 2.386, | |
| "eval_wer": 0.25221864419635776, | |
| "step": 6800 | |
| }, | |
| { | |
| "epoch": 3.03, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 780.1394, | |
| "eval_samples_per_second": 18.926, | |
| "eval_steps_per_second": 2.366, | |
| "eval_wer": 0.24091683273456949, | |
| "step": 6900 | |
| }, | |
| { | |
| "epoch": 3.07, | |
| "learning_rate": 0.0004038549793483249, | |
| "loss": 0.2766, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 3.07, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 783.1904, | |
| "eval_samples_per_second": 18.852, | |
| "eval_steps_per_second": 2.357, | |
| "eval_wer": 0.24534377779769825, | |
| "step": 7000 | |
| }, | |
| { | |
| "epoch": 3.12, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.1186, | |
| "eval_samples_per_second": 19.0, | |
| "eval_steps_per_second": 2.375, | |
| "eval_wer": 0.2326076912998807, | |
| "step": 7100 | |
| }, | |
| { | |
| "epoch": 3.16, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 781.1613, | |
| "eval_samples_per_second": 18.901, | |
| "eval_steps_per_second": 2.363, | |
| "eval_wer": 0.22860137497327973, | |
| "step": 7200 | |
| }, | |
| { | |
| "epoch": 3.2, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 786.2675, | |
| "eval_samples_per_second": 18.779, | |
| "eval_steps_per_second": 2.348, | |
| "eval_wer": 0.23420745960929795, | |
| "step": 7300 | |
| }, | |
| { | |
| "epoch": 3.25, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 781.7233, | |
| "eval_samples_per_second": 18.888, | |
| "eval_steps_per_second": 2.361, | |
| "eval_wer": 0.23047006985195248, | |
| "step": 7400 | |
| }, | |
| { | |
| "epoch": 3.29, | |
| "learning_rate": 0.0003579623680587425, | |
| "loss": 0.2468, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 3.29, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.7207, | |
| "eval_samples_per_second": 18.985, | |
| "eval_steps_per_second": 2.374, | |
| "eval_wer": 0.2238089655980858, | |
| "step": 7500 | |
| }, | |
| { | |
| "epoch": 3.33, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 786.7846, | |
| "eval_samples_per_second": 18.766, | |
| "eval_steps_per_second": 2.346, | |
| "eval_wer": 0.23211121147971672, | |
| "step": 7600 | |
| }, | |
| { | |
| "epoch": 3.38, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 784.5553, | |
| "eval_samples_per_second": 18.82, | |
| "eval_steps_per_second": 2.353, | |
| "eval_wer": 0.23048386095806814, | |
| "step": 7700 | |
| }, | |
| { | |
| "epoch": 3.42, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 776.8796, | |
| "eval_samples_per_second": 19.006, | |
| "eval_steps_per_second": 2.376, | |
| "eval_wer": 0.21740989236041677, | |
| "step": 7800 | |
| }, | |
| { | |
| "epoch": 3.47, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 778.8968, | |
| "eval_samples_per_second": 18.956, | |
| "eval_steps_per_second": 2.37, | |
| "eval_wer": 0.22008536694685596, | |
| "step": 7900 | |
| }, | |
| { | |
| "epoch": 3.51, | |
| "learning_rate": 0.00031206975676916014, | |
| "loss": 0.2439, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 3.51, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 785.8625, | |
| "eval_samples_per_second": 18.788, | |
| "eval_steps_per_second": 2.349, | |
| "eval_wer": 0.21332772495017963, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 3.55, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 778.9388, | |
| "eval_samples_per_second": 18.955, | |
| "eval_steps_per_second": 2.37, | |
| "eval_wer": 0.22168513525627323, | |
| "step": 8100 | |
| }, | |
| { | |
| "epoch": 3.6, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 779.3965, | |
| "eval_samples_per_second": 18.944, | |
| "eval_steps_per_second": 2.368, | |
| "eval_wer": 0.21885106294950388, | |
| "step": 8200 | |
| }, | |
| { | |
| "epoch": 3.64, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 786.4104, | |
| "eval_samples_per_second": 18.775, | |
| "eval_steps_per_second": 2.347, | |
| "eval_wer": 0.2105212348556416, | |
| "step": 8300 | |
| }, | |
| { | |
| "epoch": 3.69, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 784.1132, | |
| "eval_samples_per_second": 18.83, | |
| "eval_steps_per_second": 2.354, | |
| "eval_wer": 0.21176932995910938, | |
| "step": 8400 | |
| }, | |
| { | |
| "epoch": 3.73, | |
| "learning_rate": 0.0002661771454795778, | |
| "loss": 0.2357, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 3.73, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 776.0702, | |
| "eval_samples_per_second": 19.025, | |
| "eval_steps_per_second": 2.379, | |
| "eval_wer": 0.20932830417663648, | |
| "step": 8500 | |
| }, | |
| { | |
| "epoch": 3.77, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.6609, | |
| "eval_samples_per_second": 18.986, | |
| "eval_steps_per_second": 2.374, | |
| "eval_wer": 0.21030747271084876, | |
| "step": 8600 | |
| }, | |
| { | |
| "epoch": 3.82, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 773.9787, | |
| "eval_samples_per_second": 19.077, | |
| "eval_steps_per_second": 2.385, | |
| "eval_wer": 0.20353603960805677, | |
| "step": 8700 | |
| }, | |
| { | |
| "epoch": 3.86, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 780.5659, | |
| "eval_samples_per_second": 18.916, | |
| "eval_steps_per_second": 2.365, | |
| "eval_wer": 0.2019362712986395, | |
| "step": 8800 | |
| }, | |
| { | |
| "epoch": 3.91, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 779.996, | |
| "eval_samples_per_second": 18.93, | |
| "eval_steps_per_second": 2.367, | |
| "eval_wer": 0.20323953082656995, | |
| "step": 8900 | |
| }, | |
| { | |
| "epoch": 3.95, | |
| "learning_rate": 0.0002203763194125746, | |
| "loss": 0.2217, | |
| "step": 9000 | |
| }, | |
| { | |
| "epoch": 3.95, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 778.6538, | |
| "eval_samples_per_second": 18.962, | |
| "eval_steps_per_second": 2.371, | |
| "eval_wer": 0.20561849663152232, | |
| "step": 9000 | |
| }, | |
| { | |
| "epoch": 3.99, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 778.3405, | |
| "eval_samples_per_second": 18.97, | |
| "eval_steps_per_second": 2.372, | |
| "eval_wer": 0.20215003344343233, | |
| "step": 9100 | |
| }, | |
| { | |
| "epoch": 4.04, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 787.2038, | |
| "eval_samples_per_second": 18.756, | |
| "eval_steps_per_second": 2.345, | |
| "eval_wer": 0.19324787444576993, | |
| "step": 9200 | |
| }, | |
| { | |
| "epoch": 4.08, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 775.7143, | |
| "eval_samples_per_second": 19.034, | |
| "eval_steps_per_second": 2.38, | |
| "eval_wer": 0.19350300990890976, | |
| "step": 9300 | |
| }, | |
| { | |
| "epoch": 4.12, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 773.9153, | |
| "eval_samples_per_second": 19.078, | |
| "eval_steps_per_second": 2.385, | |
| "eval_wer": 0.1905655043062729, | |
| "step": 9400 | |
| }, | |
| { | |
| "epoch": 4.17, | |
| "learning_rate": 0.0001744837081229922, | |
| "loss": 0.2025, | |
| "step": 9500 | |
| }, | |
| { | |
| "epoch": 4.17, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 779.0392, | |
| "eval_samples_per_second": 18.953, | |
| "eval_steps_per_second": 2.37, | |
| "eval_wer": 0.18794519414429633, | |
| "step": 9500 | |
| }, | |
| { | |
| "epoch": 4.21, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 779.0747, | |
| "eval_samples_per_second": 18.952, | |
| "eval_steps_per_second": 2.369, | |
| "eval_wer": 0.18824859847884098, | |
| "step": 9600 | |
| }, | |
| { | |
| "epoch": 4.26, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.6573, | |
| "eval_samples_per_second": 18.987, | |
| "eval_steps_per_second": 2.374, | |
| "eval_wer": 0.18538004840678246, | |
| "step": 9700 | |
| }, | |
| { | |
| "epoch": 4.3, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 772.7615, | |
| "eval_samples_per_second": 19.107, | |
| "eval_steps_per_second": 2.389, | |
| "eval_wer": 0.18654539687355626, | |
| "step": 9800 | |
| }, | |
| { | |
| "epoch": 4.34, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 778.0179, | |
| "eval_samples_per_second": 18.978, | |
| "eval_steps_per_second": 2.373, | |
| "eval_wer": 0.18438708876645452, | |
| "step": 9900 | |
| }, | |
| { | |
| "epoch": 4.39, | |
| "learning_rate": 0.00012859109683340984, | |
| "loss": 0.1869, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 4.39, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 778.8028, | |
| "eval_samples_per_second": 18.959, | |
| "eval_steps_per_second": 2.37, | |
| "eval_wer": 0.1821667206818323, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 4.43, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 777.366, | |
| "eval_samples_per_second": 18.994, | |
| "eval_steps_per_second": 2.375, | |
| "eval_wer": 0.1815461209066273, | |
| "step": 10100 | |
| }, | |
| { | |
| "epoch": 4.48, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 781.9611, | |
| "eval_samples_per_second": 18.882, | |
| "eval_steps_per_second": 2.361, | |
| "eval_wer": 0.18118755214762, | |
| "step": 10200 | |
| }, | |
| { | |
| "epoch": 4.52, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 760.9314, | |
| "eval_samples_per_second": 19.404, | |
| "eval_steps_per_second": 2.426, | |
| "eval_wer": 0.17923611063225325, | |
| "step": 10300 | |
| }, | |
| { | |
| "epoch": 4.56, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 761.9088, | |
| "eval_samples_per_second": 19.379, | |
| "eval_steps_per_second": 2.423, | |
| "eval_wer": 0.17967742602795458, | |
| "step": 10400 | |
| }, | |
| { | |
| "epoch": 4.61, | |
| "learning_rate": 8.269848554382745e-05, | |
| "loss": 0.1863, | |
| "step": 10500 | |
| }, | |
| { | |
| "epoch": 4.61, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 760.7934, | |
| "eval_samples_per_second": 19.407, | |
| "eval_steps_per_second": 2.426, | |
| "eval_wer": 0.1773812068596962, | |
| "step": 10500 | |
| }, | |
| { | |
| "epoch": 4.65, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 755.7192, | |
| "eval_samples_per_second": 19.538, | |
| "eval_steps_per_second": 2.443, | |
| "eval_wer": 0.1767330248722599, | |
| "step": 10600 | |
| }, | |
| { | |
| "epoch": 4.7, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 756.3189, | |
| "eval_samples_per_second": 19.522, | |
| "eval_steps_per_second": 2.441, | |
| "eval_wer": 0.17650547162135138, | |
| "step": 10700 | |
| }, | |
| { | |
| "epoch": 4.74, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 761.0501, | |
| "eval_samples_per_second": 19.401, | |
| "eval_steps_per_second": 2.426, | |
| "eval_wer": 0.1752918542831728, | |
| "step": 10800 | |
| }, | |
| { | |
| "epoch": 4.78, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 756.3701, | |
| "eval_samples_per_second": 19.521, | |
| "eval_steps_per_second": 2.441, | |
| "eval_wer": 0.17308527730466622, | |
| "step": 10900 | |
| }, | |
| { | |
| "epoch": 4.83, | |
| "learning_rate": 3.6805874254245066e-05, | |
| "loss": 0.178, | |
| "step": 11000 | |
| }, | |
| { | |
| "epoch": 4.83, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 758.6147, | |
| "eval_samples_per_second": 19.463, | |
| "eval_steps_per_second": 2.433, | |
| "eval_wer": 0.17265775301508057, | |
| "step": 11000 | |
| }, | |
| { | |
| "epoch": 4.87, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 759.5074, | |
| "eval_samples_per_second": 19.44, | |
| "eval_steps_per_second": 2.431, | |
| "eval_wer": 0.17243709531722992, | |
| "step": 11100 | |
| }, | |
| { | |
| "epoch": 4.91, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 757.3653, | |
| "eval_samples_per_second": 19.495, | |
| "eval_steps_per_second": 2.437, | |
| "eval_wer": 0.17223022872549493, | |
| "step": 11200 | |
| }, | |
| { | |
| "epoch": 4.96, | |
| "eval_loss": Infinity, | |
| "eval_runtime": 756.4761, | |
| "eval_samples_per_second": 19.518, | |
| "eval_steps_per_second": 2.44, | |
| "eval_wer": 0.17115452244847298, | |
| "step": 11300 | |
| }, | |
| { | |
| "epoch": 5.0, | |
| "step": 11395, | |
| "total_flos": 1.0194681891264653e+20, | |
| "train_loss": 0.4200820018974194, | |
| "train_runtime": 124144.1421, | |
| "train_samples_per_second": 5.872, | |
| "train_steps_per_second": 0.092 | |
| } | |
| ], | |
| "max_steps": 11395, | |
| "num_train_epochs": 5, | |
| "total_flos": 1.0194681891264653e+20, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |