zhenting's picture
Upload folder using huggingface_hub
ad58461 verified
{"current_steps": 10, "total_steps": 781, "loss": 2.0492, "lr": 1.2658227848101267e-06, "epoch": 0.0128, "percentage": 1.28, "elapsed_time": "0:00:57", "remaining_time": "1:13:30"}
{"current_steps": 20, "total_steps": 781, "loss": 1.8655, "lr": 2.5316455696202535e-06, "epoch": 0.0256, "percentage": 2.56, "elapsed_time": "0:01:44", "remaining_time": "1:06:19"}
{"current_steps": 30, "total_steps": 781, "loss": 1.4331, "lr": 3.7974683544303802e-06, "epoch": 0.0384, "percentage": 3.84, "elapsed_time": "0:02:30", "remaining_time": "1:02:35"}
{"current_steps": 40, "total_steps": 781, "loss": 1.0761, "lr": 5.063291139240507e-06, "epoch": 0.0512, "percentage": 5.12, "elapsed_time": "0:03:19", "remaining_time": "1:01:26"}
{"current_steps": 50, "total_steps": 781, "loss": 0.8806, "lr": 6.329113924050634e-06, "epoch": 0.064, "percentage": 6.4, "elapsed_time": "0:04:04", "remaining_time": "0:59:31"}
{"current_steps": 60, "total_steps": 781, "loss": 0.7862, "lr": 7.5949367088607605e-06, "epoch": 0.0768, "percentage": 7.68, "elapsed_time": "0:04:48", "remaining_time": "0:57:48"}
{"current_steps": 70, "total_steps": 781, "loss": 0.7079, "lr": 8.860759493670886e-06, "epoch": 0.0896, "percentage": 8.96, "elapsed_time": "0:05:36", "remaining_time": "0:56:58"}
{"current_steps": 80, "total_steps": 781, "loss": 0.6374, "lr": 9.99994993147413e-06, "epoch": 0.1024, "percentage": 10.24, "elapsed_time": "0:06:20", "remaining_time": "0:55:31"}
{"current_steps": 90, "total_steps": 781, "loss": 0.6237, "lr": 9.993942921593858e-06, "epoch": 0.1152, "percentage": 11.52, "elapsed_time": "0:07:06", "remaining_time": "0:54:38"}
{"current_steps": 100, "total_steps": 781, "loss": 0.5959, "lr": 9.977935989714594e-06, "epoch": 0.128, "percentage": 12.8, "elapsed_time": "0:07:51", "remaining_time": "0:53:30"}
{"current_steps": 110, "total_steps": 781, "loss": 0.5679, "lr": 9.951961188279216e-06, "epoch": 0.1408, "percentage": 14.08, "elapsed_time": "0:08:35", "remaining_time": "0:52:24"}
{"current_steps": 120, "total_steps": 781, "loss": 0.5446, "lr": 9.916070529493785e-06, "epoch": 0.1536, "percentage": 15.36, "elapsed_time": "0:09:20", "remaining_time": "0:51:27"}
{"current_steps": 130, "total_steps": 781, "loss": 0.5291, "lr": 9.870335881177774e-06, "epoch": 0.1664, "percentage": 16.65, "elapsed_time": "0:10:05", "remaining_time": "0:50:29"}
{"current_steps": 140, "total_steps": 781, "loss": 0.5222, "lr": 9.814848822855216e-06, "epoch": 0.1792, "percentage": 17.93, "elapsed_time": "0:10:47", "remaining_time": "0:49:24"}
{"current_steps": 150, "total_steps": 781, "loss": 0.5171, "lr": 9.749720462374939e-06, "epoch": 0.192, "percentage": 19.21, "elapsed_time": "0:11:33", "remaining_time": "0:48:38"}
{"current_steps": 160, "total_steps": 781, "loss": 0.501, "lr": 9.675081213427076e-06, "epoch": 0.2048, "percentage": 20.49, "elapsed_time": "0:12:19", "remaining_time": "0:47:50"}
{"current_steps": 170, "total_steps": 781, "loss": 0.4905, "lr": 9.591080534401371e-06, "epoch": 0.2176, "percentage": 21.77, "elapsed_time": "0:13:06", "remaining_time": "0:47:05"}
{"current_steps": 180, "total_steps": 781, "loss": 0.4887, "lr": 9.497886629110187e-06, "epoch": 0.2304, "percentage": 23.05, "elapsed_time": "0:13:50", "remaining_time": "0:46:12"}
{"current_steps": 190, "total_steps": 781, "loss": 0.4754, "lr": 9.395686109975475e-06, "epoch": 0.2432, "percentage": 24.33, "elapsed_time": "0:14:35", "remaining_time": "0:45:22"}
{"current_steps": 200, "total_steps": 781, "loss": 0.4681, "lr": 9.284683624354172e-06, "epoch": 0.256, "percentage": 25.61, "elapsed_time": "0:15:21", "remaining_time": "0:44:38"}
{"current_steps": 210, "total_steps": 781, "loss": 0.4503, "lr": 9.165101444750259e-06, "epoch": 0.2688, "percentage": 26.89, "elapsed_time": "0:16:05", "remaining_time": "0:43:45"}
{"current_steps": 220, "total_steps": 781, "loss": 0.4505, "lr": 9.037179023734036e-06, "epoch": 0.2816, "percentage": 28.17, "elapsed_time": "0:16:50", "remaining_time": "0:42:56"}
{"current_steps": 230, "total_steps": 781, "loss": 0.4492, "lr": 8.901172514459864e-06, "epoch": 0.2944, "percentage": 29.45, "elapsed_time": "0:17:38", "remaining_time": "0:42:14"}
{"current_steps": 240, "total_steps": 781, "loss": 0.4428, "lr": 8.757354257742501e-06, "epoch": 0.3072, "percentage": 30.73, "elapsed_time": "0:18:24", "remaining_time": "0:41:28"}
{"current_steps": 250, "total_steps": 781, "loss": 0.4357, "lr": 8.606012236719073e-06, "epoch": 0.32, "percentage": 32.01, "elapsed_time": "0:19:06", "remaining_time": "0:40:35"}
{"current_steps": 260, "total_steps": 781, "loss": 0.4335, "lr": 8.447449500188731e-06, "epoch": 0.3328, "percentage": 33.29, "elapsed_time": "0:19:54", "remaining_time": "0:39:52"}
{"current_steps": 270, "total_steps": 781, "loss": 0.4249, "lr": 8.28198355578465e-06, "epoch": 0.3456, "percentage": 34.57, "elapsed_time": "0:20:37", "remaining_time": "0:39:01"}
{"current_steps": 280, "total_steps": 781, "loss": 0.417, "lr": 8.10994573419352e-06, "epoch": 0.3584, "percentage": 35.85, "elapsed_time": "0:21:21", "remaining_time": "0:38:12"}
{"current_steps": 290, "total_steps": 781, "loss": 0.4101, "lr": 7.931680525695634e-06, "epoch": 0.3712, "percentage": 37.13, "elapsed_time": "0:22:04", "remaining_time": "0:37:23"}
{"current_steps": 300, "total_steps": 781, "loss": 0.4102, "lr": 7.747544890354031e-06, "epoch": 0.384, "percentage": 38.41, "elapsed_time": "0:22:49", "remaining_time": "0:36:36"}
{"current_steps": 310, "total_steps": 781, "loss": 0.4005, "lr": 7.557907543234051e-06, "epoch": 0.3968, "percentage": 39.69, "elapsed_time": "0:23:31", "remaining_time": "0:35:45"}
{"current_steps": 320, "total_steps": 781, "loss": 0.3938, "lr": 7.363148216084548e-06, "epoch": 0.4096, "percentage": 40.97, "elapsed_time": "0:24:15", "remaining_time": "0:34:57"}
{"current_steps": 330, "total_steps": 781, "loss": 0.4025, "lr": 7.163656896959181e-06, "epoch": 0.4224, "percentage": 42.25, "elapsed_time": "0:25:03", "remaining_time": "0:34:14"}
{"current_steps": 340, "total_steps": 781, "loss": 0.3917, "lr": 6.959833049300376e-06, "epoch": 0.4352, "percentage": 43.53, "elapsed_time": "0:25:48", "remaining_time": "0:33:28"}
{"current_steps": 350, "total_steps": 781, "loss": 0.3956, "lr": 6.75208481204967e-06, "epoch": 0.448, "percentage": 44.81, "elapsed_time": "0:26:32", "remaining_time": "0:32:40"}
{"current_steps": 360, "total_steps": 781, "loss": 0.3863, "lr": 6.540828182386154e-06, "epoch": 0.4608, "percentage": 46.09, "elapsed_time": "0:27:16", "remaining_time": "0:31:53"}
{"current_steps": 370, "total_steps": 781, "loss": 0.386, "lr": 6.326486182729504e-06, "epoch": 0.4736, "percentage": 47.38, "elapsed_time": "0:28:00", "remaining_time": "0:31:06"}
{"current_steps": 380, "total_steps": 781, "loss": 0.3876, "lr": 6.1094880136755886e-06, "epoch": 0.4864, "percentage": 48.66, "elapsed_time": "0:28:47", "remaining_time": "0:30:22"}
{"current_steps": 390, "total_steps": 781, "loss": 0.3751, "lr": 5.890268194560834e-06, "epoch": 0.4992, "percentage": 49.94, "elapsed_time": "0:29:33", "remaining_time": "0:29:37"}
{"current_steps": 400, "total_steps": 781, "loss": 0.3773, "lr": 5.669265693376309e-06, "epoch": 0.512, "percentage": 51.22, "elapsed_time": "0:30:15", "remaining_time": "0:28:49"}
{"current_steps": 410, "total_steps": 781, "loss": 0.3785, "lr": 5.4469230477737466e-06, "epoch": 0.5248, "percentage": 52.5, "elapsed_time": "0:31:04", "remaining_time": "0:28:06"}
{"current_steps": 420, "total_steps": 781, "loss": 0.3641, "lr": 5.223685478923671e-06, "epoch": 0.5376, "percentage": 53.78, "elapsed_time": "0:31:46", "remaining_time": "0:27:18"}
{"current_steps": 430, "total_steps": 781, "loss": 0.3769, "lr": 5e-06, "epoch": 0.5504, "percentage": 55.06, "elapsed_time": "0:32:32", "remaining_time": "0:26:34"}
{"current_steps": 440, "total_steps": 781, "loss": 0.3747, "lr": 4.77631452107633e-06, "epoch": 0.5632, "percentage": 56.34, "elapsed_time": "0:33:17", "remaining_time": "0:25:47"}
{"current_steps": 450, "total_steps": 781, "loss": 0.3539, "lr": 4.553076952226255e-06, "epoch": 0.576, "percentage": 57.62, "elapsed_time": "0:33:59", "remaining_time": "0:24:59"}
{"current_steps": 460, "total_steps": 781, "loss": 0.3702, "lr": 4.330734306623694e-06, "epoch": 0.5888, "percentage": 58.9, "elapsed_time": "0:34:45", "remaining_time": "0:24:15"}
{"current_steps": 470, "total_steps": 781, "loss": 0.36, "lr": 4.109731805439168e-06, "epoch": 0.6016, "percentage": 60.18, "elapsed_time": "0:35:32", "remaining_time": "0:23:31"}
{"current_steps": 480, "total_steps": 781, "loss": 0.3655, "lr": 3.890511986324413e-06, "epoch": 0.6144, "percentage": 61.46, "elapsed_time": "0:36:17", "remaining_time": "0:22:45"}
{"current_steps": 490, "total_steps": 781, "loss": 0.355, "lr": 3.6735138172704967e-06, "epoch": 0.6272, "percentage": 62.74, "elapsed_time": "0:37:02", "remaining_time": "0:22:00"}
{"current_steps": 500, "total_steps": 781, "loss": 0.3593, "lr": 3.459171817613847e-06, "epoch": 0.64, "percentage": 64.02, "elapsed_time": "0:37:47", "remaining_time": "0:21:14"}
{"current_steps": 510, "total_steps": 781, "loss": 0.3547, "lr": 3.2479151879503324e-06, "epoch": 0.6528, "percentage": 65.3, "elapsed_time": "0:38:32", "remaining_time": "0:20:28"}
{"current_steps": 520, "total_steps": 781, "loss": 0.3564, "lr": 3.040166950699626e-06, "epoch": 0.6656, "percentage": 66.58, "elapsed_time": "0:39:15", "remaining_time": "0:19:42"}
{"current_steps": 530, "total_steps": 781, "loss": 0.3455, "lr": 2.836343103040819e-06, "epoch": 0.6784, "percentage": 67.86, "elapsed_time": "0:40:01", "remaining_time": "0:18:57"}
{"current_steps": 540, "total_steps": 781, "loss": 0.3574, "lr": 2.636851783915454e-06, "epoch": 0.6912, "percentage": 69.14, "elapsed_time": "0:40:47", "remaining_time": "0:18:12"}
{"current_steps": 550, "total_steps": 781, "loss": 0.3563, "lr": 2.4420924567659508e-06, "epoch": 0.704, "percentage": 70.42, "elapsed_time": "0:41:33", "remaining_time": "0:17:27"}
{"current_steps": 560, "total_steps": 781, "loss": 0.3442, "lr": 2.2524551096459703e-06, "epoch": 0.7168, "percentage": 71.7, "elapsed_time": "0:42:18", "remaining_time": "0:16:41"}
{"current_steps": 570, "total_steps": 781, "loss": 0.3513, "lr": 2.068319474304365e-06, "epoch": 0.7296, "percentage": 72.98, "elapsed_time": "0:43:03", "remaining_time": "0:15:56"}
{"current_steps": 580, "total_steps": 781, "loss": 0.3505, "lr": 1.8900542658064807e-06, "epoch": 0.7424, "percentage": 74.26, "elapsed_time": "0:43:46", "remaining_time": "0:15:10"}
{"current_steps": 590, "total_steps": 781, "loss": 0.3436, "lr": 1.7180164442153529e-06, "epoch": 0.7552, "percentage": 75.54, "elapsed_time": "0:44:28", "remaining_time": "0:14:23"}
{"current_steps": 600, "total_steps": 781, "loss": 0.3492, "lr": 1.5525504998112717e-06, "epoch": 0.768, "percentage": 76.82, "elapsed_time": "0:45:15", "remaining_time": "0:13:39"}
{"current_steps": 610, "total_steps": 781, "loss": 0.3376, "lr": 1.3939877632809279e-06, "epoch": 0.7808, "percentage": 78.1, "elapsed_time": "0:45:58", "remaining_time": "0:12:53"}
{"current_steps": 620, "total_steps": 781, "loss": 0.3509, "lr": 1.2426457422575e-06, "epoch": 0.7936, "percentage": 79.39, "elapsed_time": "0:46:46", "remaining_time": "0:12:08"}
{"current_steps": 630, "total_steps": 781, "loss": 0.3427, "lr": 1.0988274855401377e-06, "epoch": 0.8064, "percentage": 80.67, "elapsed_time": "0:47:31", "remaining_time": "0:11:23"}
{"current_steps": 640, "total_steps": 781, "loss": 0.352, "lr": 9.628209762659658e-07, "epoch": 0.8192, "percentage": 81.95, "elapsed_time": "0:48:17", "remaining_time": "0:10:38"}
{"current_steps": 650, "total_steps": 781, "loss": 0.3512, "lr": 8.348985552497424e-07, "epoch": 0.832, "percentage": 83.23, "elapsed_time": "0:49:03", "remaining_time": "0:09:53"}
{"current_steps": 660, "total_steps": 781, "loss": 0.3418, "lr": 7.153163756458287e-07, "epoch": 0.8448, "percentage": 84.51, "elapsed_time": "0:49:47", "remaining_time": "0:09:07"}
{"current_steps": 670, "total_steps": 781, "loss": 0.3415, "lr": 6.043138900245277e-07, "epoch": 0.8576, "percentage": 85.79, "elapsed_time": "0:50:30", "remaining_time": "0:08:22"}
{"current_steps": 680, "total_steps": 781, "loss": 0.3498, "lr": 5.021133708898146e-07, "epoch": 0.8704, "percentage": 87.07, "elapsed_time": "0:51:18", "remaining_time": "0:07:37"}
{"current_steps": 690, "total_steps": 781, "loss": 0.3418, "lr": 4.089194655986306e-07, "epoch": 0.8832, "percentage": 88.35, "elapsed_time": "0:52:03", "remaining_time": "0:06:51"}
{"current_steps": 700, "total_steps": 781, "loss": 0.3417, "lr": 3.2491878657292643e-07, "epoch": 0.896, "percentage": 89.63, "elapsed_time": "0:52:49", "remaining_time": "0:06:06"}
{"current_steps": 710, "total_steps": 781, "loss": 0.3414, "lr": 2.502795376250622e-07, "epoch": 0.9088, "percentage": 90.91, "elapsed_time": "0:53:33", "remaining_time": "0:05:21"}
{"current_steps": 720, "total_steps": 781, "loss": 0.3303, "lr": 1.8515117714478447e-07, "epoch": 0.9216, "percentage": 92.19, "elapsed_time": "0:54:18", "remaining_time": "0:04:36"}
{"current_steps": 730, "total_steps": 781, "loss": 0.3516, "lr": 1.2966411882222695e-07, "epoch": 0.9344, "percentage": 93.47, "elapsed_time": "0:55:05", "remaining_time": "0:03:50"}
{"current_steps": 740, "total_steps": 781, "loss": 0.3459, "lr": 8.392947050621603e-08, "epoch": 0.9472, "percentage": 94.75, "elapsed_time": "0:55:50", "remaining_time": "0:03:05"}
{"current_steps": 750, "total_steps": 781, "loss": 0.3381, "lr": 4.803881172078473e-08, "epoch": 0.96, "percentage": 96.03, "elapsed_time": "0:56:35", "remaining_time": "0:02:20"}
{"current_steps": 760, "total_steps": 781, "loss": 0.3435, "lr": 2.206401028540639e-08, "epoch": 0.9728, "percentage": 97.31, "elapsed_time": "0:57:19", "remaining_time": "0:01:35"}
{"current_steps": 770, "total_steps": 781, "loss": 0.3533, "lr": 6.057078406142003e-09, "epoch": 0.9856, "percentage": 98.59, "elapsed_time": "0:58:06", "remaining_time": "0:00:49"}
{"current_steps": 780, "total_steps": 781, "loss": 0.3355, "lr": 5.0068525870305974e-11, "epoch": 0.9984, "percentage": 99.87, "elapsed_time": "0:58:49", "remaining_time": "0:00:04"}
{"current_steps": 781, "total_steps": 781, "epoch": 0.99968, "percentage": 100.0, "elapsed_time": "0:59:19", "remaining_time": "0:00:00"}