| {"current_steps": 1, "total_steps": 220, "loss": 2.6726, "learning_rate": 2.0000000000000002e-07, "epoch": 0.045454545454545456, "percentage": 0.45, "elapsed_time": "0:00:16", "remaining_time": "1:01:40", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 2, "total_steps": 220, "loss": 2.623, "learning_rate": 4.0000000000000003e-07, "epoch": 0.09090909090909091, "percentage": 0.91, "elapsed_time": "0:00:25", "remaining_time": "0:46:04", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 3, "total_steps": 220, "loss": 2.5421, "learning_rate": 6.000000000000001e-07, "epoch": 0.13636363636363635, "percentage": 1.36, "elapsed_time": "0:00:33", "remaining_time": "0:40:40", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 4, "total_steps": 220, "loss": 2.577, "learning_rate": 8.000000000000001e-07, "epoch": 0.18181818181818182, "percentage": 1.82, "elapsed_time": "0:00:42", "remaining_time": "0:38:01", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 5, "total_steps": 220, "loss": 2.6671, "learning_rate": 1.0000000000000002e-06, "epoch": 0.22727272727272727, "percentage": 2.27, "elapsed_time": "0:00:50", "remaining_time": "0:36:28", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 6, "total_steps": 220, "loss": 2.5147, "learning_rate": 1.2000000000000002e-06, "epoch": 0.2727272727272727, "percentage": 2.73, "elapsed_time": "0:01:00", "remaining_time": "0:35:43", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 7, "total_steps": 220, "loss": 2.5655, "learning_rate": 1.4000000000000001e-06, "epoch": 0.3181818181818182, "percentage": 3.18, "elapsed_time": "0:01:08", "remaining_time": "0:34:47", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 8, "total_steps": 220, "loss": 2.4802, "learning_rate": 1.6000000000000001e-06, "epoch": 0.36363636363636365, "percentage": 3.64, "elapsed_time": "0:01:17", "remaining_time": "0:34:05", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 9, "total_steps": 220, "loss": 2.579, "learning_rate": 1.8000000000000001e-06, "epoch": 0.4090909090909091, "percentage": 4.09, "elapsed_time": "0:01:25", "remaining_time": "0:33:31", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 10, "total_steps": 220, "loss": 2.5608, "learning_rate": 2.0000000000000003e-06, "epoch": 0.45454545454545453, "percentage": 4.55, "elapsed_time": "0:01:34", "remaining_time": "0:33:01", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 11, "total_steps": 220, "loss": 2.433, "learning_rate": 2.2e-06, "epoch": 0.5, "percentage": 5.0, "elapsed_time": "0:01:42", "remaining_time": "0:32:33", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 12, "total_steps": 220, "loss": 2.5093, "learning_rate": 2.4000000000000003e-06, "epoch": 0.5454545454545454, "percentage": 5.45, "elapsed_time": "0:01:51", "remaining_time": "0:32:05", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 13, "total_steps": 220, "loss": 2.5413, "learning_rate": 2.6e-06, "epoch": 0.5909090909090909, "percentage": 5.91, "elapsed_time": "0:01:59", "remaining_time": "0:31:50", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 14, "total_steps": 220, "loss": 2.3515, "learning_rate": 2.8000000000000003e-06, "epoch": 0.6363636363636364, "percentage": 6.36, "elapsed_time": "0:02:08", "remaining_time": "0:31:31", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 15, "total_steps": 220, "loss": 2.3429, "learning_rate": 3e-06, "epoch": 0.6818181818181818, "percentage": 6.82, "elapsed_time": "0:02:18", "remaining_time": "0:31:36", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 16, "total_steps": 220, "loss": 2.1881, "learning_rate": 3.2000000000000003e-06, "epoch": 0.7272727272727273, "percentage": 7.27, "elapsed_time": "0:02:27", "remaining_time": "0:31:16", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 17, "total_steps": 220, "loss": 2.2334, "learning_rate": 3.4000000000000005e-06, "epoch": 0.7727272727272727, "percentage": 7.73, "elapsed_time": "0:02:35", "remaining_time": "0:30:57", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 18, "total_steps": 220, "loss": 2.2575, "learning_rate": 3.6000000000000003e-06, "epoch": 0.8181818181818182, "percentage": 8.18, "elapsed_time": "0:02:44", "remaining_time": "0:30:41", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 19, "total_steps": 220, "loss": 2.1451, "learning_rate": 3.8000000000000005e-06, "epoch": 0.8636363636363636, "percentage": 8.64, "elapsed_time": "0:02:52", "remaining_time": "0:30:26", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 20, "total_steps": 220, "loss": 2.1156, "learning_rate": 4.000000000000001e-06, "epoch": 0.9090909090909091, "percentage": 9.09, "elapsed_time": "0:03:01", "remaining_time": "0:30:10", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 21, "total_steps": 220, "loss": 2.1072, "learning_rate": 4.2000000000000004e-06, "epoch": 0.9545454545454546, "percentage": 9.55, "elapsed_time": "0:03:09", "remaining_time": "0:29:56", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 22, "total_steps": 220, "loss": 2.1694, "learning_rate": 4.4e-06, "epoch": 1.0, "percentage": 10.0, "elapsed_time": "0:03:17", "remaining_time": "0:29:41", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 23, "total_steps": 220, "loss": 2.0194, "learning_rate": 4.600000000000001e-06, "epoch": 1.0454545454545454, "percentage": 10.45, "elapsed_time": "0:03:26", "remaining_time": "0:29:27", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 24, "total_steps": 220, "loss": 2.0222, "learning_rate": 4.800000000000001e-06, "epoch": 1.0909090909090908, "percentage": 10.91, "elapsed_time": "0:03:34", "remaining_time": "0:29:12", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 25, "total_steps": 220, "loss": 2.1193, "learning_rate": 5e-06, "epoch": 1.1363636363636362, "percentage": 11.36, "elapsed_time": "0:03:43", "remaining_time": "0:29:00", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 26, "total_steps": 220, "loss": 1.998, "learning_rate": 5.2e-06, "epoch": 1.1818181818181819, "percentage": 11.82, "elapsed_time": "0:03:51", "remaining_time": "0:28:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 27, "total_steps": 220, "loss": 2.0051, "learning_rate": 5.400000000000001e-06, "epoch": 1.2272727272727273, "percentage": 12.27, "elapsed_time": "0:03:59", "remaining_time": "0:28:34", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 28, "total_steps": 220, "loss": 1.9324, "learning_rate": 5.600000000000001e-06, "epoch": 1.2727272727272727, "percentage": 12.73, "elapsed_time": "0:04:08", "remaining_time": "0:28:24", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 29, "total_steps": 220, "loss": 2.0088, "learning_rate": 5.8e-06, "epoch": 1.3181818181818181, "percentage": 13.18, "elapsed_time": "0:04:17", "remaining_time": "0:28:14", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 30, "total_steps": 220, "loss": 2.0523, "learning_rate": 6e-06, "epoch": 1.3636363636363638, "percentage": 13.64, "elapsed_time": "0:04:25", "remaining_time": "0:28:02", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 31, "total_steps": 220, "loss": 1.9473, "learning_rate": 6.200000000000001e-06, "epoch": 1.4090909090909092, "percentage": 14.09, "elapsed_time": "0:04:34", "remaining_time": "0:27:53", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 32, "total_steps": 220, "loss": 1.8585, "learning_rate": 6.4000000000000006e-06, "epoch": 1.4545454545454546, "percentage": 14.55, "elapsed_time": "0:04:43", "remaining_time": "0:27:43", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 33, "total_steps": 220, "loss": 1.9325, "learning_rate": 6.600000000000001e-06, "epoch": 1.5, "percentage": 15.0, "elapsed_time": "0:04:51", "remaining_time": "0:27:31", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 34, "total_steps": 220, "loss": 1.8983, "learning_rate": 6.800000000000001e-06, "epoch": 1.5454545454545454, "percentage": 15.45, "elapsed_time": "0:04:59", "remaining_time": "0:27:19", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 35, "total_steps": 220, "loss": 1.7547, "learning_rate": 7e-06, "epoch": 1.5909090909090908, "percentage": 15.91, "elapsed_time": "0:05:08", "remaining_time": "0:27:10", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 36, "total_steps": 220, "loss": 1.8169, "learning_rate": 7.2000000000000005e-06, "epoch": 1.6363636363636362, "percentage": 16.36, "elapsed_time": "0:05:16", "remaining_time": "0:26:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 37, "total_steps": 220, "loss": 1.8036, "learning_rate": 7.4e-06, "epoch": 1.6818181818181817, "percentage": 16.82, "elapsed_time": "0:05:25", "remaining_time": "0:26:47", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 38, "total_steps": 220, "loss": 1.7398, "learning_rate": 7.600000000000001e-06, "epoch": 1.7272727272727273, "percentage": 17.27, "elapsed_time": "0:05:33", "remaining_time": "0:26:38", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 39, "total_steps": 220, "loss": 1.8263, "learning_rate": 7.800000000000002e-06, "epoch": 1.7727272727272727, "percentage": 17.73, "elapsed_time": "0:05:42", "remaining_time": "0:26:28", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 40, "total_steps": 220, "loss": 1.7271, "learning_rate": 8.000000000000001e-06, "epoch": 1.8181818181818183, "percentage": 18.18, "elapsed_time": "0:05:50", "remaining_time": "0:26:18", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 41, "total_steps": 220, "loss": 1.7655, "learning_rate": 8.2e-06, "epoch": 1.8636363636363638, "percentage": 18.64, "elapsed_time": "0:05:58", "remaining_time": "0:26:07", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 42, "total_steps": 220, "loss": 1.8138, "learning_rate": 8.400000000000001e-06, "epoch": 1.9090909090909092, "percentage": 19.09, "elapsed_time": "0:06:07", "remaining_time": "0:25:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 43, "total_steps": 220, "loss": 1.7645, "learning_rate": 8.6e-06, "epoch": 1.9545454545454546, "percentage": 19.55, "elapsed_time": "0:06:15", "remaining_time": "0:25:47", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 44, "total_steps": 220, "loss": 1.7034, "learning_rate": 8.8e-06, "epoch": 2.0, "percentage": 20.0, "elapsed_time": "0:06:23", "remaining_time": "0:25:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 45, "total_steps": 220, "loss": 1.6356, "learning_rate": 9e-06, "epoch": 2.0454545454545454, "percentage": 20.45, "elapsed_time": "0:06:32", "remaining_time": "0:25:26", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 46, "total_steps": 220, "loss": 1.6274, "learning_rate": 9.200000000000002e-06, "epoch": 2.090909090909091, "percentage": 20.91, "elapsed_time": "0:06:40", "remaining_time": "0:25:16", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 47, "total_steps": 220, "loss": 1.6118, "learning_rate": 9.4e-06, "epoch": 2.1363636363636362, "percentage": 21.36, "elapsed_time": "0:06:49", "remaining_time": "0:25:06", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 48, "total_steps": 220, "loss": 1.6379, "learning_rate": 9.600000000000001e-06, "epoch": 2.1818181818181817, "percentage": 21.82, "elapsed_time": "0:06:57", "remaining_time": "0:24:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 49, "total_steps": 220, "loss": 1.6267, "learning_rate": 9.800000000000001e-06, "epoch": 2.227272727272727, "percentage": 22.27, "elapsed_time": "0:07:05", "remaining_time": "0:24:45", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 50, "total_steps": 220, "loss": 1.5023, "learning_rate": 1e-05, "epoch": 2.2727272727272725, "percentage": 22.73, "elapsed_time": "0:07:14", "remaining_time": "0:24:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 51, "total_steps": 220, "loss": 1.4344, "learning_rate": 9.999146252290264e-06, "epoch": 2.3181818181818183, "percentage": 23.18, "elapsed_time": "0:07:22", "remaining_time": "0:24:25", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 52, "total_steps": 220, "loss": 1.5547, "learning_rate": 9.996585300715117e-06, "epoch": 2.3636363636363638, "percentage": 23.64, "elapsed_time": "0:07:30", "remaining_time": "0:24:15", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 53, "total_steps": 220, "loss": 1.5188, "learning_rate": 9.992318019837171e-06, "epoch": 2.409090909090909, "percentage": 24.09, "elapsed_time": "0:07:38", "remaining_time": "0:24:05", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 54, "total_steps": 220, "loss": 1.4996, "learning_rate": 9.98634586692894e-06, "epoch": 2.4545454545454546, "percentage": 24.55, "elapsed_time": "0:07:47", "remaining_time": "0:23:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 55, "total_steps": 220, "loss": 1.4596, "learning_rate": 9.978670881475173e-06, "epoch": 2.5, "percentage": 25.0, "elapsed_time": "0:07:55", "remaining_time": "0:23:45", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 56, "total_steps": 220, "loss": 1.5426, "learning_rate": 9.96929568447637e-06, "epoch": 2.5454545454545454, "percentage": 25.45, "elapsed_time": "0:08:03", "remaining_time": "0:23:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 57, "total_steps": 220, "loss": 1.545, "learning_rate": 9.958223477553715e-06, "epoch": 2.590909090909091, "percentage": 25.91, "elapsed_time": "0:08:11", "remaining_time": "0:23:26", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 58, "total_steps": 220, "loss": 1.4553, "learning_rate": 9.945458041855732e-06, "epoch": 2.6363636363636362, "percentage": 26.36, "elapsed_time": "0:08:20", "remaining_time": "0:23:16", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 59, "total_steps": 220, "loss": 1.4848, "learning_rate": 9.931003736767013e-06, "epoch": 2.6818181818181817, "percentage": 26.82, "elapsed_time": "0:08:28", "remaining_time": "0:23:07", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 60, "total_steps": 220, "loss": 1.5095, "learning_rate": 9.91486549841951e-06, "epoch": 2.7272727272727275, "percentage": 27.27, "elapsed_time": "0:08:36", "remaining_time": "0:22:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 61, "total_steps": 220, "loss": 1.5803, "learning_rate": 9.89704883800683e-06, "epoch": 2.7727272727272725, "percentage": 27.73, "elapsed_time": "0:08:45", "remaining_time": "0:22:48", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 62, "total_steps": 220, "loss": 1.507, "learning_rate": 9.877559839902185e-06, "epoch": 2.8181818181818183, "percentage": 28.18, "elapsed_time": "0:08:53", "remaining_time": "0:22:38", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 63, "total_steps": 220, "loss": 1.5185, "learning_rate": 9.85640515958057e-06, "epoch": 2.8636363636363638, "percentage": 28.64, "elapsed_time": "0:09:01", "remaining_time": "0:22:29", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 64, "total_steps": 220, "loss": 1.4085, "learning_rate": 9.833592021345938e-06, "epoch": 2.909090909090909, "percentage": 29.09, "elapsed_time": "0:09:10", "remaining_time": "0:22:20", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 65, "total_steps": 220, "loss": 1.4969, "learning_rate": 9.809128215864096e-06, "epoch": 2.9545454545454546, "percentage": 29.55, "elapsed_time": "0:09:18", "remaining_time": "0:22:11", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 66, "total_steps": 220, "loss": 1.4385, "learning_rate": 9.783022097502204e-06, "epoch": 3.0, "percentage": 30.0, "elapsed_time": "0:09:26", "remaining_time": "0:22:01", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 67, "total_steps": 220, "loss": 1.2442, "learning_rate": 9.755282581475769e-06, "epoch": 3.0454545454545454, "percentage": 30.45, "elapsed_time": "0:09:35", "remaining_time": "0:21:53", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 68, "total_steps": 220, "loss": 1.2198, "learning_rate": 9.7259191408041e-06, "epoch": 3.090909090909091, "percentage": 30.91, "elapsed_time": "0:09:43", "remaining_time": "0:21:44", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 69, "total_steps": 220, "loss": 1.2244, "learning_rate": 9.694941803075285e-06, "epoch": 3.1363636363636362, "percentage": 31.36, "elapsed_time": "0:09:51", "remaining_time": "0:21:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 70, "total_steps": 220, "loss": 1.1815, "learning_rate": 9.66236114702178e-06, "epoch": 3.1818181818181817, "percentage": 31.82, "elapsed_time": "0:10:00", "remaining_time": "0:21:25", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 71, "total_steps": 220, "loss": 1.218, "learning_rate": 9.628188298907782e-06, "epoch": 3.227272727272727, "percentage": 32.27, "elapsed_time": "0:10:08", "remaining_time": "0:21:16", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 72, "total_steps": 220, "loss": 1.1746, "learning_rate": 9.592434928729617e-06, "epoch": 3.2727272727272725, "percentage": 32.73, "elapsed_time": "0:10:16", "remaining_time": "0:21:07", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 73, "total_steps": 220, "loss": 1.1944, "learning_rate": 9.555113246230443e-06, "epoch": 3.3181818181818183, "percentage": 33.18, "elapsed_time": "0:10:25", "remaining_time": "0:20:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 74, "total_steps": 220, "loss": 1.2331, "learning_rate": 9.516235996730645e-06, "epoch": 3.3636363636363638, "percentage": 33.64, "elapsed_time": "0:10:33", "remaining_time": "0:20:49", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 75, "total_steps": 220, "loss": 1.1874, "learning_rate": 9.475816456775313e-06, "epoch": 3.409090909090909, "percentage": 34.09, "elapsed_time": "0:10:42", "remaining_time": "0:20:42", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 76, "total_steps": 220, "loss": 1.1734, "learning_rate": 9.43386842960031e-06, "epoch": 3.4545454545454546, "percentage": 34.55, "elapsed_time": "0:10:51", "remaining_time": "0:20:34", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 77, "total_steps": 220, "loss": 1.1196, "learning_rate": 9.39040624041849e-06, "epoch": 3.5, "percentage": 35.0, "elapsed_time": "0:11:00", "remaining_time": "0:20:26", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 78, "total_steps": 220, "loss": 1.1794, "learning_rate": 9.345444731527642e-06, "epoch": 3.5454545454545454, "percentage": 35.45, "elapsed_time": "0:11:08", "remaining_time": "0:20:17", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 79, "total_steps": 220, "loss": 1.1617, "learning_rate": 9.298999257241862e-06, "epoch": 3.590909090909091, "percentage": 35.91, "elapsed_time": "0:11:16", "remaining_time": "0:20:08", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 80, "total_steps": 220, "loss": 1.1825, "learning_rate": 9.251085678648072e-06, "epoch": 3.6363636363636362, "percentage": 36.36, "elapsed_time": "0:11:24", "remaining_time": "0:19:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 81, "total_steps": 220, "loss": 1.1648, "learning_rate": 9.201720358189464e-06, "epoch": 3.6818181818181817, "percentage": 36.82, "elapsed_time": "0:11:33", "remaining_time": "0:19:49", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 82, "total_steps": 220, "loss": 1.1517, "learning_rate": 9.150920154077753e-06, "epoch": 3.7272727272727275, "percentage": 37.27, "elapsed_time": "0:11:41", "remaining_time": "0:19:41", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 83, "total_steps": 220, "loss": 1.1556, "learning_rate": 9.098702414536107e-06, "epoch": 3.7727272727272725, "percentage": 37.73, "elapsed_time": "0:11:50", "remaining_time": "0:19:32", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 84, "total_steps": 220, "loss": 1.1113, "learning_rate": 9.045084971874738e-06, "epoch": 3.8181818181818183, "percentage": 38.18, "elapsed_time": "0:11:58", "remaining_time": "0:19:23", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 85, "total_steps": 220, "loss": 1.1526, "learning_rate": 8.990086136401199e-06, "epoch": 3.8636363636363638, "percentage": 38.64, "elapsed_time": "0:12:06", "remaining_time": "0:19:14", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 86, "total_steps": 220, "loss": 1.1591, "learning_rate": 8.933724690167417e-06, "epoch": 3.909090909090909, "percentage": 39.09, "elapsed_time": "0:12:14", "remaining_time": "0:19:05", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 87, "total_steps": 220, "loss": 1.1127, "learning_rate": 8.87601988055565e-06, "epoch": 3.9545454545454546, "percentage": 39.55, "elapsed_time": "0:12:23", "remaining_time": "0:18:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 88, "total_steps": 220, "loss": 1.1371, "learning_rate": 8.816991413705515e-06, "epoch": 4.0, "percentage": 40.0, "elapsed_time": "0:12:30", "remaining_time": "0:18:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 89, "total_steps": 220, "loss": 0.966, "learning_rate": 8.756659447784367e-06, "epoch": 4.045454545454546, "percentage": 40.45, "elapsed_time": "0:12:39", "remaining_time": "0:18:37", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 90, "total_steps": 220, "loss": 0.9361, "learning_rate": 8.695044586103297e-06, "epoch": 4.090909090909091, "percentage": 40.91, "elapsed_time": "0:12:47", "remaining_time": "0:18:28", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 91, "total_steps": 220, "loss": 0.8836, "learning_rate": 8.632167870081122e-06, "epoch": 4.136363636363637, "percentage": 41.36, "elapsed_time": "0:12:55", "remaining_time": "0:18:19", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 92, "total_steps": 220, "loss": 0.8812, "learning_rate": 8.568050772058763e-06, "epoch": 4.181818181818182, "percentage": 41.82, "elapsed_time": "0:13:04", "remaining_time": "0:18:10", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 93, "total_steps": 220, "loss": 0.8142, "learning_rate": 8.502715187966455e-06, "epoch": 4.2272727272727275, "percentage": 42.27, "elapsed_time": "0:13:12", "remaining_time": "0:18:01", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 94, "total_steps": 220, "loss": 0.8877, "learning_rate": 8.436183429846314e-06, "epoch": 4.2727272727272725, "percentage": 42.73, "elapsed_time": "0:13:20", "remaining_time": "0:17:53", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 95, "total_steps": 220, "loss": 0.8551, "learning_rate": 8.368478218232787e-06, "epoch": 4.318181818181818, "percentage": 43.18, "elapsed_time": "0:13:29", "remaining_time": "0:17:45", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 96, "total_steps": 220, "loss": 0.8286, "learning_rate": 8.299622674393615e-06, "epoch": 4.363636363636363, "percentage": 43.64, "elapsed_time": "0:13:37", "remaining_time": "0:17:36", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 97, "total_steps": 220, "loss": 0.8311, "learning_rate": 8.229640312433938e-06, "epoch": 4.409090909090909, "percentage": 44.09, "elapsed_time": "0:13:46", "remaining_time": "0:17:28", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 98, "total_steps": 220, "loss": 0.8179, "learning_rate": 8.158555031266255e-06, "epoch": 4.454545454545454, "percentage": 44.55, "elapsed_time": "0:13:55", "remaining_time": "0:17:19", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 99, "total_steps": 220, "loss": 0.8209, "learning_rate": 8.086391106448965e-06, "epoch": 4.5, "percentage": 45.0, "elapsed_time": "0:14:06", "remaining_time": "0:17:14", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 100, "total_steps": 220, "loss": 0.8364, "learning_rate": 8.013173181896283e-06, "epoch": 4.545454545454545, "percentage": 45.45, "elapsed_time": "0:14:15", "remaining_time": "0:17:06", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 101, "total_steps": 220, "loss": 0.7655, "learning_rate": 7.938926261462366e-06, "epoch": 4.590909090909091, "percentage": 45.91, "elapsed_time": "0:14:43", "remaining_time": "0:17:20", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 102, "total_steps": 220, "loss": 0.8741, "learning_rate": 7.863675700402527e-06, "epoch": 4.636363636363637, "percentage": 46.36, "elapsed_time": "0:14:53", "remaining_time": "0:17:13", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 103, "total_steps": 220, "loss": 0.7883, "learning_rate": 7.787447196714428e-06, "epoch": 4.681818181818182, "percentage": 46.82, "elapsed_time": "0:15:01", "remaining_time": "0:17:04", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 104, "total_steps": 220, "loss": 0.8025, "learning_rate": 7.710266782362248e-06, "epoch": 4.7272727272727275, "percentage": 47.27, "elapsed_time": "0:15:10", "remaining_time": "0:16:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 105, "total_steps": 220, "loss": 0.8299, "learning_rate": 7.63216081438678e-06, "epoch": 4.7727272727272725, "percentage": 47.73, "elapsed_time": "0:15:18", "remaining_time": "0:16:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 106, "total_steps": 220, "loss": 0.8515, "learning_rate": 7.553155965904535e-06, "epoch": 4.818181818181818, "percentage": 48.18, "elapsed_time": "0:15:27", "remaining_time": "0:16:37", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 107, "total_steps": 220, "loss": 0.791, "learning_rate": 7.473279216998896e-06, "epoch": 4.863636363636363, "percentage": 48.64, "elapsed_time": "0:15:35", "remaining_time": "0:16:27", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 108, "total_steps": 220, "loss": 0.7944, "learning_rate": 7.392557845506433e-06, "epoch": 4.909090909090909, "percentage": 49.09, "elapsed_time": "0:15:43", "remaining_time": "0:16:18", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 109, "total_steps": 220, "loss": 0.8151, "learning_rate": 7.311019417701567e-06, "epoch": 4.954545454545455, "percentage": 49.55, "elapsed_time": "0:15:51", "remaining_time": "0:16:09", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 110, "total_steps": 220, "loss": 0.794, "learning_rate": 7.2286917788826926e-06, "epoch": 5.0, "percentage": 50.0, "elapsed_time": "0:16:00", "remaining_time": "0:16:00", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 111, "total_steps": 220, "loss": 0.5533, "learning_rate": 7.145603043863045e-06, "epoch": 5.045454545454546, "percentage": 50.45, "elapsed_time": "0:16:09", "remaining_time": "0:15:52", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 112, "total_steps": 220, "loss": 0.6281, "learning_rate": 7.061781587369518e-06, "epoch": 5.090909090909091, "percentage": 50.91, "elapsed_time": "0:16:18", "remaining_time": "0:15:43", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 113, "total_steps": 220, "loss": 0.5547, "learning_rate": 6.977256034352713e-06, "epoch": 5.136363636363637, "percentage": 51.36, "elapsed_time": "0:16:26", "remaining_time": "0:15:34", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 114, "total_steps": 220, "loss": 0.6596, "learning_rate": 6.892055250211552e-06, "epoch": 5.181818181818182, "percentage": 51.82, "elapsed_time": "0:16:35", "remaining_time": "0:15:25", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 115, "total_steps": 220, "loss": 0.5801, "learning_rate": 6.806208330935766e-06, "epoch": 5.2272727272727275, "percentage": 52.27, "elapsed_time": "0:16:43", "remaining_time": "0:15:16", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 116, "total_steps": 220, "loss": 0.6149, "learning_rate": 6.719744593169642e-06, "epoch": 5.2727272727272725, "percentage": 52.73, "elapsed_time": "0:16:52", "remaining_time": "0:15:07", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 117, "total_steps": 220, "loss": 0.5546, "learning_rate": 6.6326935642004165e-06, "epoch": 5.318181818181818, "percentage": 53.18, "elapsed_time": "0:17:01", "remaining_time": "0:14:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 118, "total_steps": 220, "loss": 0.5663, "learning_rate": 6.545084971874738e-06, "epoch": 5.363636363636363, "percentage": 53.64, "elapsed_time": "0:17:09", "remaining_time": "0:14:50", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 119, "total_steps": 220, "loss": 0.5264, "learning_rate": 6.456948734446624e-06, "epoch": 5.409090909090909, "percentage": 54.09, "elapsed_time": "0:17:17", "remaining_time": "0:14:40", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 120, "total_steps": 220, "loss": 0.546, "learning_rate": 6.368314950360416e-06, "epoch": 5.454545454545454, "percentage": 54.55, "elapsed_time": "0:17:26", "remaining_time": "0:14:31", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 121, "total_steps": 220, "loss": 0.5353, "learning_rate": 6.279213887972179e-06, "epoch": 5.5, "percentage": 55.0, "elapsed_time": "0:17:34", "remaining_time": "0:14:23", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 122, "total_steps": 220, "loss": 0.5532, "learning_rate": 6.189675975213094e-06, "epoch": 5.545454545454545, "percentage": 55.45, "elapsed_time": "0:17:43", "remaining_time": "0:14:13", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 123, "total_steps": 220, "loss": 0.5811, "learning_rate": 6.099731789198344e-06, "epoch": 5.590909090909091, "percentage": 55.91, "elapsed_time": "0:17:51", "remaining_time": "0:14:04", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 124, "total_steps": 220, "loss": 0.5323, "learning_rate": 6.009412045785051e-06, "epoch": 5.636363636363637, "percentage": 56.36, "elapsed_time": "0:17:59", "remaining_time": "0:13:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 125, "total_steps": 220, "loss": 0.4695, "learning_rate": 5.918747589082853e-06, "epoch": 5.681818181818182, "percentage": 56.82, "elapsed_time": "0:18:08", "remaining_time": "0:13:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 126, "total_steps": 220, "loss": 0.513, "learning_rate": 5.82776938092065e-06, "epoch": 5.7272727272727275, "percentage": 57.27, "elapsed_time": "0:18:16", "remaining_time": "0:13:38", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 127, "total_steps": 220, "loss": 0.5675, "learning_rate": 5.736508490273189e-06, "epoch": 5.7727272727272725, "percentage": 57.73, "elapsed_time": "0:18:24", "remaining_time": "0:13:29", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 128, "total_steps": 220, "loss": 0.4782, "learning_rate": 5.644996082651018e-06, "epoch": 5.818181818181818, "percentage": 58.18, "elapsed_time": "0:18:33", "remaining_time": "0:13:20", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 129, "total_steps": 220, "loss": 0.5491, "learning_rate": 5.553263409457504e-06, "epoch": 5.863636363636363, "percentage": 58.64, "elapsed_time": "0:18:41", "remaining_time": "0:13:11", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 130, "total_steps": 220, "loss": 0.5364, "learning_rate": 5.46134179731651e-06, "epoch": 5.909090909090909, "percentage": 59.09, "elapsed_time": "0:18:50", "remaining_time": "0:13:02", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 131, "total_steps": 220, "loss": 0.5165, "learning_rate": 5.36926263737437e-06, "epoch": 5.954545454545455, "percentage": 59.55, "elapsed_time": "0:18:58", "remaining_time": "0:12:53", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 132, "total_steps": 220, "loss": 0.4634, "learning_rate": 5.27705737457985e-06, "epoch": 6.0, "percentage": 60.0, "elapsed_time": "0:19:06", "remaining_time": "0:12:44", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 133, "total_steps": 220, "loss": 0.3672, "learning_rate": 5.184757496945726e-06, "epoch": 6.045454545454546, "percentage": 60.45, "elapsed_time": "0:19:15", "remaining_time": "0:12:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 134, "total_steps": 220, "loss": 0.3422, "learning_rate": 5.09239452479565e-06, "epoch": 6.090909090909091, "percentage": 60.91, "elapsed_time": "0:19:24", "remaining_time": "0:12:27", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 135, "total_steps": 220, "loss": 0.3537, "learning_rate": 5e-06, "epoch": 6.136363636363637, "percentage": 61.36, "elapsed_time": "0:19:33", "remaining_time": "0:12:18", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 136, "total_steps": 220, "loss": 0.3177, "learning_rate": 4.907605475204352e-06, "epoch": 6.181818181818182, "percentage": 61.82, "elapsed_time": "0:19:41", "remaining_time": "0:12:09", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 137, "total_steps": 220, "loss": 0.3183, "learning_rate": 4.815242503054277e-06, "epoch": 6.2272727272727275, "percentage": 62.27, "elapsed_time": "0:19:50", "remaining_time": "0:12:01", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 138, "total_steps": 220, "loss": 0.3546, "learning_rate": 4.7229426254201504e-06, "epoch": 6.2727272727272725, "percentage": 62.73, "elapsed_time": "0:19:59", "remaining_time": "0:11:52", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 139, "total_steps": 220, "loss": 0.3567, "learning_rate": 4.630737362625631e-06, "epoch": 6.318181818181818, "percentage": 63.18, "elapsed_time": "0:20:08", "remaining_time": "0:11:44", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 140, "total_steps": 220, "loss": 0.3418, "learning_rate": 4.53865820268349e-06, "epoch": 6.363636363636363, "percentage": 63.64, "elapsed_time": "0:20:17", "remaining_time": "0:11:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 141, "total_steps": 220, "loss": 0.3212, "learning_rate": 4.446736590542497e-06, "epoch": 6.409090909090909, "percentage": 64.09, "elapsed_time": "0:20:25", "remaining_time": "0:11:26", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 142, "total_steps": 220, "loss": 0.3619, "learning_rate": 4.355003917348985e-06, "epoch": 6.454545454545454, "percentage": 64.55, "elapsed_time": "0:20:33", "remaining_time": "0:11:17", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 143, "total_steps": 220, "loss": 0.3412, "learning_rate": 4.263491509726812e-06, "epoch": 6.5, "percentage": 65.0, "elapsed_time": "0:20:42", "remaining_time": "0:11:08", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 144, "total_steps": 220, "loss": 0.3194, "learning_rate": 4.17223061907935e-06, "epoch": 6.545454545454545, "percentage": 65.45, "elapsed_time": "0:20:50", "remaining_time": "0:10:59", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 145, "total_steps": 220, "loss": 0.3543, "learning_rate": 4.081252410917148e-06, "epoch": 6.590909090909091, "percentage": 65.91, "elapsed_time": "0:20:58", "remaining_time": "0:10:51", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 146, "total_steps": 220, "loss": 0.3825, "learning_rate": 3.99058795421495e-06, "epoch": 6.636363636363637, "percentage": 66.36, "elapsed_time": "0:21:07", "remaining_time": "0:10:42", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 147, "total_steps": 220, "loss": 0.3209, "learning_rate": 3.9002682108016585e-06, "epoch": 6.681818181818182, "percentage": 66.82, "elapsed_time": "0:21:15", "remaining_time": "0:10:33", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 148, "total_steps": 220, "loss": 0.3234, "learning_rate": 3.8103240247869077e-06, "epoch": 6.7272727272727275, "percentage": 67.27, "elapsed_time": "0:21:24", "remaining_time": "0:10:25", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 149, "total_steps": 220, "loss": 0.3375, "learning_rate": 3.720786112027822e-06, "epoch": 6.7727272727272725, "percentage": 67.73, "elapsed_time": "0:21:33", "remaining_time": "0:10:16", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 150, "total_steps": 220, "loss": 0.3617, "learning_rate": 3.6316850496395863e-06, "epoch": 6.818181818181818, "percentage": 68.18, "elapsed_time": "0:21:41", "remaining_time": "0:10:07", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 151, "total_steps": 220, "loss": 0.3353, "learning_rate": 3.5430512655533774e-06, "epoch": 6.863636363636363, "percentage": 68.64, "elapsed_time": "0:21:50", "remaining_time": "0:09:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 152, "total_steps": 220, "loss": 0.4345, "learning_rate": 3.4549150281252635e-06, "epoch": 6.909090909090909, "percentage": 69.09, "elapsed_time": "0:21:59", "remaining_time": "0:09:50", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 153, "total_steps": 220, "loss": 0.3405, "learning_rate": 3.3673064357995844e-06, "epoch": 6.954545454545455, "percentage": 69.55, "elapsed_time": "0:22:08", "remaining_time": "0:09:41", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 154, "total_steps": 220, "loss": 0.3275, "learning_rate": 3.2802554068303595e-06, "epoch": 7.0, "percentage": 70.0, "elapsed_time": "0:22:17", "remaining_time": "0:09:33", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 155, "total_steps": 220, "loss": 0.2393, "learning_rate": 3.1937916690642356e-06, "epoch": 7.045454545454546, "percentage": 70.45, "elapsed_time": "0:22:26", "remaining_time": "0:09:24", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 156, "total_steps": 220, "loss": 0.2316, "learning_rate": 3.107944749788449e-06, "epoch": 7.090909090909091, "percentage": 70.91, "elapsed_time": "0:22:34", "remaining_time": "0:09:15", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 157, "total_steps": 220, "loss": 0.2322, "learning_rate": 3.0227439656472878e-06, "epoch": 7.136363636363637, "percentage": 71.36, "elapsed_time": "0:22:42", "remaining_time": "0:09:06", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 158, "total_steps": 220, "loss": 0.276, "learning_rate": 2.9382184126304834e-06, "epoch": 7.181818181818182, "percentage": 71.82, "elapsed_time": "0:22:51", "remaining_time": "0:08:58", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 159, "total_steps": 220, "loss": 0.2282, "learning_rate": 2.8543969561369556e-06, "epoch": 7.2272727272727275, "percentage": 72.27, "elapsed_time": "0:22:59", "remaining_time": "0:08:49", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 160, "total_steps": 220, "loss": 0.1981, "learning_rate": 2.771308221117309e-06, "epoch": 7.2727272727272725, "percentage": 72.73, "elapsed_time": "0:23:07", "remaining_time": "0:08:40", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 161, "total_steps": 220, "loss": 0.2062, "learning_rate": 2.6889805822984348e-06, "epoch": 7.318181818181818, "percentage": 73.18, "elapsed_time": "0:23:16", "remaining_time": "0:08:31", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 162, "total_steps": 220, "loss": 0.201, "learning_rate": 2.607442154493568e-06, "epoch": 7.363636363636363, "percentage": 73.64, "elapsed_time": "0:23:24", "remaining_time": "0:08:22", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 163, "total_steps": 220, "loss": 0.1979, "learning_rate": 2.526720783001107e-06, "epoch": 7.409090909090909, "percentage": 74.09, "elapsed_time": "0:23:32", "remaining_time": "0:08:14", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 164, "total_steps": 220, "loss": 0.2385, "learning_rate": 2.4468440340954664e-06, "epoch": 7.454545454545454, "percentage": 74.55, "elapsed_time": "0:23:41", "remaining_time": "0:08:05", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 165, "total_steps": 220, "loss": 0.2452, "learning_rate": 2.3678391856132203e-06, "epoch": 7.5, "percentage": 75.0, "elapsed_time": "0:23:50", "remaining_time": "0:07:56", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 166, "total_steps": 220, "loss": 0.2498, "learning_rate": 2.289733217637753e-06, "epoch": 7.545454545454545, "percentage": 75.45, "elapsed_time": "0:23:58", "remaining_time": "0:07:48", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 167, "total_steps": 220, "loss": 0.2384, "learning_rate": 2.2125528032855727e-06, "epoch": 7.590909090909091, "percentage": 75.91, "elapsed_time": "0:24:07", "remaining_time": "0:07:39", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 168, "total_steps": 220, "loss": 0.2382, "learning_rate": 2.136324299597474e-06, "epoch": 7.636363636363637, "percentage": 76.36, "elapsed_time": "0:24:15", "remaining_time": "0:07:30", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 169, "total_steps": 220, "loss": 0.2097, "learning_rate": 2.061073738537635e-06, "epoch": 7.681818181818182, "percentage": 76.82, "elapsed_time": "0:24:24", "remaining_time": "0:07:21", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 170, "total_steps": 220, "loss": 0.259, "learning_rate": 1.9868268181037186e-06, "epoch": 7.7272727272727275, "percentage": 77.27, "elapsed_time": "0:24:32", "remaining_time": "0:07:13", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 171, "total_steps": 220, "loss": 0.2007, "learning_rate": 1.913608893551036e-06, "epoch": 7.7727272727272725, "percentage": 77.73, "elapsed_time": "0:24:41", "remaining_time": "0:07:04", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 172, "total_steps": 220, "loss": 0.2187, "learning_rate": 1.8414449687337467e-06, "epoch": 7.818181818181818, "percentage": 78.18, "elapsed_time": "0:24:52", "remaining_time": "0:06:56", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 173, "total_steps": 220, "loss": 0.2684, "learning_rate": 1.7703596875660645e-06, "epoch": 7.863636363636363, "percentage": 78.64, "elapsed_time": "0:25:01", "remaining_time": "0:06:47", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 174, "total_steps": 220, "loss": 0.2529, "learning_rate": 1.7003773256063882e-06, "epoch": 7.909090909090909, "percentage": 79.09, "elapsed_time": "0:25:09", "remaining_time": "0:06:39", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 175, "total_steps": 220, "loss": 0.2058, "learning_rate": 1.6315217817672142e-06, "epoch": 7.954545454545455, "percentage": 79.55, "elapsed_time": "0:25:17", "remaining_time": "0:06:30", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 176, "total_steps": 220, "loss": 0.2102, "learning_rate": 1.5638165701536866e-06, "epoch": 8.0, "percentage": 80.0, "elapsed_time": "0:25:25", "remaining_time": "0:06:21", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 177, "total_steps": 220, "loss": 0.1886, "learning_rate": 1.4972848120335453e-06, "epoch": 8.045454545454545, "percentage": 80.45, "elapsed_time": "0:25:35", "remaining_time": "0:06:12", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 178, "total_steps": 220, "loss": 0.1575, "learning_rate": 1.4319492279412388e-06, "epoch": 8.090909090909092, "percentage": 80.91, "elapsed_time": "0:25:43", "remaining_time": "0:06:04", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 179, "total_steps": 220, "loss": 0.2066, "learning_rate": 1.3678321299188802e-06, "epoch": 8.136363636363637, "percentage": 81.36, "elapsed_time": "0:25:51", "remaining_time": "0:05:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 180, "total_steps": 220, "loss": 0.1811, "learning_rate": 1.3049554138967052e-06, "epoch": 8.181818181818182, "percentage": 81.82, "elapsed_time": "0:26:00", "remaining_time": "0:05:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 181, "total_steps": 220, "loss": 0.2073, "learning_rate": 1.2433405522156334e-06, "epoch": 8.227272727272727, "percentage": 82.27, "elapsed_time": "0:26:09", "remaining_time": "0:05:38", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 182, "total_steps": 220, "loss": 0.1446, "learning_rate": 1.1830085862944851e-06, "epoch": 8.272727272727273, "percentage": 82.73, "elapsed_time": "0:26:18", "remaining_time": "0:05:29", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 183, "total_steps": 220, "loss": 0.1691, "learning_rate": 1.1239801194443507e-06, "epoch": 8.318181818181818, "percentage": 83.18, "elapsed_time": "0:26:27", "remaining_time": "0:05:20", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 184, "total_steps": 220, "loss": 0.1721, "learning_rate": 1.066275309832584e-06, "epoch": 8.363636363636363, "percentage": 83.64, "elapsed_time": "0:26:37", "remaining_time": "0:05:12", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 185, "total_steps": 220, "loss": 0.1443, "learning_rate": 1.0099138635988026e-06, "epoch": 8.409090909090908, "percentage": 84.09, "elapsed_time": "0:26:45", "remaining_time": "0:05:03", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 186, "total_steps": 220, "loss": 0.1836, "learning_rate": 9.549150281252633e-07, "epoch": 8.454545454545455, "percentage": 84.55, "elapsed_time": "0:26:54", "remaining_time": "0:04:55", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 187, "total_steps": 220, "loss": 0.1453, "learning_rate": 9.01297585463895e-07, "epoch": 8.5, "percentage": 85.0, "elapsed_time": "0:27:02", "remaining_time": "0:04:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 188, "total_steps": 220, "loss": 0.1163, "learning_rate": 8.490798459222477e-07, "epoch": 8.545454545454545, "percentage": 85.45, "elapsed_time": "0:27:12", "remaining_time": "0:04:37", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 189, "total_steps": 220, "loss": 0.1794, "learning_rate": 7.98279641810537e-07, "epoch": 8.590909090909092, "percentage": 85.91, "elapsed_time": "0:27:20", "remaining_time": "0:04:29", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 190, "total_steps": 220, "loss": 0.1675, "learning_rate": 7.489143213519301e-07, "epoch": 8.636363636363637, "percentage": 86.36, "elapsed_time": "0:27:30", "remaining_time": "0:04:20", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 191, "total_steps": 220, "loss": 0.1805, "learning_rate": 7.010007427581378e-07, "epoch": 8.681818181818182, "percentage": 86.82, "elapsed_time": "0:27:38", "remaining_time": "0:04:11", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 192, "total_steps": 220, "loss": 0.1715, "learning_rate": 6.545552684723583e-07, "epoch": 8.727272727272727, "percentage": 87.27, "elapsed_time": "0:27:46", "remaining_time": "0:04:03", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 193, "total_steps": 220, "loss": 0.1899, "learning_rate": 6.095937595815104e-07, "epoch": 8.772727272727273, "percentage": 87.73, "elapsed_time": "0:27:55", "remaining_time": "0:03:54", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 194, "total_steps": 220, "loss": 0.1388, "learning_rate": 5.661315703996905e-07, "epoch": 8.818181818181818, "percentage": 88.18, "elapsed_time": "0:28:03", "remaining_time": "0:03:45", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 195, "total_steps": 220, "loss": 0.185, "learning_rate": 5.241835432246888e-07, "epoch": 8.863636363636363, "percentage": 88.64, "elapsed_time": "0:28:11", "remaining_time": "0:03:36", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 196, "total_steps": 220, "loss": 0.153, "learning_rate": 4.837640032693558e-07, "epoch": 8.909090909090908, "percentage": 89.09, "elapsed_time": "0:28:20", "remaining_time": "0:03:28", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 197, "total_steps": 220, "loss": 0.1593, "learning_rate": 4.448867537695578e-07, "epoch": 8.954545454545455, "percentage": 89.55, "elapsed_time": "0:28:28", "remaining_time": "0:03:19", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 198, "total_steps": 220, "loss": 0.1616, "learning_rate": 4.0756507127038494e-07, "epoch": 9.0, "percentage": 90.0, "elapsed_time": "0:28:36", "remaining_time": "0:03:10", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 199, "total_steps": 220, "loss": 0.144, "learning_rate": 3.71811701092219e-07, "epoch": 9.045454545454545, "percentage": 90.45, "elapsed_time": "0:28:44", "remaining_time": "0:03:02", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 200, "total_steps": 220, "loss": 0.1366, "learning_rate": 3.3763885297822153e-07, "epoch": 9.090909090909092, "percentage": 90.91, "elapsed_time": "0:28:53", "remaining_time": "0:02:53", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 201, "total_steps": 220, "loss": 0.1551, "learning_rate": 3.0505819692471797e-07, "epoch": 9.136363636363637, "percentage": 91.36, "elapsed_time": "0:29:20", "remaining_time": "0:02:46", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 202, "total_steps": 220, "loss": 0.1379, "learning_rate": 2.7408085919590265e-07, "epoch": 9.181818181818182, "percentage": 91.82, "elapsed_time": "0:29:30", "remaining_time": "0:02:37", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 203, "total_steps": 220, "loss": 0.1698, "learning_rate": 2.447174185242324e-07, "epoch": 9.227272727272727, "percentage": 92.27, "elapsed_time": "0:29:40", "remaining_time": "0:02:29", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 204, "total_steps": 220, "loss": 0.1525, "learning_rate": 2.1697790249779638e-07, "epoch": 9.272727272727273, "percentage": 92.73, "elapsed_time": "0:29:49", "remaining_time": "0:02:20", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 205, "total_steps": 220, "loss": 0.164, "learning_rate": 1.908717841359048e-07, "epoch": 9.318181818181818, "percentage": 93.18, "elapsed_time": "0:29:57", "remaining_time": "0:02:11", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 206, "total_steps": 220, "loss": 0.1904, "learning_rate": 1.664079786540629e-07, "epoch": 9.363636363636363, "percentage": 93.64, "elapsed_time": "0:30:06", "remaining_time": "0:02:02", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 207, "total_steps": 220, "loss": 0.1215, "learning_rate": 1.435948404194304e-07, "epoch": 9.409090909090908, "percentage": 94.09, "elapsed_time": "0:30:14", "remaining_time": "0:01:53", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 208, "total_steps": 220, "loss": 0.1679, "learning_rate": 1.22440160097817e-07, "epoch": 9.454545454545455, "percentage": 94.55, "elapsed_time": "0:30:23", "remaining_time": "0:01:45", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 209, "total_steps": 220, "loss": 0.1378, "learning_rate": 1.0295116199317057e-07, "epoch": 9.5, "percentage": 95.0, "elapsed_time": "0:30:32", "remaining_time": "0:01:36", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 210, "total_steps": 220, "loss": 0.1411, "learning_rate": 8.513450158049109e-08, "epoch": 9.545454545454545, "percentage": 95.45, "elapsed_time": "0:30:40", "remaining_time": "0:01:27", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 211, "total_steps": 220, "loss": 0.1329, "learning_rate": 6.899626323298714e-08, "epoch": 9.590909090909092, "percentage": 95.91, "elapsed_time": "0:30:48", "remaining_time": "0:01:18", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 212, "total_steps": 220, "loss": 0.1097, "learning_rate": 5.454195814427021e-08, "epoch": 9.636363636363637, "percentage": 96.36, "elapsed_time": "0:30:57", "remaining_time": "0:01:10", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 213, "total_steps": 220, "loss": 0.1913, "learning_rate": 4.177652244628627e-08, "epoch": 9.681818181818182, "percentage": 96.82, "elapsed_time": "0:31:05", "remaining_time": "0:01:01", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 214, "total_steps": 220, "loss": 0.1388, "learning_rate": 3.0704315523631956e-08, "epoch": 9.727272727272727, "percentage": 97.27, "elapsed_time": "0:31:14", "remaining_time": "0:00:52", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 215, "total_steps": 220, "loss": 0.1091, "learning_rate": 2.1329118524827662e-08, "epoch": 9.772727272727273, "percentage": 97.73, "elapsed_time": "0:31:23", "remaining_time": "0:00:43", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 216, "total_steps": 220, "loss": 0.1112, "learning_rate": 1.3654133071059894e-08, "epoch": 9.818181818181818, "percentage": 98.18, "elapsed_time": "0:31:31", "remaining_time": "0:00:35", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 217, "total_steps": 220, "loss": 0.1306, "learning_rate": 7.681980162830283e-09, "epoch": 9.863636363636363, "percentage": 98.64, "elapsed_time": "0:31:42", "remaining_time": "0:00:26", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 218, "total_steps": 220, "loss": 0.1584, "learning_rate": 3.41469928488547e-09, "epoch": 9.909090909090908, "percentage": 99.09, "elapsed_time": "0:31:52", "remaining_time": "0:00:17", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 219, "total_steps": 220, "loss": 0.1243, "learning_rate": 8.537477097364522e-10, "epoch": 9.954545454545455, "percentage": 99.55, "elapsed_time": "0:32:01", "remaining_time": "0:00:08", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 220, "total_steps": 220, "loss": 0.1587, "learning_rate": 0.0, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "0:32:11", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} | |
| {"current_steps": 220, "total_steps": 220, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "0:32:11", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0} | |