Jeckmu's picture
Upload folder using huggingface_hub
fea19af verified
{"current_steps": 5, "total_steps": 105, "loss": 0.4843, "lr": 4.972077065562821e-05, "epoch": 0.1413427561837456, "percentage": 4.76, "elapsed_time": "0:03:26", "remaining_time": "1:08:55", "throughput": 432.13, "total_tokens": 89360}
{"current_steps": 10, "total_steps": 105, "loss": 0.271, "lr": 4.888932014465352e-05, "epoch": 0.2826855123674912, "percentage": 9.52, "elapsed_time": "0:06:35", "remaining_time": "1:02:40", "throughput": 438.72, "total_tokens": 173680}
{"current_steps": 15, "total_steps": 105, "loss": 0.3194, "lr": 4.752422169756048e-05, "epoch": 0.42402826855123676, "percentage": 14.29, "elapsed_time": "0:09:40", "remaining_time": "0:58:02", "throughput": 441.57, "total_tokens": 256320}
{"current_steps": 20, "total_steps": 105, "loss": 0.2881, "lr": 4.5655969357899874e-05, "epoch": 0.5653710247349824, "percentage": 19.05, "elapsed_time": "0:13:21", "remaining_time": "0:56:44", "throughput": 441.98, "total_tokens": 354080}
{"current_steps": 25, "total_steps": 105, "loss": 0.2433, "lr": 4.332629679574566e-05, "epoch": 0.7067137809187279, "percentage": 23.81, "elapsed_time": "0:16:45", "remaining_time": "0:53:36", "throughput": 442.81, "total_tokens": 445120}
{"current_steps": 30, "total_steps": 105, "loss": 0.1921, "lr": 4.058724504646834e-05, "epoch": 0.8480565371024735, "percentage": 28.57, "elapsed_time": "0:20:09", "remaining_time": "0:50:23", "throughput": 443.39, "total_tokens": 536160}
{"current_steps": 35, "total_steps": 105, "loss": 0.1475, "lr": 3.7500000000000003e-05, "epoch": 0.9893992932862191, "percentage": 33.33, "elapsed_time": "0:23:25", "remaining_time": "0:46:50", "throughput": 442.72, "total_tokens": 622160}
{"current_steps": 40, "total_steps": 105, "loss": 0.1183, "lr": 3.413352560915988e-05, "epoch": 1.1130742049469964, "percentage": 38.1, "elapsed_time": "0:26:26", "remaining_time": "0:42:58", "throughput": 443.07, "total_tokens": 702992}
{"current_steps": 45, "total_steps": 105, "loss": 0.0833, "lr": 3.056302334890786e-05, "epoch": 1.254416961130742, "percentage": 42.86, "elapsed_time": "0:29:54", "remaining_time": "0:39:52", "throughput": 443.43, "total_tokens": 795712}
{"current_steps": 50, "total_steps": 105, "loss": 0.1549, "lr": 2.686825233966061e-05, "epoch": 1.3957597173144876, "percentage": 47.62, "elapsed_time": "0:33:10", "remaining_time": "0:36:29", "throughput": 442.2, "total_tokens": 880032}
{"current_steps": 55, "total_steps": 105, "loss": 0.1048, "lr": 2.3131747660339394e-05, "epoch": 1.5371024734982333, "percentage": 52.38, "elapsed_time": "0:36:32", "remaining_time": "0:33:13", "throughput": 442.17, "total_tokens": 969392}
{"current_steps": 60, "total_steps": 105, "loss": 0.1268, "lr": 1.9436976651092144e-05, "epoch": 1.6784452296819787, "percentage": 57.14, "elapsed_time": "0:40:00", "remaining_time": "0:30:00", "throughput": 441.09, "total_tokens": 1058752}
{"current_steps": 65, "total_steps": 105, "loss": 0.0301, "lr": 1.5866474390840125e-05, "epoch": 1.8197879858657244, "percentage": 61.9, "elapsed_time": "0:43:08", "remaining_time": "0:26:32", "throughput": 441.67, "total_tokens": 1143072}
{"current_steps": 70, "total_steps": 105, "loss": 0.0827, "lr": 1.2500000000000006e-05, "epoch": 1.96113074204947, "percentage": 66.67, "elapsed_time": "0:46:31", "remaining_time": "0:23:15", "throughput": 442.04, "total_tokens": 1234112}
{"current_steps": 75, "total_steps": 105, "loss": 0.0773, "lr": 9.412754953531663e-06, "epoch": 2.0848056537102475, "percentage": 71.43, "elapsed_time": "0:49:05", "remaining_time": "0:19:38", "throughput": 442.46, "total_tokens": 1303184}
{"current_steps": 80, "total_steps": 105, "loss": 0.0324, "lr": 6.673703204254347e-06, "epoch": 2.2261484098939928, "percentage": 76.19, "elapsed_time": "0:52:10", "remaining_time": "0:16:18", "throughput": 442.66, "total_tokens": 1385824}
{"current_steps": 85, "total_steps": 105, "loss": 0.0619, "lr": 4.344030642100133e-06, "epoch": 2.3674911660777385, "percentage": 80.95, "elapsed_time": "0:55:35", "remaining_time": "0:13:04", "throughput": 442.78, "total_tokens": 1476864}
{"current_steps": 90, "total_steps": 105, "loss": 0.0218, "lr": 2.475778302439524e-06, "epoch": 2.508833922261484, "percentage": 85.71, "elapsed_time": "0:59:11", "remaining_time": "0:09:51", "throughput": 441.97, "total_tokens": 1569584}
{"current_steps": 95, "total_steps": 105, "loss": 0.0275, "lr": 1.1106798553464804e-06, "epoch": 2.65017667844523, "percentage": 90.48, "elapsed_time": "1:02:27", "remaining_time": "0:06:34", "throughput": 442.21, "total_tokens": 1657264}
{"current_steps": 100, "total_steps": 105, "loss": 0.113, "lr": 2.7922934437178695e-07, "epoch": 2.791519434628975, "percentage": 95.24, "elapsed_time": "1:05:51", "remaining_time": "0:03:17", "throughput": 441.99, "total_tokens": 1746624}
{"current_steps": 105, "total_steps": 105, "loss": 0.0585, "lr": 0.0, "epoch": 2.932862190812721, "percentage": 100.0, "elapsed_time": "1:09:28", "remaining_time": "0:00:00", "throughput": 441.6, "total_tokens": 1841024}
{"current_steps": 105, "total_steps": 105, "epoch": 2.932862190812721, "percentage": 100.0, "elapsed_time": "1:09:30", "remaining_time": "0:00:00", "throughput": 441.44, "total_tokens": 1841024}