| { | |
| "before_init_mem_cpu": 699817984, | |
| "before_init_mem_gpu": 0, | |
| "epoch": 5.98, | |
| "eval_accuracy": 0.544073054441718, | |
| "eval_loss": 1.9982993602752686, | |
| "eval_mem_cpu_alloc_delta": 9977856, | |
| "eval_mem_cpu_peaked_delta": 60305408, | |
| "eval_mem_gpu_alloc_delta": 0, | |
| "eval_mem_gpu_peaked_delta": 2357757952, | |
| "eval_runtime": 481.5484, | |
| "eval_samples": 588, | |
| "eval_samples_per_second": 1.221, | |
| "eval_steps_per_second": 0.305, | |
| "init_mem_cpu_alloc_delta": -283938816, | |
| "init_mem_cpu_peaked_delta": 332918784, | |
| "init_mem_gpu_alloc_delta": 334744576, | |
| "init_mem_gpu_peaked_delta": 0, | |
| "perplexity": 7.376500655769286, | |
| "train_loss": 2.0183091745143984, | |
| "train_mem_cpu_alloc_delta": 1155149824, | |
| "train_mem_cpu_peaked_delta": 308719616, | |
| "train_mem_gpu_alloc_delta": 988995584, | |
| "train_mem_gpu_peaked_delta": 4500811776, | |
| "train_runtime": 35067.5673, | |
| "train_samples": 5325, | |
| "train_samples_per_second": 0.911, | |
| "train_steps_per_second": 0.007 | |
| } |