{ "best_metric": null, "best_model_checkpoint": null, "epoch": 3.0, "eval_steps": 500, "global_step": 243, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_B-Claim": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 295.0 }, "eval_B-MajorClaim": { "f1-score": 0.0, "precision": 0.0, "recall": 0.0, "support": 156.0 }, "eval_B-Premise": { "f1-score": 0.6820276497695853, "precision": 0.6540404040404041, "recall": 0.7125171939477304, "support": 727.0 }, "eval_I-Claim": { "f1-score": 0.43557936284183824, "precision": 0.5235513385293121, "recall": 0.3729181752353367, "support": 4143.0 }, "eval_I-MajorClaim": { "f1-score": 0.5835814547001276, "precision": 0.5468314069350338, "recall": 0.6256269949840402, "support": 2193.0 }, "eval_I-Premise": { "f1-score": 0.8638885700072705, "precision": 0.8318349299926308, "recall": 0.8985115020297699, "support": 12563.0 }, "eval_O": { "f1-score": 0.8838224593742419, "precision": 0.8730234786775275, "recall": 0.8948919449901768, "support": 10180.0 }, "eval_accuracy": 0.7876854942657897, "eval_loss": 0.5461820363998413, "eval_macro avg": { "f1-score": 0.4926999280990091, "precision": 0.4898973654535584, "recall": 0.500637973026722, "support": 30257.0 }, "eval_runtime": 5.0655, "eval_samples_per_second": 15.991, "eval_steps_per_second": 2.172, "eval_weighted avg": { "f1-score": 0.7743853744001297, "precision": 0.7661527277359783, "recall": 0.7876854942657897, "support": 30257.0 }, "step": 81 }, { "epoch": 2.0, "eval_B-Claim": { "f1-score": 0.46397188049209137, "precision": 0.48175182481751827, "recall": 0.44745762711864406, "support": 295.0 }, "eval_B-MajorClaim": { "f1-score": 0.6402439024390244, "precision": 0.6104651162790697, "recall": 0.6730769230769231, "support": 156.0 }, "eval_B-Premise": { "f1-score": 0.7515299877600979, "precision": 0.6769570011025359, "recall": 0.844566712517194, "support": 727.0 }, "eval_I-Claim": { "f1-score": 0.5573419078242231, "precision": 0.5500705218617772, "recall": 0.5648081100651702, "support": 4143.0 }, "eval_I-MajorClaim": { "f1-score": 0.7704582651391162, "precision": 0.6987012987012987, "recall": 0.8586411308709531, "support": 2193.0 }, "eval_I-Premise": { "f1-score": 0.8736837792436597, "precision": 0.9002026342451874, "recall": 0.8486826394969355, "support": 12563.0 }, "eval_O": { "f1-score": 0.9114385688236163, "precision": 0.9145485115221046, "recall": 0.9083497053045186, "support": 10180.0 }, "eval_accuracy": 0.8256932280133523, "eval_loss": 0.4454804062843323, "eval_macro avg": { "f1-score": 0.7098097559602613, "precision": 0.6903852726470703, "recall": 0.7350832640643341, "support": 30257.0 }, "eval_runtime": 5.0817, "eval_samples_per_second": 15.94, "eval_steps_per_second": 2.165, "eval_weighted avg": { "f1-score": 0.8274557458920446, "precision": 0.8315444607100787, "recall": 0.8256932280133523, "support": 30257.0 }, "step": 162 }, { "epoch": 3.0, "eval_B-Claim": { "f1-score": 0.5551724137931033, "precision": 0.5649122807017544, "recall": 0.5457627118644067, "support": 295.0 }, "eval_B-MajorClaim": { "f1-score": 0.7108433734939757, "precision": 0.6704545454545454, "recall": 0.7564102564102564, "support": 156.0 }, "eval_B-Premise": { "f1-score": 0.7860892388451444, "precision": 0.7515683814303639, "recall": 0.8239339752407153, "support": 727.0 }, "eval_I-Claim": { "f1-score": 0.5878616796047988, "precision": 0.573296627666896, "recall": 0.6031860970311369, "support": 4143.0 }, "eval_I-MajorClaim": { "f1-score": 0.7989093387866394, "precision": 0.7961956521739131, "recall": 0.801641586867305, "support": 2193.0 }, "eval_I-Premise": { "f1-score": 0.8824656529006482, "precision": 0.9044793581815143, "recall": 0.8614980498288626, "support": 12563.0 }, "eval_O": { "f1-score": 0.9169814976266588, "precision": 0.9044525128989107, "recall": 0.9298624754420433, "support": 10180.0 }, "eval_accuracy": 0.8402683676504611, "eval_loss": 0.41143855452537537, "eval_macro avg": { "f1-score": 0.7483318850072812, "precision": 0.7379084797868425, "recall": 0.7603278789549609, "support": 30257.0 }, "eval_runtime": 5.0654, "eval_samples_per_second": 15.991, "eval_steps_per_second": 2.172, "eval_weighted avg": { "f1-score": 0.8412916372002002, "precision": 0.8430827906594975, "recall": 0.8402683676504611, "support": 30257.0 }, "step": 243 } ], "logging_steps": 500, "max_steps": 4050, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, "total_flos": 430032772197000.0, "train_batch_size": 4, "trial_name": null, "trial_params": null }