Theoreticallyhugo commited on
Commit
eebae89
·
verified ·
1 Parent(s): b314f36

Training in progress, epoch 1, checkpoint

Browse files
checkpoint-41/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:138942c8f4356011d76a3a29cef1fcfe36ed60d9640d9cc91ca5f0c3d61957cf
3
  size 592330980
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cd33ff53c0edd4d359980f27f4afa194ec5b807febef7f4cbaefde162b633c4b
3
  size 592330980
checkpoint-41/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9a4408a3ce9f54e3b82993c0eeca8d47b25ea144ed63e3793861dbd04f8f2088
3
  size 1014670074
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab3510262bc219de46e870072b2a617000c0c57c3d0baaaf87394856c91f5477
3
  size 1014670074
checkpoint-41/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a939982f711c8a91f0893b4f281f0db4fd89d7ca52de2aed82098ef9ff76ea2
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b75d0f85c6e5f43bda08f24453a869f5d0b5d0d33d936ef1b542f406f081347
3
  size 14244
checkpoint-41/trainer_state.json CHANGED
@@ -14,60 +14,60 @@
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
- "support": 317.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
- "support": 155.0
24
  },
25
  "eval_B-Premise": {
26
- "f1-score": 0.030989272943980926,
27
- "precision": 0.8125,
28
- "recall": 0.015795868772782502,
29
- "support": 823.0
30
  },
31
  "eval_I-Claim": {
32
- "f1-score": 0.4085060273601517,
33
- "precision": 0.4962158604804212,
34
- "recall": 0.34714548802946593,
35
- "support": 4344.0
36
  },
37
  "eval_I-MajorClaim": {
38
- "f1-score": 0.4814916369618864,
39
- "precision": 0.5727332028701891,
40
- "recall": 0.4153263954588458,
41
- "support": 2114.0
42
  },
43
  "eval_I-Premise": {
44
- "f1-score": 0.8524337025847599,
45
- "precision": 0.7845887659890008,
46
- "recall": 0.9331226574557213,
47
- "support": 13607.0
48
  },
49
  "eval_O": {
50
- "f1-score": 0.8266195658367045,
51
- "precision": 0.7997794928335171,
52
- "recall": 0.855323664662186,
53
- "support": 8481.0
54
  },
55
- "eval_accuracy": 0.748969538554338,
56
- "eval_loss": 0.6934605836868286,
57
  "eval_macro avg": {
58
- "f1-score": 0.3714343150982119,
59
- "precision": 0.49511676031044694,
60
- "recall": 0.36667343919700024,
61
- "support": 29841.0
62
  },
63
- "eval_runtime": 1.4147,
64
- "eval_samples_per_second": 56.549,
65
- "eval_steps_per_second": 7.069,
66
  "eval_weighted avg": {
67
- "f1-score": 0.7180574915034598,
68
- "precision": 0.7202786906044678,
69
- "recall": 0.748969538554338,
70
- "support": 29841.0
71
  },
72
  "step": 41
73
  }
@@ -77,7 +77,7 @@
77
  "num_input_tokens_seen": 0,
78
  "num_train_epochs": 16,
79
  "save_steps": 500,
80
- "total_flos": 143790812718000.0,
81
  "train_batch_size": 8,
82
  "trial_name": null,
83
  "trial_params": null
 
14
  "f1-score": 0.0,
15
  "precision": 0.0,
16
  "recall": 0.0,
17
+ "support": 339.0
18
  },
19
  "eval_B-MajorClaim": {
20
  "f1-score": 0.0,
21
  "precision": 0.0,
22
  "recall": 0.0,
23
+ "support": 160.0
24
  },
25
  "eval_B-Premise": {
26
+ "f1-score": 0.22426470588235295,
27
+ "precision": 0.8299319727891157,
28
+ "recall": 0.12964930924548354,
29
+ "support": 941.0
30
  },
31
  "eval_I-Claim": {
32
+ "f1-score": 0.38247663551401867,
33
+ "precision": 0.423873640600725,
34
+ "recall": 0.348446147296722,
35
+ "support": 4698.0
36
  },
37
  "eval_I-MajorClaim": {
38
+ "f1-score": 0.3634627625716104,
39
+ "precision": 0.5125673249551167,
40
+ "recall": 0.28155818540433925,
41
+ "support": 2028.0
42
  },
43
  "eval_I-Premise": {
44
+ "f1-score": 0.8298935191271198,
45
+ "precision": 0.8110747093209996,
46
+ "recall": 0.8496063521970257,
47
+ "support": 14861.0
48
  },
49
  "eval_O": {
50
+ "f1-score": 0.8121805609242796,
51
+ "precision": 0.7380952380952381,
52
+ "recall": 0.9027976701995608,
53
+ "support": 10473.0
54
  },
55
+ "eval_accuracy": 0.7286865671641791,
56
+ "eval_loss": 0.763540506362915,
57
  "eval_macro avg": {
58
+ "f1-score": 0.3731825977170545,
59
+ "precision": 0.47364898368017067,
60
+ "recall": 0.3588653806204473,
61
+ "support": 33500.0
62
  },
63
+ "eval_runtime": 1.4539,
64
+ "eval_samples_per_second": 55.714,
65
+ "eval_steps_per_second": 7.566,
66
  "eval_weighted avg": {
67
+ "f1-score": 0.7040007584084623,
68
+ "precision": 0.7043362259324342,
69
+ "recall": 0.7286865671641791,
70
+ "support": 33500.0
71
  },
72
  "step": 41
73
  }
 
77
  "num_input_tokens_seen": 0,
78
  "num_train_epochs": 16,
79
  "save_steps": 500,
80
+ "total_flos": 143344257399000.0,
81
  "train_batch_size": 8,
82
  "trial_name": null,
83
  "trial_params": null
checkpoint-41/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5626137ff44175bb256e7d272052a295ab9ae4c6895813ac192564aaad939cff
3
  size 4664
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:920ab155975bf66f694757fefb246b73b0d1489bdf4f03eda383fa028f5d083a
3
  size 4664