Commit
·
86104c8
1
Parent(s):
b081990
Training in progress, step 8500
Browse files- {checkpoint-7000 → checkpoint-8000}/config.json +0 -0
- {checkpoint-7000 → checkpoint-8000}/optimizer.pt +1 -1
- {checkpoint-7500 → checkpoint-8000}/pytorch_model.bin +1 -1
- {checkpoint-7500 → checkpoint-8000}/rng_state.pth +1 -1
- {checkpoint-7500 → checkpoint-8000}/scaler.pt +1 -1
- {checkpoint-7000 → checkpoint-8000}/scheduler.pt +1 -1
- {checkpoint-7000 → checkpoint-8000}/special_tokens_map.json +0 -0
- {checkpoint-7000 → checkpoint-8000}/tokenizer.json +0 -0
- {checkpoint-7000 → checkpoint-8000}/tokenizer_config.json +0 -0
- {checkpoint-7500 → checkpoint-8000}/trainer_state.json +21 -3
- {checkpoint-7000 → checkpoint-8000}/training_args.bin +0 -0
- {checkpoint-7500 → checkpoint-8500}/config.json +0 -0
- {checkpoint-7500 → checkpoint-8500}/optimizer.pt +1 -1
- {checkpoint-7000 → checkpoint-8500}/pytorch_model.bin +1 -1
- {checkpoint-7000 → checkpoint-8500}/rng_state.pth +1 -1
- {checkpoint-7000 → checkpoint-8500}/scaler.pt +1 -1
- {checkpoint-7500 → checkpoint-8500}/scheduler.pt +1 -1
- {checkpoint-7500 → checkpoint-8500}/special_tokens_map.json +0 -0
- {checkpoint-7500 → checkpoint-8500}/tokenizer.json +0 -0
- {checkpoint-7500 → checkpoint-8500}/tokenizer_config.json +0 -0
- {checkpoint-7000 → checkpoint-8500}/trainer_state.json +59 -5
- {checkpoint-7500 → checkpoint-8500}/training_args.bin +0 -0
- pytorch_model.bin +1 -1
- runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0 +2 -2
{checkpoint-7000 → checkpoint-8000}/config.json
RENAMED
|
File without changes
|
{checkpoint-7000 → checkpoint-8000}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2265828101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b39cb815a920edaf287fed25e2a19b016671ea73dd16f75036bf2bcfaf1b767a
|
| 3 |
size 2265828101
|
{checkpoint-7500 → checkpoint-8000}/pytorch_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1134425553
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:27b504e227955abd271e8dfb3a65060b57aab9124c9a51342289b2487370d857
|
| 3 |
size 1134425553
|
{checkpoint-7500 → checkpoint-8000}/rng_state.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14575
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:960a0ff8566f0b77c05a97c9fc1c687f7ca7734da4222daf4902d9e243e0137d
|
| 3 |
size 14575
|
{checkpoint-7500 → checkpoint-8000}/scaler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 557
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:05c943ac5112ace01757b5472903bea87985b301a9f82c01afb7df322762c49c
|
| 3 |
size 557
|
{checkpoint-7000 → checkpoint-8000}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 627
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c82aba72db92b65d16e163361936c8fce2a4ed55ab1b817ceacaf38e10c5cade
|
| 3 |
size 627
|
{checkpoint-7000 → checkpoint-8000}/special_tokens_map.json
RENAMED
|
File without changes
|
{checkpoint-7000 → checkpoint-8000}/tokenizer.json
RENAMED
|
File without changes
|
{checkpoint-7000 → checkpoint-8000}/tokenizer_config.json
RENAMED
|
File without changes
|
{checkpoint-7500 → checkpoint-8000}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.8573209374145502,
|
| 3 |
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
|
| 4 |
-
"epoch": 3.
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -276,11 +276,29 @@
|
|
| 276 |
"eval_samples_per_second": 61.609,
|
| 277 |
"eval_steps_per_second": 3.873,
|
| 278 |
"step": 7500
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 279 |
}
|
| 280 |
],
|
| 281 |
"max_steps": 12035,
|
| 282 |
"num_train_epochs": 5,
|
| 283 |
-
"total_flos": 1.
|
| 284 |
"trial_name": null,
|
| 285 |
"trial_params": null
|
| 286 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_metric": 0.8573209374145502,
|
| 3 |
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-6000",
|
| 4 |
+
"epoch": 3.3236393851267136,
|
| 5 |
+
"global_step": 8000,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 276 |
"eval_samples_per_second": 61.609,
|
| 277 |
"eval_steps_per_second": 3.873,
|
| 278 |
"step": 7500
|
| 279 |
+
},
|
| 280 |
+
{
|
| 281 |
+
"epoch": 3.32,
|
| 282 |
+
"learning_rate": 1.6792687993352722e-05,
|
| 283 |
+
"loss": 0.0788,
|
| 284 |
+
"step": 8000
|
| 285 |
+
},
|
| 286 |
+
{
|
| 287 |
+
"epoch": 3.32,
|
| 288 |
+
"eval_accuracy": 0.8364993324862074,
|
| 289 |
+
"eval_f1": 0.8364993324862076,
|
| 290 |
+
"eval_loss": 1.028805136680603,
|
| 291 |
+
"eval_precision": 0.8364993324862074,
|
| 292 |
+
"eval_recall": 0.8364993324862074,
|
| 293 |
+
"eval_runtime": 38.2117,
|
| 294 |
+
"eval_samples_per_second": 53.701,
|
| 295 |
+
"eval_steps_per_second": 3.376,
|
| 296 |
+
"step": 8000
|
| 297 |
}
|
| 298 |
],
|
| 299 |
"max_steps": 12035,
|
| 300 |
"num_train_epochs": 5,
|
| 301 |
+
"total_flos": 1.3347886251942144e+16,
|
| 302 |
"trial_name": null,
|
| 303 |
"trial_params": null
|
| 304 |
}
|
{checkpoint-7000 → checkpoint-8000}/training_args.bin
RENAMED
|
File without changes
|
{checkpoint-7500 → checkpoint-8500}/config.json
RENAMED
|
File without changes
|
{checkpoint-7500 → checkpoint-8500}/optimizer.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2265828101
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea130ecc564ac6fe490d67f54147e9dc00bf72e39d0688a66ba68802757a9e2b
|
| 3 |
size 2265828101
|
{checkpoint-7000 → checkpoint-8500}/pytorch_model.bin
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1134425553
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e39c7d7515bc3fd9710bfa20bd4d1d7c408894096e55b518c4e64c07ac0ff33b
|
| 3 |
size 1134425553
|
{checkpoint-7000 → checkpoint-8500}/rng_state.pth
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14575
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c16ad00f12a6b00ebecd82041529c62f714ed6d5992e9f831161d0979641cda
|
| 3 |
size 14575
|
{checkpoint-7000 → checkpoint-8500}/scaler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 557
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4c06e32f681823ca88423b1784605ca44bf8a960abc7518ae6b79b079157ccc
|
| 3 |
size 557
|
{checkpoint-7500 → checkpoint-8500}/scheduler.pt
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 627
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53b7ca82f31c9b2520ad7f958578cfcb752be5bbfebe85216932fd844130a1eb
|
| 3 |
size 627
|
{checkpoint-7500 → checkpoint-8500}/special_tokens_map.json
RENAMED
|
File without changes
|
{checkpoint-7500 → checkpoint-8500}/tokenizer.json
RENAMED
|
File without changes
|
{checkpoint-7500 → checkpoint-8500}/tokenizer_config.json
RENAMED
|
File without changes
|
{checkpoint-7000 → checkpoint-8500}/trainer_state.json
RENAMED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
{
|
| 2 |
-
"best_metric": 0.
|
| 3 |
-
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-
|
| 4 |
-
"epoch":
|
| 5 |
-
"global_step":
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
@@ -258,11 +258,65 @@
|
|
| 258 |
"eval_samples_per_second": 51.982,
|
| 259 |
"eval_steps_per_second": 3.268,
|
| 260 |
"step": 7000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 261 |
}
|
| 262 |
],
|
| 263 |
"max_steps": 12035,
|
| 264 |
"num_train_epochs": 5,
|
| 265 |
-
"total_flos": 1.
|
| 266 |
"trial_name": null,
|
| 267 |
"trial_params": null
|
| 268 |
}
|
|
|
|
| 1 |
{
|
| 2 |
+
"best_metric": 0.8849383152916955,
|
| 3 |
+
"best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_ml384-v2/checkpoint-8500",
|
| 4 |
+
"epoch": 3.5313668466971335,
|
| 5 |
+
"global_step": 8500,
|
| 6 |
"is_hyper_param_search": false,
|
| 7 |
"is_local_process_zero": true,
|
| 8 |
"is_world_process_zero": true,
|
|
|
|
| 258 |
"eval_samples_per_second": 51.982,
|
| 259 |
"eval_steps_per_second": 3.268,
|
| 260 |
"step": 7000
|
| 261 |
+
},
|
| 262 |
+
{
|
| 263 |
+
"epoch": 3.12,
|
| 264 |
+
"learning_rate": 1.886996260905692e-05,
|
| 265 |
+
"loss": 0.1012,
|
| 266 |
+
"step": 7500
|
| 267 |
+
},
|
| 268 |
+
{
|
| 269 |
+
"epoch": 3.12,
|
| 270 |
+
"eval_accuracy": 0.8385581702079747,
|
| 271 |
+
"eval_f1": 0.8385581702079747,
|
| 272 |
+
"eval_loss": 0.8271787166595459,
|
| 273 |
+
"eval_precision": 0.8385581702079747,
|
| 274 |
+
"eval_recall": 0.8385581702079747,
|
| 275 |
+
"eval_runtime": 33.307,
|
| 276 |
+
"eval_samples_per_second": 61.609,
|
| 277 |
+
"eval_steps_per_second": 3.873,
|
| 278 |
+
"step": 7500
|
| 279 |
+
},
|
| 280 |
+
{
|
| 281 |
+
"epoch": 3.32,
|
| 282 |
+
"learning_rate": 1.6792687993352722e-05,
|
| 283 |
+
"loss": 0.0788,
|
| 284 |
+
"step": 8000
|
| 285 |
+
},
|
| 286 |
+
{
|
| 287 |
+
"epoch": 3.32,
|
| 288 |
+
"eval_accuracy": 0.8364993324862074,
|
| 289 |
+
"eval_f1": 0.8364993324862076,
|
| 290 |
+
"eval_loss": 1.028805136680603,
|
| 291 |
+
"eval_precision": 0.8364993324862074,
|
| 292 |
+
"eval_recall": 0.8364993324862074,
|
| 293 |
+
"eval_runtime": 38.2117,
|
| 294 |
+
"eval_samples_per_second": 53.701,
|
| 295 |
+
"eval_steps_per_second": 3.376,
|
| 296 |
+
"step": 8000
|
| 297 |
+
},
|
| 298 |
+
{
|
| 299 |
+
"epoch": 3.53,
|
| 300 |
+
"learning_rate": 1.4715413377648527e-05,
|
| 301 |
+
"loss": 0.0802,
|
| 302 |
+
"step": 8500
|
| 303 |
+
},
|
| 304 |
+
{
|
| 305 |
+
"epoch": 3.53,
|
| 306 |
+
"eval_accuracy": 0.8849383152916955,
|
| 307 |
+
"eval_f1": 0.8849383152916955,
|
| 308 |
+
"eval_loss": 0.719699501991272,
|
| 309 |
+
"eval_precision": 0.8849383152916955,
|
| 310 |
+
"eval_recall": 0.8849383152916955,
|
| 311 |
+
"eval_runtime": 34.4056,
|
| 312 |
+
"eval_samples_per_second": 59.641,
|
| 313 |
+
"eval_steps_per_second": 3.749,
|
| 314 |
+
"step": 8500
|
| 315 |
}
|
| 316 |
],
|
| 317 |
"max_steps": 12035,
|
| 318 |
"num_train_epochs": 5,
|
| 319 |
+
"total_flos": 1.4182402968486144e+16,
|
| 320 |
"trial_name": null,
|
| 321 |
"trial_params": null
|
| 322 |
}
|
{checkpoint-7500 → checkpoint-8500}/training_args.bin
RENAMED
|
File without changes
|
pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1134425553
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e39c7d7515bc3fd9710bfa20bd4d1d7c408894096e55b518c4e64c07ac0ff33b
|
| 3 |
size 1134425553
|
runs/Feb09_15-43-15_f1c8d3a96fe7/events.out.tfevents.1675957409.f1c8d3a96fe7.143.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4f7c4c7428bf319a3138119ab5d1663f67efa67393e048e30432a37e3bf8e016
|
| 3 |
+
size 15322
|