Commit 
							
							·
						
						0a6fb58
	
1
								Parent(s):
							
							27433f3
								
Training in progress, step 1300
Browse files- {checkpoint-700 → checkpoint-1200}/config.json +0 -0
- {checkpoint-700 → checkpoint-1200}/optimizer.pt +1 -1
- {checkpoint-800 → checkpoint-1200}/pytorch_model.bin +1 -1
- {checkpoint-800 → checkpoint-1200}/rng_state.pth +1 -1
- {checkpoint-800 → checkpoint-1200}/scaler.pt +1 -1
- {checkpoint-700 → checkpoint-1200}/scheduler.pt +1 -1
- {checkpoint-700 → checkpoint-1200}/special_tokens_map.json +0 -0
- {checkpoint-700 → checkpoint-1200}/tokenizer.json +0 -0
- {checkpoint-700 → checkpoint-1200}/tokenizer_config.json +0 -0
- {checkpoint-800 → checkpoint-1200}/trainer_state.json +57 -3
- {checkpoint-700 → checkpoint-1200}/training_args.bin +0 -0
- {checkpoint-800 → checkpoint-1300}/config.json +0 -0
- {checkpoint-800 → checkpoint-1300}/optimizer.pt +1 -1
- {checkpoint-700 → checkpoint-1300}/pytorch_model.bin +1 -1
- {checkpoint-700 → checkpoint-1300}/rng_state.pth +1 -1
- {checkpoint-700 → checkpoint-1300}/scaler.pt +1 -1
- {checkpoint-800 → checkpoint-1300}/scheduler.pt +1 -1
- {checkpoint-800 → checkpoint-1300}/special_tokens_map.json +0 -0
- {checkpoint-800 → checkpoint-1300}/tokenizer.json +0 -0
- {checkpoint-800 → checkpoint-1300}/tokenizer_config.json +0 -0
- {checkpoint-700 → checkpoint-1300}/trainer_state.json +81 -3
- {checkpoint-800 → checkpoint-1300}/training_args.bin +0 -0
- pytorch_model.bin +1 -1
- runs/Feb15_07-53-26_e220f522c880/events.out.tfevents.1676447621.e220f522c880.495.0 +2 -2
    	
        {checkpoint-700 → checkpoint-1200}/config.json
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-700 → checkpoint-1200}/optimizer.pt
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 2265828101
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:280a221cc64b57effe5c7a796f38b48321fed8fcb3ff1e239c462a69ff81116c
         | 
| 3 | 
             
            size 2265828101
         | 
    	
        {checkpoint-800 → checkpoint-1200}/pytorch_model.bin
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 1134425553
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:129796804ce986931f94bfed0dab6f25dddc2e97c3a332294d4f52bf3528c96a
         | 
| 3 | 
             
            size 1134425553
         | 
    	
        {checkpoint-800 → checkpoint-1200}/rng_state.pth
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 14575
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:cd6ffa5eb17c8d65486aa60854f05719c6a9abb0d32d2839b3ba42058bd6991d
         | 
| 3 | 
             
            size 14575
         | 
    	
        {checkpoint-800 → checkpoint-1200}/scaler.pt
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 557
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:6b74d76706ac346849ec903aa334b83db05c630c620b87dcbe1a7b129aecd1c1
         | 
| 3 | 
             
            size 557
         | 
    	
        {checkpoint-700 → checkpoint-1200}/scheduler.pt
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 627
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:29a2c927b05979c18fd3e62e50ba927b4a9c741248dda26234d8cd08f20d64a8
         | 
| 3 | 
             
            size 627
         | 
    	
        {checkpoint-700 → checkpoint-1200}/special_tokens_map.json
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-700 → checkpoint-1200}/tokenizer.json
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-700 → checkpoint-1200}/tokenizer_config.json
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-800 → checkpoint-1200}/trainer_state.json
    RENAMED
    
    | @@ -1,8 +1,8 @@ | |
| 1 | 
             
            {
         | 
| 2 | 
             
              "best_metric": 0.885723696687195,
         | 
| 3 | 
             
              "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
         | 
| 4 | 
            -
              "epoch": 0. | 
| 5 | 
            -
              "global_step":  | 
| 6 | 
             
              "is_hyper_param_search": false,
         | 
| 7 | 
             
              "is_local_process_zero": true,
         | 
| 8 | 
             
              "is_world_process_zero": true,
         | 
| @@ -108,11 +108,65 @@ | |
| 108 | 
             
                  "eval_samples_per_second": 35.233,
         | 
| 109 | 
             
                  "eval_steps_per_second": 2.214,
         | 
| 110 | 
             
                  "step": 800
         | 
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
| 111 | 
             
                }
         | 
| 112 | 
             
              ],
         | 
| 113 | 
             
              "max_steps": 1876,
         | 
| 114 | 
             
              "num_train_epochs": 1,
         | 
| 115 | 
            -
              "total_flos":  | 
| 116 | 
             
              "trial_name": null,
         | 
| 117 | 
             
              "trial_params": null
         | 
| 118 | 
             
            }
         | 
|  | |
| 1 | 
             
            {
         | 
| 2 | 
             
              "best_metric": 0.885723696687195,
         | 
| 3 | 
             
              "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
         | 
| 4 | 
            +
              "epoch": 0.6396588486140725,
         | 
| 5 | 
            +
              "global_step": 1200,
         | 
| 6 | 
             
              "is_hyper_param_search": false,
         | 
| 7 | 
             
              "is_local_process_zero": true,
         | 
| 8 | 
             
              "is_world_process_zero": true,
         | 
|  | |
| 108 | 
             
                  "eval_samples_per_second": 35.233,
         | 
| 109 | 
             
                  "eval_steps_per_second": 2.214,
         | 
| 110 | 
             
                  "step": 800
         | 
| 111 | 
            +
                },
         | 
| 112 | 
            +
                {
         | 
| 113 | 
            +
                  "epoch": 0.48,
         | 
| 114 | 
            +
                  "eval_accuracy": 0.8833980456546259,
         | 
| 115 | 
            +
                  "eval_f1": 0.8833980456546259,
         | 
| 116 | 
            +
                  "eval_loss": 0.38389313220977783,
         | 
| 117 | 
            +
                  "eval_precision": 0.8833980456546259,
         | 
| 118 | 
            +
                  "eval_recall": 0.8833980456546259,
         | 
| 119 | 
            +
                  "eval_runtime": 47.6493,
         | 
| 120 | 
            +
                  "eval_samples_per_second": 33.726,
         | 
| 121 | 
            +
                  "eval_steps_per_second": 2.12,
         | 
| 122 | 
            +
                  "step": 900
         | 
| 123 | 
            +
                },
         | 
| 124 | 
            +
                {
         | 
| 125 | 
            +
                  "epoch": 0.53,
         | 
| 126 | 
            +
                  "learning_rate": 9.381663113006397e-06,
         | 
| 127 | 
            +
                  "loss": 0.4464,
         | 
| 128 | 
            +
                  "step": 1000
         | 
| 129 | 
            +
                },
         | 
| 130 | 
            +
                {
         | 
| 131 | 
            +
                  "epoch": 0.53,
         | 
| 132 | 
            +
                  "eval_accuracy": 0.8498407977082855,
         | 
| 133 | 
            +
                  "eval_f1": 0.8498407977082856,
         | 
| 134 | 
            +
                  "eval_loss": 0.4365050792694092,
         | 
| 135 | 
            +
                  "eval_precision": 0.8498407977082855,
         | 
| 136 | 
            +
                  "eval_recall": 0.8498407977082855,
         | 
| 137 | 
            +
                  "eval_runtime": 47.0078,
         | 
| 138 | 
            +
                  "eval_samples_per_second": 34.186,
         | 
| 139 | 
            +
                  "eval_steps_per_second": 2.149,
         | 
| 140 | 
            +
                  "step": 1000
         | 
| 141 | 
            +
                },
         | 
| 142 | 
            +
                {
         | 
| 143 | 
            +
                  "epoch": 0.59,
         | 
| 144 | 
            +
                  "eval_accuracy": 0.8811622266361904,
         | 
| 145 | 
            +
                  "eval_f1": 0.8811622266361904,
         | 
| 146 | 
            +
                  "eval_loss": 0.36158204078674316,
         | 
| 147 | 
            +
                  "eval_precision": 0.8811622266361904,
         | 
| 148 | 
            +
                  "eval_recall": 0.8811622266361904,
         | 
| 149 | 
            +
                  "eval_runtime": 44.8724,
         | 
| 150 | 
            +
                  "eval_samples_per_second": 35.813,
         | 
| 151 | 
            +
                  "eval_steps_per_second": 2.251,
         | 
| 152 | 
            +
                  "step": 1100
         | 
| 153 | 
            +
                },
         | 
| 154 | 
            +
                {
         | 
| 155 | 
            +
                  "epoch": 0.64,
         | 
| 156 | 
            +
                  "eval_accuracy": 0.8795751943864972,
         | 
| 157 | 
            +
                  "eval_f1": 0.8795751943864972,
         | 
| 158 | 
            +
                  "eval_loss": 0.3948919177055359,
         | 
| 159 | 
            +
                  "eval_precision": 0.8795751943864972,
         | 
| 160 | 
            +
                  "eval_recall": 0.8795751943864972,
         | 
| 161 | 
            +
                  "eval_runtime": 45.1224,
         | 
| 162 | 
            +
                  "eval_samples_per_second": 35.614,
         | 
| 163 | 
            +
                  "eval_steps_per_second": 2.238,
         | 
| 164 | 
            +
                  "step": 1200
         | 
| 165 | 
             
                }
         | 
| 166 | 
             
              ],
         | 
| 167 | 
             
              "max_steps": 1876,
         | 
| 168 | 
             
              "num_train_epochs": 1,
         | 
| 169 | 
            +
              "total_flos": 2670453492940800.0,
         | 
| 170 | 
             
              "trial_name": null,
         | 
| 171 | 
             
              "trial_params": null
         | 
| 172 | 
             
            }
         | 
    	
        {checkpoint-700 → checkpoint-1200}/training_args.bin
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-800 → checkpoint-1300}/config.json
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-800 → checkpoint-1300}/optimizer.pt
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 2265828101
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:2c08cf141a111f37d0566da69d0c30d72707ecd26196f04456a9b2121b4d97d3
         | 
| 3 | 
             
            size 2265828101
         | 
    	
        {checkpoint-700 → checkpoint-1300}/pytorch_model.bin
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 1134425553
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:7d4698a9bcd9f4d1b85cd29935ce42f4264d331bc9713045308140215396cd2e
         | 
| 3 | 
             
            size 1134425553
         | 
    	
        {checkpoint-700 → checkpoint-1300}/rng_state.pth
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 14575
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:55d131675f12693ae085c3c3a36adf556143b9deea694fe5308eef74c5dc9628
         | 
| 3 | 
             
            size 14575
         | 
    	
        {checkpoint-700 → checkpoint-1300}/scaler.pt
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 557
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:af7a31e9f5bbee16af877be66fd13ae4491e1f0e57f209ceef7ac824ca84139d
         | 
| 3 | 
             
            size 557
         | 
    	
        {checkpoint-800 → checkpoint-1300}/scheduler.pt
    RENAMED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 627
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:893ff4c60fcbf7662c0d4334e0bfce704fb88be1f6c471b5adc0626650efe85d
         | 
| 3 | 
             
            size 627
         | 
    	
        {checkpoint-800 → checkpoint-1300}/special_tokens_map.json
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-800 → checkpoint-1300}/tokenizer.json
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-800 → checkpoint-1300}/tokenizer_config.json
    RENAMED
    
    | 
            File without changes
         | 
    	
        {checkpoint-700 → checkpoint-1300}/trainer_state.json
    RENAMED
    
    | @@ -1,8 +1,8 @@ | |
| 1 | 
             
            {
         | 
| 2 | 
             
              "best_metric": 0.885723696687195,
         | 
| 3 | 
             
              "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
         | 
| 4 | 
            -
              "epoch": 0. | 
| 5 | 
            -
              "global_step":  | 
| 6 | 
             
              "is_hyper_param_search": false,
         | 
| 7 | 
             
              "is_local_process_zero": true,
         | 
| 8 | 
             
              "is_world_process_zero": true,
         | 
| @@ -96,11 +96,89 @@ | |
| 96 | 
             
                  "eval_samples_per_second": 35.056,
         | 
| 97 | 
             
                  "eval_steps_per_second": 2.203,
         | 
| 98 | 
             
                  "step": 700
         | 
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
| 99 | 
             
                }
         | 
| 100 | 
             
              ],
         | 
| 101 | 
             
              "max_steps": 1876,
         | 
| 102 | 
             
              "num_train_epochs": 1,
         | 
| 103 | 
            -
              "total_flos":  | 
| 104 | 
             
              "trial_name": null,
         | 
| 105 | 
             
              "trial_params": null
         | 
| 106 | 
             
            }
         | 
|  | |
| 1 | 
             
            {
         | 
| 2 | 
             
              "best_metric": 0.885723696687195,
         | 
| 3 | 
             
              "best_model_checkpoint": "DocLayNet/lilt-xlm-roberta-base-finetuned-DocLayNet-base_paragraphs_ml512-v5/checkpoint-600",
         | 
| 4 | 
            +
              "epoch": 0.6929637526652452,
         | 
| 5 | 
            +
              "global_step": 1300,
         | 
| 6 | 
             
              "is_hyper_param_search": false,
         | 
| 7 | 
             
              "is_local_process_zero": true,
         | 
| 8 | 
             
              "is_world_process_zero": true,
         | 
|  | |
| 96 | 
             
                  "eval_samples_per_second": 35.056,
         | 
| 97 | 
             
                  "eval_steps_per_second": 2.203,
         | 
| 98 | 
             
                  "step": 700
         | 
| 99 | 
            +
                },
         | 
| 100 | 
            +
                {
         | 
| 101 | 
            +
                  "epoch": 0.43,
         | 
| 102 | 
            +
                  "eval_accuracy": 0.8528252168445007,
         | 
| 103 | 
            +
                  "eval_f1": 0.8528252168445007,
         | 
| 104 | 
            +
                  "eval_loss": 0.44917240738868713,
         | 
| 105 | 
            +
                  "eval_precision": 0.8528252168445007,
         | 
| 106 | 
            +
                  "eval_recall": 0.8528252168445007,
         | 
| 107 | 
            +
                  "eval_runtime": 45.6102,
         | 
| 108 | 
            +
                  "eval_samples_per_second": 35.233,
         | 
| 109 | 
            +
                  "eval_steps_per_second": 2.214,
         | 
| 110 | 
            +
                  "step": 800
         | 
| 111 | 
            +
                },
         | 
| 112 | 
            +
                {
         | 
| 113 | 
            +
                  "epoch": 0.48,
         | 
| 114 | 
            +
                  "eval_accuracy": 0.8833980456546259,
         | 
| 115 | 
            +
                  "eval_f1": 0.8833980456546259,
         | 
| 116 | 
            +
                  "eval_loss": 0.38389313220977783,
         | 
| 117 | 
            +
                  "eval_precision": 0.8833980456546259,
         | 
| 118 | 
            +
                  "eval_recall": 0.8833980456546259,
         | 
| 119 | 
            +
                  "eval_runtime": 47.6493,
         | 
| 120 | 
            +
                  "eval_samples_per_second": 33.726,
         | 
| 121 | 
            +
                  "eval_steps_per_second": 2.12,
         | 
| 122 | 
            +
                  "step": 900
         | 
| 123 | 
            +
                },
         | 
| 124 | 
            +
                {
         | 
| 125 | 
            +
                  "epoch": 0.53,
         | 
| 126 | 
            +
                  "learning_rate": 9.381663113006397e-06,
         | 
| 127 | 
            +
                  "loss": 0.4464,
         | 
| 128 | 
            +
                  "step": 1000
         | 
| 129 | 
            +
                },
         | 
| 130 | 
            +
                {
         | 
| 131 | 
            +
                  "epoch": 0.53,
         | 
| 132 | 
            +
                  "eval_accuracy": 0.8498407977082855,
         | 
| 133 | 
            +
                  "eval_f1": 0.8498407977082856,
         | 
| 134 | 
            +
                  "eval_loss": 0.4365050792694092,
         | 
| 135 | 
            +
                  "eval_precision": 0.8498407977082855,
         | 
| 136 | 
            +
                  "eval_recall": 0.8498407977082855,
         | 
| 137 | 
            +
                  "eval_runtime": 47.0078,
         | 
| 138 | 
            +
                  "eval_samples_per_second": 34.186,
         | 
| 139 | 
            +
                  "eval_steps_per_second": 2.149,
         | 
| 140 | 
            +
                  "step": 1000
         | 
| 141 | 
            +
                },
         | 
| 142 | 
            +
                {
         | 
| 143 | 
            +
                  "epoch": 0.59,
         | 
| 144 | 
            +
                  "eval_accuracy": 0.8811622266361904,
         | 
| 145 | 
            +
                  "eval_f1": 0.8811622266361904,
         | 
| 146 | 
            +
                  "eval_loss": 0.36158204078674316,
         | 
| 147 | 
            +
                  "eval_precision": 0.8811622266361904,
         | 
| 148 | 
            +
                  "eval_recall": 0.8811622266361904,
         | 
| 149 | 
            +
                  "eval_runtime": 44.8724,
         | 
| 150 | 
            +
                  "eval_samples_per_second": 35.813,
         | 
| 151 | 
            +
                  "eval_steps_per_second": 2.251,
         | 
| 152 | 
            +
                  "step": 1100
         | 
| 153 | 
            +
                },
         | 
| 154 | 
            +
                {
         | 
| 155 | 
            +
                  "epoch": 0.64,
         | 
| 156 | 
            +
                  "eval_accuracy": 0.8795751943864972,
         | 
| 157 | 
            +
                  "eval_f1": 0.8795751943864972,
         | 
| 158 | 
            +
                  "eval_loss": 0.3948919177055359,
         | 
| 159 | 
            +
                  "eval_precision": 0.8795751943864972,
         | 
| 160 | 
            +
                  "eval_recall": 0.8795751943864972,
         | 
| 161 | 
            +
                  "eval_runtime": 45.1224,
         | 
| 162 | 
            +
                  "eval_samples_per_second": 35.614,
         | 
| 163 | 
            +
                  "eval_steps_per_second": 2.238,
         | 
| 164 | 
            +
                  "step": 1200
         | 
| 165 | 
            +
                },
         | 
| 166 | 
            +
                {
         | 
| 167 | 
            +
                  "epoch": 0.69,
         | 
| 168 | 
            +
                  "eval_accuracy": 0.8612794075079601,
         | 
| 169 | 
            +
                  "eval_f1": 0.8612794075079601,
         | 
| 170 | 
            +
                  "eval_loss": 0.41840043663978577,
         | 
| 171 | 
            +
                  "eval_precision": 0.8612794075079601,
         | 
| 172 | 
            +
                  "eval_recall": 0.8612794075079601,
         | 
| 173 | 
            +
                  "eval_runtime": 39.7377,
         | 
| 174 | 
            +
                  "eval_samples_per_second": 40.44,
         | 
| 175 | 
            +
                  "eval_steps_per_second": 2.542,
         | 
| 176 | 
            +
                  "step": 1300
         | 
| 177 | 
             
                }
         | 
| 178 | 
             
              ],
         | 
| 179 | 
             
              "max_steps": 1876,
         | 
| 180 | 
             
              "num_train_epochs": 1,
         | 
| 181 | 
            +
              "total_flos": 2892991284019200.0,
         | 
| 182 | 
             
              "trial_name": null,
         | 
| 183 | 
             
              "trial_params": null
         | 
| 184 | 
             
            }
         | 
    	
        {checkpoint-800 → checkpoint-1300}/training_args.bin
    RENAMED
    
    | 
            File without changes
         | 
    	
        pytorch_model.bin
    CHANGED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
             
            size 1134425553
         | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:7d4698a9bcd9f4d1b85cd29935ce42f4264d331bc9713045308140215396cd2e
         | 
| 3 | 
             
            size 1134425553
         | 
    	
        runs/Feb15_07-53-26_e220f522c880/events.out.tfevents.1676447621.e220f522c880.495.0
    CHANGED
    
    | @@ -1,3 +1,3 @@ | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256: | 
| 3 | 
            -
            size  | 
|  | |
| 1 | 
             
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:aec79be76242a342cf813e35be39731a4cf8ff91fe61776b977f2529b2fa0e92
         | 
| 3 | 
            +
            size 11114
         | 
