nguyenkhoa commited on
Commit
c6a2dab
·
verified ·
1 Parent(s): 59d1419

End of training

Browse files
Files changed (3) hide show
  1. all_results.json +8 -0
  2. train_results.json +8 -0
  3. trainer_state.json +194 -0
all_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "total_flos": 2.0799754853313946e+18,
4
+ "train_loss": 0.021147532474010362,
5
+ "train_runtime": 5927.6048,
6
+ "train_samples_per_second": 70.453,
7
+ "train_steps_per_second": 0.092
8
+ }
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 5.0,
3
+ "total_flos": 2.0799754853313946e+18,
4
+ "train_loss": 0.021147532474010362,
5
+ "train_runtime": 5927.6048,
6
+ "train_samples_per_second": 70.453,
7
+ "train_steps_per_second": 0.092
8
+ }
trainer_state.json ADDED
@@ -0,0 +1,194 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.022426238283514977,
3
+ "best_model_checkpoint": "./dinov2_Liveness_detection_v2.2.3/checkpoint-512",
4
+ "epoch": 5.0,
5
+ "eval_steps": 64,
6
+ "global_step": 545,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.5871559633027523,
13
+ "grad_norm": 4.068049430847168,
14
+ "learning_rate": 4.422018348623854e-05,
15
+ "loss": 0.0562,
16
+ "step": 64
17
+ },
18
+ {
19
+ "epoch": 0.5871559633027523,
20
+ "eval_accuracy": 0.986015995402519,
21
+ "eval_f1": 0.9860480756099135,
22
+ "eval_loss": 0.03846299648284912,
23
+ "eval_precision": 0.9860352552892203,
24
+ "eval_recall": 0.986015995402519,
25
+ "eval_runtime": 217.7244,
26
+ "eval_samples_per_second": 95.906,
27
+ "eval_steps_per_second": 11.992,
28
+ "step": 64
29
+ },
30
+ {
31
+ "epoch": 1.1743119266055047,
32
+ "grad_norm": 2.0854928493499756,
33
+ "learning_rate": 3.834862385321101e-05,
34
+ "loss": 0.0328,
35
+ "step": 128
36
+ },
37
+ {
38
+ "epoch": 1.1743119266055047,
39
+ "eval_accuracy": 0.9884105167377041,
40
+ "eval_f1": 0.9883880032307305,
41
+ "eval_loss": 0.0350191667675972,
42
+ "eval_precision": 0.988510772434393,
43
+ "eval_recall": 0.9884105167377041,
44
+ "eval_runtime": 207.2244,
45
+ "eval_samples_per_second": 100.765,
46
+ "eval_steps_per_second": 12.6,
47
+ "step": 128
48
+ },
49
+ {
50
+ "epoch": 1.761467889908257,
51
+ "grad_norm": 7.789446830749512,
52
+ "learning_rate": 3.2477064220183487e-05,
53
+ "loss": 0.0251,
54
+ "step": 192
55
+ },
56
+ {
57
+ "epoch": 1.761467889908257,
58
+ "eval_accuracy": 0.9878837220439635,
59
+ "eval_f1": 0.9879027538320604,
60
+ "eval_loss": 0.031058767810463905,
61
+ "eval_precision": 0.9878842870124719,
62
+ "eval_recall": 0.9878837220439635,
63
+ "eval_runtime": 206.3437,
64
+ "eval_samples_per_second": 101.195,
65
+ "eval_steps_per_second": 12.654,
66
+ "step": 192
67
+ },
68
+ {
69
+ "epoch": 2.3486238532110093,
70
+ "grad_norm": 3.044827938079834,
71
+ "learning_rate": 2.6605504587155967e-05,
72
+ "loss": 0.0185,
73
+ "step": 256
74
+ },
75
+ {
76
+ "epoch": 2.3486238532110093,
77
+ "eval_accuracy": 0.9894641061251855,
78
+ "eval_f1": 0.9894535727205462,
79
+ "eval_loss": 0.02958873100578785,
80
+ "eval_precision": 0.9895000833022948,
81
+ "eval_recall": 0.9894641061251855,
82
+ "eval_runtime": 207.7816,
83
+ "eval_samples_per_second": 100.495,
84
+ "eval_steps_per_second": 12.566,
85
+ "step": 256
86
+ },
87
+ {
88
+ "epoch": 2.9357798165137616,
89
+ "grad_norm": 3.2054522037506104,
90
+ "learning_rate": 2.0733944954128444e-05,
91
+ "loss": 0.0166,
92
+ "step": 320
93
+ },
94
+ {
95
+ "epoch": 2.9357798165137616,
96
+ "eval_accuracy": 0.989703558258704,
97
+ "eval_f1": 0.9896806110545806,
98
+ "eval_loss": 0.03277856856584549,
99
+ "eval_precision": 0.9898218810126647,
100
+ "eval_recall": 0.989703558258704,
101
+ "eval_runtime": 208.2058,
102
+ "eval_samples_per_second": 100.29,
103
+ "eval_steps_per_second": 12.54,
104
+ "step": 320
105
+ },
106
+ {
107
+ "epoch": 3.522935779816514,
108
+ "grad_norm": 2.348264694213867,
109
+ "learning_rate": 1.486238532110092e-05,
110
+ "loss": 0.0109,
111
+ "step": 384
112
+ },
113
+ {
114
+ "epoch": 3.522935779816514,
115
+ "eval_accuracy": 0.9906134763660744,
116
+ "eval_f1": 0.9906023345002652,
117
+ "eval_loss": 0.03355810046195984,
118
+ "eval_precision": 0.9906567348383362,
119
+ "eval_recall": 0.9906134763660744,
120
+ "eval_runtime": 208.1416,
121
+ "eval_samples_per_second": 100.321,
122
+ "eval_steps_per_second": 12.544,
123
+ "step": 384
124
+ },
125
+ {
126
+ "epoch": 4.110091743119266,
127
+ "grad_norm": 1.7739728689193726,
128
+ "learning_rate": 8.990825688073395e-06,
129
+ "loss": 0.0098,
130
+ "step": 448
131
+ },
132
+ {
133
+ "epoch": 4.110091743119266,
134
+ "eval_accuracy": 0.9917149561802596,
135
+ "eval_f1": 0.9917071374247993,
136
+ "eval_loss": 0.024906398728489876,
137
+ "eval_precision": 0.9917439317129936,
138
+ "eval_recall": 0.9917149561802596,
139
+ "eval_runtime": 208.2528,
140
+ "eval_samples_per_second": 100.268,
141
+ "eval_steps_per_second": 12.538,
142
+ "step": 448
143
+ },
144
+ {
145
+ "epoch": 4.697247706422019,
146
+ "grad_norm": 0.5001527667045593,
147
+ "learning_rate": 3.119266055045872e-06,
148
+ "loss": 0.0069,
149
+ "step": 512
150
+ },
151
+ {
152
+ "epoch": 4.697247706422019,
153
+ "eval_accuracy": 0.993247449834778,
154
+ "eval_f1": 0.993242084550572,
155
+ "eval_loss": 0.022426238283514977,
156
+ "eval_precision": 0.9932676807197346,
157
+ "eval_recall": 0.993247449834778,
158
+ "eval_runtime": 221.0481,
159
+ "eval_samples_per_second": 94.464,
160
+ "eval_steps_per_second": 11.812,
161
+ "step": 512
162
+ },
163
+ {
164
+ "epoch": 5.0,
165
+ "step": 545,
166
+ "total_flos": 2.0799754853313946e+18,
167
+ "train_loss": 0.021147532474010362,
168
+ "train_runtime": 5927.6048,
169
+ "train_samples_per_second": 70.453,
170
+ "train_steps_per_second": 0.092
171
+ }
172
+ ],
173
+ "logging_steps": 64,
174
+ "max_steps": 545,
175
+ "num_input_tokens_seen": 0,
176
+ "num_train_epochs": 5,
177
+ "save_steps": 64,
178
+ "stateful_callbacks": {
179
+ "TrainerControl": {
180
+ "args": {
181
+ "should_epoch_stop": false,
182
+ "should_evaluate": false,
183
+ "should_log": false,
184
+ "should_save": true,
185
+ "should_training_stop": true
186
+ },
187
+ "attributes": {}
188
+ }
189
+ },
190
+ "total_flos": 2.0799754853313946e+18,
191
+ "train_batch_size": 768,
192
+ "trial_name": null,
193
+ "trial_params": null
194
+ }