Euanyu commited on
Commit
ad6c526
1 Parent(s): 734e567

Delete trainer_state.json

Browse files
Files changed (1) hide show
  1. trainer_state.json +0 -187
trainer_state.json DELETED
@@ -1,187 +0,0 @@
1
- {
2
- "best_metric": 0.1951880156993866,
3
- "best_model_checkpoint": "bioformer8L_caption_RTX6000/checkpoint-1230",
4
- "epoch": 5.0,
5
- "eval_steps": 500,
6
- "global_step": 6150,
7
- "is_hyper_param_search": false,
8
- "is_local_process_zero": true,
9
- "is_world_process_zero": true,
10
- "log_history": [
11
- {
12
- "epoch": 0.4065040650406504,
13
- "grad_norm": 6.299335956573486,
14
- "learning_rate": 2.75609756097561e-05,
15
- "loss": 0.2386,
16
- "step": 500
17
- },
18
- {
19
- "epoch": 0.8130081300813008,
20
- "grad_norm": 1.643288016319275,
21
- "learning_rate": 2.5121951219512197e-05,
22
- "loss": 0.1845,
23
- "step": 1000
24
- },
25
- {
26
- "epoch": 1.0,
27
- "eval_accuracy": 0.9235252019220939,
28
- "eval_f1": 0.9179996646545943,
29
- "eval_f1_medical": 0.9392857142857143,
30
- "eval_f1_non_medical": 0.8967136150234741,
31
- "eval_loss": 0.1951880156993866,
32
- "eval_precision": 0.9223852158649997,
33
- "eval_recall": 0.9142873862649601,
34
- "eval_runtime": 27.8883,
35
- "eval_samples_per_second": 350.72,
36
- "eval_steps_per_second": 10.972,
37
- "step": 1230
38
- },
39
- {
40
- "epoch": 1.2195121951219512,
41
- "grad_norm": 2.678163766860962,
42
- "learning_rate": 2.2682926829268295e-05,
43
- "loss": 0.1505,
44
- "step": 1500
45
- },
46
- {
47
- "epoch": 1.6260162601626016,
48
- "grad_norm": 2.3176321983337402,
49
- "learning_rate": 2.024390243902439e-05,
50
- "loss": 0.1284,
51
- "step": 2000
52
- },
53
- {
54
- "epoch": 2.0,
55
- "eval_accuracy": 0.9270013291074533,
56
- "eval_f1": 0.9224194379620252,
57
- "eval_f1_medical": 0.9412732357295608,
58
- "eval_f1_non_medical": 0.9035656401944895,
59
- "eval_loss": 0.2104455977678299,
60
- "eval_precision": 0.9225986393203021,
61
- "eval_recall": 0.9222416990354869,
62
- "eval_runtime": 28.2544,
63
- "eval_samples_per_second": 346.176,
64
- "eval_steps_per_second": 10.83,
65
- "step": 2460
66
- },
67
- {
68
- "epoch": 2.032520325203252,
69
- "grad_norm": 4.071255683898926,
70
- "learning_rate": 1.7804878048780488e-05,
71
- "loss": 0.1227,
72
- "step": 2500
73
- },
74
- {
75
- "epoch": 2.4390243902439024,
76
- "grad_norm": 14.561558723449707,
77
- "learning_rate": 1.5365853658536586e-05,
78
- "loss": 0.0809,
79
- "step": 3000
80
- },
81
- {
82
- "epoch": 2.845528455284553,
83
- "grad_norm": 5.630990982055664,
84
- "learning_rate": 1.2926829268292684e-05,
85
- "loss": 0.0881,
86
- "step": 3500
87
- },
88
- {
89
- "epoch": 3.0,
90
- "eval_accuracy": 0.9278192413863613,
91
- "eval_f1": 0.9233290940374888,
92
- "eval_f1_medical": 0.9418834376028976,
93
- "eval_f1_non_medical": 0.9047747504720799,
94
- "eval_loss": 0.25612133741378784,
95
- "eval_precision": 0.9232846377701289,
96
- "eval_recall": 0.9233736416754945,
97
- "eval_runtime": 27.9805,
98
- "eval_samples_per_second": 349.564,
99
- "eval_steps_per_second": 10.936,
100
- "step": 3690
101
- },
102
- {
103
- "epoch": 3.252032520325203,
104
- "grad_norm": 16.422693252563477,
105
- "learning_rate": 1.048780487804878e-05,
106
- "loss": 0.0643,
107
- "step": 4000
108
- },
109
- {
110
- "epoch": 3.658536585365854,
111
- "grad_norm": 3.8088247776031494,
112
- "learning_rate": 8.048780487804879e-06,
113
- "loss": 0.0567,
114
- "step": 4500
115
- },
116
- {
117
- "epoch": 4.0,
118
- "eval_accuracy": 0.9209692260505061,
119
- "eval_f1": 0.9165782775866363,
120
- "eval_f1_medical": 0.9357172557172557,
121
- "eval_f1_non_medical": 0.897439299456017,
122
- "eval_loss": 0.3461480140686035,
123
- "eval_precision": 0.9141722217469603,
124
- "eval_recall": 0.9193323694864739,
125
- "eval_runtime": 27.8584,
126
- "eval_samples_per_second": 351.097,
127
- "eval_steps_per_second": 10.984,
128
- "step": 4920
129
- },
130
- {
131
- "epoch": 4.065040650406504,
132
- "grad_norm": 3.315011739730835,
133
- "learning_rate": 5.609756097560976e-06,
134
- "loss": 0.0519,
135
- "step": 5000
136
- },
137
- {
138
- "epoch": 4.471544715447155,
139
- "grad_norm": 15.6904878616333,
140
- "learning_rate": 3.1707317073170736e-06,
141
- "loss": 0.0328,
142
- "step": 5500
143
- },
144
- {
145
- "epoch": 4.878048780487805,
146
- "grad_norm": 15.453346252441406,
147
- "learning_rate": 7.317073170731708e-07,
148
- "loss": 0.0358,
149
- "step": 6000
150
- },
151
- {
152
- "epoch": 5.0,
153
- "eval_accuracy": 0.9273080462120438,
154
- "eval_f1": 0.9227413256853779,
155
- "eval_f1_medical": 0.9415247964470762,
156
- "eval_f1_non_medical": 0.9039578549236796,
157
- "eval_loss": 0.3629767894744873,
158
- "eval_precision": 0.9229432788139431,
159
- "eval_recall": 0.9225412244408466,
160
- "eval_runtime": 27.7955,
161
- "eval_samples_per_second": 351.891,
162
- "eval_steps_per_second": 11.009,
163
- "step": 6150
164
- }
165
- ],
166
- "logging_steps": 500,
167
- "max_steps": 6150,
168
- "num_input_tokens_seen": 0,
169
- "num_train_epochs": 5,
170
- "save_steps": 500,
171
- "stateful_callbacks": {
172
- "TrainerControl": {
173
- "args": {
174
- "should_epoch_stop": false,
175
- "should_evaluate": false,
176
- "should_log": false,
177
- "should_save": true,
178
- "should_training_stop": true
179
- },
180
- "attributes": {}
181
- }
182
- },
183
- "total_flos": 1.3125933204124032e+16,
184
- "train_batch_size": 32,
185
- "trial_name": null,
186
- "trial_params": null
187
- }