lombardata commited on
Commit
361dec1
1 Parent(s): cfa1009

Evaluation on the test set completed on 2024_09_13.

Browse files
README.md ADDED
@@ -0,0 +1,75 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: microsoft/resnet-50
4
+ tags:
5
+ - generated_from_trainer
6
+ metrics:
7
+ - accuracy
8
+ model-index:
9
+ - name: resnet-50-2024_09_13-batch-size32_epochs150_freeze
10
+ results: []
11
+ ---
12
+
13
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
14
+ should probably proofread and complete it, then remove this comment. -->
15
+
16
+ # resnet-50-2024_09_13-batch-size32_epochs150_freeze
17
+
18
+ This model is a fine-tuned version of [microsoft/resnet-50](https://huggingface.co/microsoft/resnet-50) on the None dataset.
19
+ It achieves the following results on the evaluation set:
20
+ - Loss: nan
21
+ - F1 Micro: 0.0002
22
+ - F1 Macro: 0.0002
23
+ - Roc Auc: 0.4995
24
+ - Accuracy: 0.0003
25
+ - Learning Rate: 0.0001
26
+
27
+ ## Model description
28
+
29
+ More information needed
30
+
31
+ ## Intended uses & limitations
32
+
33
+ More information needed
34
+
35
+ ## Training and evaluation data
36
+
37
+ More information needed
38
+
39
+ ## Training procedure
40
+
41
+ ### Training hyperparameters
42
+
43
+ The following hyperparameters were used during training:
44
+ - learning_rate: 0.001
45
+ - train_batch_size: 32
46
+ - eval_batch_size: 32
47
+ - seed: 42
48
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
49
+ - lr_scheduler_type: linear
50
+ - num_epochs: 150
51
+ - mixed_precision_training: Native AMP
52
+
53
+ ### Training results
54
+
55
+ | Training Loss | Epoch | Step | Validation Loss | F1 Micro | F1 Macro | Roc Auc | Accuracy | Rate |
56
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|:--------:|:-------:|:--------:|:------:|
57
+ | No log | 1.0 | 273 | nan | 0.0 | 0.0 | 0.4995 | 0.0 | 0.001 |
58
+ | 0.0 | 2.0 | 546 | nan | 0.0003 | 0.0004 | 0.4993 | 0.0007 | 0.001 |
59
+ | 0.0 | 3.0 | 819 | nan | 0.0008 | 0.0010 | 0.4994 | 0.0017 | 0.001 |
60
+ | 0.0 | 4.0 | 1092 | nan | 0.0 | 0.0 | 0.4991 | 0.0 | 0.001 |
61
+ | 0.0 | 5.0 | 1365 | nan | 0.0005 | 0.0006 | 0.4994 | 0.0010 | 0.001 |
62
+ | 0.0 | 6.0 | 1638 | nan | 0.0002 | 0.0002 | 0.4993 | 0.0003 | 0.001 |
63
+ | 0.0 | 7.0 | 1911 | nan | 0.0 | 0.0 | 0.4993 | 0.0 | 0.0001 |
64
+ | 0.0 | 8.0 | 2184 | nan | 0.0002 | 0.0002 | 0.4993 | 0.0003 | 0.0001 |
65
+ | 0.0 | 9.0 | 2457 | nan | 0.0 | 0.0 | 0.4994 | 0.0 | 0.0001 |
66
+ | 0.0 | 10.0 | 2730 | nan | 0.0003 | 0.0004 | 0.4994 | 0.0007 | 0.0001 |
67
+ | 0.0 | 11.0 | 3003 | nan | 0.0 | 0.0 | 0.4994 | 0.0 | 0.0001 |
68
+
69
+
70
+ ### Framework versions
71
+
72
+ - Transformers 4.41.1
73
+ - Pytorch 2.3.0+cu121
74
+ - Datasets 2.19.1
75
+ - Tokenizers 0.19.1
all_results.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 11.0,
3
+ "eval_accuracy": 0.00034602076124567473,
4
+ "eval_f1_macro": 0.0002346041055718475,
5
+ "eval_f1_micro": 0.00015795293002685197,
6
+ "eval_loss": NaN,
7
+ "eval_roc_auc": 0.49951383990145193,
8
+ "eval_runtime": 420.9492,
9
+ "eval_samples_per_second": 6.865,
10
+ "eval_steps_per_second": 0.216,
11
+ "learning_rate": 0.0001,
12
+ "total_flos": 1.09151596234231e+19,
13
+ "train_loss": 0.0,
14
+ "train_runtime": 18978.5009,
15
+ "train_samples_per_second": 68.888,
16
+ "train_steps_per_second": 2.158
17
+ }
logs/events.out.tfevents.1726211111.datavisu2 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4a472b78238fc927f2d5d81899c3cb6db75396f543284060e274090e6bec08d4
3
- size 12580
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de833b5c3fa8ee2e547eaa3da26af08dd80d3672f6589245868fde77d737ca98
3
+ size 14275
logs/events.out.tfevents.1726230522.datavisu2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:428cf977790a688a573d85efeae42c0dd9de9e76db0de8772420cd075a543ebe
3
+ size 40
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d4c9245b0000abe7d5e316dd8c2f5e1c33bc7f4f29eb0c3cf8b863ed7961ab3
3
  size 94540692
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a56cc264c89bf5c7bf218605581418f30601d5599835dd576b71e7c1bb9eb67
3
  size 94540692
test_results.json ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 11.0,
3
+ "eval_accuracy": 0.00034602076124567473,
4
+ "eval_f1_macro": 0.0002346041055718475,
5
+ "eval_f1_micro": 0.00015795293002685197,
6
+ "eval_loss": NaN,
7
+ "eval_roc_auc": 0.49951383990145193,
8
+ "eval_runtime": 420.9492,
9
+ "eval_samples_per_second": 6.865,
10
+ "eval_steps_per_second": 0.216,
11
+ "learning_rate": 0.0001
12
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 11.0,
3
+ "learning_rate": 0.0001,
4
+ "total_flos": 1.09151596234231e+19,
5
+ "train_loss": 0.0,
6
+ "train_runtime": 18978.5009,
7
+ "train_samples_per_second": 68.888,
8
+ "train_steps_per_second": 2.158
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,237 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": NaN,
3
+ "best_model_checkpoint": "/home/datawork-iot-nos/Seatizen/models/multilabel/fine_scale/resnet-50-2024_09_13-batch-size32_epochs150_freeze/checkpoint-273",
4
+ "epoch": 11.0,
5
+ "eval_steps": 500,
6
+ "global_step": 3003,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 1.0,
13
+ "eval_accuracy": 0.0,
14
+ "eval_f1_macro": 0.0,
15
+ "eval_f1_micro": 0.0,
16
+ "eval_loss": NaN,
17
+ "eval_roc_auc": 0.499453523472468,
18
+ "eval_runtime": 431.8634,
19
+ "eval_samples_per_second": 6.683,
20
+ "eval_steps_per_second": 0.211,
21
+ "learning_rate": 0.001,
22
+ "step": 273
23
+ },
24
+ {
25
+ "epoch": 1.8315018315018317,
26
+ "grad_norm": NaN,
27
+ "learning_rate": 0.001,
28
+ "loss": 0.0,
29
+ "step": 500
30
+ },
31
+ {
32
+ "epoch": 2.0,
33
+ "eval_accuracy": 0.000693000693000693,
34
+ "eval_f1_macro": 0.00040576181781294376,
35
+ "eval_f1_micro": 0.00031409501374165687,
36
+ "eval_loss": NaN,
37
+ "eval_roc_auc": 0.4992791043687002,
38
+ "eval_runtime": 437.2143,
39
+ "eval_samples_per_second": 6.601,
40
+ "eval_steps_per_second": 0.208,
41
+ "learning_rate": 0.001,
42
+ "step": 546
43
+ },
44
+ {
45
+ "epoch": 3.0,
46
+ "eval_accuracy": 0.0017325017325017325,
47
+ "eval_f1_macro": 0.0010049241282283187,
48
+ "eval_f1_micro": 0.0007850525985241011,
49
+ "eval_loss": NaN,
50
+ "eval_roc_auc": 0.4993980575804369,
51
+ "eval_runtime": 449.0005,
52
+ "eval_samples_per_second": 6.428,
53
+ "eval_steps_per_second": 0.203,
54
+ "learning_rate": 0.001,
55
+ "step": 819
56
+ },
57
+ {
58
+ "epoch": 3.663003663003663,
59
+ "grad_norm": NaN,
60
+ "learning_rate": 0.001,
61
+ "loss": 0.0,
62
+ "step": 1000
63
+ },
64
+ {
65
+ "epoch": 4.0,
66
+ "eval_accuracy": 0.0,
67
+ "eval_f1_macro": 0.0,
68
+ "eval_f1_micro": 0.0,
69
+ "eval_loss": NaN,
70
+ "eval_roc_auc": 0.49914125117102115,
71
+ "eval_runtime": 438.2382,
72
+ "eval_samples_per_second": 6.585,
73
+ "eval_steps_per_second": 0.208,
74
+ "learning_rate": 0.001,
75
+ "step": 1092
76
+ },
77
+ {
78
+ "epoch": 5.0,
79
+ "eval_accuracy": 0.0010395010395010396,
80
+ "eval_f1_macro": 0.0006430178973314757,
81
+ "eval_f1_micro": 0.00047177229124076113,
82
+ "eval_loss": NaN,
83
+ "eval_roc_auc": 0.4994358575523217,
84
+ "eval_runtime": 457.0913,
85
+ "eval_samples_per_second": 6.314,
86
+ "eval_steps_per_second": 0.199,
87
+ "learning_rate": 0.001,
88
+ "step": 1365
89
+ },
90
+ {
91
+ "epoch": 5.4945054945054945,
92
+ "grad_norm": NaN,
93
+ "learning_rate": 0.001,
94
+ "loss": 0.0,
95
+ "step": 1500
96
+ },
97
+ {
98
+ "epoch": 6.0,
99
+ "eval_accuracy": 0.0003465003465003465,
100
+ "eval_f1_macro": 0.000206782464846981,
101
+ "eval_f1_micro": 0.00015712153350616704,
102
+ "eval_loss": NaN,
103
+ "eval_roc_auc": 0.49927198166285536,
104
+ "eval_runtime": 425.3309,
105
+ "eval_samples_per_second": 6.785,
106
+ "eval_steps_per_second": 0.214,
107
+ "learning_rate": 0.001,
108
+ "step": 1638
109
+ },
110
+ {
111
+ "epoch": 7.0,
112
+ "eval_accuracy": 0.0,
113
+ "eval_f1_macro": 0.0,
114
+ "eval_f1_micro": 0.0,
115
+ "eval_loss": NaN,
116
+ "eval_roc_auc": 0.49929738732174456,
117
+ "eval_runtime": 423.0556,
118
+ "eval_samples_per_second": 6.822,
119
+ "eval_steps_per_second": 0.215,
120
+ "learning_rate": 0.0001,
121
+ "step": 1911
122
+ },
123
+ {
124
+ "epoch": 7.326007326007326,
125
+ "grad_norm": NaN,
126
+ "learning_rate": 0.0001,
127
+ "loss": 0.0,
128
+ "step": 2000
129
+ },
130
+ {
131
+ "epoch": 8.0,
132
+ "eval_accuracy": 0.0003465003465003465,
133
+ "eval_f1_macro": 0.0002061218179944347,
134
+ "eval_f1_micro": 0.00015710919088766695,
135
+ "eval_loss": NaN,
136
+ "eval_roc_auc": 0.49926547598990856,
137
+ "eval_runtime": 417.1408,
138
+ "eval_samples_per_second": 6.919,
139
+ "eval_steps_per_second": 0.218,
140
+ "learning_rate": 0.0001,
141
+ "step": 2184
142
+ },
143
+ {
144
+ "epoch": 9.0,
145
+ "eval_accuracy": 0.0,
146
+ "eval_f1_macro": 0.0,
147
+ "eval_f1_micro": 0.0,
148
+ "eval_loss": NaN,
149
+ "eval_roc_auc": 0.49944051212657437,
150
+ "eval_runtime": 408.1598,
151
+ "eval_samples_per_second": 7.071,
152
+ "eval_steps_per_second": 0.223,
153
+ "learning_rate": 0.0001,
154
+ "step": 2457
155
+ },
156
+ {
157
+ "epoch": 9.157509157509157,
158
+ "grad_norm": NaN,
159
+ "learning_rate": 0.0001,
160
+ "loss": 0.0,
161
+ "step": 2500
162
+ },
163
+ {
164
+ "epoch": 10.0,
165
+ "eval_accuracy": 0.000693000693000693,
166
+ "eval_f1_macro": 0.0004230565838180856,
167
+ "eval_f1_micro": 0.00031441597233139445,
168
+ "eval_loss": NaN,
169
+ "eval_roc_auc": 0.49936367811700877,
170
+ "eval_runtime": 430.9669,
171
+ "eval_samples_per_second": 6.697,
172
+ "eval_steps_per_second": 0.211,
173
+ "learning_rate": 0.0001,
174
+ "step": 2730
175
+ },
176
+ {
177
+ "epoch": 10.989010989010989,
178
+ "grad_norm": NaN,
179
+ "learning_rate": 0.0001,
180
+ "loss": 0.0,
181
+ "step": 3000
182
+ },
183
+ {
184
+ "epoch": 11.0,
185
+ "eval_accuracy": 0.0,
186
+ "eval_f1_macro": 0.0,
187
+ "eval_f1_micro": 0.0,
188
+ "eval_loss": NaN,
189
+ "eval_roc_auc": 0.49943400645362757,
190
+ "eval_runtime": 416.2683,
191
+ "eval_samples_per_second": 6.933,
192
+ "eval_steps_per_second": 0.219,
193
+ "learning_rate": 0.0001,
194
+ "step": 3003
195
+ },
196
+ {
197
+ "epoch": 11.0,
198
+ "learning_rate": 0.0001,
199
+ "step": 3003,
200
+ "total_flos": 1.09151596234231e+19,
201
+ "train_loss": 0.0,
202
+ "train_runtime": 18978.5009,
203
+ "train_samples_per_second": 68.888,
204
+ "train_steps_per_second": 2.158
205
+ }
206
+ ],
207
+ "logging_steps": 500,
208
+ "max_steps": 40950,
209
+ "num_input_tokens_seen": 0,
210
+ "num_train_epochs": 150,
211
+ "save_steps": 500,
212
+ "stateful_callbacks": {
213
+ "EarlyStoppingCallback": {
214
+ "args": {
215
+ "early_stopping_patience": 10,
216
+ "early_stopping_threshold": 0.0
217
+ },
218
+ "attributes": {
219
+ "early_stopping_patience_counter": 0
220
+ }
221
+ },
222
+ "TrainerControl": {
223
+ "args": {
224
+ "should_epoch_stop": false,
225
+ "should_evaluate": false,
226
+ "should_log": false,
227
+ "should_save": true,
228
+ "should_training_stop": true
229
+ },
230
+ "attributes": {}
231
+ }
232
+ },
233
+ "total_flos": 1.09151596234231e+19,
234
+ "train_batch_size": 32,
235
+ "trial_name": null,
236
+ "trial_params": null
237
+ }