{ "best_metric": NaN, "best_model_checkpoint": "/home/datawork-iot-nos/Seatizen/models/multilabel/fine_scale/resnet-50-2024_09_13-batch-size32_epochs150_freeze/checkpoint-273", "epoch": 11.0, "eval_steps": 500, "global_step": 3003, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.0, "eval_f1_macro": 0.0, "eval_f1_micro": 0.0, "eval_loss": NaN, "eval_roc_auc": 0.499453523472468, "eval_runtime": 431.8634, "eval_samples_per_second": 6.683, "eval_steps_per_second": 0.211, "learning_rate": 0.001, "step": 273 }, { "epoch": 1.8315018315018317, "grad_norm": NaN, "learning_rate": 0.001, "loss": 0.0, "step": 500 }, { "epoch": 2.0, "eval_accuracy": 0.000693000693000693, "eval_f1_macro": 0.00040576181781294376, "eval_f1_micro": 0.00031409501374165687, "eval_loss": NaN, "eval_roc_auc": 0.4992791043687002, "eval_runtime": 437.2143, "eval_samples_per_second": 6.601, "eval_steps_per_second": 0.208, "learning_rate": 0.001, "step": 546 }, { "epoch": 3.0, "eval_accuracy": 0.0017325017325017325, "eval_f1_macro": 0.0010049241282283187, "eval_f1_micro": 0.0007850525985241011, "eval_loss": NaN, "eval_roc_auc": 0.4993980575804369, "eval_runtime": 449.0005, "eval_samples_per_second": 6.428, "eval_steps_per_second": 0.203, "learning_rate": 0.001, "step": 819 }, { "epoch": 3.663003663003663, "grad_norm": NaN, "learning_rate": 0.001, "loss": 0.0, "step": 1000 }, { "epoch": 4.0, "eval_accuracy": 0.0, "eval_f1_macro": 0.0, "eval_f1_micro": 0.0, "eval_loss": NaN, "eval_roc_auc": 0.49914125117102115, "eval_runtime": 438.2382, "eval_samples_per_second": 6.585, "eval_steps_per_second": 0.208, "learning_rate": 0.001, "step": 1092 }, { "epoch": 5.0, "eval_accuracy": 0.0010395010395010396, "eval_f1_macro": 0.0006430178973314757, "eval_f1_micro": 0.00047177229124076113, "eval_loss": NaN, "eval_roc_auc": 0.4994358575523217, "eval_runtime": 457.0913, "eval_samples_per_second": 6.314, "eval_steps_per_second": 0.199, "learning_rate": 0.001, "step": 1365 }, { "epoch": 5.4945054945054945, "grad_norm": NaN, "learning_rate": 0.001, "loss": 0.0, "step": 1500 }, { "epoch": 6.0, "eval_accuracy": 0.0003465003465003465, "eval_f1_macro": 0.000206782464846981, "eval_f1_micro": 0.00015712153350616704, "eval_loss": NaN, "eval_roc_auc": 0.49927198166285536, "eval_runtime": 425.3309, "eval_samples_per_second": 6.785, "eval_steps_per_second": 0.214, "learning_rate": 0.001, "step": 1638 }, { "epoch": 7.0, "eval_accuracy": 0.0, "eval_f1_macro": 0.0, "eval_f1_micro": 0.0, "eval_loss": NaN, "eval_roc_auc": 0.49929738732174456, "eval_runtime": 423.0556, "eval_samples_per_second": 6.822, "eval_steps_per_second": 0.215, "learning_rate": 0.0001, "step": 1911 }, { "epoch": 7.326007326007326, "grad_norm": NaN, "learning_rate": 0.0001, "loss": 0.0, "step": 2000 }, { "epoch": 8.0, "eval_accuracy": 0.0003465003465003465, "eval_f1_macro": 0.0002061218179944347, "eval_f1_micro": 0.00015710919088766695, "eval_loss": NaN, "eval_roc_auc": 0.49926547598990856, "eval_runtime": 417.1408, "eval_samples_per_second": 6.919, "eval_steps_per_second": 0.218, "learning_rate": 0.0001, "step": 2184 }, { "epoch": 9.0, "eval_accuracy": 0.0, "eval_f1_macro": 0.0, "eval_f1_micro": 0.0, "eval_loss": NaN, "eval_roc_auc": 0.49944051212657437, "eval_runtime": 408.1598, "eval_samples_per_second": 7.071, "eval_steps_per_second": 0.223, "learning_rate": 0.0001, "step": 2457 }, { "epoch": 9.157509157509157, "grad_norm": NaN, "learning_rate": 0.0001, "loss": 0.0, "step": 2500 }, { "epoch": 10.0, "eval_accuracy": 0.000693000693000693, "eval_f1_macro": 0.0004230565838180856, "eval_f1_micro": 0.00031441597233139445, "eval_loss": NaN, "eval_roc_auc": 0.49936367811700877, "eval_runtime": 430.9669, "eval_samples_per_second": 6.697, "eval_steps_per_second": 0.211, "learning_rate": 0.0001, "step": 2730 }, { "epoch": 10.989010989010989, "grad_norm": NaN, "learning_rate": 0.0001, "loss": 0.0, "step": 3000 }, { "epoch": 11.0, "eval_accuracy": 0.0, "eval_f1_macro": 0.0, "eval_f1_micro": 0.0, "eval_loss": NaN, "eval_roc_auc": 0.49943400645362757, "eval_runtime": 416.2683, "eval_samples_per_second": 6.933, "eval_steps_per_second": 0.219, "learning_rate": 0.0001, "step": 3003 }, { "epoch": 11.0, "learning_rate": 0.0001, "step": 3003, "total_flos": 1.09151596234231e+19, "train_loss": 0.0, "train_runtime": 18978.5009, "train_samples_per_second": 68.888, "train_steps_per_second": 2.158 } ], "logging_steps": 500, "max_steps": 40950, "num_input_tokens_seen": 0, "num_train_epochs": 150, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 10, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.09151596234231e+19, "train_batch_size": 32, "trial_name": null, "trial_params": null }