|
{ |
|
"best_metric": 0.9424768686294556, |
|
"best_model_checkpoint": "diogopaes10/012-microsoft-deberta-v3-base-finetuned-yahoo-8000_2000/checkpoint-500", |
|
"epoch": 2.0, |
|
"global_step": 500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.0, |
|
"learning_rate": 1.9984e-05, |
|
"loss": 2.308, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 1.9200000000000003e-05, |
|
"loss": 2.2963, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_accuracy": 0.2015, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.807334899902344, |
|
"eval_f1": 0.12984294240667255, |
|
"eval_gpu_ram_allocated": 2.0898146629333496, |
|
"eval_gpu_ram_cached": 25.845703125, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 48, |
|
"eval_loss": 2.2150378227233887, |
|
"eval_precision": 0.20897251377917925, |
|
"eval_recall": 0.2015, |
|
"eval_runtime": 2.4064, |
|
"eval_samples_per_second": 831.127, |
|
"eval_steps_per_second": 26.181, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.9806594848632812, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"learning_rate": 1.8400000000000003e-05, |
|
"loss": 1.8843, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_accuracy": 0.592, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.80740737915039, |
|
"eval_f1": 0.5588381140615875, |
|
"eval_gpu_ram_allocated": 2.0897889137268066, |
|
"eval_gpu_ram_cached": 25.84765625, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 49, |
|
"eval_loss": 1.4590158462524414, |
|
"eval_precision": 0.6417526665901784, |
|
"eval_recall": 0.592, |
|
"eval_runtime": 2.4022, |
|
"eval_samples_per_second": 832.564, |
|
"eval_steps_per_second": 26.226, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.9979324340820312, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"learning_rate": 1.7616000000000002e-05, |
|
"loss": 1.3348, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_accuracy": 0.668, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.80740737915039, |
|
"eval_f1": 0.6613366784391611, |
|
"eval_gpu_ram_allocated": 2.089787483215332, |
|
"eval_gpu_ram_cached": 25.85546875, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 49, |
|
"eval_loss": 1.180911660194397, |
|
"eval_precision": 0.6736430562605106, |
|
"eval_recall": 0.668, |
|
"eval_runtime": 2.3835, |
|
"eval_samples_per_second": 839.093, |
|
"eval_steps_per_second": 26.431, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.983623504638672, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 1.6816e-05, |
|
"loss": 1.1501, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_accuracy": 0.695, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.807422637939453, |
|
"eval_f1": 0.6929220794455174, |
|
"eval_gpu_ram_allocated": 2.0897974967956543, |
|
"eval_gpu_ram_cached": 25.85546875, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 51, |
|
"eval_loss": 1.0483959913253784, |
|
"eval_precision": 0.6981404124535453, |
|
"eval_recall": 0.695, |
|
"eval_runtime": 2.3606, |
|
"eval_samples_per_second": 847.255, |
|
"eval_steps_per_second": 26.689, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.9695281982421875, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 1.6016e-05, |
|
"loss": 1.0842, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.6905, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.80750274658203, |
|
"eval_f1": 0.6825102140466686, |
|
"eval_gpu_ram_allocated": 2.0897974967956543, |
|
"eval_gpu_ram_cached": 25.85546875, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 50, |
|
"eval_loss": 1.0264948606491089, |
|
"eval_precision": 0.6893511728014889, |
|
"eval_recall": 0.6905, |
|
"eval_runtime": 2.3931, |
|
"eval_samples_per_second": 835.746, |
|
"eval_steps_per_second": 26.326, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.975543975830078, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"learning_rate": 1.5216000000000001e-05, |
|
"loss": 0.8618, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"eval_accuracy": 0.704, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.807506561279297, |
|
"eval_f1": 0.70238565521567, |
|
"eval_gpu_ram_allocated": 2.0897774696350098, |
|
"eval_gpu_ram_cached": 25.85546875, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 50, |
|
"eval_loss": 0.9903561472892761, |
|
"eval_precision": 0.7048361105844692, |
|
"eval_recall": 0.704, |
|
"eval_runtime": 2.3588, |
|
"eval_samples_per_second": 847.898, |
|
"eval_steps_per_second": 26.709, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.97076416015625, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.4, |
|
"learning_rate": 1.4416e-05, |
|
"loss": 0.9329, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 1.4, |
|
"eval_accuracy": 0.686, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.807571411132812, |
|
"eval_f1": 0.6824952585178898, |
|
"eval_gpu_ram_allocated": 2.089780330657959, |
|
"eval_gpu_ram_cached": 25.85546875, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 48, |
|
"eval_loss": 0.9927061796188354, |
|
"eval_precision": 0.6938911551302326, |
|
"eval_recall": 0.686, |
|
"eval_runtime": 2.3815, |
|
"eval_samples_per_second": 839.799, |
|
"eval_steps_per_second": 26.454, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.9594879150390625, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 1.3616e-05, |
|
"loss": 0.9053, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"eval_accuracy": 0.705, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.807575225830078, |
|
"eval_f1": 0.702067821848656, |
|
"eval_gpu_ram_allocated": 2.089798927307129, |
|
"eval_gpu_ram_cached": 25.85546875, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 48, |
|
"eval_loss": 0.9795323610305786, |
|
"eval_precision": 0.7048247100554489, |
|
"eval_recall": 0.705, |
|
"eval_runtime": 2.405, |
|
"eval_samples_per_second": 831.614, |
|
"eval_steps_per_second": 26.196, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.9837112426757812, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.8, |
|
"learning_rate": 1.2816000000000002e-05, |
|
"loss": 0.9173, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 1.8, |
|
"eval_accuracy": 0.709, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.807697296142578, |
|
"eval_f1": 0.702389340359417, |
|
"eval_gpu_ram_allocated": 2.089791774749756, |
|
"eval_gpu_ram_cached": 25.85546875, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 48, |
|
"eval_loss": 0.9748538136482239, |
|
"eval_precision": 0.7139968646595424, |
|
"eval_recall": 0.709, |
|
"eval_runtime": 2.4003, |
|
"eval_samples_per_second": 833.243, |
|
"eval_steps_per_second": 26.247, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.9850807189941406, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"learning_rate": 1.2016000000000002e-05, |
|
"loss": 0.9189, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.718, |
|
"eval_disk_space_total": 78.1898422241211, |
|
"eval_disk_space_used": 24.807697296142578, |
|
"eval_f1": 0.7137748110894239, |
|
"eval_gpu_ram_allocated": 2.0897889137268066, |
|
"eval_gpu_ram_cached": 25.85546875, |
|
"eval_gpu_ram_total": 39.56402587890625, |
|
"eval_gpu_utilization": 48, |
|
"eval_loss": 0.9424768686294556, |
|
"eval_precision": 0.718404095887314, |
|
"eval_recall": 0.718, |
|
"eval_runtime": 2.381, |
|
"eval_samples_per_second": 839.978, |
|
"eval_steps_per_second": 26.459, |
|
"eval_system_ram_total": 83.48073959350586, |
|
"eval_system_ram_used": 3.994873046875, |
|
"step": 500 |
|
} |
|
], |
|
"max_steps": 1250, |
|
"num_train_epochs": 5, |
|
"total_flos": 965391777104256.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|