update model

Files changed (8) hide show

all_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
-    "train_loss": 0.24564219588448766,
-    "train_runtime": 262.0679,
     "train_samples": 8808,
-    "train_samples_per_second": 100.829,
-    "train_steps_per_second": 6.308
 }

 {
     "epoch": 3.0,
+    "train_loss": 0.23321845325209195,
+    "train_runtime": 205.592,
     "train_samples": 8808,
+    "train_samples_per_second": 128.526,
+    "train_steps_per_second": 8.04
 }

config.json CHANGED Viewed

@@ -11,20 +11,20 @@
   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "id2label": {
-    "0": "LABEL_0",
-    "1": "LABEL_1",
-    "2": "LABEL_2",
-    "3": "LABEL_3",
-    "4": "LABEL_4"
   },
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "label2id": {
-    "LABEL_0": 0,
-    "LABEL_1": 1,
-    "LABEL_2": 2,
-    "LABEL_3": 3,
-    "LABEL_4": 4
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
@@ -39,7 +39,7 @@
   "pooler_type": "first_token_transform",
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
-  "transformers_version": "4.36.2",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 119547

   "hidden_dropout_prob": 0.1,
   "hidden_size": 768,
   "id2label": {
+    "0": "B-Claim",
+    "1": "B-Premise",
+    "2": "I-Claim",
+    "3": "I-Premise",
+    "4": "O"
   },
   "initializer_range": 0.02,
   "intermediate_size": 3072,
   "label2id": {
+    "B-Claim": 0,
+    "B-Premise": 1,
+    "I-Claim": 2,
+    "I-Premise": 3,
+    "O": 4
   },
   "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
   "pooler_type": "first_token_transform",
   "position_embedding_type": "absolute",
   "torch_dtype": "float32",
+  "transformers_version": "4.40.0.dev0",
   "type_vocab_size": 2,
   "use_cache": true,
   "vocab_size": 119547

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d88e185b8f01e5d7aff8d660772f93e7497df7ea384348229e5a140bbc692235
 size 709090132

 version https://git-lfs.github.com/spec/v1
+oid sha256:7a11f26a1e60915fd8c58c74707dd728a37ce27f8b70d3f8814faf80ca5b5a46
 size 709090132

tokenizer.json CHANGED Viewed

@@ -2,7 +2,7 @@
   "version": "1.0",
   "truncation": {
     "direction": "Right",
-    "max_length": 512,
     "strategy": "LongestFirst",
     "stride": 0
   },

   "version": "1.0",
   "truncation": {
     "direction": "Right",
+    "max_length": 256,
     "strategy": "LongestFirst",
     "stride": 0
   },

tokenizer_config.json CHANGED Viewed

@@ -1,5 +1,4 @@
 {
-  "add_prefix_space": true,
   "added_tokens_decoder": {
     "0": {
       "content": "[PAD]",
@@ -52,5 +51,6 @@
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
   "unk_token": "[UNK]"
 }

 {
   "added_tokens_decoder": {
     "0": {
       "content": "[PAD]",
   "strip_accents": null,
   "tokenize_chinese_chars": true,
   "tokenizer_class": "BertTokenizer",
+  "truncation": true,
   "unk_token": "[UNK]"
 }

train_results.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
     "epoch": 3.0,
-    "train_loss": 0.24564219588448766,
-    "train_runtime": 262.0679,
     "train_samples": 8808,
-    "train_samples_per_second": 100.829,
-    "train_steps_per_second": 6.308
 }

 {
     "epoch": 3.0,
+    "train_loss": 0.23321845325209195,
+    "train_runtime": 205.592,
     "train_samples": 8808,
+    "train_samples_per_second": 128.526,
+    "train_steps_per_second": 8.04
 }

trainer_state.json CHANGED Viewed

@@ -10,30 +10,33 @@
   "log_history": [
     {
       "epoch": 0.91,
       "learning_rate": 3.487598306110103e-05,
-      "loss": 0.4056,
       "step": 500
     },
     {
       "epoch": 1.81,
       "learning_rate": 1.975196612220206e-05,
-      "loss": 0.2455,
       "step": 1000
     },
     {
       "epoch": 2.72,
       "learning_rate": 4.627949183303086e-06,
-      "loss": 0.1298,
       "step": 1500
     },
     {
       "epoch": 3.0,
       "step": 1653,
-      "total_flos": 1395101222261760.0,
-      "train_loss": 0.24564219588448766,
-      "train_runtime": 262.0679,
-      "train_samples_per_second": 100.829,
-      "train_steps_per_second": 6.308
     }
   ],
   "logging_steps": 500,
@@ -41,7 +44,7 @@
   "num_input_tokens_seen": 0,
   "num_train_epochs": 3,
   "save_steps": 500,
-  "total_flos": 1395101222261760.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

   "log_history": [
     {
       "epoch": 0.91,
+      "grad_norm": 4.16880989074707,
       "learning_rate": 3.487598306110103e-05,
+      "loss": 0.4004,
       "step": 500
     },
     {
       "epoch": 1.81,
+      "grad_norm": 1.7097141742706299,
       "learning_rate": 1.975196612220206e-05,
+      "loss": 0.2175,
       "step": 1000
     },
     {
       "epoch": 2.72,
+      "grad_norm": 0.8170027136802673,
       "learning_rate": 4.627949183303086e-06,
+      "loss": 0.1255,
       "step": 1500
     },
     {
       "epoch": 3.0,
       "step": 1653,
+      "total_flos": 1394635774789920.0,
+      "train_loss": 0.23321845325209195,
+      "train_runtime": 205.592,
+      "train_samples_per_second": 128.526,
+      "train_steps_per_second": 8.04
     }
   ],
   "logging_steps": 500,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 3,
   "save_steps": 500,
+  "total_flos": 1394635774789920.0,
   "train_batch_size": 16,
   "trial_name": null,
   "trial_params": null

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:de11250632abb8e8078d16652e77145ac8ead77ea6eca4e95f9eb9fc9d3743bf
-size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:ed24ac9afab1bea179b4701674fefdacd7f3cebd1c81dd62a5bc0fdf71863ccd
+size 5048