Training in progress, step 500

Files changed (9) hide show

config.json CHANGED Viewed

@@ -1,37 +1,44 @@
 {
-  "_name_or_path": "lxyuan/distilbert-base-multilingual-cased-sentiments-student",
-  "activation": "gelu",
   "architectures": [
-    "DistilBertForSequenceClassification"
   ],
-  "attention_dropout": 0.1,
-  "dim": 768,
-  "dropout": 0.1,
-  "hidden_dim": 3072,
   "id2label": {
     "0": "negative",
     "1": "netral",
     "2": "positive"
   },
   "initializer_range": 0.02,
   "label2id": {
     "negative": 0,
     "netral": 1,
     "positive": 2
   },
   "max_position_embeddings": 512,
-  "max_split_size_mb": 100,
-  "model_type": "distilbert",
-  "n_heads": 12,
-  "n_layers": 6,
   "output_past": true,
   "pad_token_id": 0,
   "problem_type": "single_label_classification",
-  "qa_dropout": 0.1,
-  "seq_classif_dropout": 0.2,
-  "sinusoidal_pos_embds": false,
-  "tie_weights_": true,
   "torch_dtype": "float32",
-  "transformers_version": "4.37.2",
-  "vocab_size": 119547
 }

 {
+  "_name_or_path": "naufalihsan/indonesian-sbert-large",
+  "_num_labels": 5,
   "architectures": [
+    "BertForSequenceClassification"
   ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "directionality": "bidi",
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 1024,
   "id2label": {
     "0": "negative",
     "1": "netral",
     "2": "positive"
   },
   "initializer_range": 0.02,
+  "intermediate_size": 4096,
   "label2id": {
     "negative": 0,
     "netral": 1,
     "positive": 2
   },
+  "layer_norm_eps": 1e-12,
   "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 16,
+  "num_hidden_layers": 24,
   "output_past": true,
   "pad_token_id": 0,
+  "pooler_fc_size": 768,
+  "pooler_num_attention_heads": 12,
+  "pooler_num_fc_layers": 3,
+  "pooler_size_per_head": 128,
+  "pooler_type": "first_token_transform",
+  "position_embedding_type": "absolute",
   "problem_type": "single_label_classification",
   "torch_dtype": "float32",
+  "transformers_version": "4.35.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2d3cf7972da23d24bc6c61ff0a80d81ed459b03c3abf34c7116767bcc49a50e4
-size 541320452

 version https://git-lfs.github.com/spec/v1
+oid sha256:a413d2a8be19be7d7144f9d7b9e6c574691fb3f122beeec3ad9895fc73605a6e
+size 2681258616

runs/Feb23_04-31-13_153b43858746/events.out.tfevents.1708662676.153b43858746.6732.0 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:c794030a25a04b60553aa447ba27486f937a80da6cac1ae265924069ae085350
+size 5046

runs/Feb23_06-12-03_153b43858746/events.out.tfevents.1708668724.153b43858746.6732.1 ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:fb2966d49e910934d283a9bb2c0173db92191a31377a400c65bcd6b5791df5f1
+size 5203

special_tokens_map.json CHANGED Viewed

@@ -1,37 +1,7 @@
 {
-  "cls_token": {
-    "content": "[CLS]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "mask_token": {
-    "content": "[MASK]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "pad_token": {
-    "content": "[PAD]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "sep_token": {
-    "content": "[SEP]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  },
-  "unk_token": {
-    "content": "[UNK]",
-    "lstrip": false,
-    "normalized": false,
-    "rstrip": false,
-    "single_word": false
-  }
 }

 {
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
 }

tokenizer.json CHANGED Viewed

The diff for this file is too large to render. See raw diff

tokenizer_config.json CHANGED Viewed

@@ -8,7 +8,7 @@
       "single_word": false,
       "special": true
     },
-    "100": {
       "content": "[UNK]",
       "lstrip": false,
       "normalized": false,
@@ -16,7 +16,7 @@
       "single_word": false,
       "special": true
     },
-    "101": {
       "content": "[CLS]",
       "lstrip": false,
       "normalized": false,
@@ -24,7 +24,7 @@
       "single_word": false,
       "special": true
     },
-    "102": {
       "content": "[SEP]",
       "lstrip": false,
       "normalized": false,
@@ -32,7 +32,7 @@
       "single_word": false,
       "special": true
     },
-    "103": {
       "content": "[MASK]",
       "lstrip": false,
       "normalized": false,
@@ -44,10 +44,10 @@
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
-  "do_lower_case": false,
   "mask_token": "[MASK]",
   "max_length": 512,
-  "model_max_length": 512,
   "never_split": null,
   "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
@@ -57,7 +57,7 @@
   "stride": 0,
   "strip_accents": null,
   "tokenize_chinese_chars": true,
-  "tokenizer_class": "DistilBertTokenizer",
   "truncation_side": "right",
   "truncation_strategy": "longest_first",
   "unk_token": "[UNK]"

       "single_word": false,
       "special": true
     },
+    "1": {
       "content": "[UNK]",
       "lstrip": false,
       "normalized": false,
       "single_word": false,
       "special": true
     },
+    "2": {
       "content": "[CLS]",
       "lstrip": false,
       "normalized": false,
       "single_word": false,
       "special": true
     },
+    "3": {
       "content": "[SEP]",
       "lstrip": false,
       "normalized": false,
       "single_word": false,
       "special": true
     },
+    "4": {
       "content": "[MASK]",
       "lstrip": false,
       "normalized": false,
   "clean_up_tokenization_spaces": true,
   "cls_token": "[CLS]",
   "do_basic_tokenize": true,
+  "do_lower_case": true,
   "mask_token": "[MASK]",
   "max_length": 512,
+  "model_max_length": 1000000000000000019884624838656,
   "never_split": null,
   "pad_to_multiple_of": null,
   "pad_token": "[PAD]",
   "stride": 0,
   "strip_accents": null,
   "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
   "truncation_side": "right",
   "truncation_strategy": "longest_first",
   "unk_token": "[UNK]"

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:11bf066db97bce61d10cca02c8a5961d0917904ef5b22283d3f686b48d3816f6
-size 4664

 version https://git-lfs.github.com/spec/v1
+oid sha256:83046e28cccf1abc1c1cae120e6fe8bb463b8086565ed1d7bac02ff1cd2512ab
+size 4536

vocab.txt CHANGED Viewed

The diff for this file is too large to render. See raw diff