fzanartu commited on
Commit
6e0d174
1 Parent(s): 1ef67df

End of training

Browse files
Files changed (25) hide show
  1. README.md +68 -0
  2. config.json +36 -0
  3. model.safetensors +3 -0
  4. runs/Aug15_14-52-42_8fa8d8970b4b/events.out.tfevents.1723733564.8fa8d8970b4b.490.0 +3 -0
  5. runs/Aug15_14-56-08_8fa8d8970b4b/events.out.tfevents.1723733770.8fa8d8970b4b.490.1 +3 -0
  6. runs/Aug15_15-03-12_8fa8d8970b4b/events.out.tfevents.1723734193.8fa8d8970b4b.490.2 +3 -0
  7. runs/Aug15_15-26-24_8fa8d8970b4b/events.out.tfevents.1723735585.8fa8d8970b4b.6054.0 +3 -0
  8. runs/Aug15_15-27-37_8fa8d8970b4b/events.out.tfevents.1723735657.8fa8d8970b4b.6054.1 +3 -0
  9. runs/Aug15_15-28-01_8fa8d8970b4b/events.out.tfevents.1723735682.8fa8d8970b4b.6054.2 +3 -0
  10. runs/Aug15_15-29-57_8fa8d8970b4b/events.out.tfevents.1723735798.8fa8d8970b4b.6054.3 +3 -0
  11. runs/Aug15_15-31-05_8fa8d8970b4b/events.out.tfevents.1723735866.8fa8d8970b4b.6054.4 +3 -0
  12. runs/Aug15_15-35-23_8fa8d8970b4b/events.out.tfevents.1723736125.8fa8d8970b4b.12007.0 +3 -0
  13. runs/Aug15_15-36-18_8fa8d8970b4b/events.out.tfevents.1723736179.8fa8d8970b4b.12007.1 +3 -0
  14. runs/Aug15_15-37-26_8fa8d8970b4b/events.out.tfevents.1723736247.8fa8d8970b4b.12007.2 +3 -0
  15. runs/Aug15_15-37-26_8fa8d8970b4b/events.out.tfevents.1723737112.8fa8d8970b4b.12007.3 +3 -0
  16. runs/Aug15_15-56-45_8fa8d8970b4b/events.out.tfevents.1723737407.8fa8d8970b4b.17631.0 +3 -0
  17. runs/Aug15_15-57-51_8fa8d8970b4b/events.out.tfevents.1723737471.8fa8d8970b4b.17631.1 +3 -0
  18. runs/Aug15_15-58-25_8fa8d8970b4b/events.out.tfevents.1723737506.8fa8d8970b4b.17631.2 +3 -0
  19. runs/Aug15_15-59-07_8fa8d8970b4b/events.out.tfevents.1723737547.8fa8d8970b4b.17631.3 +3 -0
  20. runs/Aug15_15-59-07_8fa8d8970b4b/events.out.tfevents.1723737875.8fa8d8970b4b.17631.4 +3 -0
  21. special_tokens_map.json +7 -0
  22. tokenizer.json +0 -0
  23. tokenizer_config.json +55 -0
  24. training_args.bin +3 -0
  25. vocab.txt +0 -0
README.md ADDED
@@ -0,0 +1,68 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: distilbert/distilbert-base-uncased
4
+ tags:
5
+ - generated_from_trainer
6
+ metrics:
7
+ - accuracy
8
+ - f1
9
+ - precision
10
+ - recall
11
+ model-index:
12
+ - name: my_awesome_model
13
+ results: []
14
+ ---
15
+
16
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
17
+ should probably proofread and complete it, then remove this comment. -->
18
+
19
+ # my_awesome_model
20
+
21
+ This model is a fine-tuned version of [distilbert/distilbert-base-uncased](https://huggingface.co/distilbert/distilbert-base-uncased) on the None dataset.
22
+ It achieves the following results on the evaluation set:
23
+ - Loss: 0.2740
24
+ - Accuracy: 0.6975
25
+ - F1: 0.6768
26
+ - Precision: 0.6819
27
+ - Recall: 0.6975
28
+
29
+ ## Model description
30
+
31
+ More information needed
32
+
33
+ ## Intended uses & limitations
34
+
35
+ More information needed
36
+
37
+ ## Training and evaluation data
38
+
39
+ More information needed
40
+
41
+ ## Training procedure
42
+
43
+ ### Training hyperparameters
44
+
45
+ The following hyperparameters were used during training:
46
+ - learning_rate: 2e-05
47
+ - train_batch_size: 16
48
+ - eval_batch_size: 16
49
+ - seed: 42
50
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
51
+ - lr_scheduler_type: linear
52
+ - num_epochs: 3
53
+
54
+ ### Training results
55
+
56
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall |
57
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
58
+ | No log | 1.0 | 384 | 0.3141 | 0.6836 | 0.6113 | 0.6934 | 0.6836 |
59
+ | 0.3433 | 2.0 | 768 | 0.2599 | 0.7148 | 0.6995 | 0.7028 | 0.7148 |
60
+ | 0.2239 | 3.0 | 1152 | 0.2601 | 0.7018 | 0.7032 | 0.7067 | 0.7018 |
61
+
62
+
63
+ ### Framework versions
64
+
65
+ - Transformers 4.42.4
66
+ - Pytorch 2.3.1+cu121
67
+ - Datasets 2.21.0
68
+ - Tokenizers 0.19.1
config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "distilbert/distilbert-base-uncased",
3
+ "activation": "gelu",
4
+ "architectures": [
5
+ "DistilBertForSequenceClassification"
6
+ ],
7
+ "attention_dropout": 0.1,
8
+ "dim": 768,
9
+ "dropout": 0.1,
10
+ "hidden_dim": 3072,
11
+ "id2label": {
12
+ "0": "SUPPORTS",
13
+ "1": "REFUTES",
14
+ "2": "NOT_ENOUGH_INFO",
15
+ "3": "DISPUTED"
16
+ },
17
+ "initializer_range": 0.02,
18
+ "label2id": {
19
+ "DISPUTED": 2,
20
+ "NOT_ENOUGH_INFO": 3,
21
+ "REFUTES": 1,
22
+ "SUPPORTS": 0
23
+ },
24
+ "max_position_embeddings": 512,
25
+ "model_type": "distilbert",
26
+ "n_heads": 12,
27
+ "n_layers": 6,
28
+ "pad_token_id": 0,
29
+ "qa_dropout": 0.1,
30
+ "seq_classif_dropout": 0.2,
31
+ "sinusoidal_pos_embds": false,
32
+ "tie_weights_": true,
33
+ "torch_dtype": "float32",
34
+ "transformers_version": "4.42.4",
35
+ "vocab_size": 30522
36
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20fbc9160151807cc005a7b4873211eb2bc58d2a2c1a13d55f2add465645b152
3
+ size 267838720
runs/Aug15_14-52-42_8fa8d8970b4b/events.out.tfevents.1723733564.8fa8d8970b4b.490.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccd8fc2caa2aa831be41c5a159ee75f6a3b271f775268e83fbe4472a0bf957fc
3
+ size 6149
runs/Aug15_14-56-08_8fa8d8970b4b/events.out.tfevents.1723733770.8fa8d8970b4b.490.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f45e5cbaf21a7cbb564535e1d0cd9ebb3e65837bebd865b88d1534c1c997d85f
3
+ size 6563
runs/Aug15_15-03-12_8fa8d8970b4b/events.out.tfevents.1723734193.8fa8d8970b4b.490.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6b1c7ab847a1d6a23e72b9a7b66adcd0bf501f3541f5203258d5a8c1136ba593
3
+ size 6240
runs/Aug15_15-26-24_8fa8d8970b4b/events.out.tfevents.1723735585.8fa8d8970b4b.6054.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ba0472e66ac2e59b78d202fa484dad02bfd127ad285ebe4aacfbf925a0003c4
3
+ size 4941
runs/Aug15_15-27-37_8fa8d8970b4b/events.out.tfevents.1723735657.8fa8d8970b4b.6054.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fe57df0638509d5fbc64baa946236ee4ec9dc0f870127ed0706bb5e0d6d4119
3
+ size 4941
runs/Aug15_15-28-01_8fa8d8970b4b/events.out.tfevents.1723735682.8fa8d8970b4b.6054.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e1f75afdd09ac3c3e91802662c1001756a1e85829bd07c22dacab7feba4455ad
3
+ size 4941
runs/Aug15_15-29-57_8fa8d8970b4b/events.out.tfevents.1723735798.8fa8d8970b4b.6054.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc3a39bc5d8f2cf085d782fded4579ba5dad36dffefe2ded3ffe7032c2022dc4
3
+ size 4941
runs/Aug15_15-31-05_8fa8d8970b4b/events.out.tfevents.1723735866.8fa8d8970b4b.6054.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c414c8aaa058c889725cf7d13ba5474ceaa426fe2e9c313e44c9792d523e5157
3
+ size 6450
runs/Aug15_15-35-23_8fa8d8970b4b/events.out.tfevents.1723736125.8fa8d8970b4b.12007.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:255faa3604b9bb71140901a25832afa24509a8b9d35784703c09c5aaed4353bf
3
+ size 4942
runs/Aug15_15-36-18_8fa8d8970b4b/events.out.tfevents.1723736179.8fa8d8970b4b.12007.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a5798beccf0586bf3d6b42cc81273ad0e38f4f12af2430c8970dc1296ea782d
3
+ size 4942
runs/Aug15_15-37-26_8fa8d8970b4b/events.out.tfevents.1723736247.8fa8d8970b4b.12007.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4521291d302573429442bda0579e2ba518d747e9bd0e333f83ad37b20012bdc6
3
+ size 11493
runs/Aug15_15-37-26_8fa8d8970b4b/events.out.tfevents.1723737112.8fa8d8970b4b.12007.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9ab60251a5117e99a91bf4f05e27f085340e5ee00ae9f0779e730eb100d4fc2
3
+ size 560
runs/Aug15_15-56-45_8fa8d8970b4b/events.out.tfevents.1723737407.8fa8d8970b4b.17631.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:36fa43cf20879c9a32cd54053bab9cdee375648cdb4ed29a5f20bf86d6b71d11
3
+ size 4941
runs/Aug15_15-57-51_8fa8d8970b4b/events.out.tfevents.1723737471.8fa8d8970b4b.17631.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3adabff79967aa6804ba6bd0e7efc3e3a027afa75c2122919d245f5fb2f7d79c
3
+ size 4941
runs/Aug15_15-58-25_8fa8d8970b4b/events.out.tfevents.1723737506.8fa8d8970b4b.17631.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f5ff71f1d4c31e26b468196b93ddff072c8dea2b8e0f083d882de33f9269b801
3
+ size 4941
runs/Aug15_15-59-07_8fa8d8970b4b/events.out.tfevents.1723737547.8fa8d8970b4b.17631.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4e5d1d7f4e338bb26ffab1db480a3b38461b9dacfa471c46fd1fc810fa8ea85e
3
+ size 7133
runs/Aug15_15-59-07_8fa8d8970b4b/events.out.tfevents.1723737875.8fa8d8970b4b.17631.4 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:946a8dbf090865b639aabea0fa4a2bca70394e4ad765c62193efa445270f237b
3
+ size 560
special_tokens_map.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
7
+ }
tokenizer.json ADDED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
+ "lstrip": false,
38
+ "normalized": false,
39
+ "rstrip": false,
40
+ "single_word": false,
41
+ "special": true
42
+ }
43
+ },
44
+ "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_lower_case": true,
47
+ "mask_token": "[MASK]",
48
+ "model_max_length": 512,
49
+ "pad_token": "[PAD]",
50
+ "sep_token": "[SEP]",
51
+ "strip_accents": null,
52
+ "tokenize_chinese_chars": true,
53
+ "tokenizer_class": "DistilBertTokenizer",
54
+ "unk_token": "[UNK]"
55
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a06bc9f0f7c9142d173a0930cfd0d7387a0a0e7c4ae4fd7c225bcbea98a469a6
3
+ size 5112
vocab.txt ADDED
The diff for this file is too large to render. See raw diff