End of training
Browse files- README.md +68 -0
- config.json +36 -0
- model.safetensors +3 -0
- runs/Aug15_14-52-42_8fa8d8970b4b/events.out.tfevents.1723733564.8fa8d8970b4b.490.0 +3 -0
- runs/Aug15_14-56-08_8fa8d8970b4b/events.out.tfevents.1723733770.8fa8d8970b4b.490.1 +3 -0
- runs/Aug15_15-03-12_8fa8d8970b4b/events.out.tfevents.1723734193.8fa8d8970b4b.490.2 +3 -0
- runs/Aug15_15-26-24_8fa8d8970b4b/events.out.tfevents.1723735585.8fa8d8970b4b.6054.0 +3 -0
- runs/Aug15_15-27-37_8fa8d8970b4b/events.out.tfevents.1723735657.8fa8d8970b4b.6054.1 +3 -0
- runs/Aug15_15-28-01_8fa8d8970b4b/events.out.tfevents.1723735682.8fa8d8970b4b.6054.2 +3 -0
- runs/Aug15_15-29-57_8fa8d8970b4b/events.out.tfevents.1723735798.8fa8d8970b4b.6054.3 +3 -0
- runs/Aug15_15-31-05_8fa8d8970b4b/events.out.tfevents.1723735866.8fa8d8970b4b.6054.4 +3 -0
- runs/Aug15_15-35-23_8fa8d8970b4b/events.out.tfevents.1723736125.8fa8d8970b4b.12007.0 +3 -0
- runs/Aug15_15-36-18_8fa8d8970b4b/events.out.tfevents.1723736179.8fa8d8970b4b.12007.1 +3 -0
- runs/Aug15_15-37-26_8fa8d8970b4b/events.out.tfevents.1723736247.8fa8d8970b4b.12007.2 +3 -0
- runs/Aug15_15-37-26_8fa8d8970b4b/events.out.tfevents.1723737112.8fa8d8970b4b.12007.3 +3 -0
- runs/Aug15_15-56-45_8fa8d8970b4b/events.out.tfevents.1723737407.8fa8d8970b4b.17631.0 +3 -0
- runs/Aug15_15-57-51_8fa8d8970b4b/events.out.tfevents.1723737471.8fa8d8970b4b.17631.1 +3 -0
- runs/Aug15_15-58-25_8fa8d8970b4b/events.out.tfevents.1723737506.8fa8d8970b4b.17631.2 +3 -0
- runs/Aug15_15-59-07_8fa8d8970b4b/events.out.tfevents.1723737547.8fa8d8970b4b.17631.3 +3 -0
- runs/Aug15_15-59-07_8fa8d8970b4b/events.out.tfevents.1723737875.8fa8d8970b4b.17631.4 +3 -0
- special_tokens_map.json +7 -0
- tokenizer.json +0 -0
- tokenizer_config.json +55 -0
- training_args.bin +3 -0
- vocab.txt +0 -0
README.md
ADDED
@@ -0,0 +1,68 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
license: apache-2.0
|
3 |
+
base_model: distilbert/distilbert-base-uncased
|
4 |
+
tags:
|
5 |
+
- generated_from_trainer
|
6 |
+
metrics:
|
7 |
+
- accuracy
|
8 |
+
- f1
|
9 |
+
- precision
|
10 |
+
- recall
|
11 |
+
model-index:
|
12 |
+
- name: my_awesome_model
|
13 |
+
results: []
|
14 |
+
---
|
15 |
+
|
16 |
+
<!-- This model card has been generated automatically according to the information the Trainer had access to. You
|
17 |
+
should probably proofread and complete it, then remove this comment. -->
|
18 |
+
|
19 |
+
# my_awesome_model
|
20 |
+
|
21 |
+
This model is a fine-tuned version of [distilbert/distilbert-base-uncased](https://huggingface.co/distilbert/distilbert-base-uncased) on the None dataset.
|
22 |
+
It achieves the following results on the evaluation set:
|
23 |
+
- Loss: 0.2740
|
24 |
+
- Accuracy: 0.6975
|
25 |
+
- F1: 0.6768
|
26 |
+
- Precision: 0.6819
|
27 |
+
- Recall: 0.6975
|
28 |
+
|
29 |
+
## Model description
|
30 |
+
|
31 |
+
More information needed
|
32 |
+
|
33 |
+
## Intended uses & limitations
|
34 |
+
|
35 |
+
More information needed
|
36 |
+
|
37 |
+
## Training and evaluation data
|
38 |
+
|
39 |
+
More information needed
|
40 |
+
|
41 |
+
## Training procedure
|
42 |
+
|
43 |
+
### Training hyperparameters
|
44 |
+
|
45 |
+
The following hyperparameters were used during training:
|
46 |
+
- learning_rate: 2e-05
|
47 |
+
- train_batch_size: 16
|
48 |
+
- eval_batch_size: 16
|
49 |
+
- seed: 42
|
50 |
+
- optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
|
51 |
+
- lr_scheduler_type: linear
|
52 |
+
- num_epochs: 3
|
53 |
+
|
54 |
+
### Training results
|
55 |
+
|
56 |
+
| Training Loss | Epoch | Step | Validation Loss | Accuracy | F1 | Precision | Recall |
|
57 |
+
|:-------------:|:-----:|:----:|:---------------:|:--------:|:------:|:---------:|:------:|
|
58 |
+
| No log | 1.0 | 384 | 0.3141 | 0.6836 | 0.6113 | 0.6934 | 0.6836 |
|
59 |
+
| 0.3433 | 2.0 | 768 | 0.2599 | 0.7148 | 0.6995 | 0.7028 | 0.7148 |
|
60 |
+
| 0.2239 | 3.0 | 1152 | 0.2601 | 0.7018 | 0.7032 | 0.7067 | 0.7018 |
|
61 |
+
|
62 |
+
|
63 |
+
### Framework versions
|
64 |
+
|
65 |
+
- Transformers 4.42.4
|
66 |
+
- Pytorch 2.3.1+cu121
|
67 |
+
- Datasets 2.21.0
|
68 |
+
- Tokenizers 0.19.1
|
config.json
ADDED
@@ -0,0 +1,36 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "distilbert/distilbert-base-uncased",
|
3 |
+
"activation": "gelu",
|
4 |
+
"architectures": [
|
5 |
+
"DistilBertForSequenceClassification"
|
6 |
+
],
|
7 |
+
"attention_dropout": 0.1,
|
8 |
+
"dim": 768,
|
9 |
+
"dropout": 0.1,
|
10 |
+
"hidden_dim": 3072,
|
11 |
+
"id2label": {
|
12 |
+
"0": "SUPPORTS",
|
13 |
+
"1": "REFUTES",
|
14 |
+
"2": "NOT_ENOUGH_INFO",
|
15 |
+
"3": "DISPUTED"
|
16 |
+
},
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"label2id": {
|
19 |
+
"DISPUTED": 2,
|
20 |
+
"NOT_ENOUGH_INFO": 3,
|
21 |
+
"REFUTES": 1,
|
22 |
+
"SUPPORTS": 0
|
23 |
+
},
|
24 |
+
"max_position_embeddings": 512,
|
25 |
+
"model_type": "distilbert",
|
26 |
+
"n_heads": 12,
|
27 |
+
"n_layers": 6,
|
28 |
+
"pad_token_id": 0,
|
29 |
+
"qa_dropout": 0.1,
|
30 |
+
"seq_classif_dropout": 0.2,
|
31 |
+
"sinusoidal_pos_embds": false,
|
32 |
+
"tie_weights_": true,
|
33 |
+
"torch_dtype": "float32",
|
34 |
+
"transformers_version": "4.42.4",
|
35 |
+
"vocab_size": 30522
|
36 |
+
}
|
model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20fbc9160151807cc005a7b4873211eb2bc58d2a2c1a13d55f2add465645b152
|
3 |
+
size 267838720
|
runs/Aug15_14-52-42_8fa8d8970b4b/events.out.tfevents.1723733564.8fa8d8970b4b.490.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccd8fc2caa2aa831be41c5a159ee75f6a3b271f775268e83fbe4472a0bf957fc
|
3 |
+
size 6149
|
runs/Aug15_14-56-08_8fa8d8970b4b/events.out.tfevents.1723733770.8fa8d8970b4b.490.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f45e5cbaf21a7cbb564535e1d0cd9ebb3e65837bebd865b88d1534c1c997d85f
|
3 |
+
size 6563
|
runs/Aug15_15-03-12_8fa8d8970b4b/events.out.tfevents.1723734193.8fa8d8970b4b.490.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b1c7ab847a1d6a23e72b9a7b66adcd0bf501f3541f5203258d5a8c1136ba593
|
3 |
+
size 6240
|
runs/Aug15_15-26-24_8fa8d8970b4b/events.out.tfevents.1723735585.8fa8d8970b4b.6054.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ba0472e66ac2e59b78d202fa484dad02bfd127ad285ebe4aacfbf925a0003c4
|
3 |
+
size 4941
|
runs/Aug15_15-27-37_8fa8d8970b4b/events.out.tfevents.1723735657.8fa8d8970b4b.6054.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fe57df0638509d5fbc64baa946236ee4ec9dc0f870127ed0706bb5e0d6d4119
|
3 |
+
size 4941
|
runs/Aug15_15-28-01_8fa8d8970b4b/events.out.tfevents.1723735682.8fa8d8970b4b.6054.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e1f75afdd09ac3c3e91802662c1001756a1e85829bd07c22dacab7feba4455ad
|
3 |
+
size 4941
|
runs/Aug15_15-29-57_8fa8d8970b4b/events.out.tfevents.1723735798.8fa8d8970b4b.6054.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc3a39bc5d8f2cf085d782fded4579ba5dad36dffefe2ded3ffe7032c2022dc4
|
3 |
+
size 4941
|
runs/Aug15_15-31-05_8fa8d8970b4b/events.out.tfevents.1723735866.8fa8d8970b4b.6054.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c414c8aaa058c889725cf7d13ba5474ceaa426fe2e9c313e44c9792d523e5157
|
3 |
+
size 6450
|
runs/Aug15_15-35-23_8fa8d8970b4b/events.out.tfevents.1723736125.8fa8d8970b4b.12007.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:255faa3604b9bb71140901a25832afa24509a8b9d35784703c09c5aaed4353bf
|
3 |
+
size 4942
|
runs/Aug15_15-36-18_8fa8d8970b4b/events.out.tfevents.1723736179.8fa8d8970b4b.12007.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a5798beccf0586bf3d6b42cc81273ad0e38f4f12af2430c8970dc1296ea782d
|
3 |
+
size 4942
|
runs/Aug15_15-37-26_8fa8d8970b4b/events.out.tfevents.1723736247.8fa8d8970b4b.12007.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4521291d302573429442bda0579e2ba518d747e9bd0e333f83ad37b20012bdc6
|
3 |
+
size 11493
|
runs/Aug15_15-37-26_8fa8d8970b4b/events.out.tfevents.1723737112.8fa8d8970b4b.12007.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9ab60251a5117e99a91bf4f05e27f085340e5ee00ae9f0779e730eb100d4fc2
|
3 |
+
size 560
|
runs/Aug15_15-56-45_8fa8d8970b4b/events.out.tfevents.1723737407.8fa8d8970b4b.17631.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36fa43cf20879c9a32cd54053bab9cdee375648cdb4ed29a5f20bf86d6b71d11
|
3 |
+
size 4941
|
runs/Aug15_15-57-51_8fa8d8970b4b/events.out.tfevents.1723737471.8fa8d8970b4b.17631.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3adabff79967aa6804ba6bd0e7efc3e3a027afa75c2122919d245f5fb2f7d79c
|
3 |
+
size 4941
|
runs/Aug15_15-58-25_8fa8d8970b4b/events.out.tfevents.1723737506.8fa8d8970b4b.17631.2
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5ff71f1d4c31e26b468196b93ddff072c8dea2b8e0f083d882de33f9269b801
|
3 |
+
size 4941
|
runs/Aug15_15-59-07_8fa8d8970b4b/events.out.tfevents.1723737547.8fa8d8970b4b.17631.3
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e5d1d7f4e338bb26ffab1db480a3b38461b9dacfa471c46fd1fc810fa8ea85e
|
3 |
+
size 7133
|
runs/Aug15_15-59-07_8fa8d8970b4b/events.out.tfevents.1723737875.8fa8d8970b4b.17631.4
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:946a8dbf090865b639aabea0fa4a2bca70394e4ad765c62193efa445270f237b
|
3 |
+
size 560
|
special_tokens_map.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"cls_token": "[CLS]",
|
3 |
+
"mask_token": "[MASK]",
|
4 |
+
"pad_token": "[PAD]",
|
5 |
+
"sep_token": "[SEP]",
|
6 |
+
"unk_token": "[UNK]"
|
7 |
+
}
|
tokenizer.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
tokenizer_config.json
ADDED
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"added_tokens_decoder": {
|
3 |
+
"0": {
|
4 |
+
"content": "[PAD]",
|
5 |
+
"lstrip": false,
|
6 |
+
"normalized": false,
|
7 |
+
"rstrip": false,
|
8 |
+
"single_word": false,
|
9 |
+
"special": true
|
10 |
+
},
|
11 |
+
"100": {
|
12 |
+
"content": "[UNK]",
|
13 |
+
"lstrip": false,
|
14 |
+
"normalized": false,
|
15 |
+
"rstrip": false,
|
16 |
+
"single_word": false,
|
17 |
+
"special": true
|
18 |
+
},
|
19 |
+
"101": {
|
20 |
+
"content": "[CLS]",
|
21 |
+
"lstrip": false,
|
22 |
+
"normalized": false,
|
23 |
+
"rstrip": false,
|
24 |
+
"single_word": false,
|
25 |
+
"special": true
|
26 |
+
},
|
27 |
+
"102": {
|
28 |
+
"content": "[SEP]",
|
29 |
+
"lstrip": false,
|
30 |
+
"normalized": false,
|
31 |
+
"rstrip": false,
|
32 |
+
"single_word": false,
|
33 |
+
"special": true
|
34 |
+
},
|
35 |
+
"103": {
|
36 |
+
"content": "[MASK]",
|
37 |
+
"lstrip": false,
|
38 |
+
"normalized": false,
|
39 |
+
"rstrip": false,
|
40 |
+
"single_word": false,
|
41 |
+
"special": true
|
42 |
+
}
|
43 |
+
},
|
44 |
+
"clean_up_tokenization_spaces": true,
|
45 |
+
"cls_token": "[CLS]",
|
46 |
+
"do_lower_case": true,
|
47 |
+
"mask_token": "[MASK]",
|
48 |
+
"model_max_length": 512,
|
49 |
+
"pad_token": "[PAD]",
|
50 |
+
"sep_token": "[SEP]",
|
51 |
+
"strip_accents": null,
|
52 |
+
"tokenize_chinese_chars": true,
|
53 |
+
"tokenizer_class": "DistilBertTokenizer",
|
54 |
+
"unk_token": "[UNK]"
|
55 |
+
}
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a06bc9f0f7c9142d173a0930cfd0d7387a0a0e7c4ae4fd7c225bcbea98a469a6
|
3 |
+
size 5112
|
vocab.txt
ADDED
The diff for this file is too large to render.
See raw diff
|
|