desdesmond commited on
Commit
4351348
1 Parent(s): 775d8c1

desdesmond/lora_training

Browse files
README.md CHANGED
@@ -1,11 +1,11 @@
1
  ---
2
- base_model: mnoukhov/gpt2-imdb-sentiment-classifier
3
  library_name: peft
4
- license: mit
5
- metrics:
6
- - accuracy
7
  tags:
8
  - generated_from_trainer
 
 
9
  model-index:
10
  - name: lora_training
11
  results: []
@@ -16,10 +16,10 @@ should probably proofread and complete it, then remove this comment. -->
16
 
17
  # lora_training
18
 
19
- This model is a fine-tuned version of [mnoukhov/gpt2-imdb-sentiment-classifier](https://huggingface.co/mnoukhov/gpt2-imdb-sentiment-classifier) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 1.1823
22
- - Accuracy: 0.5481
23
 
24
  ## Model description
25
 
@@ -42,7 +42,7 @@ The following hyperparameters were used during training:
42
  - train_batch_size: 16
43
  - eval_batch_size: 16
44
  - seed: 42
45
- - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
46
  - lr_scheduler_type: linear
47
  - num_epochs: 5
48
 
@@ -50,16 +50,17 @@ The following hyperparameters were used during training:
50
 
51
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
52
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
53
- | 1.9491 | 1.0 | 800 | 1.5683 | 0.3409 |
54
- | 1.4934 | 2.0 | 1600 | 1.4219 | 0.4922 |
55
- | 1.4128 | 3.0 | 2400 | 1.2784 | 0.5244 |
56
- | 1.2545 | 4.0 | 3200 | 1.2019 | 0.5441 |
57
- | 1.1988 | 5.0 | 4000 | 1.1823 | 0.5481 |
58
 
59
 
60
  ### Framework versions
61
 
62
  - PEFT 0.13.2
63
- - Transformers 4.44.2
64
  - Pytorch 2.5.0+cu121
65
- - Tokenizers 0.19.1
 
 
1
  ---
 
2
  library_name: peft
3
+ license: apache-2.0
4
+ base_model: ykacer/bert-base-cased-imdb-sequence-classification
 
5
  tags:
6
  - generated_from_trainer
7
+ metrics:
8
+ - accuracy
9
  model-index:
10
  - name: lora_training
11
  results: []
 
16
 
17
  # lora_training
18
 
19
+ This model is a fine-tuned version of [ykacer/bert-base-cased-imdb-sequence-classification](https://huggingface.co/ykacer/bert-base-cased-imdb-sequence-classification) on an unknown dataset.
20
  It achieves the following results on the evaluation set:
21
+ - Loss: 1.0969
22
+ - Accuracy: 0.5975
23
 
24
  ## Model description
25
 
 
42
  - train_batch_size: 16
43
  - eval_batch_size: 16
44
  - seed: 42
45
+ - optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
46
  - lr_scheduler_type: linear
47
  - num_epochs: 5
48
 
 
50
 
51
  | Training Loss | Epoch | Step | Validation Loss | Accuracy |
52
  |:-------------:|:-----:|:----:|:---------------:|:--------:|
53
+ | 1.6038 | 1.0 | 800 | 1.5082 | 0.4547 |
54
+ | 1.305 | 2.0 | 1600 | 1.2096 | 0.5466 |
55
+ | 1.1727 | 3.0 | 2400 | 1.1352 | 0.5775 |
56
+ | 1.1199 | 4.0 | 3200 | 1.1062 | 0.5947 |
57
+ | 1.0959 | 5.0 | 4000 | 1.0969 | 0.5975 |
58
 
59
 
60
  ### Framework versions
61
 
62
  - PEFT 0.13.2
63
+ - Transformers 4.46.2
64
  - Pytorch 2.5.0+cu121
65
+ - Datasets 3.1.0
66
+ - Tokenizers 0.20.3
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "mnoukhov/gpt2-imdb-sentiment-classifier",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
@@ -23,7 +23,8 @@
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
- "c_proj"
 
27
  ],
28
  "task_type": "TOKEN_CLS",
29
  "use_dora": false,
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "ykacer/bert-base-cased-imdb-sequence-classification",
5
  "bias": "none",
6
  "fan_in_fan_out": false,
7
  "inference_mode": true,
 
23
  "rank_pattern": {},
24
  "revision": null,
25
  "target_modules": [
26
+ "query",
27
+ "value"
28
  ],
29
  "task_type": "TOKEN_CLS",
30
  "use_dora": false,
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:88860639b64eec2fbd7ff1e9225092efd27e8bdb4d8a6f44ff876e5145f0d037
3
- size 1056704
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:553082f5bf6bb7fe5c1ba6d0027c7dc097595e6626a4c2fc08766989495ce553
3
+ size 615128
special_tokens_map.json CHANGED
@@ -1,30 +1,7 @@
1
  {
2
- "bos_token": {
3
- "content": "<|endoftext|>",
4
- "lstrip": false,
5
- "normalized": false,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "eos_token": {
10
- "content": "<|endoftext|>",
11
- "lstrip": false,
12
- "normalized": false,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "<|endoftext|>",
18
- "lstrip": false,
19
- "normalized": false,
20
- "rstrip": false,
21
- "single_word": false
22
- },
23
- "unk_token": {
24
- "content": "<|endoftext|>",
25
- "lstrip": false,
26
- "normalized": false,
27
- "rstrip": false,
28
- "single_word": false
29
- }
30
  }
 
1
  {
2
+ "cls_token": "[CLS]",
3
+ "mask_token": "[MASK]",
4
+ "pad_token": "[PAD]",
5
+ "sep_token": "[SEP]",
6
+ "unk_token": "[UNK]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  }
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -1,8 +1,39 @@
1
  {
2
- "add_prefix_space": false,
3
  "added_tokens_decoder": {
4
- "50256": {
5
- "content": "<|endoftext|>",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6
  "lstrip": false,
7
  "normalized": false,
8
  "rstrip": false,
@@ -10,11 +41,17 @@
10
  "special": true
11
  }
12
  },
13
- "bos_token": "<|endoftext|>",
14
  "clean_up_tokenization_spaces": true,
15
- "eos_token": "<|endoftext|>",
16
- "model_max_length": 1024,
17
- "pad_token": "<|endoftext|>",
18
- "tokenizer_class": "GPT2Tokenizer",
19
- "unk_token": "<|endoftext|>"
 
 
 
 
 
 
 
20
  }
 
1
  {
 
2
  "added_tokens_decoder": {
3
+ "0": {
4
+ "content": "[PAD]",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false,
9
+ "special": true
10
+ },
11
+ "100": {
12
+ "content": "[UNK]",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false,
17
+ "special": true
18
+ },
19
+ "101": {
20
+ "content": "[CLS]",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false,
25
+ "special": true
26
+ },
27
+ "102": {
28
+ "content": "[SEP]",
29
+ "lstrip": false,
30
+ "normalized": false,
31
+ "rstrip": false,
32
+ "single_word": false,
33
+ "special": true
34
+ },
35
+ "103": {
36
+ "content": "[MASK]",
37
  "lstrip": false,
38
  "normalized": false,
39
  "rstrip": false,
 
41
  "special": true
42
  }
43
  },
 
44
  "clean_up_tokenization_spaces": true,
45
+ "cls_token": "[CLS]",
46
+ "do_basic_tokenize": true,
47
+ "do_lower_case": false,
48
+ "mask_token": "[MASK]",
49
+ "model_max_length": 512,
50
+ "never_split": null,
51
+ "pad_token": "[PAD]",
52
+ "sep_token": "[SEP]",
53
+ "strip_accents": null,
54
+ "tokenize_chinese_chars": true,
55
+ "tokenizer_class": "BertTokenizer",
56
+ "unk_token": "[UNK]"
57
  }
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:26dfbcc74eb94d53c0b93afd7c5b38640c092cb2e063fd48cd5f97363dcf0ad5
3
- size 5176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:506faaa3ff61fda901e71fb517d5a38902a1b769b1aa5caae878b69178ce37bf
3
+ size 5240
vocab.txt ADDED
The diff for this file is too large to render. See raw diff