deopoler commited on
Commit
85e94fb
1 Parent(s): e6c02c2

End of training

Browse files
README.md ADDED
@@ -0,0 +1,86 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ license: apache-2.0
3
+ base_model: ntu-spml/distilhubert
4
+ tags:
5
+ - generated_from_trainer
6
+ datasets:
7
+ - keystrokes
8
+ metrics:
9
+ - accuracy
10
+ model-index:
11
+ - name: distilhubert-finetuned-keystrokes
12
+ results:
13
+ - task:
14
+ name: Audio Classification
15
+ type: audio-classification
16
+ dataset:
17
+ name: Keystrokes
18
+ type: keystrokes
19
+ config: default
20
+ split: train
21
+ args: default
22
+ metrics:
23
+ - name: Accuracy
24
+ type: accuracy
25
+ value: 0.5555555555555556
26
+ ---
27
+
28
+ <!-- This model card has been generated automatically according to the information the Trainer had access to. You
29
+ should probably proofread and complete it, then remove this comment. -->
30
+
31
+ # distilhubert-finetuned-keystrokes
32
+
33
+ This model is a fine-tuned version of [ntu-spml/distilhubert](https://huggingface.co/ntu-spml/distilhubert) on the Keystrokes dataset.
34
+ It achieves the following results on the evaluation set:
35
+ - Loss: 2.1861
36
+ - Accuracy: 0.5556
37
+
38
+ ## Model description
39
+
40
+ More information needed
41
+
42
+ ## Intended uses & limitations
43
+
44
+ More information needed
45
+
46
+ ## Training and evaluation data
47
+
48
+ More information needed
49
+
50
+ ## Training procedure
51
+
52
+ ### Training hyperparameters
53
+
54
+ The following hyperparameters were used during training:
55
+ - learning_rate: 5e-05
56
+ - train_batch_size: 8
57
+ - eval_batch_size: 8
58
+ - seed: 42
59
+ - optimizer: Adam with betas=(0.9,0.999) and epsilon=1e-08
60
+ - lr_scheduler_type: linear
61
+ - lr_scheduler_warmup_ratio: 0.1
62
+ - num_epochs: 10
63
+ - mixed_precision_training: Native AMP
64
+
65
+ ### Training results
66
+
67
+ | Training Loss | Epoch | Step | Validation Loss | Accuracy |
68
+ |:-------------:|:-----:|:----:|:---------------:|:--------:|
69
+ | 3.5798 | 1.0 | 90 | 3.5605 | 0.0722 |
70
+ | 3.396 | 2.0 | 180 | 3.3216 | 0.2722 |
71
+ | 3.1783 | 3.0 | 270 | 3.0565 | 0.3 |
72
+ | 2.8625 | 4.0 | 360 | 2.8097 | 0.3667 |
73
+ | 2.5934 | 5.0 | 450 | 2.6345 | 0.4222 |
74
+ | 2.4605 | 6.0 | 540 | 2.4812 | 0.4111 |
75
+ | 2.2524 | 7.0 | 630 | 2.3649 | 0.4444 |
76
+ | 2.1017 | 8.0 | 720 | 2.2739 | 0.5167 |
77
+ | 2.0619 | 9.0 | 810 | 2.2158 | 0.5222 |
78
+ | 2.0477 | 10.0 | 900 | 2.1861 | 0.5556 |
79
+
80
+
81
+ ### Framework versions
82
+
83
+ - Transformers 4.40.1
84
+ - Pytorch 2.2.1
85
+ - Datasets 2.19.0
86
+ - Tokenizers 0.19.1
config.json ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "ntu-spml/distilhubert",
3
+ "activation_dropout": 0.1,
4
+ "apply_spec_augment": false,
5
+ "architectures": [
6
+ "HubertForSequenceClassification"
7
+ ],
8
+ "attention_dropout": 0.1,
9
+ "bos_token_id": 1,
10
+ "classifier_proj_size": 256,
11
+ "conv_bias": false,
12
+ "conv_dim": [
13
+ 512,
14
+ 512,
15
+ 512,
16
+ 512,
17
+ 512,
18
+ 512,
19
+ 512
20
+ ],
21
+ "conv_kernel": [
22
+ 10,
23
+ 3,
24
+ 3,
25
+ 3,
26
+ 3,
27
+ 2,
28
+ 2
29
+ ],
30
+ "conv_stride": [
31
+ 5,
32
+ 2,
33
+ 2,
34
+ 2,
35
+ 2,
36
+ 2,
37
+ 2
38
+ ],
39
+ "ctc_loss_reduction": "sum",
40
+ "ctc_zero_infinity": false,
41
+ "do_stable_layer_norm": false,
42
+ "eos_token_id": 2,
43
+ "feat_extract_activation": "gelu",
44
+ "feat_extract_norm": "group",
45
+ "feat_proj_dropout": 0.0,
46
+ "feat_proj_layer_norm": false,
47
+ "final_dropout": 0.0,
48
+ "hidden_act": "gelu",
49
+ "hidden_dropout": 0.1,
50
+ "hidden_size": 768,
51
+ "id2label": {
52
+ "0": "0",
53
+ "1": "1",
54
+ "10": "A",
55
+ "11": "B",
56
+ "12": "C",
57
+ "13": "D",
58
+ "14": "E",
59
+ "15": "F",
60
+ "16": "G",
61
+ "17": "H",
62
+ "18": "I",
63
+ "19": "J",
64
+ "2": "2",
65
+ "20": "K",
66
+ "21": "L",
67
+ "22": "M",
68
+ "23": "N",
69
+ "24": "O",
70
+ "25": "P",
71
+ "26": "Q",
72
+ "27": "R",
73
+ "28": "S",
74
+ "29": "T",
75
+ "3": "3",
76
+ "30": "U",
77
+ "31": "V",
78
+ "32": "W",
79
+ "33": "X",
80
+ "34": "Y",
81
+ "35": "Z",
82
+ "4": "4",
83
+ "5": "5",
84
+ "6": "6",
85
+ "7": "7",
86
+ "8": "8",
87
+ "9": "9"
88
+ },
89
+ "initializer_range": 0.02,
90
+ "intermediate_size": 3072,
91
+ "label2id": {
92
+ "0": "0",
93
+ "1": "1",
94
+ "2": "2",
95
+ "3": "3",
96
+ "4": "4",
97
+ "5": "5",
98
+ "6": "6",
99
+ "7": "7",
100
+ "8": "8",
101
+ "9": "9",
102
+ "A": "10",
103
+ "B": "11",
104
+ "C": "12",
105
+ "D": "13",
106
+ "E": "14",
107
+ "F": "15",
108
+ "G": "16",
109
+ "H": "17",
110
+ "I": "18",
111
+ "J": "19",
112
+ "K": "20",
113
+ "L": "21",
114
+ "M": "22",
115
+ "N": "23",
116
+ "O": "24",
117
+ "P": "25",
118
+ "Q": "26",
119
+ "R": "27",
120
+ "S": "28",
121
+ "T": "29",
122
+ "U": "30",
123
+ "V": "31",
124
+ "W": "32",
125
+ "X": "33",
126
+ "Y": "34",
127
+ "Z": "35"
128
+ },
129
+ "layer_norm_eps": 1e-05,
130
+ "layerdrop": 0.0,
131
+ "mask_feature_length": 10,
132
+ "mask_feature_min_masks": 0,
133
+ "mask_feature_prob": 0.0,
134
+ "mask_time_length": 10,
135
+ "mask_time_min_masks": 2,
136
+ "mask_time_prob": 0.05,
137
+ "model_type": "hubert",
138
+ "num_attention_heads": 12,
139
+ "num_conv_pos_embedding_groups": 16,
140
+ "num_conv_pos_embeddings": 128,
141
+ "num_feat_extract_layers": 7,
142
+ "num_hidden_layers": 2,
143
+ "pad_token_id": 0,
144
+ "torch_dtype": "float32",
145
+ "transformers_version": "4.40.1",
146
+ "use_weighted_layer_sum": false,
147
+ "vocab_size": 32
148
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94699d5017759eeb18dd7a63f6bbb80dbe517541f2c71ce68fcf3ef4b4ddecb9
3
+ size 94798464
preprocessor_config.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "do_normalize": true,
3
+ "feature_extractor_type": "Wav2Vec2FeatureExtractor",
4
+ "feature_size": 1,
5
+ "padding_side": "right",
6
+ "padding_value": 0,
7
+ "return_attention_mask": true,
8
+ "sampling_rate": 16000
9
+ }
runs/May04_12-26-51_seonjin-MS-7C94/events.out.tfevents.1714793218.seonjin-MS-7C94.23556.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bae0c2f8748a1823860dfe40d1f6c3ab4c5f3024605a137493b8470277f9533e
3
+ size 48060
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:43ad9d9ed61bb67b09147ea97a9d38cf3ba0f93e8e8b77c63a40c9bb54718e8f
3
+ size 5048