St4n commited on
Commit
a021d4a
1 Parent(s): c9b151a

St4n/wav2vec2-base-self-331-colab

Browse files
alphabet.json DELETED
@@ -1 +0,0 @@
1
- {"labels": [" ", "a", "b", "c", "d", "e", "f", "g", "h", "i", "k", "l", "m", "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z", "\u2047", "", "<s>", "</s>"], "is_bpe": false}
 
 
language_model/5gram.bin DELETED
@@ -1,3 +0,0 @@
1
- version https://git-lfs.github.com/spec/v1
2
- oid sha256:d7bab2b9cbbbc0129a09e4ea49d8fc3054d7d9469cad97732e56584b41edb7db
3
- size 47141
 
 
 
 
language_model/attrs.json DELETED
@@ -1 +0,0 @@
1
- {"alpha": 0.5, "beta": 1.5, "unk_score_offset": -10.0, "score_boundary": true}
 
 
language_model/unigrams.txt DELETED
@@ -1,152 +0,0 @@
1
- </s>
2
- <s>
3
- a
4
- after
5
- air
6
- alive
7
- altimeter
8
- altitude
9
- and
10
- anti
11
- approach
12
- area
13
- arm
14
- around
15
- auto
16
- autobrake
17
- autothrottle
18
- bark
19
- before
20
- bleed
21
- brake
22
- brakes
23
- c
24
- cabin
25
- center
26
- central
27
- check
28
- checked
29
- checklist
30
- clear
31
- climb
32
- collection
33
- collision
34
- combine
35
- complete
36
- continuous
37
- control
38
- de
39
- descent
40
- doors
41
- down
42
- eight
43
- emergency
44
- engine
45
- equipment
46
- exist
47
- exit
48
- exterior
49
- external
50
- f
51
- feet
52
- fifteen
53
- five
54
- flap
55
- flaps
56
- flight
57
- four
58
- frequency
59
- fuel
60
- full
61
- gear
62
- generator
63
- generators
64
- give
65
- glideslope
66
- go
67
- green
68
- ground
69
- heading
70
- heat
71
- hundred
72
- hydraulic
73
- i
74
- ice
75
- initial
76
- instrument
77
- instruments
78
- isolation
79
- kilograms
80
- landing
81
- left
82
- level
83
- lever
84
- levers
85
- light
86
- lights
87
- localiser
88
- m
89
- mode
90
- model
91
- nav
92
- navy
93
- of
94
- off
95
- ok
96
- on
97
- one
98
- open
99
- p
100
- packets
101
- packs
102
- parking
103
- parks
104
- passenger
105
- pilot
106
- position
107
- positive
108
- preflight
109
- probe
110
- pump
111
- pumps
112
- r
113
- rate
114
- recall
115
- removed
116
- right
117
- roger
118
- run
119
- runway
120
- s
121
- secure
122
- selector
123
- selectors
124
- set
125
- shutdown
126
- signs
127
- sit
128
- six
129
- speed
130
- start
131
- switch
132
- switches
133
- take
134
- takeoff
135
- taking
136
- tax
137
- taxi
138
- thirty
139
- thousand
140
- three
141
- thrust
142
- trust
143
- turn
144
- two
145
- u
146
- up
147
- value
148
- valve
149
- wave
150
- waves
151
- window
152
- zero
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
preprocessor_config.json CHANGED
@@ -4,7 +4,6 @@
4
  "feature_size": 1,
5
  "padding_side": "right",
6
  "padding_value": 0.0,
7
- "processor_class": "Wav2Vec2ProcessorWithLM",
8
  "return_attention_mask": false,
9
  "sampling_rate": 16000
10
  }
 
4
  "feature_size": 1,
5
  "padding_side": "right",
6
  "padding_value": 0.0,
 
7
  "return_attention_mask": false,
8
  "sampling_rate": 16000
9
  }
special_tokens_map.json CHANGED
@@ -1,30 +1,6 @@
1
  {
2
- "bos_token": {
3
- "content": "<s>",
4
- "lstrip": false,
5
- "normalized": false,
6
- "rstrip": false,
7
- "single_word": false
8
- },
9
- "eos_token": {
10
- "content": "</s>",
11
- "lstrip": false,
12
- "normalized": false,
13
- "rstrip": false,
14
- "single_word": false
15
- },
16
- "pad_token": {
17
- "content": "[PAD]",
18
- "lstrip": true,
19
- "normalized": false,
20
- "rstrip": true,
21
- "single_word": false
22
- },
23
- "unk_token": {
24
- "content": "[UNK]",
25
- "lstrip": true,
26
- "normalized": false,
27
- "rstrip": true,
28
- "single_word": false
29
- }
30
- }
 
1
  {
2
+ "bos_token": "<s>",
3
+ "eos_token": "</s>",
4
+ "pad_token": "[PAD]",
5
+ "unk_token": "[UNK]"
6
+ }
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
tokenizer_config.json CHANGED
@@ -39,7 +39,6 @@
39
  "eos_token": "</s>",
40
  "model_max_length": 1000000000000000019884624838656,
41
  "pad_token": "[PAD]",
42
- "processor_class": "Wav2Vec2ProcessorWithLM",
43
  "replace_word_delimiter_char": " ",
44
  "target_lang": null,
45
  "tokenizer_class": "Wav2Vec2CTCTokenizer",
 
39
  "eos_token": "</s>",
40
  "model_max_length": 1000000000000000019884624838656,
41
  "pad_token": "[PAD]",
 
42
  "replace_word_delimiter_char": " ",
43
  "target_lang": null,
44
  "tokenizer_class": "Wav2Vec2CTCTokenizer",