EzraWilliam commited on
Commit
ff6537d
1 Parent(s): e2987ae

Upload tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +26 -36
vocab.json CHANGED
@@ -1,41 +1,31 @@
1
  {
2
- "0": 13,
3
- "1": 22,
4
- "2": 25,
5
- "3": 3,
6
- "4": 20,
7
- "5": 6,
8
- "6": 11,
9
- "7": 10,
10
- "8": 33,
11
- "9": 29,
12
- "[PAD]": 38,
13
- "[UNK]": 37,
14
  "a": 1,
15
- "b": 32,
16
- "c": 19,
17
- "d": 23,
18
- "e": 12,
19
- "f": 28,
20
- "g": 5,
21
- "h": 4,
22
- "i": 27,
23
- "j": 9,
24
- "k": 26,
25
- "l": 24,
26
- "m": 18,
27
- "n": 34,
28
- "o": 36,
29
- "p": 14,
30
- "q": 16,
31
- "r": 17,
32
- "s": 8,
33
- "t": 15,
34
- "u": 35,
35
- "v": 30,
36
- "w": 7,
37
- "x": 31,
38
  "y": 2,
39
- "z": 21,
40
  "|": 0
41
  }
 
1
  {
2
+ "[PAD]": 28,
3
+ "[UNK]": 27,
 
 
 
 
 
 
 
 
 
 
4
  "a": 1,
5
+ "b": 23,
6
+ "c": 14,
7
+ "d": 16,
8
+ "e": 8,
9
+ "f": 20,
10
+ "g": 4,
11
+ "h": 3,
12
+ "i": 19,
13
+ "j": 7,
14
+ "k": 18,
15
+ "l": 17,
16
+ "m": 13,
17
+ "n": 24,
18
+ "o": 26,
19
+ "p": 9,
20
+ "q": 11,
21
+ "r": 12,
22
+ "s": 6,
23
+ "t": 10,
24
+ "u": 25,
25
+ "v": 21,
26
+ "w": 5,
27
+ "x": 22,
28
  "y": 2,
29
+ "z": 15,
30
  "|": 0
31
  }