EzraWilliam commited on
Commit
6f33fbc
1 Parent(s): 57b07a3

Upload tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +29 -27
vocab.json CHANGED
@@ -1,31 +1,33 @@
1
  {
2
- "[PAD]": 28,
3
- "[UNK]": 27,
4
- "a": 1,
5
- "b": 23,
6
- "c": 14,
7
- "d": 16,
8
- "e": 8,
 
 
9
  "f": 20,
10
- "g": 4,
11
- "h": 3,
12
- "i": 19,
13
- "j": 7,
14
- "k": 18,
15
- "l": 17,
16
- "m": 13,
17
- "n": 24,
18
  "o": 26,
19
- "p": 9,
20
- "q": 11,
21
- "r": 12,
22
- "s": 6,
23
- "t": 10,
24
- "u": 25,
25
- "v": 21,
26
- "w": 5,
27
- "x": 22,
28
- "y": 2,
29
- "z": 15,
30
- "|": 0
31
  }
 
1
  {
2
+ "\"": 8,
3
+ "'": 22,
4
+ "[PAD]": 30,
5
+ "[UNK]": 29,
6
+ "a": 24,
7
+ "b": 19,
8
+ "c": 5,
9
+ "d": 27,
10
+ "e": 23,
11
  "f": 20,
12
+ "g": 9,
13
+ "h": 16,
14
+ "i": 14,
15
+ "j": 28,
16
+ "k": 3,
17
+ "l": 1,
18
+ "m": 12,
19
+ "n": 2,
20
  "o": 26,
21
+ "p": 18,
22
+ "q": 25,
23
+ "r": 15,
24
+ "s": 21,
25
+ "t": 13,
26
+ "u": 10,
27
+ "v": 0,
28
+ "w": 17,
29
+ "x": 7,
30
+ "y": 4,
31
+ "z": 6,
32
+ "|": 11
33
  }