krishnagarg09 commited on
Commit
e66215f
1 Parent(s): 9074062

Update tokenizer to fast

Browse files
Files changed (3) hide show
  1. bpe.codes +0 -0
  2. pytorch_model.bin +1 -1
  3. tokenizer_config.json +1 -0
bpe.codes ADDED
The diff for this file is too large to render. See raw diff
 
pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6011be27c16b36ba3735f24e474e0420b8836ad4add73dc032e697d12b43659b
3
  size 539679413
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a68ec6ff70460ae5325a5388a3dcc93b83c5f0b67074f5986d8c6c37d78e6d5a
3
  size 539679413
tokenizer_config.json CHANGED
@@ -2,6 +2,7 @@
2
  "bos_token": "<s>",
3
  "cls_token": "<s>",
4
  "eos_token": "</s>",
 
5
  "mask_token": "<mask>",
6
  "model_max_length": 128,
7
  "name_or_path": "vinai/bertweet-base",
 
2
  "bos_token": "<s>",
3
  "cls_token": "<s>",
4
  "eos_token": "</s>",
5
+ "is_fast": true,
6
  "mask_token": "<mask>",
7
  "model_max_length": 128,
8
  "name_or_path": "vinai/bertweet-base",