nbh-rjn commited on
Commit
a9756dd
·
verified ·
1 Parent(s): e239d3d

Upload tokenizer

Browse files
Files changed (2) hide show
  1. special_tokens_map.json +3 -21
  2. tokenizer_config.json +1 -1
special_tokens_map.json CHANGED
@@ -103,26 +103,8 @@
103
  "<unk_101>",
104
  "<unk_102>"
105
  ],
106
- "eos_token": {
107
- "content": "</s>",
108
- "lstrip": false,
109
- "normalized": false,
110
- "rstrip": false,
111
- "single_word": false
112
- },
113
  "mask_token": "<mask_2>",
114
- "pad_token": {
115
- "content": "<pad>",
116
- "lstrip": false,
117
- "normalized": false,
118
- "rstrip": false,
119
- "single_word": false
120
- },
121
- "unk_token": {
122
- "content": "<unk>",
123
- "lstrip": false,
124
- "normalized": false,
125
- "rstrip": false,
126
- "single_word": false
127
- }
128
  }
 
103
  "<unk_101>",
104
  "<unk_102>"
105
  ],
106
+ "eos_token": "</s>",
 
 
 
 
 
 
107
  "mask_token": "<mask_2>",
108
+ "pad_token": "<pad>",
109
+ "unk_token": "<unk>"
 
 
 
 
 
 
 
 
 
 
 
 
110
  }
tokenizer_config.json CHANGED
@@ -958,7 +958,7 @@
958
  "full_tokenizer_file": null,
959
  "mask_token": "<mask_2>",
960
  "mask_token_sent": "<mask_1>",
961
- "model_max_length": 512,
962
  "offset": 103,
963
  "pad_token": "<pad>",
964
  "sp_model_kwargs": {},
 
958
  "full_tokenizer_file": null,
959
  "mask_token": "<mask_2>",
960
  "mask_token_sent": "<mask_1>",
961
+ "model_max_length": 1024,
962
  "offset": 103,
963
  "pad_token": "<pad>",
964
  "sp_model_kwargs": {},