rtler commited on
Commit
e7875f0
·
1 Parent(s): 7b517ae

Upload tokenizer

Browse files
Files changed (2) hide show
  1. added_tokens.json +2 -2
  2. vocab.json +9 -11
added_tokens.json CHANGED
@@ -1,4 +1,4 @@
1
  {
2
- "</s>": 33,
3
- "<s>": 32
4
  }
 
1
  {
2
+ "</s>": 31,
3
+ "<s>": 30
4
  }
vocab.json CHANGED
@@ -1,6 +1,6 @@
1
  {
2
- "[PAD]": 31,
3
- "[UNK]": 30,
4
  "|": 0,
5
  "ا": 1,
6
  "ب": 2,
@@ -22,13 +22,11 @@
22
  "و": 18,
23
  "ِ": 19,
24
  "ّ": 20,
25
- "ْ": 21,
26
- "ٔ": 22,
27
- "پ": 23,
28
- "چ": 24,
29
- "ژ": 25,
30
- "ک": 26,
31
- "گ": 27,
32
- "ی": 28,
33
- "ﺩ": 29
34
  }
 
1
  {
2
+ "[PAD]": 29,
3
+ "[UNK]": 28,
4
  "|": 0,
5
  "ا": 1,
6
  "ب": 2,
 
22
  "و": 18,
23
  "ِ": 19,
24
  "ّ": 20,
25
+ "ٔ": 21,
26
+ "پ": 22,
27
+ "چ": 23,
28
+ "ژ": 24,
29
+ "ک": 25,
30
+ "گ": 26,
31
+ "ی": 27
 
 
32
  }