hadiqa123 commited on
Commit
697b7f6
1 Parent(s): d387f35

add tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +14 -14
vocab.json CHANGED
@@ -1,19 +1,19 @@
1
  {
 
2
  "[PAD]": 16,
3
  "[UNK]": 15,
4
- "|": 0,
5
- "ا": 2,
6
- "ب": 14,
7
- "ت": 13,
8
- "د": 1,
9
- "ز": 7,
10
- "س": 9,
11
- "ل": 11,
12
- "م": 12,
13
  "ڑ": 8,
14
- "ک": 5,
15
- "ھ": 6,
16
- "ہ": 4,
17
- "ی": 3,
18
- "ے": 10
19
  }
 
1
  {
2
+ " ": 11,
3
  "[PAD]": 16,
4
  "[UNK]": 15,
5
+ "ا": 4,
6
+ "ب": 5,
7
+ "ت": 14,
8
+ "د": 13,
9
+ "ز": 12,
10
+ "س": 3,
11
+ "ل": 9,
12
+ "م": 7,
 
13
  "ڑ": 8,
14
+ "ک": 2,
15
+ "ھ": 10,
16
+ "ہ": 6,
17
+ "ی": 0,
18
+ "ے": 1
19
  }