Sercan commited on
Commit
bd0587b
1 Parent(s): df080b4

Upload tokenizer

Browse files
Files changed (1) hide show
  1. vocab.json +43 -43
vocab.json CHANGED
@@ -1,47 +1,47 @@
1
  {
2
- "0": 41,
3
- "1": 8,
4
- "2": 6,
5
- "3": 21,
6
- "4": 28,
7
- "5": 12,
8
- "6": 2,
9
- "7": 16,
10
- "8": 25,
11
- "9": 24,
12
  "[PAD]": 44,
13
  "[UNK]": 43,
14
- "a": 22,
15
- "b": 32,
16
- "c": 13,
17
- "d": 15,
18
- "e": 9,
19
- "f": 29,
20
- "g": 5,
21
- "h": 33,
22
- "i": 34,
23
- "j": 37,
24
- "k": 40,
25
- "l": 23,
26
- "m": 42,
27
- "n": 30,
28
- "o": 31,
29
- "p": 11,
30
- "q": 35,
31
- "r": 20,
32
- "s": 17,
33
- "t": 18,
34
- "u": 10,
35
- "v": 26,
36
- "w": 38,
37
- "x": 14,
38
- "y": 19,
39
- "z": 36,
40
- "|": 1,
41
- "ç": 27,
42
- "ö": 39,
43
- "ü": 0,
44
- "ğ": 7,
45
- "ı": 4,
46
- "ş": 3
47
  }
 
1
  {
2
+ "0": 37,
3
+ "1": 7,
4
+ "2": 20,
5
+ "3": 1,
6
+ "4": 8,
7
+ "5": 4,
8
+ "6": 33,
9
+ "7": 11,
10
+ "8": 41,
11
+ "9": 6,
12
  "[PAD]": 44,
13
  "[UNK]": 43,
14
+ "a": 29,
15
+ "b": 19,
16
+ "c": 0,
17
+ "d": 28,
18
+ "e": 18,
19
+ "f": 38,
20
+ "g": 17,
21
+ "h": 16,
22
+ "i": 15,
23
+ "j": 32,
24
+ "k": 26,
25
+ "l": 27,
26
+ "m": 13,
27
+ "n": 14,
28
+ "o": 12,
29
+ "p": 5,
30
+ "q": 22,
31
+ "r": 3,
32
+ "s": 35,
33
+ "t": 2,
34
+ "u": 9,
35
+ "v": 25,
36
+ "w": 34,
37
+ "x": 39,
38
+ "y": 30,
39
+ "z": 31,
40
+ "|": 40,
41
+ "ç": 36,
42
+ "ö": 23,
43
+ "ü": 10,
44
+ "ğ": 42,
45
+ "ı": 21,
46
+ "ş": 24
47
  }