AshwinSankar commited on
Commit
1e1bace
·
verified ·
1 Parent(s): 2679972

Upload tokenizer

Browse files
Files changed (4) hide show
  1. special_tokens_map.json +16 -0
  2. tokenization_vits.py +195 -0
  3. tokenizer_config.json +37 -0
  4. vocab.json +1240 -0
special_tokens_map.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "pad_token": {
3
+ "content": "_",
4
+ "lstrip": false,
5
+ "normalized": false,
6
+ "rstrip": false,
7
+ "single_word": false
8
+ },
9
+ "unk_token": {
10
+ "content": "<unk>",
11
+ "lstrip": false,
12
+ "normalized": false,
13
+ "rstrip": false,
14
+ "single_word": false
15
+ }
16
+ }
tokenization_vits.py ADDED
@@ -0,0 +1,195 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ """Tokenization class for VITS."""
2
+
3
+ import json
4
+ import os
5
+ import re
6
+ from typing import Any, Dict, List, Optional, Tuple, Union
7
+
8
+ from transformers.tokenization_utils import PreTrainedTokenizer
9
+ from transformers.utils import logging
10
+
11
+
12
+ logger = logging.get_logger(__name__)
13
+
14
+ VOCAB_FILES_NAMES = {"vocab_file": "vocab.json"}
15
+
16
+
17
+ def has_non_roman_characters(input_string):
18
+ # Find any character outside the ASCII range
19
+ non_roman_pattern = re.compile(r"[^\x00-\x7F]")
20
+
21
+ # Search the input string for non-Roman characters
22
+ match = non_roman_pattern.search(input_string)
23
+ has_non_roman = match is not None
24
+ return has_non_roman
25
+
26
+
27
+ class IndicVitsTokenizer(PreTrainedTokenizer):
28
+ """
29
+ Construct a VITS tokenizer.
30
+
31
+ This tokenizer inherits from [`PreTrainedTokenizer`] which contains most of the main methods. Users should refer to
32
+ this superclass for more information regarding those methods.
33
+
34
+ Args:
35
+ vocab_file (`str`):
36
+ Path to the vocabulary file.
37
+ language (`str`, *optional*):
38
+ Language identifier.
39
+ add_blank (`bool`, *optional*, defaults to `True`):
40
+ Whether to insert token id 0 in between the other tokens.
41
+ normalize (`bool`, *optional*, defaults to `True`):
42
+ Whether to normalize the input text by removing all casing and punctuation.
43
+ phonemize (`bool`, *optional*, defaults to `True`):
44
+ Whether to convert the input text into phonemes.
45
+ is_uroman (`bool`, *optional*, defaults to `False`):
46
+ Whether the `uroman` Romanizer needs to be applied to the input text prior to tokenizing.
47
+ """
48
+
49
+ vocab_files_names = VOCAB_FILES_NAMES
50
+ model_input_names = ["input_ids", "attention_mask"]
51
+
52
+ def __init__(
53
+ self,
54
+ vocab_file,
55
+ pad_token="<pad>",
56
+ unk_token="<unk>",
57
+ language=None,
58
+ add_blank=True,
59
+ normalize=True,
60
+ phonemize=True,
61
+ is_uroman=False,
62
+ **kwargs,
63
+ ) -> None:
64
+ with open(vocab_file, encoding="utf-8") as vocab_handle:
65
+ self.encoder = json.load(vocab_handle)
66
+
67
+ self.decoder = {v: k for k, v in self.encoder.items()}
68
+ self.language = language
69
+ self.add_blank = add_blank
70
+ self.normalize = normalize
71
+ self.phonemize = phonemize
72
+
73
+ self.is_uroman = is_uroman
74
+
75
+ super().__init__(
76
+ pad_token=pad_token,
77
+ unk_token=unk_token,
78
+ language=language,
79
+ add_blank=add_blank,
80
+ normalize=normalize,
81
+ phonemize=phonemize,
82
+ is_uroman=is_uroman,
83
+ **kwargs,
84
+ )
85
+
86
+ @property
87
+ def vocab_size(self):
88
+ return len(self.encoder)
89
+
90
+ def get_vocab(self):
91
+ vocab = {self.convert_ids_to_tokens(i): i for i in range(self.vocab_size)}
92
+ vocab.update(self.added_tokens_encoder)
93
+ return vocab
94
+
95
+ def normalize_text(self, input_string):
96
+ """Lowercase the input string, respecting any special token ids that may be part or entirely upper-cased."""
97
+ all_vocabulary = list(self.encoder.keys()) + list(self.added_tokens_encoder.keys())
98
+ filtered_text = ""
99
+
100
+ i = 0
101
+ while i < len(input_string):
102
+ found_match = False
103
+ for word in all_vocabulary:
104
+ if input_string[i : i + len(word)] == word:
105
+ filtered_text += word
106
+ i += len(word)
107
+ found_match = True
108
+ break
109
+
110
+ if not found_match:
111
+ filtered_text += input_string[i].lower()
112
+ i += 1
113
+
114
+ return filtered_text
115
+
116
+ def prepare_for_tokenization(
117
+ self, text: str, is_split_into_words: bool = False, normalize: Optional[bool] = None, **kwargs
118
+ ) -> Tuple[str, Dict[str, Any]]:
119
+ """
120
+ Performs any necessary transformations before tokenization.
121
+
122
+ This method should pop the arguments from kwargs and return the remaining `kwargs` as well. We test the
123
+ `kwargs` at the end of the encoding process to be sure all the arguments have been used.
124
+
125
+ Args:
126
+ text (`str`):
127
+ The text to prepare.
128
+ is_split_into_words (`bool`, *optional*, defaults to `False`):
129
+ Whether or not the input is already pre-tokenized (e.g., split into words). If set to `True`, the
130
+ tokenizer assumes the input is already split into words (for instance, by splitting it on whitespace)
131
+ which it will tokenize.
132
+ normalize (`bool`, *optional*, defaults to `None`):
133
+ Whether or not to apply punctuation and casing normalization to the text inputs. Typically, VITS is
134
+ trained on lower-cased and un-punctuated text. Hence, normalization is used to ensure that the input
135
+ text consists only of lower-case characters.
136
+ kwargs (`Dict[str, Any]`, *optional*):
137
+ Keyword arguments to use for the tokenization.
138
+
139
+ Returns:
140
+ `Tuple[str, Dict[str, Any]]`: The prepared text and the unused kwargs.
141
+ """
142
+ normalize = normalize if normalize is not None else self.normalize
143
+
144
+ if normalize:
145
+ # normalise for casing
146
+ text = self.normalize_text(text)
147
+
148
+ # strip any chars outside of the vocab (punctuation)
149
+ text = "".join(list(filter(lambda char: char in self.encoder, text))).strip()
150
+ return text, kwargs
151
+
152
+ def _tokenize(self, text: str) -> List[str]:
153
+ """Tokenize a string by inserting the `<pad>` token at the boundary between adjacent characters."""
154
+ tokens = list(text)
155
+
156
+ return tokens
157
+
158
+ def convert_tokens_to_string(self, tokens: List[str]) -> str:
159
+ if self.add_blank and len(tokens) > 1:
160
+ tokens = tokens[1::2]
161
+ return "".join(tokens)
162
+
163
+ def convert_tokens_to_ids(self, tokens: List[str]) -> List[int]:
164
+ ids = []
165
+ for token in tokens:
166
+ ids.append(self._convert_token_to_id(token))
167
+
168
+ if self.add_blank:
169
+ interspersed = [0] * (len(ids) * 2 + 1)
170
+ interspersed[1::2] = ids
171
+ ids = interspersed
172
+
173
+ return ids
174
+
175
+ def _convert_token_to_id(self, token):
176
+ """Converts a token (str) in an id using the vocab."""
177
+ return self.encoder.get(token, self.encoder.get(self.unk_token))
178
+
179
+ def _convert_id_to_token(self, index):
180
+ """Converts an index (integer) in a token (str) using the vocab."""
181
+ return self.decoder.get(index)
182
+
183
+ def save_vocabulary(self, save_directory: str, filename_prefix: Optional[str] = None) -> Union[Tuple[str], None]:
184
+ if not os.path.isdir(save_directory):
185
+ logger.error(f"Vocabulary path ({save_directory}) should be a directory")
186
+ return
187
+
188
+ vocab_file = os.path.join(
189
+ save_directory, (filename_prefix + "-" if filename_prefix else "") + VOCAB_FILES_NAMES["vocab_file"]
190
+ )
191
+
192
+ with open(vocab_file, "w", encoding="utf-8") as f:
193
+ f.write(json.dumps(self.encoder, indent=2, sort_keys=True, ensure_ascii=False) + "\n")
194
+
195
+ return (vocab_file,)
tokenizer_config.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_blank": true,
3
+ "added_tokens_decoder": {
4
+ "95": {
5
+ "content": "_",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "1218": {
13
+ "content": "<unk>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ }
20
+ },
21
+ "auto_map": {
22
+ "AutoTokenizer": [
23
+ "tokenization_vits.IndicVitsTokenizer",
24
+ null
25
+ ]
26
+ },
27
+ "clean_up_tokenization_spaces": false,
28
+ "extra_special_tokens": {},
29
+ "is_uroman": false,
30
+ "language": null,
31
+ "model_max_length": 1000000000000000019884624838656,
32
+ "normalize": true,
33
+ "pad_token": "_",
34
+ "phonemize": false,
35
+ "tokenizer_class": "IndicVitsTokenizer",
36
+ "unk_token": "<unk>"
37
+ }
vocab.json ADDED
@@ -0,0 +1,1240 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ " ": 16,
3
+ "!": 69,
4
+ "\"": 70,
5
+ "#": 71,
6
+ "$": 72,
7
+ "%": 73,
8
+ "&": 74,
9
+ "'": 1247,
10
+ "(": 76,
11
+ ")": 77,
12
+ "*": 78,
13
+ "+": 79,
14
+ ",": 80,
15
+ "-": 81,
16
+ ".": 82,
17
+ "/": 83,
18
+ "0": 1250,
19
+ "1": 1251,
20
+ "2": 1252,
21
+ "3": 1253,
22
+ "4": 1254,
23
+ "5": 1255,
24
+ "6": 1256,
25
+ "7": 1257,
26
+ "8": 1258,
27
+ "9": 1259,
28
+ ":": 84,
29
+ ";": 85,
30
+ "<": 86,
31
+ "=": 87,
32
+ ">": 88,
33
+ "?": 89,
34
+ "@": 90,
35
+ "A": 17,
36
+ "B": 18,
37
+ "C": 19,
38
+ "D": 20,
39
+ "E": 21,
40
+ "F": 22,
41
+ "G": 23,
42
+ "H": 24,
43
+ "I": 25,
44
+ "J": 26,
45
+ "K": 27,
46
+ "L": 28,
47
+ "M": 29,
48
+ "N": 30,
49
+ "O": 31,
50
+ "P": 32,
51
+ "Q": 33,
52
+ "R": 34,
53
+ "S": 35,
54
+ "T": 36,
55
+ "U": 37,
56
+ "V": 38,
57
+ "W": 39,
58
+ "X": 40,
59
+ "Y": 41,
60
+ "Z": 42,
61
+ "[": 91,
62
+ "\\": 92,
63
+ "]": 93,
64
+ "^": 94,
65
+ "_": 95,
66
+ "`": 96,
67
+ "a": 43,
68
+ "b": 44,
69
+ "c": 45,
70
+ "d": 46,
71
+ "e": 47,
72
+ "f": 48,
73
+ "g": 49,
74
+ "h": 50,
75
+ "i": 51,
76
+ "j": 52,
77
+ "k": 53,
78
+ "l": 54,
79
+ "m": 55,
80
+ "n": 56,
81
+ "o": 57,
82
+ "p": 58,
83
+ "q": 59,
84
+ "r": 60,
85
+ "s": 61,
86
+ "t": 62,
87
+ "t̺": 97,
88
+ "u": 63,
89
+ "v": 64,
90
+ "w": 65,
91
+ "x": 66,
92
+ "y": 67,
93
+ "z": 68,
94
+ "{": 98,
95
+ "|": 99,
96
+ "}": 100,
97
+ "~": 101,
98
+ "¡": 102,
99
+ "¢": 103,
100
+ "£": 104,
101
+ "¤": 105,
102
+ "¥": 106,
103
+ "¦": 107,
104
+ "§": 108,
105
+ "¨": 109,
106
+ "©": 110,
107
+ "ª": 111,
108
+ "«": 112,
109
+ "¬": 113,
110
+ "®": 114,
111
+ "¯": 115,
112
+ "°": 116,
113
+ "±": 117,
114
+ "²": 118,
115
+ "³": 119,
116
+ "´": 120,
117
+ "µ": 121,
118
+ "¶": 122,
119
+ "·": 123,
120
+ "¸": 124,
121
+ "¹": 125,
122
+ "º": 126,
123
+ "»": 127,
124
+ "¼": 128,
125
+ "½": 129,
126
+ "¾": 130,
127
+ "¿": 131,
128
+ "Â": 132,
129
+ "Ã": 133,
130
+ "×": 134,
131
+ "â": 135,
132
+ "æ": 1143,
133
+ "ç": 1149,
134
+ "ð": 1152,
135
+ "ø": 1187,
136
+ "ā": 136,
137
+ "ħ": 1169,
138
+ "ŋ": 1183,
139
+ "œ": 1191,
140
+ "ǀ": 1223,
141
+ "ǁ": 1224,
142
+ "ǂ": 1225,
143
+ "ǃ": 1226,
144
+ "ɐ": 1141,
145
+ "ɑ": 1140,
146
+ "ɒ": 1142,
147
+ "ɓ": 1144,
148
+ "ɔ": 1147,
149
+ "ɕ": 1148,
150
+ "ɖ": 1151,
151
+ "ɗ": 1150,
152
+ "ɘ": 1155,
153
+ "ə": 1154,
154
+ "ɚ": 1156,
155
+ "ɛ": 1157,
156
+ "ɜ": 1158,
157
+ "ɝ": 1159,
158
+ "ɞ": 1160,
159
+ "ɟ": 1161,
160
+ "ɠ": 1164,
161
+ "ɡ": 1163,
162
+ "ɢ": 1165,
163
+ "ɣ": 1210,
164
+ "ɤ": 1211,
165
+ "ɥ": 1170,
166
+ "ɦ": 1167,
167
+ "ɧ": 1168,
168
+ "ɨ": 1172,
169
+ "ɪ": 1173,
170
+ "ɫ": 1177,
171
+ "ɬ": 1176,
172
+ "ɭ": 1175,
173
+ "ɮ": 1178,
174
+ "ɯ": 1181,
175
+ "ɰ": 1182,
176
+ "ɱ": 1180,
177
+ "ɲ": 1185,
178
+ "ɳ": 1184,
179
+ "ɴ": 1186,
180
+ "ɵ": 1188,
181
+ "ɶ": 1192,
182
+ "ɸ": 1189,
183
+ "ɹ": 1194,
184
+ "ɺ": 1195,
185
+ "ɻ": 1197,
186
+ "ɽ": 1200,
187
+ "ɾ": 1196,
188
+ "ʀ": 1198,
189
+ "ʁ": 1199,
190
+ "ʂ": 1201,
191
+ "ʃ": 1202,
192
+ "ʄ": 1162,
193
+ "ʈ": 1203,
194
+ "ʉ": 1205,
195
+ "ʊ": 1206,
196
+ "ʋ": 1207,
197
+ "ʌ": 1209,
198
+ "ʍ": 1212,
199
+ "ʎ": 1214,
200
+ "ʏ": 1215,
201
+ "ʐ": 1217,
202
+ "ʑ": 1216,
203
+ "ʒ": 1218,
204
+ "ʔ": 1219,
205
+ "ʕ": 1221,
206
+ "ʘ": 1193,
207
+ "ʙ": 1145,
208
+ "ʛ": 1166,
209
+ "ʜ": 1171,
210
+ "ʝ": 1174,
211
+ "ʟ": 1179,
212
+ "ʡ": 1220,
213
+ "ʢ": 1222,
214
+ "ʤ": 1153,
215
+ "ʧ": 1204,
216
+ "ʰ": 1233,
217
+ "ʱ": 1234,
218
+ "ʲ": 1235,
219
+ "ʴ": 1232,
220
+ "ʷ": 1236,
221
+ "ʼ": 1231,
222
+ "ˆ": 138,
223
+ "ˈ": 1227,
224
+ "ˌ": 1228,
225
+ "ː": 1229,
226
+ "ˑ": 1230,
227
+ "˞": 1239,
228
+ "ˠ": 1237,
229
+ "ˤ": 1238,
230
+ "̃": 1249,
231
+ "̩": 1246,
232
+ "β": 1146,
233
+ "θ": 1190,
234
+ "χ": 1213,
235
+ "،": 139,
236
+ "؛": 140,
237
+ "؟": 141,
238
+ "٪": 142,
239
+ "٫": 143,
240
+ "٬": 144,
241
+ "٭": 145,
242
+ "۔": 146,
243
+ "۔۔۔": 147,
244
+ "ऀ": 148,
245
+ "ँ": 149,
246
+ "ं": 150,
247
+ "ः": 151,
248
+ "ऄ": 152,
249
+ "अ": 153,
250
+ "आ": 154,
251
+ "इ": 155,
252
+ "ई": 156,
253
+ "उ": 157,
254
+ "ऊ": 158,
255
+ "ऋ": 159,
256
+ "ऌ": 160,
257
+ "ऍ": 161,
258
+ "ऎ": 162,
259
+ "ए": 163,
260
+ "ऐ": 164,
261
+ "ऑ": 165,
262
+ "ऒ": 166,
263
+ "ओ": 167,
264
+ "औ": 168,
265
+ "क": 169,
266
+ "ख": 170,
267
+ "ग": 171,
268
+ "घ": 172,
269
+ "ङ": 173,
270
+ "च": 174,
271
+ "छ": 175,
272
+ "ज": 176,
273
+ "झ": 177,
274
+ "ञ": 178,
275
+ "ट": 179,
276
+ "ठ": 180,
277
+ "ड": 181,
278
+ "ढ": 182,
279
+ "ण": 183,
280
+ "त": 184,
281
+ "थ": 185,
282
+ "द": 186,
283
+ "ध": 187,
284
+ "न": 188,
285
+ "ऩ": 189,
286
+ "प": 190,
287
+ "फ": 191,
288
+ "ब": 192,
289
+ "भ": 193,
290
+ "म": 194,
291
+ "य": 195,
292
+ "र": 196,
293
+ "ऱ": 197,
294
+ "ल": 198,
295
+ "ळ": 199,
296
+ "ऴ": 200,
297
+ "व": 201,
298
+ "श": 202,
299
+ "ष": 203,
300
+ "स": 204,
301
+ "ह": 205,
302
+ "ऺ": 206,
303
+ "ऻ": 207,
304
+ "़": 208,
305
+ "ऽ": 209,
306
+ "ा": 210,
307
+ "ि": 211,
308
+ "ी": 212,
309
+ "ु": 213,
310
+ "ू": 214,
311
+ "ृ": 215,
312
+ "ॄ": 216,
313
+ "ॅ": 217,
314
+ "ॆ": 218,
315
+ "े": 219,
316
+ "ै": 220,
317
+ "ॉ": 221,
318
+ "ॊ": 222,
319
+ "ो": 223,
320
+ "ौ": 224,
321
+ "्": 225,
322
+ "ॎ": 226,
323
+ "ॏ": 227,
324
+ "ॐ": 228,
325
+ "॑": 229,
326
+ "॒": 230,
327
+ "॓": 231,
328
+ "॔": 232,
329
+ "ॕ": 233,
330
+ "ॖ": 234,
331
+ "ॗ": 235,
332
+ "क़": 236,
333
+ "ख़": 237,
334
+ "ग़": 238,
335
+ "ज़": 239,
336
+ "ड़": 240,
337
+ "ढ़": 241,
338
+ "फ़": 242,
339
+ "य़": 243,
340
+ "ॠ": 244,
341
+ "ॡ": 245,
342
+ "ॢ": 246,
343
+ "ॣ": 247,
344
+ "।": 248,
345
+ "॥": 249,
346
+ "०": 250,
347
+ "१": 251,
348
+ "२": 252,
349
+ "३": 253,
350
+ "४": 254,
351
+ "५": 255,
352
+ "६": 256,
353
+ "७": 257,
354
+ "८": 258,
355
+ "९": 259,
356
+ "॰": 260,
357
+ "ॱ": 261,
358
+ "ॲ": 262,
359
+ "ॳ": 263,
360
+ "ॴ": 264,
361
+ "ॵ": 265,
362
+ "ॶ": 266,
363
+ "ॷ": 267,
364
+ "ॸ": 268,
365
+ "ॹ": 269,
366
+ "ॺ": 270,
367
+ "ॻ": 271,
368
+ "ॼ": 272,
369
+ "ॽ": 273,
370
+ "ॾ": 274,
371
+ "ॿ": 275,
372
+ "ঀ": 276,
373
+ "ঁ": 277,
374
+ "ং": 278,
375
+ "ঃ": 279,
376
+ "অ": 280,
377
+ "আ": 281,
378
+ "ই": 282,
379
+ "ঈ": 283,
380
+ "উ": 284,
381
+ "ঊ": 285,
382
+ "ঋ": 286,
383
+ "ঌ": 287,
384
+ "এ": 288,
385
+ "ঐ": 289,
386
+ "ও": 290,
387
+ "ঔ": 291,
388
+ "ক": 292,
389
+ "খ": 293,
390
+ "গ": 294,
391
+ "ঘ": 295,
392
+ "ঙ": 296,
393
+ "চ": 297,
394
+ "ছ": 298,
395
+ "জ": 299,
396
+ "ঝ": 300,
397
+ "ঞ": 301,
398
+ "ট": 302,
399
+ "ঠ": 303,
400
+ "ড": 304,
401
+ "ঢ": 305,
402
+ "ণ": 306,
403
+ "ত": 307,
404
+ "থ": 308,
405
+ "দ": 309,
406
+ "ধ": 310,
407
+ "ন": 311,
408
+ "প": 312,
409
+ "ফ": 313,
410
+ "ব": 314,
411
+ "ভ": 315,
412
+ "ম": 316,
413
+ "য": 317,
414
+ "র": 318,
415
+ "ল": 319,
416
+ "শ": 320,
417
+ "ষ": 321,
418
+ "স": 322,
419
+ "হ": 323,
420
+ "়": 324,
421
+ "ঽ": 325,
422
+ "া": 326,
423
+ "ি": 327,
424
+ "ী": 328,
425
+ "ু": 329,
426
+ "ূ": 330,
427
+ "ৃ": 331,
428
+ "ৄ": 332,
429
+ "ে": 333,
430
+ "ৈ": 334,
431
+ "ো": 335,
432
+ "ৌ": 336,
433
+ "্": 337,
434
+ "ৎ": 338,
435
+ "ৗ": 339,
436
+ "ড়": 340,
437
+ "ঢ়": 341,
438
+ "য়": 342,
439
+ "ৠ": 343,
440
+ "ৡ": 344,
441
+ "ৢ": 345,
442
+ "ৣ": 346,
443
+ "০": 347,
444
+ "১": 348,
445
+ "২": 349,
446
+ "৩": 350,
447
+ "৪": 351,
448
+ "৫": 352,
449
+ "৬": 353,
450
+ "৭": 354,
451
+ "৮": 355,
452
+ "৯": 356,
453
+ "ৰ": 357,
454
+ "ৱ": 358,
455
+ "৲": 359,
456
+ "৳": 360,
457
+ "৴": 361,
458
+ "৵": 362,
459
+ "৶": 363,
460
+ "৷": 364,
461
+ "৸": 365,
462
+ "৹": 366,
463
+ "৺": 367,
464
+ "৻": 368,
465
+ "ৼ": 369,
466
+ "৽": 370,
467
+ "৾": 371,
468
+ "ਁ": 372,
469
+ "ਂ": 373,
470
+ "ਃ": 374,
471
+ "ਅ": 375,
472
+ "ਆ": 376,
473
+ "ਇ": 377,
474
+ "ਈ": 378,
475
+ "ਉ": 379,
476
+ "ਊ": 380,
477
+ "ਏ": 381,
478
+ "ਐ": 382,
479
+ "ਓ": 383,
480
+ "ਔ": 384,
481
+ "ਕ": 385,
482
+ "ਖ": 386,
483
+ "ਗ": 387,
484
+ "ਘ": 388,
485
+ "ਙ": 389,
486
+ "ਚ": 390,
487
+ "ਛ": 391,
488
+ "ਜ": 392,
489
+ "ਝ": 393,
490
+ "ਞ": 394,
491
+ "ਟ": 395,
492
+ "ਠ": 396,
493
+ "ਡ": 397,
494
+ "ਢ": 398,
495
+ "ਣ": 399,
496
+ "ਤ": 400,
497
+ "ਥ": 401,
498
+ "ਦ": 402,
499
+ "ਧ": 403,
500
+ "ਨ": 404,
501
+ "ਪ": 405,
502
+ "ਫ": 406,
503
+ "ਬ": 407,
504
+ "ਭ": 408,
505
+ "ਮ": 409,
506
+ "ਯ": 410,
507
+ "ਰ": 411,
508
+ "ਲ": 412,
509
+ "ਲ਼": 413,
510
+ "ਵ": 414,
511
+ "ਸ਼": 415,
512
+ "ਸ": 416,
513
+ "ਹ": 417,
514
+ "਼": 418,
515
+ "ਾ": 419,
516
+ "ਿ": 420,
517
+ "ੀ": 421,
518
+ "ੁ": 422,
519
+ "ੂ": 423,
520
+ "ੇ": 424,
521
+ "ੈ": 425,
522
+ "ੋ": 426,
523
+ "ੌ": 427,
524
+ "੍": 428,
525
+ "ੑ": 429,
526
+ "ਖ਼": 430,
527
+ "ਗ਼": 431,
528
+ "ਜ਼": 432,
529
+ "ੜ": 433,
530
+ "ਫ਼": 434,
531
+ "੦": 435,
532
+ "੧": 436,
533
+ "੨": 437,
534
+ "੩": 438,
535
+ "੪": 439,
536
+ "੫": 440,
537
+ "੬": 441,
538
+ "੭": 442,
539
+ "੮": 443,
540
+ "੯": 444,
541
+ "ੰ": 445,
542
+ "ੱ": 446,
543
+ "ੲ": 447,
544
+ "ੳ": 448,
545
+ "ੴ": 449,
546
+ "ੵ": 450,
547
+ "੶": 451,
548
+ "ઁ": 452,
549
+ "ં": 453,
550
+ "ઃ": 454,
551
+ "અ": 455,
552
+ "આ": 456,
553
+ "ઇ": 457,
554
+ "ઈ": 458,
555
+ "ઉ": 459,
556
+ "ઊ": 460,
557
+ "ઋ": 461,
558
+ "ઌ": 462,
559
+ "ઍ": 463,
560
+ "એ": 464,
561
+ "ઐ": 465,
562
+ "ઑ": 466,
563
+ "ઓ": 467,
564
+ "ઔ": 468,
565
+ "ક": 469,
566
+ "ખ": 470,
567
+ "ગ": 471,
568
+ "ઘ": 472,
569
+ "ઙ": 473,
570
+ "ચ": 474,
571
+ "છ": 475,
572
+ "જ": 476,
573
+ "ઝ": 477,
574
+ "ઞ": 478,
575
+ "ટ": 479,
576
+ "ઠ": 480,
577
+ "ડ": 481,
578
+ "ઢ": 482,
579
+ "ણ": 483,
580
+ "ત": 484,
581
+ "થ": 485,
582
+ "દ": 486,
583
+ "ધ": 487,
584
+ "ન": 488,
585
+ "પ": 489,
586
+ "ફ": 490,
587
+ "બ": 491,
588
+ "ભ": 492,
589
+ "મ": 493,
590
+ "ય": 494,
591
+ "ર": 495,
592
+ "લ": 496,
593
+ "ળ": 497,
594
+ "વ": 498,
595
+ "શ": 499,
596
+ "ષ": 500,
597
+ "સ": 501,
598
+ "હ": 502,
599
+ "઼": 503,
600
+ "ઽ": 504,
601
+ "ા": 505,
602
+ "િ": 506,
603
+ "ી": 507,
604
+ "ુ": 508,
605
+ "ૂ": 509,
606
+ "ૃ": 510,
607
+ "ૄ": 511,
608
+ "ૅ": 512,
609
+ "ે": 513,
610
+ "ૈ": 514,
611
+ "ૉ": 515,
612
+ "ો": 516,
613
+ "ૌ": 517,
614
+ "્": 518,
615
+ "ૐ": 519,
616
+ "ૠ": 520,
617
+ "ૡ": 521,
618
+ "ૢ": 522,
619
+ "ૣ": 523,
620
+ "૦": 524,
621
+ "૧": 525,
622
+ "૨": 526,
623
+ "૩": 527,
624
+ "૪": 528,
625
+ "૫": 529,
626
+ "૬": 530,
627
+ "૭": 531,
628
+ "૮": 532,
629
+ "૯": 533,
630
+ "૰": 534,
631
+ "૱": 535,
632
+ "ૹ": 536,
633
+ "ૺ": 537,
634
+ "ૻ": 538,
635
+ "ૼ": 539,
636
+ "૽": 540,
637
+ "૾": 541,
638
+ "૿": 542,
639
+ "ଁ": 543,
640
+ "ଂ": 544,
641
+ "ଃ": 545,
642
+ "ଅ": 546,
643
+ "ଆ": 547,
644
+ "ଇ": 548,
645
+ "ଈ": 549,
646
+ "ଉ": 550,
647
+ "ଊ": 551,
648
+ "ଋ": 552,
649
+ "ଌ": 553,
650
+ "ଏ": 554,
651
+ "ଐ": 555,
652
+ "ଓ": 556,
653
+ "ଔ": 557,
654
+ "କ": 558,
655
+ "ଖ": 559,
656
+ "ଗ": 560,
657
+ "ଘ": 561,
658
+ "ଙ": 562,
659
+ "ଚ": 563,
660
+ "ଛ": 564,
661
+ "ଜ": 565,
662
+ "ଝ": 566,
663
+ "ଞ": 567,
664
+ "ଟ": 568,
665
+ "ଠ": 569,
666
+ "ଡ": 570,
667
+ "ଢ": 571,
668
+ "ଣ": 572,
669
+ "ତ": 573,
670
+ "ଥ": 574,
671
+ "ଦ": 575,
672
+ "ଧ": 576,
673
+ "ନ": 577,
674
+ "ପ": 578,
675
+ "ଫ": 579,
676
+ "ବ": 580,
677
+ "ଭ": 581,
678
+ "ମ": 582,
679
+ "ଯ": 583,
680
+ "ର": 584,
681
+ "ଲ": 585,
682
+ "ଳ": 586,
683
+ "ଵ": 587,
684
+ "ଶ": 588,
685
+ "ଷ": 589,
686
+ "ସ": 590,
687
+ "ହ": 591,
688
+ "଼": 592,
689
+ "ଽ": 593,
690
+ "ା": 594,
691
+ "ି": 595,
692
+ "ୀ": 596,
693
+ "ୁ": 597,
694
+ "ୂ": 598,
695
+ "ୃ": 599,
696
+ "ୄ": 600,
697
+ "େ": 601,
698
+ "ୈ": 602,
699
+ "ୋ": 603,
700
+ "ୌ": 604,
701
+ "୍": 605,
702
+ "୕": 606,
703
+ "ୖ": 607,
704
+ "ୗ": 608,
705
+ "ଡ଼": 609,
706
+ "ଢ଼": 610,
707
+ "ୟ": 611,
708
+ "ୠ": 612,
709
+ "ୡ": 613,
710
+ "ୢ": 614,
711
+ "ୣ": 615,
712
+ "୦": 616,
713
+ "୧": 617,
714
+ "୨": 618,
715
+ "୩": 619,
716
+ "୪": 620,
717
+ "୫": 621,
718
+ "୬": 622,
719
+ "୭": 623,
720
+ "୮": 624,
721
+ "୯": 625,
722
+ "୰": 626,
723
+ "ୱ": 627,
724
+ "୲": 628,
725
+ "୳": 629,
726
+ "୴": 630,
727
+ "୵": 631,
728
+ "୶": 632,
729
+ "୷": 633,
730
+ "ஂ": 634,
731
+ "ஃ": 635,
732
+ "அ": 636,
733
+ "ஆ": 637,
734
+ "இ": 638,
735
+ "ஈ": 639,
736
+ "உ": 640,
737
+ "ஊ": 641,
738
+ "எ": 642,
739
+ "ஏ": 643,
740
+ "ஐ": 644,
741
+ "ஒ": 645,
742
+ "ஓ": 646,
743
+ "ஔ": 647,
744
+ "க": 648,
745
+ "ங": 649,
746
+ "ச": 650,
747
+ "ஜ": 651,
748
+ "ஞ": 652,
749
+ "ட": 653,
750
+ "ண": 654,
751
+ "த": 655,
752
+ "ந": 656,
753
+ "ன": 657,
754
+ "ப": 658,
755
+ "ம": 659,
756
+ "ய": 660,
757
+ "ர": 661,
758
+ "ற": 662,
759
+ "ல": 663,
760
+ "ள": 664,
761
+ "ழ": 665,
762
+ "வ": 666,
763
+ "ஶ": 667,
764
+ "ஷ": 668,
765
+ "ஸ": 669,
766
+ "ஹ": 670,
767
+ "ா": 671,
768
+ "ி": 672,
769
+ "ீ": 673,
770
+ "ு": 674,
771
+ "ூ": 675,
772
+ "ெ": 676,
773
+ "ே": 677,
774
+ "ை": 678,
775
+ "ொ": 679,
776
+ "ோ": 680,
777
+ "ௌ": 681,
778
+ "்": 682,
779
+ "ௐ": 683,
780
+ "ௗ": 684,
781
+ "௦": 685,
782
+ "௧": 686,
783
+ "௨": 687,
784
+ "௩": 688,
785
+ "௪": 689,
786
+ "௫": 690,
787
+ "௬": 691,
788
+ "௭": 692,
789
+ "௮": 693,
790
+ "௯": 694,
791
+ "௰": 695,
792
+ "௱": 696,
793
+ "௲": 697,
794
+ "௳": 698,
795
+ "௴": 699,
796
+ "௵": 700,
797
+ "௶": 701,
798
+ "௷": 702,
799
+ "௸": 703,
800
+ "௹": 704,
801
+ "௺": 705,
802
+ "ఀ": 706,
803
+ "ఁ": 707,
804
+ "ం": 708,
805
+ "ః": 709,
806
+ "ఄ": 710,
807
+ "అ": 711,
808
+ "ఆ": 712,
809
+ "ఇ": 713,
810
+ "ఈ": 714,
811
+ "ఉ": 715,
812
+ "ఊ": 716,
813
+ "ఋ": 717,
814
+ "ఌ": 718,
815
+ "ఎ": 719,
816
+ "ఏ": 720,
817
+ "ఐ": 721,
818
+ "ఒ": 722,
819
+ "ఓ": 723,
820
+ "ఔ": 724,
821
+ "క": 725,
822
+ "ఖ": 726,
823
+ "గ": 727,
824
+ "ఘ": 728,
825
+ "ఙ": 729,
826
+ "చ": 730,
827
+ "ఛ": 731,
828
+ "జ": 732,
829
+ "ఝ": 733,
830
+ "ఞ": 734,
831
+ "ట": 735,
832
+ "ఠ": 736,
833
+ "డ": 737,
834
+ "ఢ": 738,
835
+ "ణ": 739,
836
+ "త": 740,
837
+ "థ": 741,
838
+ "ద": 742,
839
+ "ధ": 743,
840
+ "న": 744,
841
+ "ప": 745,
842
+ "ఫ": 746,
843
+ "బ": 747,
844
+ "భ": 748,
845
+ "మ": 749,
846
+ "య": 750,
847
+ "ర": 751,
848
+ "ఱ": 752,
849
+ "ల": 753,
850
+ "ళ": 754,
851
+ "ఴ": 755,
852
+ "వ": 756,
853
+ "శ": 757,
854
+ "ష": 758,
855
+ "స": 759,
856
+ "హ": 760,
857
+ "ఽ": 761,
858
+ "ా": 762,
859
+ "ి": 763,
860
+ "ీ": 764,
861
+ "ు": 765,
862
+ "ూ": 766,
863
+ "ృ": 767,
864
+ "ౄ": 768,
865
+ "ె": 769,
866
+ "ే": 770,
867
+ "ై": 771,
868
+ "ొ": 772,
869
+ "ో": 773,
870
+ "ౌ": 774,
871
+ "్": 775,
872
+ "ౕ": 776,
873
+ "ౖ": 777,
874
+ "ౘ": 778,
875
+ "ౙ": 779,
876
+ "ౚ": 780,
877
+ "ౠ": 781,
878
+ "ౡ": 782,
879
+ "ౢ": 783,
880
+ "ౣ": 784,
881
+ "౦": 785,
882
+ "౧": 786,
883
+ "౨": 787,
884
+ "౩": 788,
885
+ "౪": 789,
886
+ "౫": 790,
887
+ "౬": 791,
888
+ "౭": 792,
889
+ "౮": 793,
890
+ "౯": 794,
891
+ "౷": 795,
892
+ "౸": 796,
893
+ "౹": 797,
894
+ "౺": 798,
895
+ "౻": 799,
896
+ "౼": 800,
897
+ "౽": 801,
898
+ "౾": 802,
899
+ "౿": 803,
900
+ "ಀ": 804,
901
+ "ಁ": 805,
902
+ "ಂ": 806,
903
+ "ಃ": 807,
904
+ "಄": 808,
905
+ "ಅ": 809,
906
+ "ಆ": 810,
907
+ "ಇ": 811,
908
+ "ಈ": 812,
909
+ "ಉ": 813,
910
+ "ಊ": 814,
911
+ "ಋ": 815,
912
+ "ಌ": 816,
913
+ "ಎ": 817,
914
+ "ಏ": 818,
915
+ "ಐ": 819,
916
+ "ಒ": 820,
917
+ "ಓ": 821,
918
+ "ಔ": 822,
919
+ "ಕ": 823,
920
+ "ಖ": 824,
921
+ "ಗ": 825,
922
+ "ಘ": 826,
923
+ "ಙ": 827,
924
+ "ಚ": 828,
925
+ "ಛ": 829,
926
+ "ಜ": 830,
927
+ "ಝ": 831,
928
+ "ಞ": 832,
929
+ "ಟ": 833,
930
+ "ಠ": 834,
931
+ "ಡ": 835,
932
+ "ಢ": 836,
933
+ "ಣ": 837,
934
+ "ತ": 838,
935
+ "ಥ": 839,
936
+ "ದ": 840,
937
+ "ಧ": 841,
938
+ "ನ": 842,
939
+ "ಪ": 843,
940
+ "ಫ": 844,
941
+ "ಬ": 845,
942
+ "ಭ": 846,
943
+ "ಮ": 847,
944
+ "ಯ": 848,
945
+ "ರ": 849,
946
+ "ಱ": 850,
947
+ "ಲ": 851,
948
+ "ಳ": 852,
949
+ "ವ": 853,
950
+ "ಶ": 854,
951
+ "ಷ": 855,
952
+ "ಸ": 856,
953
+ "ಹ": 857,
954
+ "಼": 858,
955
+ "ಽ": 859,
956
+ "ಾ": 860,
957
+ "ಿ": 861,
958
+ "ೀ": 862,
959
+ "ು": 863,
960
+ "ೂ": 864,
961
+ "ೃ": 865,
962
+ "ೄ": 866,
963
+ "ೆ": 867,
964
+ "ೇ": 868,
965
+ "ೈ": 869,
966
+ "ೊ": 870,
967
+ "ೋ": 871,
968
+ "ೌ": 872,
969
+ "್": 873,
970
+ "ೕ": 874,
971
+ "ೖ": 875,
972
+ "ೞ": 876,
973
+ "ೠ": 877,
974
+ "ೡ": 878,
975
+ "ೢ": 879,
976
+ "ೣ": 880,
977
+ "೦": 881,
978
+ "೧": 882,
979
+ "೨": 883,
980
+ "೩": 884,
981
+ "೪": 885,
982
+ "೫": 886,
983
+ "೬": 887,
984
+ "೭": 888,
985
+ "೮": 889,
986
+ "೯": 890,
987
+ "ೱ": 891,
988
+ "ೲ": 892,
989
+ "ഀ": 893,
990
+ "ഁ": 894,
991
+ "ം": 895,
992
+ "ഃ": 896,
993
+ "ഄ": 897,
994
+ "അ": 898,
995
+ "ആ": 899,
996
+ "ഇ": 900,
997
+ "ഈ": 901,
998
+ "ഉ": 902,
999
+ "ഊ": 903,
1000
+ "ഋ": 904,
1001
+ "ഌ": 905,
1002
+ "എ": 906,
1003
+ "ഏ": 907,
1004
+ "ഐ": 908,
1005
+ "ഒ": 909,
1006
+ "ഓ": 910,
1007
+ "ഔ": 911,
1008
+ "ക": 912,
1009
+ "ഖ": 913,
1010
+ "ഗ": 914,
1011
+ "ഘ": 915,
1012
+ "ങ": 916,
1013
+ "ച": 917,
1014
+ "ഛ": 918,
1015
+ "ജ": 919,
1016
+ "ഝ": 920,
1017
+ "ഞ": 921,
1018
+ "ട": 922,
1019
+ "ഠ": 923,
1020
+ "ഡ": 924,
1021
+ "ഢ": 925,
1022
+ "ണ": 926,
1023
+ "ത": 927,
1024
+ "ഥ": 928,
1025
+ "ദ": 929,
1026
+ "ധ": 930,
1027
+ "ന": 931,
1028
+ "ഩ": 932,
1029
+ "പ": 933,
1030
+ "ഫ": 934,
1031
+ "ബ": 935,
1032
+ "ഭ": 936,
1033
+ "മ": 937,
1034
+ "യ": 938,
1035
+ "ര": 939,
1036
+ "റ": 940,
1037
+ "ല": 941,
1038
+ "ള": 942,
1039
+ "ഴ": 943,
1040
+ "വ": 944,
1041
+ "ശ": 945,
1042
+ "ഷ": 946,
1043
+ "സ": 947,
1044
+ "ഹ": 948,
1045
+ "ഺ": 949,
1046
+ "഻": 950,
1047
+ "഼": 951,
1048
+ "ഽ": 952,
1049
+ "ാ": 953,
1050
+ "ി": 954,
1051
+ "ീ": 955,
1052
+ "ു": 956,
1053
+ "ൂ": 957,
1054
+ "ൃ": 958,
1055
+ "ൄ": 959,
1056
+ "െ": 960,
1057
+ "േ": 961,
1058
+ "ൈ": 962,
1059
+ "ൊ": 963,
1060
+ "ോ": 964,
1061
+ "ൌ": 965,
1062
+ "്": 966,
1063
+ "ൎ": 967,
1064
+ "൏": 968,
1065
+ "ൔ": 969,
1066
+ "ൕ": 970,
1067
+ "ൖ": 971,
1068
+ "ൗ": 972,
1069
+ "൘": 973,
1070
+ "൙": 974,
1071
+ "൚": 975,
1072
+ "൛": 976,
1073
+ "൜": 977,
1074
+ "൝": 978,
1075
+ "൞": 979,
1076
+ "ൟ": 980,
1077
+ "ൠ": 981,
1078
+ "ൡ": 982,
1079
+ "ൢ": 983,
1080
+ "ൣ": 984,
1081
+ "൦": 985,
1082
+ "൧": 986,
1083
+ "൨": 987,
1084
+ "൩": 988,
1085
+ "൪": 989,
1086
+ "൫": 990,
1087
+ "൬": 991,
1088
+ "൭": 992,
1089
+ "൮": 993,
1090
+ "൯": 994,
1091
+ "൰": 995,
1092
+ "൱": 996,
1093
+ "൲": 997,
1094
+ "൳": 998,
1095
+ "൴": 999,
1096
+ "൵": 1000,
1097
+ "൶": 1001,
1098
+ "൷": 1002,
1099
+ "൸": 1003,
1100
+ "൹": 1004,
1101
+ "ൺ": 1005,
1102
+ "ൻ": 1006,
1103
+ "ർ": 1007,
1104
+ "ൽ": 1008,
1105
+ "ൾ": 1009,
1106
+ "ൿ": 1010,
1107
+ "ᰀ": 1011,
1108
+ "ᰁ": 1012,
1109
+ "ᰂ": 1013,
1110
+ "ᰃ": 1014,
1111
+ "ᰄ": 1015,
1112
+ "ᰅ": 1016,
1113
+ "ᰆ": 1017,
1114
+ "ᰇ": 1018,
1115
+ "ᰈ": 1019,
1116
+ "ᰉ": 1020,
1117
+ "ᰊ": 1021,
1118
+ "ᰋ": 1022,
1119
+ "ᰌ": 1023,
1120
+ "ᰍ": 1024,
1121
+ "ᰎ": 1025,
1122
+ "ᰏ": 1026,
1123
+ "ᰐ": 1027,
1124
+ "ᰑ": 1028,
1125
+ "ᰒ": 1029,
1126
+ "ᰓ": 1030,
1127
+ "ᰔ": 1031,
1128
+ "ᰕ": 1032,
1129
+ "ᰖ": 1033,
1130
+ "ᰗ": 1034,
1131
+ "ᰘ": 1035,
1132
+ "ᰙ": 1036,
1133
+ "ᰚ": 1037,
1134
+ "ᰛ": 1038,
1135
+ "ᰜ": 1039,
1136
+ "ᰝ": 1040,
1137
+ "ᰞ": 1041,
1138
+ "ᰟ": 1042,
1139
+ "ᰠ": 1043,
1140
+ "ᰡ": 1044,
1141
+ "ᰢ": 1045,
1142
+ "ᰣ": 1046,
1143
+ "ᰤ": 1047,
1144
+ "ᰥ": 1048,
1145
+ "ᰦ": 1049,
1146
+ "ᰧ": 1050,
1147
+ "ᰨ": 1051,
1148
+ "ᰩ": 1052,
1149
+ "ᰪ": 1053,
1150
+ "ᰫ": 1054,
1151
+ "ᰬ": 1055,
1152
+ "ᰭ": 1056,
1153
+ "ᰮ": 1057,
1154
+ "ᰯ": 1058,
1155
+ "ᰰ": 1059,
1156
+ "ᰱ": 1060,
1157
+ "ᰲ": 1061,
1158
+ "ᰳ": 1062,
1159
+ "ᰴ": 1063,
1160
+ "ᰵ": 1064,
1161
+ "ᰶ": 1065,
1162
+ "᰷": 1066,
1163
+ "᰻": 1067,
1164
+ "᰼": 1068,
1165
+ "᰽": 1069,
1166
+ "᰾": 1070,
1167
+ "᰿": 1071,
1168
+ "᱀": 1072,
1169
+ "᱁": 1073,
1170
+ "᱂": 1074,
1171
+ "᱃": 1075,
1172
+ "᱄": 1076,
1173
+ "᱅": 1077,
1174
+ "᱆": 1078,
1175
+ "᱇": 1079,
1176
+ "᱈": 1080,
1177
+ "᱉": 1081,
1178
+ "ᱍ": 1082,
1179
+ "ᱎ": 1083,
1180
+ "ᱏ": 1084,
1181
+ "ᵻ": 1248,
1182
+ "–": 1085,
1183
+ "—": 1086,
1184
+ "‘": 1087,
1185
+ "“": 1088,
1186
+ "”": 1089,
1187
+ "†": 1090,
1188
+ "‡": 1091,
1189
+ "•": 1092,
1190
+ "…": 1093,
1191
+ "‰": 1094,
1192
+ "′": 1095,
1193
+ "″": 1096,
1194
+ "‽": 1097,
1195
+ "₠": 1098,
1196
+ "₡": 1099,
1197
+ "₢": 1100,
1198
+ "₣": 1101,
1199
+ "₤": 1102,
1200
+ "₥": 1103,
1201
+ "₦": 1104,
1202
+ "₧": 1105,
1203
+ "₨": 1106,
1204
+ "₩": 1107,
1205
+ "₪": 1108,
1206
+ "₫": 1109,
1207
+ "€": 1110,
1208
+ "₵": 1111,
1209
+ "₹": 1112,
1210
+ "₺": 1113,
1211
+ "₽": 1114,
1212
+ "₿": 1115,
1213
+ "℅": 1116,
1214
+ "№": 1117,
1215
+ "™": 1118,
1216
+ "⅛": 1119,
1217
+ "⅜": 1120,
1218
+ "⅝": 1121,
1219
+ "⅞": 1122,
1220
+ "←": 1123,
1221
+ "↑": 1241,
1222
+ "→": 1242,
1223
+ "↓": 1240,
1224
+ "↗": 1243,
1225
+ "↘": 1244,
1226
+ "↵": 1127,
1227
+ "⇒": 1128,
1228
+ "−": 1129,
1229
+ "∩": 1130,
1230
+ "≡": 1131,
1231
+ "≤": 1132,
1232
+ "Ⓡ": 1133,
1233
+ "█": 1134,
1234
+ "●": 1135,
1235
+ "☞": 1136,
1236
+ "❀": 1137,
1237
+ "ⱱ": 1208,
1238
+ "?": 1138,
1239
+ "": 1139
1240
+ }