Omnibus commited on
Commit
3ff693b
Β·
1 Parent(s): 673c5fb

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +128 -106
app.py CHANGED
@@ -13,113 +13,135 @@ tokenizer = M2M100Tokenizer.from_pretrained("facebook/m2m100_1.2B")
13
  model = M2M100ForConditionalGeneration.from_pretrained("facebook/m2m100_1.2B").to(device)
14
  model.eval()
15
 
16
- lang_id = {
 
 
 
 
 
 
 
 
 
 
 
17
  "":"",
18
- "Afrikaans": "af",
19
- "Albanian": "sq",
20
- "Amharic": "am",
21
- "Arabic": "ar",
22
- "Armenian": "hy",
23
- "Asturian": "ast",
24
- "Azerbaijani": "az",
25
- "Bashkir": "ba",
26
- "Belarusian": "be",
27
- "Bulgarian": "bg",
28
- "Bengali": "bn",
29
- "Breton": "br",
30
- "Bosnian": "bs",
31
- "Burmese": "my",
32
- "Catalan": "ca",
33
- "Cebuano": "ceb",
34
- "Chinese": "zh",
35
- "Chinese (simplified)": "zh",
36
- "Chinese (traditional)": "zh",
37
- "Croatian": "hr",
38
- "Czech": "cs",
39
- "Danish": "da",
40
- "Dutch": "nl",
41
- "English": "en",
42
- "Estonian": "et",
43
- "Fulah": "ff",
44
- "Finnish": "fi",
45
- "French": "fr",
46
- "Western Frisian": "fy",
47
- "Gaelic": "gd",
48
- "Galician": "gl",
49
- "Georgian": "ka",
50
- "German": "de",
51
- "Greek": "el",
52
- "Gujarati": "gu",
53
- "Hausa": "ha",
54
- "Hebrew": "he",
55
- "Hindi": "hi",
56
- "Haitian": "ht",
57
- "Hungarian": "hu",
58
- "Irish": "ga",
59
- "Indonesian": "id",
60
- "Igbo": "ig",
61
- "Iloko": "ilo",
62
- "Icelandic": "is",
63
- "Italian": "it",
64
- "Japanese": "ja",
65
- "Javanese": "jv",
66
- "Kazakh": "kk",
67
- "Central Khmer": "km",
68
- "Kannada": "kn",
69
- "Korean": "ko",
70
- "Luxembourgish": "lb",
71
- "Ganda": "lg",
72
- "Lingala": "ln",
73
- "Lao": "lo",
74
- "Lithuanian": "lt",
75
- "Latvian": "lv",
76
- "Malagasy": "mg",
77
- "Macedonian": "mk",
78
- "Malayalam": "ml",
79
- "Mongolian": "mn",
80
- "Marathi": "mr",
81
- "Malay": "ms",
82
- "Nepali": "ne",
83
- "Norwegian": "no",
84
- "Northern Sotho": "ns",
85
- "Occitan": "oc",
86
- "Oriya": "or",
87
- "Panjabi": "pa",
88
- "Persian": "fa",
89
- "Polish": "pl",
90
- "Pushto": "ps",
91
- "Portuguese": "pt",
92
- "Romanian": "ro",
93
- "Russian": "ru",
94
- "Sindhi": "sd",
95
- "Sinhala": "si",
96
- "Slovak": "sk",
97
- "Slovenian": "sl",
98
- "Spanish": "es",
99
- "Somali": "so",
100
- "Serbian": "sr",
101
- "Serbian (cyrillic)": "sr",
102
- "Serbian (latin)": "sr",
103
- "Swati": "ss",
104
- "Sundanese": "su",
105
- "Swedish": "sv",
106
- "Swahili": "sw",
107
- "Tamil": "ta",
108
- "Thai": "th",
109
- "Tagalog": "tl",
110
- "Tswana": "tn",
111
- "Turkish": "tr",
112
- "Ukrainian": "uk",
113
- "Urdu": "ur",
114
- "Uzbek": "uz",
115
- "Vietnamese": "vi",
116
- "Welsh": "cy",
117
- "Wolof": "wo",
118
- "Xhosa": "xh",
119
- "Yiddish": "yi",
120
- "Yoruba": "yo",
121
- "Zulu": "zu",
122
- }
 
 
 
 
 
 
 
 
 
 
 
123
 
124
  def trans_page(input,input1,trg):
125
  src_lang = lang_id["English"]
 
13
  model = M2M100ForConditionalGeneration.from_pretrained("facebook/m2m100_1.2B").to(device)
14
  model.eval()
15
 
16
+ l1="Afrikaans"
17
+ class Language:
18
+ def __init__(self, name, code):
19
+ self.name = name
20
+ self.code = code
21
+
22
+
23
+
24
+
25
+
26
+
27
+ lang_id = [
28
  "":"",
29
+ Language("Afrikaans", "af"),
30
+ Language("Albanian", "sq"),
31
+ Language("Amharic", "am"),
32
+ Language("Arabic", "ar"),
33
+ Language("Armenian", "hy"),
34
+ Language("Asturian", "ast"),
35
+ Language("Azerbaijani", "az"),
36
+ Language("Bashkir", "ba"),
37
+ Language("Belarusian", "be"),
38
+ Language("Bulgarian", "bg"),
39
+ Language("Bengali", "bn"),
40
+ Language("Breton", "br"),
41
+ Language("Bosnian", "bs"),
42
+ Language("Burmese", "my"),
43
+ Language("Catalan", "ca"),
44
+ Language("Cebuano", "ceb"),
45
+ Language("Chinese","zh"),
46
+ Language("Croatian","hr"),
47
+ Language("Czech","cs"),
48
+ Language("Danish","da"),
49
+ Language("Dutch","nl"),
50
+ Language("English","en"),
51
+ Language("Estonian","et"),
52
+ Language("Fulah","ff"),
53
+ Language("Finnish","fi"),
54
+ Language("French","fr"),
55
+ Language("Western Frisian","fy"),
56
+ Language("Gaelic","gd"),
57
+ Language("Galician","gl"),
58
+ Language("Georgian","ka"),
59
+ Language("German","de"),
60
+ Language("Greek","el"),
61
+ Language("Gujarati","gu"),
62
+ Language("Hausa","ha"),
63
+ Language("Hebrew","he"),
64
+ Language("Hindi","hi"),
65
+ Language("Haitian","ht"),
66
+ Language("Hungarian","hu"),
67
+ Language("Irish","ga"),
68
+ Language("Indonesian","id"),
69
+ Language("Igbo","ig"),
70
+ Language("",""),
71
+ Language("",""),
72
+ Language("",""),
73
+ Language("",""),
74
+ Language("",""),
75
+ Language("",""),
76
+ Language("",""),
77
+ Language("",""),
78
+ Language("",""),
79
+ Language("",""),
80
+ Language("",""),
81
+ Language("",""),
82
+ Language("",""),
83
+ "Iloko": "ilo",
84
+ "Icelandic": "is",
85
+ "Italian": "it",
86
+ "Japanese": "ja",
87
+ "Javanese": "jv",
88
+ "Kazakh": "kk",
89
+ "Central Khmer": "km",
90
+ "Kannada": "kn",
91
+ "Korean": "ko",
92
+ "Luxembourgish": "lb",
93
+ "Ganda": "lg",
94
+ "Lingala": "ln",
95
+ "Lao": "lo",
96
+ "Lithuanian": "lt",
97
+ "Latvian": "lv",
98
+ "Malagasy": "mg",
99
+ "Macedonian": "mk",
100
+ "Malayalam": "ml",
101
+ "Mongolian": "mn",
102
+ "Marathi": "mr",
103
+ "Malay": "ms",
104
+ "Nepali": "ne",
105
+ "Norwegian": "no",
106
+ "Northern Sotho": "ns",
107
+ "Occitan": "oc",
108
+ "Oriya": "or",
109
+ "Panjabi": "pa",
110
+ "Persian": "fa",
111
+ "Polish": "pl",
112
+ "Pushto": "ps",
113
+ "Portuguese": "pt",
114
+ "Romanian": "ro",
115
+ "Russian": "ru",
116
+ "Sindhi": "sd",
117
+ "Sinhala": "si",
118
+ "Slovak": "sk",
119
+ "Slovenian": "sl",
120
+ "Spanish": "es",
121
+ "Somali": "so",
122
+ "Serbian": "sr",
123
+ "Serbian (cyrillic)": "sr",
124
+ "Serbian (latin)": "sr",
125
+ "Swati": "ss",
126
+ "Sundanese": "su",
127
+ "Swedish": "sv",
128
+ "Swahili": "sw",
129
+ "Tamil": "ta",
130
+ "Thai": "th",
131
+ "Tagalog": "tl",
132
+ "Tswana": "tn",
133
+ "Turkish": "tr",
134
+ "Ukrainian": "uk",
135
+ "Urdu": "ur",
136
+ "Uzbek": "uz",
137
+ "Vietnamese": "vi",
138
+ "Welsh": "cy",
139
+ "Wolof": "wo",
140
+ "Xhosa": "xh",
141
+ "Yiddish": "yi",
142
+ "Yoruba": "yo",
143
+ "Zulu": "zu",
144
+ ]
145
 
146
  def trans_page(input,input1,trg):
147
  src_lang = lang_id["English"]