clui commited on
Commit
0aeb96c
verified
1 Parent(s): 9dfe1e3

baseline app

Browse files
Files changed (1) hide show
  1. app.py +14 -23
app.py CHANGED
@@ -5,28 +5,15 @@ from datasets import load_dataset
5
  # Za艂aduj dataset z Hugging Face
6
  dataset = load_dataset("clui/lyricsgenius")
7
 
8
- # Funkcja do 艂adowania modeli t艂umaczeniowych z cache
9
- @st.cache_resource
10
- def load_translation_models():
11
- model_name_it_en = "Helsinki-NLP/opus-mt-it-en"
12
- tokenizer_it_en = AutoTokenizer.from_pretrained(model_name_it_en)
13
- model_it_en = AutoModelForSeq2SeqLM.from_pretrained(model_name_it_en)
14
 
15
- model_name_en_pl = "gsarti/opus-mt-tc-en-pl"
16
- tokenizer_en_pl = AutoTokenizer.from_pretrained(model_name_en_pl)
17
- model_en_pl = AutoModelForSeq2SeqLM.from_pretrained(model_name_en_pl)
18
-
19
- return tokenizer_it_en, model_it_en, tokenizer_en_pl, model_en_pl
20
-
21
- # Za艂aduj modele t艂umaczeniowe
22
- tokenizer_it_en, model_it_en, tokenizer_en_pl, model_en_pl = load_translation_models()
23
-
24
- # Funkcja do t艂umaczenia tekstu
25
- def translate(text, tokenizer, model):
26
- input_ids = tokenizer(text, return_tensors="pt", padding=True).input_ids
27
- outputs = model.generate(input_ids)
28
- translated_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
29
- return translated_text
30
 
31
  # Pole do wprowadzania nazwy artysty
32
  st.title("Neural Notes")
@@ -68,7 +55,9 @@ if artist_name:
68
 
69
  for line in lines:
70
  if line.strip():
71
- translated_text = translate(line, tokenizer_it_en, model_it_en)
 
 
72
  translated_lines_en.append(translated_text)
73
  else:
74
  translated_lines_en.append("")
@@ -84,7 +73,9 @@ if artist_name:
84
 
85
  for line in translated_lines_en:
86
  if line.strip():
87
- translated_text = translate(line, tokenizer_en_pl, model_en_pl)
 
 
88
  translated_lines_pl.append(translated_text)
89
  else:
90
  translated_lines_pl.append("")
 
5
  # Za艂aduj dataset z Hugging Face
6
  dataset = load_dataset("clui/lyricsgenius")
7
 
8
+ # Wyb贸r modelu do t艂umaczenia z w艂oskiego na angielski
9
+ model_name_it_en = "Helsinki-NLP/opus-mt-it-en"
10
+ tokenizer_it_en = AutoTokenizer.from_pretrained(model_name_it_en)
11
+ model_it_en = AutoModelForSeq2SeqLM.from_pretrained(model_name_it_en)
 
 
12
 
13
+ # Wyb贸r modelu do t艂umaczenia z angielskiego na polski
14
+ model_name_en_pl = "sdadas/mt5-base-translator-en-pl"
15
+ tokenizer_en_pl = AutoTokenizer.from_pretrained(model_name_en_pl)
16
+ model_en_pl = AutoModelForSeq2SeqLM.from_pretrained(model_name_en_pl)
 
 
 
 
 
 
 
 
 
 
 
17
 
18
  # Pole do wprowadzania nazwy artysty
19
  st.title("Neural Notes")
 
55
 
56
  for line in lines:
57
  if line.strip():
58
+ inputs = tokenizer_it_en(line, return_tensors="pt", padding=True)
59
+ translated_outputs = model_it_en.generate(**inputs)
60
+ translated_text = tokenizer_it_en.decode(translated_outputs[0], skip_special_tokens=True)
61
  translated_lines_en.append(translated_text)
62
  else:
63
  translated_lines_en.append("")
 
73
 
74
  for line in translated_lines_en:
75
  if line.strip():
76
+ inputs = tokenizer_en_pl(line, return_tensors="pt", padding=True)
77
+ translated_outputs = model_en_pl.generate(**inputs)
78
+ translated_text = tokenizer_en_pl.decode(translated_outputs[0], skip_special_tokens=True)
79
  translated_lines_pl.append(translated_text)
80
  else:
81
  translated_lines_pl.append("")