Spaces:
Sleeping
Sleeping
Commit
·
5869c97
1
Parent(s):
88413ab
troubleshooting the detect language part
Browse files
app.py
CHANGED
@@ -39,14 +39,18 @@ def predict(audio, language, mic_audio=None):
|
|
39 |
else:
|
40 |
return "(please provide audio)"
|
41 |
|
|
|
42 |
audio = whisper.load_audio(input_audio)
|
43 |
audio = whisper.pad_or_trim(audio)
|
44 |
|
|
|
45 |
mel = whisper.log_mel_spectrogram(audio).to(model.device)
|
46 |
-
|
|
|
47 |
if(language == "Detect Language"):
|
48 |
-
|
49 |
-
|
|
|
50 |
else:
|
51 |
outLanguage = language_id_lookup[language.split()[0]]
|
52 |
|
|
|
39 |
else:
|
40 |
return "(please provide audio)"
|
41 |
|
42 |
+
# Uses the model's preprocessing methods to preprocess audio
|
43 |
audio = whisper.load_audio(input_audio)
|
44 |
audio = whisper.pad_or_trim(audio)
|
45 |
|
46 |
+
# Calculates the mel frequency spectogram
|
47 |
mel = whisper.log_mel_spectrogram(audio).to(model.device)
|
48 |
+
outLanguage = 'ma'
|
49 |
+
# if
|
50 |
if(language == "Detect Language"):
|
51 |
+
lang_token, lang_probs = model.detect_language(mel)
|
52 |
+
languages = [max(probs, key=probs.get) for probs in lang_probs]
|
53 |
+
print("Detected language is: " + languages)
|
54 |
else:
|
55 |
outLanguage = language_id_lookup[language.split()[0]]
|
56 |
|