Spaces:

ruslanmv
/

Youtube-Video-Translator

Running

App Files Files Community

ruslanmv commited on 18 days ago

Commit

d652e80

verified ·

1 Parent(s): ecabf05

Update app.py

Browse files

Files changed (1) hide show

app.py +43 -47

app.py CHANGED Viewed

@@ -5,6 +5,7 @@
 # importing all necessary libraries
 import httpcore
 import pathlib
 import sys, os
 from gtts import gTTS
@@ -32,13 +33,13 @@ def download_video(url):
 def validate_youtube(url):
     #This creates a youtube objet
     try:
-        yt = YouTube(url)
     except Exception:
         print("Hi there URL seems invalid")
         return True
     #This will return the length of the video in sec as an int
     video_length = yt.length
-    if   video_length > 600:
         print("Your video is larger than 10 minutes")
         return True
     else:
@@ -51,7 +52,7 @@ def validate_url(url):
         print("Hi there URL seems invalid ")
         return True
     else:
-        return False
 def cleanup():
@@ -62,16 +63,16 @@ def cleanup():
     junks = []
     for files in types:
         junks.extend(glob.glob(files))
-    try:
         # Deleting those files
         for junk in junks:
             print("Deleting",junk)
             # Setting the path for the file to delete
             file = pathlib.Path(junk)
             # Calling the unlink method on the path
-            file.unlink()
     except Exception:
-        print("I cannot delete the file because it is being used by another process")
 def getSize(filename):
     st = os.stat(filename)
@@ -82,33 +83,33 @@ def clean_transcript(transcript_list):
     script = ""
     for text in transcript_list:
         t = text["text"]
-        if( (t != '[music]')  and  \
-            (t != '[Music]')  and  \
-            (t != '[музыка]') and  \
-            (t != '[Музыка]') and  \
-            (t != '[musik]')  and  \
-            (t != '[Musik]')  and  \
-            (t != '[musica]') and  \
-            (t != '[Musica]') and  \
-            (t != '[música]') and  \
-            (t != '[Música]') and  \
             (t != '[音楽]')   and \
-            (t != '[音乐]')
-          ) :
             script += t + " "
     return script
 def get_transcript(url,desired_language):
     id_you= url[url.index("=")+1:]
-    try:
         # retrieve the available transcripts
         transcript_list = YouTubeTranscriptApi.list_transcripts(id_you)
     except Exception:
         print('TranscriptsDisabled:')
         is_translated = False
-        return " ", " ", is_translated
     lista=[]
     transcript_translation_languages=[]
@@ -130,12 +131,12 @@ def get_transcript(url,desired_language):
     matrix=matrix.tolist()
     is_manually=False
     is_automatic=False
-    for lista in matrix:
         #print(lista)
         language_code=lista[0]
         is_generated=lista[1]
         is_translatable=lista[2]
-        if not is_generated and is_translatable :
             print("Script found manually generated")
             is_manually=True
             language_code_man=language_code
@@ -143,12 +144,12 @@ def get_transcript(url,desired_language):
             print("Script found automatic generated")
             is_automatic=True
             language_code_au=language_code
     if  is_manually:
         # we try filter for manually created transcripts
         print('We extract manually created transcripts')
-        transcript = transcript_list.find_manually_created_transcript([language_code])
     elif is_automatic:
         print('We  extract generated transcript')
         # or automatically generated ones, but not translated
@@ -168,13 +169,13 @@ def get_transcript(url,desired_language):
                 transcript_translated=transcript_translated.fetch()
                 translated=clean_transcript(transcript_translated)
                 is_translated = True
-    script_translated = ""
     if is_translated :
         script_translated = translated
     transcript=transcript.fetch()
     script = clean_transcript(transcript)
     return script, script_translated, is_translated
 # Set environment variables
@@ -225,7 +226,7 @@ def video_to_translate(url,initial_language,final_language):
     elif final_language == "Vietnamese":
         lang='vi'
     elif final_language == "Japanese":
-        lang='ja'
     # Initial directory
     home_dir= os.getenv('home_dir')
     print('Initial directory:',home_dir)
@@ -271,15 +272,15 @@ def video_to_translate(url,initial_language,final_language):
                     text=text+text_chunk+" "
                 text=str(text)
                 print(type(text))
             else:
                 try:
                         text = r.recognize_google(audio_data, language = lang_in)
                 except Exception:
-                        print("This video cannot be recognized")
-                        cleanup()
-                        return "./demo/tryagain.mp4"
         #print(text)
         print("Destination language ",lang)
@@ -293,20 +294,20 @@ def video_to_translate(url,initial_language,final_language):
             print("This text cannot be translated")
             cleanup()
             return "./demo/tryagain.mp4"
         #translation.text
         trans=translation.text
-    myobj = gTTS(text=trans, lang=lang, slow=False)
-    myobj.save("audio.wav")
     # loading audio file
     audioclip = AudioFileClip("audio.wav")
     # adding audio to the video clip
     new_audioclip = CompositeAudioClip([audioclip])
     videoclip.audio = new_audioclip
     new_video="video_translated_"+lang+".mp4"
     # Return back to main directory
     os.chdir(home_dir)
     print('Final directory',os.getcwd())
@@ -326,7 +327,7 @@ gr.Interface(
     fn=video_to_translate,
     inputs=[url, initial_language, final_language],
     outputs='video',
-    #verbose=True, # This parameter has been removed from gr.Interface
     title='Video Youtube Translator',
     description='A simple application that translates Youtube small videos from English, Italian, Japanese, Russian, Spanish, and German to Italian, Spanish, Russian, English, and Japanese. Wait one minute to process.',
     article='''<div>
@@ -335,11 +336,6 @@ gr.Interface(
         </p>
     </div>''',
     examples=[
-        ["https://www.youtube.com/watch?v=uLVRZE8OAI4", "English", "Spanish"],
-        ["https://www.youtube.com/watch?v=fkGCLIQx1MI", "English", "Russian"],
-        ["https://www.youtube.com/watch?v=6Q6hFtitthQ", "Italian", "English"],
-        ["https://www.youtube.com/watch?v=s5XvjAC7ai8", "Russian", "English"],
-        ["https://www.youtube.com/watch?v=qzzweIQoIOU", "Japanese", "English"],
-        ["https://www.youtube.com/watch?v=nOGZvu6tJFE", "German", "Spanish"]
     ]
 ).launch()

 # importing all necessary libraries
 import httpcore
+#setattr(httpcore, 'SyncHTTPTransport', 'AsyncHTTPProxy') # This line is problematic and should be removed or corrected based on the intended use.
 import pathlib
 import sys, os
 from gtts import gTTS
 def validate_youtube(url):
     #This creates a youtube objet
     try:
+        yt = YouTube(url)
     except Exception:
         print("Hi there URL seems invalid")
         return True
     #This will return the length of the video in sec as an int
     video_length = yt.length
+    if  video_length > 600:
         print("Your video is larger than 10 minutes")
         return True
     else:
         print("Hi there URL seems invalid ")
         return True
     else:
+        return False
 def cleanup():
     junks = []
     for files in types:
         junks.extend(glob.glob(files))
+    try:
         # Deleting those files
         for junk in junks:
             print("Deleting",junk)
             # Setting the path for the file to delete
             file = pathlib.Path(junk)
             # Calling the unlink method on the path
+            file.unlink()
     except Exception:
+        print("I cannot delete the file because it is being used by another process")
 def getSize(filename):
     st = os.stat(filename)
     script = ""
     for text in transcript_list:
         t = text["text"]
+        if( (t != '[music]')  and \
+            (t != '[Music]')  and \
+            (t != '[музыка]') and \
+            (t != '[Музыка]') and \
+            (t != '[musik]')  and \
+            (t != '[Musik]')  and \
+            (t != '[musica]') and \
+            (t != '[Musica]') and \
+            (t != '[música]') and \
+            (t != '[Música]') and \
             (t != '[音楽]')   and \
+            (t != '[音乐]')
+        ) :
             script += t + " "
     return script
 def get_transcript(url,desired_language):
     id_you= url[url.index("=")+1:]
+    try:
         # retrieve the available transcripts
         transcript_list = YouTubeTranscriptApi.list_transcripts(id_you)
     except Exception:
         print('TranscriptsDisabled:')
         is_translated = False
+        return " ", " ", is_translated
     lista=[]
     transcript_translation_languages=[]
     matrix=matrix.tolist()
     is_manually=False
     is_automatic=False
+    for lista in matrix:
         #print(lista)
         language_code=lista[0]
         is_generated=lista[1]
         is_translatable=lista[2]
+        if not is_generated and is_translatable :
             print("Script found manually generated")
             is_manually=True
             language_code_man=language_code
             print("Script found automatic generated")
             is_automatic=True
             language_code_au=language_code
     if  is_manually:
         # we try filter for manually created transcripts
         print('We extract manually created transcripts')
+        transcript = transcript_list.find_manually_created_transcript([language_code])
     elif is_automatic:
         print('We  extract generated transcript')
         # or automatically generated ones, but not translated
                 transcript_translated=transcript_translated.fetch()
                 translated=clean_transcript(transcript_translated)
                 is_translated = True
+    script_translated = ""
     if is_translated :
         script_translated = translated
     transcript=transcript.fetch()
     script = clean_transcript(transcript)
     return script, script_translated, is_translated
 # Set environment variables
     elif final_language == "Vietnamese":
         lang='vi'
     elif final_language == "Japanese":
+        lang='ja'
     # Initial directory
     home_dir= os.getenv('home_dir')
     print('Initial directory:',home_dir)
                     text=text+text_chunk+" "
                 text=str(text)
                 print(type(text))
             else:
                 try:
                         text = r.recognize_google(audio_data, language = lang_in)
                 except Exception:
+                    print("This video cannot be recognized")
+                    cleanup()
+                    return "./demo/tryagain.mp4"
         #print(text)
         print("Destination language ",lang)
             print("This text cannot be translated")
             cleanup()
             return "./demo/tryagain.mp4"
         #translation.text
         trans=translation.text
+    myobj = gTTS(text=trans, lang=lang, slow=False)
+    myobj.save("audio.wav")
     # loading audio file
     audioclip = AudioFileClip("audio.wav")
     # adding audio to the video clip
     new_audioclip = CompositeAudioClip([audioclip])
     videoclip.audio = new_audioclip
     new_video="video_translated_"+lang+".mp4"
     # Return back to main directory
     os.chdir(home_dir)
     print('Final directory',os.getcwd())
     fn=video_to_translate,
     inputs=[url, initial_language, final_language],
     outputs='video',
+    #verbose=True, # Removed verbose as it's no longer a valid parameter
     title='Video Youtube Translator',
     description='A simple application that translates Youtube small videos from English, Italian, Japanese, Russian, Spanish, and German to Italian, Spanish, Russian, English, and Japanese. Wait one minute to process.',
     article='''<div>
         </p>
     </div>''',
     examples=[
+        ["https://www.youtube.com/watch?v=uLVRZE8OAI4", "English", "Spanish"]
     ]
 ).launch()