File size: 5,861 Bytes
23d4cfa 0b484f3 23d4cfa 684e901 23d4cfa 3f4d8ed 23d4cfa 3f4d8ed 23d4cfa 4927d22 23d4cfa 0aa9031 3f4d8ed |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 |
from pytubefix import YouTube
from pytubefix.cli import on_progress
import time
import math
import gradio as gr
import ffmpeg
from faster_whisper import WhisperModel
import requests
import json
import arabic_reshaper # pip install arabic-reshaper
from bidi.algorithm import get_display # pip install python-bidi
from moviepy import VideoFileClip, TextClip, CompositeVideoClip
import pysrt
api_key = "268976:66f4f58a2a905"
# Define your functions here
def yt_download(url):
yt = YouTube(url)
video_path = f"{yt.title}.mp4"
ys = yt.streams.get_highest_resolution()
return video_path, yt.title
def insta_download(shortcode, id_1):
url = ""
request_body = {"shortcode": shortcode, "id": id_1}
headers = {"one-api-token": api_key, "Content-Type": "application/json"}
response =, headers=headers, json=request_body)
if response.status_code == 200:
result = response.json()
return result['result']
print(f"Error: {response.status_code}, {response.text}")
return None
def extract_audio(input_video_name):
extracted_audio = f"audio-{input_video_name}.wav"
stream = ffmpeg.input(input_video)
stream = ffmpeg.output(stream, extracted_audio), overwrite_output=True)
return extracted_audio
def transcribe(audio):
model = WhisperModel("tiny")
segments, info = model.transcribe(audio)
segments = list(segments)
for segment in segments:
print("[%.2fs -> %.2fs] %s" % (segment.start, segment.end, segment.text))
return segments
def format_time(seconds):
hours = math.floor(seconds / 3600)
seconds %= 3600
minutes = math.floor(seconds / 60)
seconds %= 60
milliseconds = round((seconds - math.floor(seconds)) * 1000)
seconds = math.floor(seconds)
formatted_time = f"{hours:02d}:{minutes:02d}:{seconds:01d},{milliseconds:03d}"
return formatted_time
def generate_subtitle_file(language, segments, input_video_name):
subtitle_file = f"sub-{input_video_name}.{language}.srt"
text = ""
for index, segment in enumerate(segments):
segment_start = format_time(segment.start)
segment_end = format_time(segment.end)
text += f"{str(index+1)} \n"
text += f"{segment_start} --> {segment_end} \n"
text += f"{segment.text} \n"
text += "\n"
f = open(subtitle_file, "w", encoding='utf8')
return subtitle_file
def read_srt_file(file_path):
with open(file_path, 'r', encoding='utf-8') as file:
srt_content =
return srt_content
except FileNotFoundError:
print(f"The file {file_path} was not found.")
except Exception as e:
print(f"An error occurred: {e}")
def translate_text(api_key, source_lang, target_lang, text):
url = ""
request_body = {"source": source_lang, "target": target_lang, "text": text}
headers = {"one-api-token": api_key, "Content-Type": "application/json"}
response =, headers=headers, json=request_body)
if response.status_code == 200:
result = response.json()
return result['result']
print(f"Error: {response.status_code}, {response.text}")
return None
def write_google(google_translate):
google = ""
with open(google, 'w', encoding="utf-8") as f:
def time_to_seconds(time_obj):
return time_obj.hours * 3600 + time_obj.minutes * 60 + time_obj.seconds + time_obj.milliseconds / 1000
def create_subtitle_clips(subtitles, videosize, fontsize=24, font='/content/arial-unicode-ms.ttf', color='yellow', debug=False):
subtitle_clips = []
for subtitle in subtitles:
start_time = time_to_seconds(subtitle.start)
end_time = time_to_seconds(subtitle.end)
duration = end_time - start_time
video_width, video_height = videosize
reshaped_text = arabic_reshaper.reshape(subtitle.text)
bidi_text = get_display(reshaped_text)
text_clip = TextClip(bidi_text, fontsize=fontsize, font=font, color=color, bg_color='black', size=(video_width*3/4, None), method='label', align='West').set_start(start_time).set_duration(duration)
subtitle_x_position = 'center'
subtitle_y_position = video_height * 4 / 5
text_position = (subtitle_x_position, subtitle_y_position)
return subtitle_clips
def process_video(url, api_key):
input_video, title = yt_download(url)
input_video_name = input_video.replace(".mp4", "")
extracted_audio = extract_audio(input_video_name)
segments = transcribe(audio=extracted_audio)
language = "fa"
subtitle_file = generate_subtitle_file(language=language, segments=segments, input_video_name=input_video_name)
source_language = "en"
target_language = "fa"
srt_string = read_srt_file(subtitle_file)
google_translate = translate_text(api_key, source_language, target_language, srt_string)
video = VideoFileClip(input_video)
subtitles ="/content/", encoding="utf-8")
output_video_file = input_video_name + '_subtitled' + ".mp4"
subtitle_clips = create_subtitle_clips(subtitles, video.size)
final_video = CompositeVideoClip([video] + subtitle_clips)
final_video.write_videofile(output_video_file, codec="libx264", audio_codec="aac")
return output_video_file
def download_file(file_path):
return gr.File.update(file_path)
iface = gr.Interface(fn=process_video, inputs=["text", "text"], outputs="file")