Spaces:

2506minecraft
/

Arabic-Chatbot

Running

App Files Files Community

2506minecraft commited on 14 days ago

Commit

d6e8610

verified ·

1 Parent(s): ace34fb

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -57

app.py CHANGED Viewed

@@ -3,15 +3,16 @@ import logging
 import threading
 import numpy as np
 import torch
-import librosa
 import soundfile as sf
 from pydub import AudioSegment
 from telegram import Update
 from telegram.ext import ApplicationBuilder, MessageHandler, filters, CommandHandler
-from transformers import pipeline, AutoTokenizer, VitsModel
 from huggingface_hub import login
 import asyncio
-from collections import defaultdict
 # ===== تهيئة التوكن =====
 login(token=os.getenv("HF_TOKEN"))
@@ -25,39 +26,29 @@ logger = logging.getLogger(__name__)
 # ===== تحميل النماذج =====
 try:
-    # 1. نموذج التعرف على الكلام
-    asr_pipeline = pipeline(
-        "automatic-speech-recognition",
-        model="jonatasgrosman/wav2vec2-large-xlsr-53-arabic",
-        token=os.getenv("HF_TOKEN")
-    )
-    # 2. نموذج توليف الصوت الأنثوي (الاسم الصحيح)
-    tts_tokenizer = AutoTokenizer.from_pretrained(
-        "facebook/mms-tts-ara",  # تم تغيير النموذج إلى فيسبوك MMS
-        token=os.getenv("HF_TOKEN")
-    )
-    tts_model = VitsModel.from_pretrained(
-        "facebook/mms-tts-ara",
-        token=os.getenv("HF_TOKEN")
-    )
 except Exception as e:
     logger.error(f"فشل تحميل النماذج: {str(e)}")
     raise
 # ===== ذاكرة المحادثة =====
-conversation_history = defaultdict(list)
 # ===== دوال معالجة الصوت =====
 def enhance_audio(input_path: str, output_path: str) -> bool:
     try:
-        audio = AudioSegment.from_wav(input_path)
-        audio = audio.low_pass_filter(3000)
-        audio = audio.high_pass_filter(100)
-        audio = audio.normalize()
-        audio = audio.fade_in(150).fade_out(150)
-        audio.export(output_path, format="wav")
         return True
     except Exception as e:
         logger.error(f"خطأ في تحسين الصوت: {str(e)}")
@@ -65,65 +56,73 @@ def enhance_audio(input_path: str, output_path: str) -> bool:
 async def speech_to_text(audio_path: str) -> str:
     try:
-        audio, sr = librosa.load(audio_path, sr=16000)
-        sf.write("temp.wav", audio, sr)
-        result = asr_pipeline("temp.wav")
-        return result["text"]
     except Exception as e:
         logger.error(f"فشل التعرف على الصوت: {str(e)}")
         return ""
 async def generate_response(text: str, user_id: str) -> str:
     try:
-        # تحديث ذاكرة المحادثة
-        conversation_history[user_id].append(text)
-        context = "\n".join(conversation_history[user_id][-3:])
-        chatbot = pipeline(
-            "text-generation",
-            model="aubmindlab/aragpt2-base",
-            token=os.getenv("HF_TOKEN"),
-            max_length=50,
-            temperature=0.7,
-        )
-        response = chatbot(
-            context,
             num_return_sequences=1,
-            pad_token_id=50256
         )
-        return response[0]['generated_text']
     except Exception as e:
         logger.error(f"فشل توليد الرد: {str(e)}")
-        return "حدث خطأ في توليد الرد."
 async def text_to_speech(text: str) -> None:
     try:
-        inputs = tts_tokenizer(text, return_tensors="pt")
-        with torch.no_grad():
-            output = tts_model(**inputs, speaker_id=1)  # اختيار الصوت الأنثوي
-        waveform = output.waveform[0].numpy()
-        sf.write("bot_response.wav", waveform, tts_model.config.sampling_rate)
     except Exception as e:
         logger.error(f"فشل تحويل النص إلى صوت: {str(e)}")
 # ===== دوال التفاعل مع المستخدم =====
 async def start(update: Update, context):
-    await update.message.reply_text("مرحبًا! أنا بوت الدردشة الصوتية الأنثوي 🎤\nأرسل لي رسالة صوتية وسأرد عليك بصوت أنثوي واضح.")
 async def process_voice(update: Update, context):
     try:
-        user_id = update.message.from_user.id
         voice_file = await update.message.voice.get_file()
         await voice_file.download_to_drive("user_voice.ogg")
         user_text = await speech_to_text("user_voice.ogg")
         if not user_text:
             await update.message.reply_text("لم أتمكن من فهم الصوت. يرجى المحاولة مرة أخرى.")
             return
-        bot_response = await generate_response(user_text, str(user_id))
         await text_to_speech(bot_response)
         if enhance_audio("bot_response.wav", "bot_response_enhanced.wav"):
             await update.message.reply_voice("bot_response_enhanced.wav")
         else:
@@ -142,10 +141,7 @@ def run_bot():
     application.add_handler(CommandHandler("start", start))
     application.add_handler(MessageHandler(filters.VOICE, process_voice))
-    application.run_polling(
-        close_loop=False,
-        stop_signals=[]
-    )
 if __name__ == "__main__":
     bot_thread = threading.Thread(target=run_bot, daemon=True)

 import threading
 import numpy as np
 import torch
 import soundfile as sf
 from pydub import AudioSegment
 from telegram import Update
 from telegram.ext import ApplicationBuilder, MessageHandler, filters, CommandHandler
+from transformers import AutoTokenizer, AutoModelForCausalLM
+from TTS.api import TTS
 from huggingface_hub import login
 import asyncio
+import noisereduce as nr
+from scipy.io import wavfile
 # ===== تهيئة التوكن =====
 login(token=os.getenv("HF_TOKEN"))
 # ===== تحميل النماذج =====
 try:
+    # 1. نموذج التعرف على الكلام (محدث)
+    tts = TTS(model_name="tts_models/multilingual/multi-dataset/xtts_v2", progress_bar=False, gpu=False)
+    # 2. نموذج الذكاء الاصطناعي (محدث)
+    tokenizer = AutoTokenizer.from_pretrained("aubmindlab/aragpt2-mega")
+    model = AutoModelForCausalLM.from_pretrained("aubmindlab/aragpt2-mega")
 except Exception as e:
     logger.error(f"فشل تحميل النماذج: {str(e)}")
     raise
 # ===== ذاكرة المحادثة =====
+conversation_history = {}
+MAX_HISTORY = 3
 # ===== دوال معالجة الصوت =====
 def enhance_audio(input_path: str, output_path: str) -> bool:
     try:
+        # تقليل الضوضاء وتحسين الجودة
+        rate, data = wavfile.read(input_path)
+        reduced_noise = nr.reduce_noise(y=data, sr=rate, stationary=True)
+        normalized = reduced_noise / np.max(np.abs(reduced_noise))
+        wavfile.write(output_path, rate, normalized)
         return True
     except Exception as e:
         logger.error(f"خطأ في تحسين الصوت: {str(e)}")
 async def speech_to_text(audio_path: str) -> str:
     try:
+        return tts.transcribe(audio_path, language="ar")
     except Exception as e:
         logger.error(f"فشل التعرف على الصوت: {str(e)}")
         return ""
 async def generate_response(text: str, user_id: str) -> str:
     try:
+        # إدارة ذاكرة المحادثة
+        history = conversation_history.get(user_id, [])
+        history.append(text)
+        history = history[-MAX_HISTORY:]
+        conversation_history[user_id] = history
+        # توليد الرد مع ضوابط الجودة
+        input_text = "المحادثة:\n" + "\n".join([f"أنت: {msg}" for msg in history]) + "\nالبوت:"
+        inputs = tokenizer.encode(input_text, return_tensors="pt", max_length=512, truncation=True)
+        outputs = model.generate(
+            inputs,
+            max_length=200,
             num_return_sequences=1,
+            temperature=0.7,
+            repetition_penalty=1.5,
+            pad_token_id=tokenizer.eos_token_id
         )
+        response = tokenizer.decode(outputs[0], skip_special_tokens=True).split("البوت:")[-1].strip()
+        return response.split("\n")[0]
     except Exception as e:
         logger.error(f"فشل توليد الرد: {str(e)}")
+        return "عذرًا، حدث خطأ ما. يرجى المحاولة لاحقًا."
 async def text_to_speech(text: str) -> None:
     try:
+        tts.tts_to_file(
+            text=text,
+            file_path="bot_response.wav",
+            speaker="ar_female_1",  # صوت أنثوي
+            language="ar"
+        )
     except Exception as e:
         logger.error(f"فشل تحويل النص إلى صوت: {str(e)}")
 # ===== دوال التفاعل مع المستخدم =====
 async def start(update: Update, context):
+    await update.message.reply_text("مرحبًا! أنا البوت الصوتي الأنثوي 🎤\nأرسل لي رسالة صوتية وسأرد عليك بصوت أنثوي واضح.")
 async def process_voice(update: Update, context):
     try:
+        user_id = str(update.message.from_user.id)
         voice_file = await update.message.voice.get_file()
         await voice_file.download_to_drive("user_voice.ogg")
+        # تحويل الصوت إلى نص
         user_text = await speech_to_text("user_voice.ogg")
         if not user_text:
             await update.message.reply_text("لم أتمكن من فهم الصوت. يرجى المحاولة مرة أخرى.")
             return
+        # توليد الرد
+        bot_response = await generate_response(user_text, user_id)
+        # تحويل الرد إلى صوت
         await text_to_speech(bot_response)
+        # تحسين الصوت
         if enhance_audio("bot_response.wav", "bot_response_enhanced.wav"):
             await update.message.reply_voice("bot_response_enhanced.wav")
         else:
     application.add_handler(CommandHandler("start", start))
     application.add_handler(MessageHandler(filters.VOICE, process_voice))
+    application.run_polling()
 if __name__ == "__main__":
     bot_thread = threading.Thread(target=run_bot, daemon=True)