Spaces:

2506minecraft
/

Arabic-Chatbot

Running

App Files Files Community

2506minecraft commited on 13 days ago

Commit

fd24c4a

verified ·

1 Parent(s): c51d569

Update app.py

Browse files

Files changed (1) hide show

app.py +17 -11

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ import soundfile as sf
 from pydub import AudioSegment
 from telegram import Update
 from telegram.ext import ApplicationBuilder, MessageHandler, filters, CommandHandler
-from transformers import pipeline
 from huggingface_hub import login
 import asyncio
 from collections import defaultdict
@@ -32,8 +32,15 @@ try:
         token=os.getenv("HF_TOKEN")
     )
-    # 2. نموذج توليف الصوت
-    tts_pipeline = pipeline("text-to-speech", model="mohamedhossam/arabic-tts", token=os.getenv("HF_TOKEN"))
 except Exception as e:
     logger.error(f"فشل تحميل النماذج: {str(e)}")
@@ -84,15 +91,18 @@ async def generate_response(text: str, user_id: str) -> str:
             num_return_sequences=1,
             pad_token_id=50256
         )
-        return response[0]['generated_text'].strip()  # إزالة المسافات الزائدة
     except Exception as e:
         logger.error(f"فشل توليد الرد: {str(e)}")
         return "حدث خطأ في توليد الرد."
 async def text_to_speech(text: str) -> None:
     try:
-        audio = tts_pipeline(text)
-        sf.write("bot_response.wav", audio["audio"], 22050)  # تأكد من استخدام معدل العينة الصحيح
     except Exception as e:
         logger.error(f"فشل تحويل النص إلى صوت: {str(e)}")
@@ -107,12 +117,8 @@ async def process_voice(update: Update, context):
         await voice_file.download_to_drive("user_voice.ogg")
         user_text = await speech_to_text("user_voice.ogg")
-        if not user_text:
-            await update.message.reply_text("لم أتمكن من فهم الصوت. يرجى المحاولة مرة أخرى.")
-            return
         bot_response = await generate_response(user_text, str(user_id))
-        await text_to speech(bot_response)
         if enhance_audio("bot_response.wav", "bot_response_enhanced.wav"):
             await update.message.reply_voice("bot_response_enhanced.wav")

 from pydub import AudioSegment
 from telegram import Update
 from telegram.ext import ApplicationBuilder, MessageHandler, filters, CommandHandler
+from transformers import pipeline, AutoTokenizer, VitsModel
 from huggingface_hub import login
 import asyncio
 from collections import defaultdict
         token=os.getenv("HF_TOKEN")
     )
+    # 2. نموذج توليف الصوت الأنثوي (الاسم الصحيح)
+    tts_tokenizer = AutoTokenizer.from_pretrained(
+        "facebook/mms-tts-ara",  # تم تغيير النموذج إلى فيسبوك MMS
+        token=os.getenv("HF_TOKEN")
+    )
+    tts_model = VitsModel.from_pretrained(
+        "facebook/mms-tts-ara",
+        token=os.getenv("HF_TOKEN")
+    )
 except Exception as e:
     logger.error(f"فشل تحميل النماذج: {str(e)}")
             num_return_sequences=1,
             pad_token_id=50256
         )
+        return response[0]['generated_text']
     except Exception as e:
         logger.error(f"فشل توليد الرد: {str(e)}")
         return "حدث خطأ في توليد الرد."
 async def text_to_speech(text: str) -> None:
     try:
+        inputs = tts_tokenizer(text, return_tensors="pt")
+        with torch.no_grad():
+            output = tts_model(**inputs, speaker_id=1)  # اختيار الصوت الأنثوي
+        waveform = output.waveform[0].numpy()
+        sf.write("bot_response.wav", waveform, tts_model.config.sampling_rate)
     except Exception as e:
         logger.error(f"فشل تحويل النص إلى صوت: {str(e)}")
         await voice_file.download_to_drive("user_voice.ogg")
         user_text = await speech_to_text("user_voice.ogg")
         bot_response = await generate_response(user_text, str(user_id))
+        await text_to_speech(bot_response)
         if enhance_audio("bot_response.wav", "bot_response_enhanced.wav"):
             await update.message.reply_voice("bot_response_enhanced.wav")