Spaces:

AvtnshM
/

Indic_ASR

Runtime error

App Files Files Community

AvtnshM commited on Aug 29

Commit

96f2af5

verified ·

1 Parent(s): ffdd72d

V6.0

Browse files

Files changed (1) hide show

app.py +41 -4

app.py CHANGED Viewed

@@ -13,12 +13,29 @@ def load_model():
     """Load the AI4Bharat IndicConformer model"""
     try:
         print("Loading AI4Bharat IndicConformer model...")
-        model = AutoModel.from_pretrained(model_name, trust_remote_code=True)
         print("✅ Model loaded successfully!")
         return model
     except Exception as e:
         print(f"❌ Error loading model: {e}")
-        return None
 # Load the model
 model = load_model()
@@ -137,6 +154,8 @@ with gr.Blocks(title="भारतीय भाषा स्पीच टू ट
         **मॉडल स्थिति (Model Status):** {model_status}
         AI4Bharat के बहुभाषी मॉडल का उपयोग करके भाषण को टेक्स्ट में बदलें।
         (Convert speech to text using AI4Bharat's multilingual model.)
@@ -190,6 +209,7 @@ with gr.Blocks(title="भारतीय भाषा स्पीच टू ट
                 with gr.Row():
                     mic_submit_btn = gr.Button("🔄 ट्रांसक्राइब करें", variant="primary", size="lg")
                     clear_mic_btn = gr.Button("🗑️ साफ़ करें", variant="secondary")
             with gr.Column(scale=1):
                 mic_output = gr.Textbox(
@@ -197,7 +217,8 @@ with gr.Blocks(title="भारतीय भाषा स्पीच टू ट
                     placeholder="रिकॉर्डिंग के बाद आपका ट्रांस्क्रिप्शन यहाँ दिखाई देगा...",
                     lines=8,
                     max_lines=15,
-                    interactive=False
                 )
         # Button actions for microphone tab
@@ -218,6 +239,13 @@ with gr.Blocks(title="भारतीय भाषा स्पीच टू ट
             lambda: (None, ""),
             outputs=[microphone_input, mic_output]
         )
     with gr.Tab("📁 फ़ाइल अपलोड (File Upload)"):
         gr.Markdown("### ट्रांस्क्रिप्शन के लिए एक ऑडियो फ़ाइल अपलोड करें")
@@ -235,6 +263,7 @@ with gr.Blocks(title="भारतीय भाषा स्पीच टू ट
                 with gr.Row():
                     file_submit_btn = gr.Button("🔄 फ़ाइल ट्रांसक्राइब करें", variant="primary", size="lg")
                     clear_file_btn = gr.Button("🗑️ साफ़ करें", variant="secondary")
             with gr.Column(scale=1):
                 file_output = gr.Textbox(
@@ -242,7 +271,8 @@ with gr.Blocks(title="भारतीय भाषा स्पीच टू ट
                     placeholder="एक ऑडियो फ़ाइल अपलोड करें और ट्रांसक्राइब पर क्लिक करें...",
                     lines=8,
                     max_lines=15,
-                    interactive=False
                 )
         # Button actions for file tab
@@ -256,6 +286,13 @@ with gr.Blocks(title="भारतीय भाषा स्पीच टू ट
             lambda: (None, ""),
             outputs=[file_input, file_output]
         )
     gr.Markdown(
         f"""

     """Load the AI4Bharat IndicConformer model"""
     try:
         print("Loading AI4Bharat IndicConformer model...")
+        print("This may take 2-3 minutes for first time download...")
+        # Load model with low memory usage
+        model = AutoModel.from_pretrained(
+            model_name,
+            trust_remote_code=True,
+            torch_dtype=torch.float32,
+            low_cpu_mem_usage=True
+        )
         print("✅ Model loaded successfully!")
         return model
     except Exception as e:
         print(f"❌ Error loading model: {e}")
+        print("Trying alternative loading method...")
+        try:
+            # Fallback: Load without low memory optimization
+            model = AutoModel.from_pretrained(model_name, trust_remote_code=True)
+            print("✅ Model loaded with fallback method!")
+            return model
+        except Exception as e2:
+            print(f"❌ All loading methods failed: {e2}")
+            return None
 # Load the model
 model = load_model()
         **मॉडल स्थिति (Model Status):** {model_status}
+        {'⏳ **पहली बार लोड हो रहा है - कृपया 2-3 मिनट प्रतीक्षा करें (First time loading - please wait 2-3 minutes)**' if model is None else ''}
         AI4Bharat के बहुभाषी मॉडल का उपयोग करके भाषण को टेक्स्ट में बदलें।
         (Convert speech to text using AI4Bharat's multilingual model.)
                 with gr.Row():
                     mic_submit_btn = gr.Button("🔄 ट्रांसक्राइब करें", variant="primary", size="lg")
                     clear_mic_btn = gr.Button("🗑️ साफ़ करें", variant="secondary")
+                    copy_mic_btn = gr.Button("📋 कॉपी करें", variant="secondary")
             with gr.Column(scale=1):
                 mic_output = gr.Textbox(
                     placeholder="रिकॉर्डिंग के बाद आपका ट्रांस्क्रिप्शन यहाँ दिखाई देगा...",
                     lines=8,
                     max_lines=15,
+                    interactive=True,  # Enable text selection and copying
+                    show_copy_button=True  # Add copy button
                 )
         # Button actions for microphone tab
             lambda: (None, ""),
             outputs=[microphone_input, mic_output]
         )
+        # Copy functionality for microphone tab
+        copy_mic_btn.click(
+            lambda x: x,  # Return the same text to enable copying
+            inputs=mic_output,
+            outputs=mic_output
+        )
     with gr.Tab("📁 फ़ाइल अपलोड (File Upload)"):
         gr.Markdown("### ट्रांस्क्रिप्शन के लिए एक ऑडियो फ़ाइल अपलोड करें")
                 with gr.Row():
                     file_submit_btn = gr.Button("🔄 फ़ाइल ट्रांसक्राइब करें", variant="primary", size="lg")
                     clear_file_btn = gr.Button("🗑️ साफ़ करें", variant="secondary")
+                    copy_file_btn = gr.Button("📋 कॉपी करें", variant="secondary")
             with gr.Column(scale=1):
                 file_output = gr.Textbox(
                     placeholder="एक ऑडियो फ़ाइल अपलोड करें और ट्रांसक्राइब पर क्लिक करें...",
                     lines=8,
                     max_lines=15,
+                    interactive=True,  # Enable text selection and copying
+                    show_copy_button=True  # Add copy button
                 )
         # Button actions for file tab
             lambda: (None, ""),
             outputs=[file_input, file_output]
         )
+        # Copy functionality for file tab
+        copy_file_btn.click(
+            lambda x: x,  # Return the same text to enable copying
+            inputs=file_output,
+            outputs=file_output
+        )
     gr.Markdown(
         f"""