Spaces:

formospeech
/

taiwanese-hakka-kaldi

Sleeping

App Files Files Community

txya900619 commited on 12 days ago

Commit

37f38b2

1 Parent(s): 6909f3d

feat: add coop in header

Browse files

Files changed (1) hide show

app.py +11 -7

app.py CHANGED Viewed

@@ -1,24 +1,27 @@
 import json
 import gradio as gr
-from omegaconf import OmegaConf
 from huggingface_hub import snapshot_download
-from vosk import Model, KaldiRecognizer
 def load_vosk(model_id: str):
     model_dir = snapshot_download(model_id)
     return Model(model_path=model_dir)
 OmegaConf.register_new_resolver("load_vosk", load_vosk)
 models_config = OmegaConf.to_object(OmegaConf.load("configs/models.yaml"))
 def automatic_speech_recognition(model_id: str, dialect_id: str, audio_data: str):
     if isinstance(models_config[model_id]["model"], dict):
         model = models_config[model_id]["model"][dialect_id]
-    else:
         model = models_config[model_id]["model"]
     sample_rate, audio_array = audio_data
     if audio_array.ndim == 2:
         audio_array = audio_array[:, 0]
@@ -30,14 +33,14 @@ def automatic_speech_recognition(model_id: str, dialect_id: str, audio_data: str
     rec.SetWords(True)
     results = []
     for start in range(0, len(audio_bytes), 4000):
         end = min(start + 4000, len(audio_bytes))
         data = audio_bytes[start:end]
         if rec.AcceptWaveform(data):
             raw_result = json.loads(rec.Result())
             results.append(raw_result)
     final_result = json.loads(rec.FinalResult())
     results.append(final_result)
@@ -48,7 +51,6 @@ def automatic_speech_recognition(model_id: str, dialect_id: str, audio_data: str
         if len(result["text"]) > 0:
             filtered_lines.append(result["text"])
     return "，".join(filtered_lines) + "。"
@@ -113,6 +115,8 @@ with demo:
         ### 研發
         - **[李鴻欣 Hung-Shin Lee](mailto:[email protected])（[聯和科創](https://www.104.com.tw/company/1a2x6bmu75)）**
         - **[陳力瑋 Li-Wei Chen](mailto:[email protected])（[聯和科創](https://www.104.com.tw/company/1a2x6bmu75)）**
         """
     )
     gr.Interface(

 import json
 import gradio as gr
 from huggingface_hub import snapshot_download
+from omegaconf import OmegaConf
+from vosk import KaldiRecognizer, Model
 def load_vosk(model_id: str):
     model_dir = snapshot_download(model_id)
     return Model(model_path=model_dir)
 OmegaConf.register_new_resolver("load_vosk", load_vosk)
 models_config = OmegaConf.to_object(OmegaConf.load("configs/models.yaml"))
 def automatic_speech_recognition(model_id: str, dialect_id: str, audio_data: str):
     if isinstance(models_config[model_id]["model"], dict):
         model = models_config[model_id]["model"][dialect_id]
+    else:
         model = models_config[model_id]["model"]
     sample_rate, audio_array = audio_data
     if audio_array.ndim == 2:
         audio_array = audio_array[:, 0]
     rec.SetWords(True)
     results = []
     for start in range(0, len(audio_bytes), 4000):
         end = min(start + 4000, len(audio_bytes))
         data = audio_bytes[start:end]
         if rec.AcceptWaveform(data):
             raw_result = json.loads(rec.Result())
             results.append(raw_result)
     final_result = json.loads(rec.FinalResult())
     results.append(final_result)
         if len(result["text"]) > 0:
             filtered_lines.append(result["text"])
     return "，".join(filtered_lines) + "。"
         ### 研發
         - **[李鴻欣 Hung-Shin Lee](mailto:[email protected])（[聯和科創](https://www.104.com.tw/company/1a2x6bmu75)）**
         - **[陳力瑋 Li-Wei Chen](mailto:[email protected])（[聯和科創](https://www.104.com.tw/company/1a2x6bmu75)）**
+        ### 合作單位
+        - **[國立聯合大學智慧客家實驗室](https://www.gohakka.org)**
         """
     )
     gr.Interface(