guangyil commited on
Commit
5cf1b23
·
verified ·
1 Parent(s): 6127bfe

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +18 -29
app.py CHANGED
@@ -27,34 +27,27 @@ from huggingface_hub import hf_hub_download
27
  from infer import load_model, eval_model
28
  from spkr import SpeakerEmbedding
29
 
30
- @spaces.GPU
31
- def spkr_model_init():
32
- spkr_model = SpeakerEmbedding(device="cuda")
33
- return spkr_model
34
-
35
- def init_models():
36
- global spkr_model, model, tokenizer, tokenizer_voila, model_type
37
- global default_ref_emb_mask_list, million_voice_ref_emb_mask_list
38
-
39
- spkr_model = spkr_model_init()
40
- model, tokenizer, tokenizer_voila, model_type = load_model("maitrix-org/Voila-chat", "maitrix-org/Voila-Tokenizer")
41
- default_ref_file = "examples/character_ref_emb_demo.pkl"
42
- million_voice_ref_file = hf_hub_download(repo_id="maitrix-org/Voila-million-voice", filename="character_ref_emb_chunk0.pkl", repo_type="dataset")
43
-
44
- default_ref_emb_mask_list = pickle.load(open(default_ref_file, "rb"))
45
- million_voice_ref_emb_mask_list = pickle.load(open(million_voice_ref_file, "rb"))
46
 
47
  instruction = "You are a smart AI agent created by Maitrix.org."
48
  save_path = os.environ.get("GRADIO_TEMP_DIR", tempfile.gettempdir())
49
- default_ref_name = "Homer Simpson"
50
 
51
  intro = """**Voila**
52
 
53
  For more demos, please goto [https://voila.maitrix.org](https://voila.maitrix.org)."""
54
 
 
 
 
55
  def get_ref_embs(ref_audio):
56
  wav, sr = torchaudio.load(ref_audio)
 
57
  ref_embs = spkr_model(wav, sr).cpu()
 
58
  return ref_embs
59
 
60
  def delete_directory(request: gr.Request):
@@ -258,18 +251,14 @@ def get_asr_tab():
258
  )
259
  return asr_tab
260
 
261
- def create_demo():
262
- with gr.Blocks(fill_height=True) as demo:
263
- with gr.Tab("Chat"):
264
- chat_tab = get_chat_tab()
265
- with gr.Tab("TTS"):
266
- tts_tab = get_tts_tab()
267
- with gr.Tab("ASR"):
268
- asr_tab = get_asr_tab()
269
- demo.unload(delete_directory)
270
- return demo
271
 
272
  if __name__ == "__main__":
273
- init_models()
274
- demo = create_demo()
275
  demo.launch()
 
27
  from infer import load_model, eval_model
28
  from spkr import SpeakerEmbedding
29
 
30
+ spkr_model = SpeakerEmbedding(device="cpu")
31
+ model, tokenizer, tokenizer_voila, model_type = load_model("maitrix-org/Voila-chat", "maitrix-org/Voila-Tokenizer")
32
+ default_ref_file = "examples/character_ref_emb_demo.pkl"
33
+ default_ref_name = "Homer Simpson"
34
+ million_voice_ref_file = hf_hub_download(repo_id="maitrix-org/Voila-million-voice", filename="character_ref_emb_chunk0.pkl", repo_type="dataset")
 
 
 
 
 
 
 
 
 
 
 
35
 
36
  instruction = "You are a smart AI agent created by Maitrix.org."
37
  save_path = os.environ.get("GRADIO_TEMP_DIR", tempfile.gettempdir())
 
38
 
39
  intro = """**Voila**
40
 
41
  For more demos, please goto [https://voila.maitrix.org](https://voila.maitrix.org)."""
42
 
43
+ default_ref_emb_mask_list = pickle.load(open(default_ref_file, "rb"))
44
+ million_voice_ref_emb_mask_list = pickle.load(open(million_voice_ref_file, "rb"))
45
+
46
  def get_ref_embs(ref_audio):
47
  wav, sr = torchaudio.load(ref_audio)
48
+ spkr_model.to("cuda")
49
  ref_embs = spkr_model(wav, sr).cpu()
50
+ spkr_model.to("cpu")
51
  return ref_embs
52
 
53
  def delete_directory(request: gr.Request):
 
251
  )
252
  return asr_tab
253
 
254
+ with gr.Blocks(fill_height=True) as demo:
255
+ with gr.Tab("Chat"):
256
+ chat_tab = get_chat_tab()
257
+ with gr.Tab("TTS"):
258
+ tts_tab = get_tts_tab()
259
+ with gr.Tab("ASR"):
260
+ asr_tab = get_asr_tab()
261
+ demo.unload(delete_directory)
 
 
262
 
263
  if __name__ == "__main__":
 
 
264
  demo.launch()