Gregniuki commited on
Commit
a3f47ba
·
verified ·
1 Parent(s): 23673a8

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -8
app.py CHANGED
@@ -52,7 +52,7 @@ vocos = Vocos.from_pretrained("charactr/vocos-mel-24khz")
52
  target_sample_rate = 24000
53
  n_mel_channels = 100
54
  hop_length = 256
55
- target_rms = 0.15
56
  nfe_step = 8 # 16, 32
57
  cfg_strength = 2.0
58
  ode_method = "euler"
@@ -274,13 +274,7 @@ def infer(ref_audio_orig, ref_text, gen_text, exp_name, remove_silence, cross_fa
274
 
275
  if not ref_text.strip():
276
  gr.Info("No reference text provided, transcribing reference audio...")
277
- ref_text = pipe(
278
- ref_audio,
279
- chunk_length_s=30,
280
- batch_size=128,
281
- generate_kwargs={"task": "transcribe"},
282
- return_timestamps=False,
283
- )["text"].strip()
284
  gr.Info("Finished transcription")
285
  else:
286
  gr.Info("Using custom reference text...")
 
52
  target_sample_rate = 24000
53
  n_mel_channels = 100
54
  hop_length = 256
55
+ target_rms = 0.1
56
  nfe_step = 8 # 16, 32
57
  cfg_strength = 2.0
58
  ode_method = "euler"
 
274
 
275
  if not ref_text.strip():
276
  gr.Info("No reference text provided, transcribing reference audio...")
277
+ ref_text = gen_text
 
 
 
 
 
 
278
  gr.Info("Finished transcription")
279
  else:
280
  gr.Info("Using custom reference text...")