Spaces:
Running
Running
File size: 1,796 Bytes
17263d1 ba051ef 17263d1 ba051ef 17263d1 ba051ef 17263d1 ba051ef 17263d1 ba051ef 17263d1 ba051ef 17263d1 ba051ef 17263d1 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 |
#!/usr/bin/python3
# -*- coding: utf-8 -*-
import argparse
import shutil
from gradio_client import Client, handle_file
# language1 = "英语"
# language2 = "English"
# language1 = "西班牙语"
# language2 = "Spanish"
language1 = "日语"
language2 = "Japanese"
# language1 = "葡萄牙语"
# language2 = "Portuguese"
# language1 = "韩语"
# language2 = "Korean"
# language1 = "阿拉伯语"
# language2 = "Arabic"
# language1 = "中国台湾"
# language2 = "Chinese"
def get_args():
parser = argparse.ArgumentParser()
parser.add_argument(
"--text",
# default="thirty-three dollars and seventy-two cents",
# default="treinta y tres euros con setenta y dos céntimos",
default="33.72円",
# default="33.72 درهم",
# default="三十三元七角两分",
type=str,
)
parser.add_argument(
"--reference",
default=rf"E:\牛信文档\语音克隆\多语种语音克隆\money_num\{language1}\{language2}_1.wav",
type=str,
)
parser.add_argument(
"--output_file",
default=rf"E:\牛信文档\语音克隆\多语种语音克隆\money_num\{language1}\xtts_v2_{language2.lower()}_2.wav",
type=str,
)
args = parser.parse_args()
return args
def main():
args = get_args()
client = Client("https://coqui-xtts.hf.space/--replicas/o7bhl/")
_, synthesised_audio, _, _ = client.predict(
args.text,
# "en",
# "es",
"ja",
# "pt",
# "ko",
# "ar",
# "zh-cn",
args.reference,
args.reference,
False, False, True, True,
fn_index=1
)
shutil.move(
synthesised_audio,
args.output_file
)
return
if __name__ == '__main__':
main()
|