Spaces:

atsushieee
/

sovits-test

Running

App Files Files Community

atsushieee commited on Dec 8, 2024

Commit

11646d7

1 Parent(s): 770369d

Update main.py

Browse files

Files changed (1) hide show

main.py +113 -5

main.py CHANGED Viewed

@@ -28,8 +28,116 @@ data = {
 df = pd.DataFrame(data)
-# 入力音声のアップロード
-    input_audio = gr.Audio(
-        label="変換したい音声をアップロード",
-        type="filepath"  # ファイルパスとして取得
-    )

 df = pd.DataFrame(data)
+def create_plot():
+    fig = px.scatter(df, x='x', y='y', text='id',
+                    title='Interactive Numeric Scatter Plot')
+    # マーカーのスタイルを設定（紫系の色に設定）
+    fig.update_traces(
+        marker=dict(
+            size=10,
+            color='#663399',  # 紫色
+            line=dict(color='#4B0082', width=1)  # より暗い紫の境界線
+        ),
+        textposition='top center'
+    )
+    # レイアウトの設定
+    fig.update_layout(
+        height=600,
+        width=800,
+        clickmode='event+select',
+        plot_bgcolor='#eeeeee',
+        paper_bgcolor='white',
+        xaxis=dict(
+            showgrid=True,
+            zeroline=True,
+            range=[-35, 35]  # x軸の範囲を設定
+        ),
+        yaxis=dict(
+            showgrid=True,
+            zeroline=True,
+            range=[-30, 30]  # y軸の範囲を設定
+        )
+    )
+    return fig
+def run_main(audio_file, shift, speaker_id):
+    # 固定の引数を設定
+    class Args:
+        pass
+    args = Args()
+    args.config = "configs/base.yaml"
+    args.model = "./vits_pretrain/sovits5.0.pretrain.pth"
+    speaker_str = f"{speaker_id:04d}"
+    args.spk = f"./configs/singers/singer{speaker_str}.npy"
+    args.wave = audio_file
+    print(audio_file)
+    args.shift = shift
+    # オプショナルパラメータのデフォルト値設定
+    args.ppg = None
+    args.vec = None
+    args.pit = None
+    args.enable_retrieval = False
+    args.retrieval_index_prefix = ""
+    args.retrieval_ratio = 0.5
+    args.n_retrieval_vectors = 3
+    args.hubert_index_path = None
+    args.whisper_index_path = None
+    args.debug = False
+    try:
+        main(args)
+        return "svc_out.wav"  # 音声ファイルのパスを返す
+    except Exception as e:
+        return None
+# Gradio インターフェースの作成
+with gr.Blocks() as demo:
+    gr.Markdown("# SVC 音声変換システム")
+    with gr.Row():
+        with gr.Column(scale=1.15):
+            plot = gr.Plot(value=create_plot())
+        with gr.Column(scale=1):
+            # 入力音声のアップロード
+            input_audio = gr.Audio(
+                label="変換したい音声をアップロード",
+                type="filepath"  # ファイルパスとして取得
+            )
+            # Speaker ID の選択
+            speaker_id = gr.Number(
+                label="Speaker ID (1-56)",
+                value=1,
+                minimum=1,
+                maximum=56,
+                step=1
+            )
+            # Pitch シフトのスライダー
+            shift = gr.Slider(
+                minimum=-12,
+                maximum=12,
+                value=0,
+                step=1,
+                label="Pitch Shift（-12から+12の半音）"
+            )
+            # ボタン
+            run_btn = gr.Button(value="音声変換を実行", variant="primary", size="lg")
+    # 出力表示用
+    output_audio = gr.Audio(label="変換後の音声")
+    run_btn.click(
+        fn=run_main,
+        inputs=[input_audio, shift, speaker_id],
+        outputs=[output_audio]
+    )
+# アプリケーションの起動
+if __name__ == "__main__":
+    demo.launch()