Spaces:

atlury
/

digitalhuman

Running

App Files Files Community

atlury commited on Sep 15, 2024

Commit

0f941de

verified ·

1 Parent(s): 59ff6b9

Update index.html

Browse files

Files changed (1) hide show

index.html +106 -62

index.html CHANGED Viewed

@@ -1,63 +1,107 @@
-<!DOCTYPE html>
-<html lang="en">
-<head>
-    <meta charset="UTF-8">
-    <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>Voice Activity Detection Demo</title>
-    <script src="https://cdn.jsdelivr.net/npm/onnxruntime-web/dist/ort.min.js"></script>
-    <script src="https://cdn.tailwindcss.com"></script>
-    <script>
-        ort.env.wasm.wasmPaths = 'https://cdn.jsdelivr.net/npm/onnxruntime-web/dist/';
-    </script>
-</head>
-<body>
-    <main class="flex min-h-screen flex-col items-center justify-between p-24">
-        <div class="text-center">
-            <div id="status" class="text-4xl mb-4">🔇 Not Listening</div>
-            <div id="audioList" class="space-y-4"></div>
-        </div>
-    </main>
-    <script type="module">
-        import { SpeechChunks } from './SpeechChunks.js';
-        let speechChunks;
-        function updateStatus(isListening) {
-            document.getElementById('status').textContent = isListening ? "🎙️ Listening..." : "🔇 Not Listening";
-        }
-        function addAudioToList(blob) {
-            const audioList = document.getElementById('audioList');
-            const audio = document.createElement('audio');
-            audio.controls = true;
-            audio.src = URL.createObjectURL(blob);
-            audio.onended = () => URL.revokeObjectURL(audio.src);
-            audioList.appendChild(audio);
-        }
-        async function initializeSpeechChunks() {
-            try {
-                speechChunks = new SpeechChunks(
-                    () => {
-                        console.log("speech start");
-                        updateStatus(true);
-                    },
-                    (blob) => {
-                        console.log("speech end");
-                        updateStatus(false);
-                        addAudioToList(blob);
-                    }
-                );
-                await speechChunks.start();
-            } catch (error) {
-                console.error("Error initializing SpeechChunks:", error);
-                updateStatus(false);
-                document.getElementById('status').textContent = "Error: " + error.message;
-            }
-        }
-        initializeSpeechChunks();
-    </script>
-</body>
 </html>

+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Voice Chat Bot</title>
+    <script src="https://cdn.jsdelivr.net/npm/onnxruntime-web/dist/ort.js"></script>
+    <script src="https://cdn.jsdelivr.net/npm/@ricky0123/[email protected]/dist/bundle.min.js"></script>
+    <script src="https://cdn.jsdelivr.net/npm/@xenova/[email protected]"></script>
+    <style>
+        body { font-family: Arial, sans-serif; max-width: 800px; margin: 0 auto; padding: 20px; }
+        button { font-size: 18px; padding: 10px 20px; margin: 10px 0; }
+        #conversation { border: 1px solid #ccc; padding: 10px; height: 300px; overflow-y: scroll; margin-bottom: 10px; }
+    </style>
+</head>
+<body>
+    <h1>Voice Chat Bot</h1>
+    <div id="conversation"></div>
+    <button id="startButton">Start Listening</button>
+    <button id="stopButton" disabled>Stop Listening</button>
+    <script type="module">
+        import { pipeline } from 'https://cdn.jsdelivr.net/npm/@xenova/[email protected]';
+        const conversationDiv = document.getElementById('conversation');
+        const startButton = document.getElementById('startButton');
+        const stopButton = document.getElementById('stopButton');
+        let myvad;
+        let sttPipeline;
+        let ttsPipeline;
+        async function initializePipelines() {
+            sttPipeline = await pipeline('automatic-speech-recognition', 'Xenova/whisper-tiny.en');
+            ttsPipeline = await pipeline('text-to-speech', 'Xenova/speecht5_tts');
+        }
+        async function processSpeech(audio) {
+            try {
+                const transcription = await sttPipeline(audio);
+                addMessage('User', transcription.text);
+                // Placeholder for LLM response
+                const botResponse = `I heard you say: "${transcription.text}". This is a placeholder response.`;
+                addMessage('Bot', botResponse);
+                const speechOutput = await ttsPipeline(botResponse);
+                playAudio(speechOutput.audio);
+            } catch (error) {
+                console.error('Error processing speech:', error);
+            }
+        }
+        function addMessage(sender, message) {
+            const messageElement = document.createElement('p');
+            messageElement.innerHTML = `<strong>${sender}:</strong> ${message}`;
+            conversationDiv.appendChild(messageElement);
+            conversationDiv.scrollTop = conversationDiv.scrollHeight;
+        }
+        function playAudio(audioArray) {
+            const audioContext = new (window.AudioContext || window.webkitAudioContext)();
+            const audioBuffer = audioContext.createBuffer(1, audioArray.length, 16000);
+            const channelData = audioBuffer.getChannelData(0);
+            channelData.set(audioArray);
+            const source = audioContext.createBufferSource();
+            source.buffer = audioBuffer;
+            source.connect(audioContext.destination);
+            source.start();
+        }
+        async function startListening() {
+            try {
+                myvad = await vad.MicVAD.new({
+                    onSpeechEnd: (audio) => {
+                        processSpeech(audio);
+                    }
+                });
+                await myvad.start();
+                startButton.disabled = true;
+                stopButton.disabled = false;
+                addMessage('System', 'Listening...');
+            } catch (error) {
+                console.error('Error starting VAD:', error);
+            }
+        }
+        function stopListening() {
+            if (myvad) {
+                myvad.stop();
+                startButton.disabled = false;
+                stopButton.disabled = true;
+                addMessage('System', 'Stopped listening.');
+            }
+        }
+        startButton.addEventListener('click', startListening);
+        stopButton.addEventListener('click', stopListening);
+        // Initialize pipelines when the page loads
+        initializePipelines().then(() => {
+            addMessage('System', 'Voice Chat Bot initialized. Click "Start Listening" to begin.');
+        });
+    </script>
+</body>
 </html>