Spaces:

GamerC0der
/

test-2

Sleeping

App Files Files Community

GamerC0der commited on Jan 8

Commit

afc5457

verified ·

1 Parent(s): 93e926b

Update app.py

Browse files

Files changed (1) hide show

app.py +119 -3

app.py CHANGED Viewed

@@ -32,7 +32,7 @@ MAIN_HTML = """
     <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.0/css/all.min.css">
 </head>
 <body>
-    <h1>Multi-Modal Playground (No JS)</h1>
     <h2>STT (Nova-3)</h2>
     <form action="/stt" method="post" enctype="multipart/form-data">
@@ -55,12 +55,125 @@ MAIN_HTML = """
         <button type="submit">Send</button>
     </form>
     <hr>
     <a href="/">Refresh Playground</a>
 </body>
 </html>
 """
 STT_RESULT_HTML = """
 <!DOCTYPE html>
 <html>
@@ -110,12 +223,16 @@ class Handler(http.server.BaseHTTPRequestHandler):
             self.send_header("Content-type", "text/html")
             self.end_headers()
             self.wfile.write(MAIN_HTML.encode())
         else:
             self.send_error(404)
     def do_POST(self):
         if self.path == '/api/stt':
-            # Keep old API endpoint for compatibility (though not used in JS-less)
             content_length = int(self.headers['Content-Length'])
             body = self.rfile.read(content_length)
             r = requests.post(STT_URL, data=body, impersonate="chrome")
@@ -200,7 +317,6 @@ class Handler(http.server.BaseHTTPRequestHandler):
                     return
             self.send_error(400, "No message provided")
-        # Keep old /api/tts and /api/chat for compatibility (though not used)
         elif self.path == '/api/tts':
             content_length = int(self.headers['Content-Length'])
             body_str = self.rfile.read(content_length).decode('utf-8')

     <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.0/css/all.min.css">
 </head>
 <body>
+    <h1>Multi-Modal Playground</h1>
     <h2>STT (Nova-3)</h2>
     <form action="/stt" method="post" enctype="multipart/form-data">
         <button type="submit">Send</button>
     </form>
+    <h2>Voice Chat</h2>
+    <p><a href="/voicechat">Go to Voice Chat</a></p>
     <hr>
     <a href="/">Refresh Playground</a>
 </body>
 </html>
 """
+VOICECHAT_HTML = """
+<!DOCTYPE html>
+<html>
+<head>
+    <title>Voice Chat</title>
+    <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.0/css/all.min.css">
+</head>
+<body>
+    <h1>Voice Chat</h1>
+    <div id="messages" style="height:300px;overflow-y:scroll;border:1px solid #ccc;padding:10px;margin-bottom:10px;background:#eee;"></div>
+    <button id="micBtn" onclick="toggleRecord()" style="font-size:48px;"><i class="fas fa-microphone"></i></button>
+    <p>Status: <span id="statusVoice">Click to start recording</span></p>
+    <audio id="voicePlayer" style="display:none;"></audio>
+    <p><a href="/">Back to Playground</a></p>
+    <script>
+        let chatMessages = [];
+        let mediaRecorder;
+        let audioChunks = [];
+        let voiceStream;
+        function renderMD(text) {
+            return text.replace(/\*\*(.*?)\*\*/g, '<b>$1</b>')
+                       .replace(/\*(.*?)\*/g, '<i>$1</i>')
+                       .replace(/`(.*?)`/g, '<code>$1</code>')
+                       .replace(/\n/g, '<br>');
+        }
+        function addMessage(role, content) {
+            const div = document.getElementById('messages');
+            const msg = document.createElement('div');
+            msg.innerHTML = `<strong>${role}:</strong> ${renderMD(content)}`;
+            div.appendChild(msg);
+            div.scrollTop = div.scrollHeight;
+        }
+        async function toggleRecord() {
+            const btn = document.getElementById('micBtn');
+            if (!mediaRecorder || mediaRecorder.state === 'inactive') {
+                try {
+                    voiceStream = await navigator.mediaDevices.getUserMedia({audio: true});
+                    mediaRecorder = new MediaRecorder(voiceStream);
+                    audioChunks = [];
+                    mediaRecorder.ondataavailable = e => audioChunks.push(e.data);
+                    mediaRecorder.onstop = processVoice;
+                    mediaRecorder.start();
+                    btn.style.color = 'red';
+                    document.getElementById('statusVoice').innerText = 'Recording... Click to stop';
+                } catch (e) {
+                    console.error('Mic error:', e);
+                    document.getElementById('statusVoice').innerText = 'Error accessing mic';
+                }
+            } else {
+                mediaRecorder.stop();
+                btn.style.color = 'black';
+                document.getElementById('statusVoice').innerText = 'Processing...';
+            }
+        }
+        async function processVoice() {
+            const audioBlob = new Blob(audioChunks, {type: 'audio/webm'});
+            if (voiceStream) {
+                voiceStream.getTracks().forEach(track => track.stop());
+            }
+            document.getElementById('statusVoice').innerText = 'Transcribing...';
+            try {
+                const sttRes = await fetch('/api/stt', {method: 'POST', body: audioBlob});
+                const sttData = await sttRes.json();
+                let userText = '';
+                if (sttData.results && sttData.results.channels && sttData.results.channels[0] &&
+                    sttData.results.channels[0].alternatives && sttData.results.channels[0].alternatives[0]) {
+                    userText = sttData.results.channels[0].alternatives[0].transcript;
+                }
+                if (!userText) {
+                    document.getElementById('statusVoice').innerText = 'No speech detected';
+                    return;
+                }
+                addMessage('user', userText);
+                chatMessages.push({role: 'user', content: userText});
+                document.getElementById('statusVoice').innerText = 'Thinking...';
+                const chatRes = await fetch('/api/chat', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json'},
+                    body: JSON.stringify({messages: chatMessages})
+                });
+                const chatData = await chatRes.json();
+                const response = chatData.response;
+                addMessage('assistant', response);
+                chatMessages.push({role: 'assistant', content: response});
+                document.getElementById('statusVoice').innerText = 'Generating speech...';
+                const ttsRes = await fetch('/api/tts', {
+                    method: 'POST',
+                    headers: {'Content-Type': 'application/json'},
+                    body: JSON.stringify({text: response})
+                });
+                const ttsData = await ttsRes.json();
+                const audioPlayer = document.getElementById('voicePlayer');
+                audioPlayer.src = 'data:audio/webm;base64,' + ttsData.audio;
+                audioPlayer.play();
+                document.getElementById('statusVoice').innerText = 'Done';
+            } catch (e) {
+                console.error('Voice process error:', e);
+                document.getElementById('statusVoice').innerText = 'Error';
+            }
+        }
+    </script>
+</body>
+</html>
+"""
 STT_RESULT_HTML = """
 <!DOCTYPE html>
 <html>
             self.send_header("Content-type", "text/html")
             self.end_headers()
             self.wfile.write(MAIN_HTML.encode())
+        elif self.path.split('?')[0] == '/voicechat':
+            self.send_response(200)
+            self.send_header("Content-type", "text/html")
+            self.end_headers()
+            self.wfile.write(VOICECHAT_HTML.encode())
         else:
             self.send_error(404)
     def do_POST(self):
         if self.path == '/api/stt':
             content_length = int(self.headers['Content-Length'])
             body = self.rfile.read(content_length)
             r = requests.post(STT_URL, data=body, impersonate="chrome")
                     return
             self.send_error(400, "No message provided")
         elif self.path == '/api/tts':
             content_length = int(self.headers['Content-Length'])
             body_str = self.rfile.read(content_length).decode('utf-8')