Demo Update 21

2025-03-30 07:18:14 -04:00
parent e1c66f1f59
commit a4f282fbcc
3 changed files with 552 additions and 51 deletions
--- a/Backend/index.html
+++ b/Backend/index.html
@@ -1,86 +1,225 @@
-
 <!DOCTYPE html>
 <html lang="en">
 <head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>Audio Conversation Bot</title>
+    <title>Voice Assistant - CSM & Whisper</title>
    <script src="https://cdn.socket.io/4.6.0/socket.io.min.js"></script>
    <style>
        body {
-            font-family: Arial, sans-serif;
+            font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
            max-width: 800px;
            margin: 0 auto;
            padding: 20px;
+            background-color: #f5f7fa;
+            color: #333;
        }
+        
+        h1 {
+            color: #2c3e50;
+            text-align: center;
+            margin-bottom: 30px;
+        }
+        
        #conversation {
            height: 400px;
-            border: 1px solid #ccc;
-            padding: 15px;
+            border: 1px solid #ddd;
+            border-radius: 10px;
+            padding: 20px;
            margin-bottom: 20px;
            overflow-y: auto;
+            background-color: white;
+            box-shadow: 0 2px 5px rgba(0,0,0,0.1);
        }
+        
+        .message-container {
+            display: flex;
+            flex-direction: column;
+            margin-bottom: 15px;
+        }
+        
+        .user-message-container {
+            align-items: flex-end;
+        }
+        
+        .bot-message-container {
+            align-items: flex-start;
+        }
+        
+        .message {
+            max-width: 80%;
+            padding: 12px;
+            border-radius: 18px;
+            position: relative;
+            word-break: break-word;
+        }
+        
        .user-message {
-            background-color: #e1f5fe;
-            padding: 10px;
-            border-radius: 8px;
-            margin-bottom: 10px;
-            align-self: flex-end;
+            background-color: #dcf8c6;
+            color: #000;
+            border-bottom-right-radius: 4px;
        }
+        
        .bot-message {
-            background-color: #f1f1f1;
-            padding: 10px;
-            border-radius: 8px;
-            margin-bottom: 10px;
+            background-color: #f1f0f0;
+            color: #000;
+            border-bottom-left-radius: 4px;
        }
+        
+        .message-label {
+            font-size: 0.8em;
+            margin-bottom: 4px;
+            color: #657786;
+        }
+        
        #controls {
            display: flex;
            gap: 10px;
+            justify-content: center;
+            margin-bottom: 15px;
        }
+        
        button {
-            padding: 10px 20px;
+            padding: 12px 24px;
            font-size: 16px;
            cursor: pointer;
+            border-radius: 50px;
+            border: none;
+            outline: none;
+            transition: all 0.3s ease;
        }
+        
        #recordButton {
            background-color: #4CAF50;
            color: white;
-            border: none;
-            border-radius: 4px;
+            width: 200px;
+            box-shadow: 0 4px 8px rgba(76, 175, 80, 0.3);
        }
+        
+        #recordButton:hover {
+            background-color: #45a049;
+            transform: translateY(-2px);
+        }
+        
        #recordButton.recording {
            background-color: #f44336;
+            animation: pulse 1.5s infinite;
+            box-shadow: 0 4px 8px rgba(244, 67, 54, 0.3);
        }
+        
+        @keyframes pulse {
+            0% {
+                transform: scale(1);
+            }
+            50% {
+                transform: scale(1.05);
+            }
+            100% {
+                transform: scale(1);
+            }
+        }
+        
        #status {
-            margin-top: 10px;
+            text-align: center;
+            margin-top: 15px;
            font-style: italic;
+            color: #657786;
+        }
+        
+        .audio-wave {
+            display: flex;
+            justify-content: center;
+            align-items: center;
+            height: 40px;
+            gap: 3px;
+        }
+        
+        .audio-wave span {
+            display: block;
+            width: 3px;
+            height: 100%;
+            background-color: #4CAF50;
+            animation: wave 1.5s infinite ease-in-out;
+            border-radius: 6px;
+        }
+        
+        .audio-wave span:nth-child(2) {
+            animation-delay: 0.2s;
+        }
+        .audio-wave span:nth-child(3) {
+            animation-delay: 0.4s;
+        }
+        .audio-wave span:nth-child(4) {
+            animation-delay: 0.6s;
+        }
+        .audio-wave span:nth-child(5) {
+            animation-delay: 0.8s;
+        }
+        
+        @keyframes wave {
+            0%, 100% {
+                height: 8px;
+            }
+            50% {
+                height: 30px;
+            }
+        }
+        
+        .hidden {
+            display: none;
+        }
+        
+        .transcription-info {
+            font-size: 0.8em;
+            color: #888;
+            margin-top: 4px;
+            text-align: right;
        }
    </style>
 </head>
 <body>
-    <h1>Audio Conversation Bot</h1>
+    <h1>Voice Assistant with CSM & Whisper</h1>
    <div id="conversation"></div>
+    
    <div id="controls">
        <button id="recordButton">Hold to Speak</button>
    </div>
-    <div id="status">Not connected</div>
+    
+    <div id="audioWave" class="audio-wave hidden">
+        <span></span>
+        <span></span>
+        <span></span>
+        <span></span>
+        <span></span>
+    </div>
+    
+    <div id="status">Connecting to server...</div>

    <script>
        const socket = io();
        const recordButton = document.getElementById('recordButton');
        const conversation = document.getElementById('conversation');
        const status = document.getElementById('status');
+        const audioWave = document.getElementById('audioWave');
        
        let mediaRecorder;
        let audioChunks = [];
        let isRecording = false;
+        let audioSendInterval;
+        let sessionActive = false;
        
-        // Initialize audio context and analyzer
+        // Initialize audio context
        const audioContext = new (window.AudioContext || window.webkitAudioContext)();
        
        // Connect to server
        socket.on('connect', () => {
            status.textContent = 'Connected to server';
+            sessionActive = true;
+        });
+        
+        socket.on('disconnect', () => {
+            status.textContent = 'Disconnected from server';
+            sessionActive = false;
        });
        
        socket.on('ready', (data) => {
@@ -90,28 +229,59 @@
        
        socket.on('transcription', (data) => {
            addMessage('user', data.text);
+            status.textContent = 'Assistant is thinking...';
        });
        
        socket.on('audio_response', (data) => {
            // Play audio
+            status.textContent = 'Playing response...';
            const audio = new Audio('data:audio/wav;base64,' + data.audio);
-            audio.play();
+            
+            audio.onended = () => {
+                status.textContent = 'Ready to record';
+            };
+            
+            audio.onerror = () => {
+                status.textContent = 'Error playing audio';
+                console.error('Error playing audio response');
+            };
+            
+            audio.play().catch(err => {
+                status.textContent = 'Error playing audio: ' + err.message;
+                console.error('Error playing audio:', err);
+            });
            
            // Display text
            addMessage('bot', data.text);
        });
        
        socket.on('error', (data) => {
-            status.textContent = data.message;
-            console.error(data.message);
+            status.textContent = 'Error: ' + data.message;
+            console.error('Server error:', data.message);
        });
        
        function setupAudioRecording() {
+            // Check if browser supports required APIs
+            if (!navigator.mediaDevices || !navigator.mediaDevices.getUserMedia) {
+                status.textContent = 'Your browser does not support audio recording';
+                return;
+            }
+            
            // Get user media
            navigator.mediaDevices.getUserMedia({ audio: true })
                .then(stream => {
-                    // Setup recording
-                    mediaRecorder = new MediaRecorder(stream);
+                    // Setup recording with better audio quality
+                    const options = { 
+                        mimeType: 'audio/webm',
+                        audioBitsPerSecond: 128000 
+                    };
+                    
+                    try {
+                        mediaRecorder = new MediaRecorder(stream, options);
+                    } catch (e) {
+                        // Fallback if the specified options aren't supported
+                        mediaRecorder = new MediaRecorder(stream);
+                    }
                    
                    mediaRecorder.ondataavailable = event => {
                        if (event.data.size > 0) {
@@ -120,36 +290,28 @@
                    };
                    
                    mediaRecorder.onstop = () => {
-                        const audioBlob = new Blob(audioChunks, { type: 'audio/wav' });
-                        audioChunks = [];
-                        
-                        // Convert to Float32Array for sending
-                        const fileReader = new FileReader();
-                        fileReader.onloadend = () => {
-                            const arrayBuffer = fileReader.result;
-                            const floatArray = new Float32Array(arrayBuffer);
-                            
-                            // Convert to base64
-                            const base64String = arrayBufferToBase64(floatArray.buffer);
-                            socket.emit('audio_chunk', { audio: base64String });
-                        };
-                        fileReader.readAsArrayBuffer(audioBlob);
-                        
-                        socket.emit('stop_speaking');
-                        isRecording = false;
+                        processRecording();
                    };
                    
-                    // Setup audio analyzer for chunking and VAD
+                    // Create audio analyzer for visualization
                    const source = audioContext.createMediaStreamSource(stream);
                    const analyzer = audioContext.createAnalyser();
                    analyzer.fftSize = 2048;
                    source.connect(analyzer);
                    
-                    // Setup button handlers
+                    // Setup button handlers with better touch handling
                    recordButton.addEventListener('mousedown', startRecording);
-                    recordButton.addEventListener('touchstart', startRecording);
+                    recordButton.addEventListener('touchstart', (e) => {
+                        e.preventDefault(); // Prevent default touch behavior
+                        startRecording();
+                    });
+                    
                    recordButton.addEventListener('mouseup', stopRecording);
-                    recordButton.addEventListener('touchend', stopRecording);
+                    recordButton.addEventListener('touchend', (e) => {
+                        e.preventDefault();
+                        stopRecording();
+                    });
+                    
                    recordButton.addEventListener('mouseleave', stopRecording);
                    
                    status.textContent = 'Ready to record';
@@ -161,12 +323,13 @@
        }
        
        function startRecording() {
-            if (!isRecording) {
+            if (!isRecording && sessionActive) {
                audioChunks = [];
                mediaRecorder.start(100); // Collect data in 100ms chunks
                recordButton.classList.add('recording');
                recordButton.textContent = 'Release to Stop';
                status.textContent = 'Recording...';
+                audioWave.classList.remove('hidden');
                isRecording = true;
                
                socket.emit('start_speaking');
@@ -186,15 +349,82 @@
                mediaRecorder.stop();
                recordButton.classList.remove('recording');
                recordButton.textContent = 'Hold to Speak';
-                status.textContent = 'Processing...';
+                status.textContent = 'Processing speech...';
+                audioWave.classList.add('hidden');
+                isRecording = false;
            }
        }
        
+        function processRecording() {
+            if (audioChunks.length === 0) {
+                status.textContent = 'No audio recorded';
+                return;
+            }
+            
+            const audioBlob = new Blob(audioChunks, { type: 'audio/webm' });
+            
+            // Convert to ArrayBuffer for processing
+            const fileReader = new FileReader();
+            fileReader.onloadend = () => {
+                try {
+                    const arrayBuffer = fileReader.result;
+                    // Convert to Float32Array - this works better with WebAudio API
+                    const audioData = convertToFloat32(arrayBuffer);
+                    
+                    // Convert to base64 for sending
+                    const base64String = arrayBufferToBase64(audioData.buffer);
+                    socket.emit('audio_chunk', { audio: base64String });
+                    
+                    // Signal end of speech
+                    socket.emit('stop_speaking');
+                } catch (e) {
+                    console.error('Error processing audio:', e);
+                    status.textContent = 'Error processing audio';
+                }
+            };
+            
+            fileReader.onerror = () => {
+                status.textContent = 'Error reading audio data';
+            };
+            
+            fileReader.readAsArrayBuffer(audioBlob);
+        }
+        
+        function convertToFloat32(arrayBuffer) {
+            // Get raw audio data as Int16 (common format for audio)
+            const int16Array = new Int16Array(arrayBuffer);
+            
+            // Convert to Float32 (normalize between -1 and 1)
+            const float32Array = new Float32Array(int16Array.length);
+            for (let i = 0; i < int16Array.length; i++) {
+                float32Array[i] = int16Array[i] / 32768.0;
+            }
+            
+            return float32Array;
+        }
+        
        function addMessage(sender, text) {
+            const containerDiv = document.createElement('div');
+            containerDiv.className = sender === 'user' ? 'message-container user-message-container' : 'message-container bot-message-container';
+            
+            const labelDiv = document.createElement('div');
+            labelDiv.className = 'message-label';
+            labelDiv.textContent = sender === 'user' ? 'You' : 'Assistant';
+            containerDiv.appendChild(labelDiv);
+            
            const messageDiv = document.createElement('div');
-            messageDiv.className = sender === 'user' ? 'user-message' : 'bot-message';
+            messageDiv.className = sender === 'user' ? 'message user-message' : 'message bot-message';
            messageDiv.textContent = text;
-            conversation.appendChild(messageDiv);
+            containerDiv.appendChild(messageDiv);
+            
+            if (sender === 'user') {
+                const infoDiv = document.createElement('div');
+                infoDiv.className = 'transcription-info';
+                infoDiv.textContent = 'Transcribed with Whisper';
+                containerDiv.appendChild(infoDiv);
+            }
+            
+            conversation.appendChild(containerDiv);
            conversation.scrollTop = conversation.scrollHeight;
        }
        
@@ -207,6 +437,20 @@
            }
            return window.btoa(binary);
        }
+        
+        // Handle page visibility change to avoid issues with background tabs
+        document.addEventListener('visibilitychange', () => {
+            if (document.hidden && isRecording) {
+                stopRecording();
+            }
+        });
+        
+        // Clean disconnection when page is closed
+        window.addEventListener('beforeunload', () => {
+            if (socket && socket.connected) {
+                socket.disconnect();
+            }
+        });
    </script>
 </body>
 </html>