Spaces:

awacke1
/

InstantASRforYouNow

Running

App Files Files Community

awacke1 commited on Nov 26, 2024

Commit

0145c6e

verified ·

1 Parent(s): 17b0e6f

Update index.html

Browse files

Files changed (1) hide show

index.html +131 -21

index.html CHANGED Viewed

@@ -1,29 +1,139 @@
 <!DOCTYPE html>
 <html lang="en">
 <head>
-    <meta charset="UTF-8" />
-    <link rel="stylesheet" href="style.css" />
-    <meta name="viewport" content="width=device-width, initial-scale=1.0" />
-    <title>Transformers.js - Object Detection</title>
 </head>
 <body>
-    <h1>Object Detection w/ 🤗 Transformers.js</h1>
-    <label id="container" for="upload">
-        <svg width="25" height="25" viewBox="0 0 25 25" fill="none" xmlns="http://www.w3.org/2000/svg">
-            <path fill="#000"
-                d="M3.5 24.3a3 3 0 0 1-1.9-.8c-.5-.5-.8-1.2-.8-1.9V2.9c0-.7.3-1.3.8-1.9.6-.5 1.2-.7 2-.7h18.6c.7 0 1.3.2 1.9.7.5.6.7 1.2.7 2v18.6c0 .7-.2 1.4-.7 1.9a3 3 0 0 1-2 .8H3.6Zm0-2.7h18.7V2.9H3.5v18.7Zm2.7-2.7h13.3c.3 0 .5 0 .6-.3v-.7l-3.7-5a.6.6 0 0 0-.6-.2c-.2 0-.4 0-.5.3l-3.5 4.6-2.4-3.3a.6.6 0 0 0-.6-.3c-.2 0-.4.1-.5.3l-2.7 3.6c-.1.2-.2.4 0 .7.1.2.3.3.6.3Z">
-            </path>
-        </svg>
-        Click to upload image
-        <label id="example">(or try example)</label>
-    </label>
-    <label id="status">Loading model...</label>
-    <input id="upload" type="file" accept="image/*" />
-    <script src="index.js" type="module"></script>
-</body>
 </html>

 <!DOCTYPE html>
 <html lang="en">
 <head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>ASR Client</title>
+    <script src="https://cdnjs.cloudflare.com/ajax/libs/transformers/1.4.1/transformers.min.js"></script>
+    <style>
+        body {
+            font-family: system-ui, -apple-system, sans-serif;
+            max-width: 800px;
+            margin: 2rem auto;
+            padding: 0 1rem;
+        }
+        .container {
+            display: flex;
+            flex-direction: column;
+            gap: 1rem;
+            align-items: center;
+        }
+        #status {
+            margin: 1rem 0;
+            padding: 0.5rem;
+            border-radius: 4px;
+        }
+        #transcription {
+            width: 100%;
+            min-height: 200px;
+            padding: 1rem;
+            border: 1px solid #ccc;
+            border-radius: 4px;
+            margin: 1rem 0;
+        }
+        button {
+            padding: 0.5rem 1rem;
+            font-size: 1rem;
+            cursor: pointer;
+            background: #0066ff;
+            color: white;
+            border: none;
+            border-radius: 4px;
+        }
+        button:disabled {
+            background: #cccccc;
+            cursor: not-allowed;
+        }
+        .status-loading {
+            background: #fff3cd;
+        }
+        .status-ready {
+            background: #d4edda;
+        }
+        .status-error {
+            background: #f8d7da;
+        }
+    </style>
 </head>
 <body>
+    <div class="container">
+        <h1>Speech Recognition Client</h1>
+        <div id="status">Loading model...</div>
+        <button id="startButton" disabled>Start Recording</button>
+        <div id="transcription"></div>
+    </div>
+    <script type="module">
+        import { pipeline } from 'https://cdn.jsdelivr.net/npm/@xenova/[email protected]/+esm';
+        let isRecording = false;
+        let model = null;
+        const startButton = document.getElementById('startButton');
+        const statusDiv = document.getElementById('status');
+        const transcriptionDiv = document.getElementById('transcription');
+        // Initialize the model
+        async function initializeModel() {
+            try {
+                statusDiv.textContent = 'Loading model...';
+                statusDiv.className = 'status-loading';
+                model = await pipeline('automatic-speech-recognition', 'Xenova/whisper-tiny');
+                statusDiv.textContent = 'Model ready! Click Start Recording to begin.';
+                statusDiv.className = 'status-ready';
+                startButton.disabled = false;
+            } catch (error) {
+                statusDiv.textContent = 'Error loading model: ' + error.message;
+                statusDiv.className = 'status-error';
+            }
+        }
+        // Handle recording
+        async function toggleRecording() {
+            if (!isRecording) {
+                try {
+                    const stream = await navigator.mediaDevices.getUserMedia({ audio: true });
+                    isRecording = true;
+                    startButton.textContent = 'Stop Recording';
+                    statusDiv.textContent = 'Recording...';
+                    statusDiv.className = 'status-loading';
+                    // Create processor and start processing audio
+                    const audioTrack = stream.getAudioTracks()[0];
+                    const processor = new MediaStreamTrackProcessor({ track: audioTrack });
+                    const transformer = new TransformStream({
+                        async transform(chunk, controller) {
+                            try {
+                                const result = await model(chunk.data);
+                                if (result && result.text) {
+                                    transcriptionDiv.textContent += ' ' + result.text;
+                                }
+                            } catch (error) {
+                                console.error('Error processing audio:', error);
+                            }
+                        }
+                    });
+                    await processor.readable.pipeTo(transformer.writable);
+                } catch (error) {
+                    statusDiv.textContent = 'Error accessing microphone: ' + error.message;
+                    statusDiv.className = 'status-error';
+                    isRecording = false;
+                }
+            } else {
+                // Stop recording
+                isRecording = false;
+                startButton.textContent = 'Start Recording';
+                statusDiv.textContent = 'Recording stopped. Click Start Recording to begin again.';
+                statusDiv.className = 'status-ready';
+            }
+        }
+        // Initialize the app
+        startButton.addEventListener('click', toggleRecording);
+        initializeModel();
+    </script>
+</body>
 </html>