File size: 17,610 Bytes
b32aebd
5d39bc0
 
 
 
 
 
 
b32aebd
5d39bc0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
b32aebd
5d39bc0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>LAHJA AI - Advanced Text-to-Speech</title>
    <script src="https://cdn.tailwindcss.com"></script>
    <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.0/css/all.min.css">
    <style>
        @import url('https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700&display=swap');
        
        body {
            font-family: 'Inter', sans-serif;
            background-color: #f8fafc;
        }
        
        .gradient-bg {
            background: linear-gradient(135deg, #6366f1 0%, #8b5cf6 50%, #d946ef 100%);
        }
        
        .textarea-shadow {
            box-shadow: 0 4px 6px -1px rgba(79, 70, 229, 0.1), 0 2px 4px -1px rgba(79, 70, 229, 0.06);
        }
        
        .waveform {
            height: 60px;
            background: linear-gradient(90deg, #6366f1, #8b5cf6, #d946ef);
            opacity: 0.7;
            position: relative;
            overflow: hidden;
        }
        
        .waveform::before {
            content: "";
            position: absolute;
            top: 0;
            left: 0;
            right: 0;
            bottom: 0;
            background: linear-gradient(
                90deg,
                transparent,
                rgba(255, 255, 255, 0.2),
                transparent
            );
            animation: wave 1.5s linear infinite;
        }
        
        @keyframes wave {
            0% {
                transform: translateX(-100%);
            }
            100% {
                transform: translateX(100%);
            }
        }
        
        .audio-player {
            transition: all 0.3s ease;
        }
        
        .audio-player:hover {
            transform: translateY(-2px);
            box-shadow: 0 10px 15px -3px rgba(0, 0, 0, 0.1), 0 4px 6px -2px rgba(0, 0, 0, 0.05);
        }
    </style>
</head>
<body>
    <div class="min-h-screen flex flex-col">
        <!-- Header -->
        <header class="gradient-bg text-white py-6 shadow-lg">
            <div class="container mx-auto px-4">
                <div class="flex justify-between items-center">
                    <div class="flex items-center space-x-2">
                        <i class="fas fa-wave-square text-2xl"></i>
                        <h1 class="text-2xl font-bold">LAHJA AI</h1>
                    </div>
                    <div class="hidden md:flex items-center space-x-4">
                        <span class="text-sm font-medium bg-white/20 px-3 py-1 rounded-full">VITS Architecture</span>
                        <span class="text-sm font-medium bg-white/20 px-3 py-1 rounded-full">Transformers</span>
                    </div>
                </div>
                <p class="mt-2 text-sm opacity-80 max-w-2xl">
                    Advanced AI-powered text-to-speech with accent-aware synthesis using cutting-edge VITS architecture and transformer models.
                </p>
            </div>
        </header>

        <!-- Main Content -->
        <main class="flex-grow container mx-auto px-4 py-8">
            <div class="max-w-4xl mx-auto">
                <div class="bg-white rounded-xl shadow-lg overflow-hidden">
                    <!-- Input Section -->
                    <div class="p-6 border-b border-gray-100">
                        <h2 class="text-xl font-semibold text-gray-800 mb-4">Text Input</h2>
                        <div class="relative">
                            <textarea 
                                id="textInput" 
                                class="w-full h-48 px-4 py-3 border border-gray-200 rounded-lg textarea-shadow focus:ring-2 focus:ring-indigo-500 focus:border-indigo-500 outline-none transition duration-200 resize-none" 
                                placeholder="Enter the text you want to convert to speech..."
                            ></textarea>
                            <div class="absolute bottom-3 right-3 flex items-center space-x-2">
                                <span id="charCount" class="text-xs text-gray-500">0 characters</span>
                                <button id="clearBtn" class="text-gray-400 hover:text-gray-600 transition">
                                    <i class="fas fa-times"></i>
                                </button>
                            </div>
                        </div>
                        
                        <div class="mt-6 flex flex-col sm:flex-row justify-between items-center space-y-4 sm:space-y-0">
                            <div class="flex items-center space-x-4">
                                <div class="flex items-center">
                                    <label for="voiceSelect" class="mr-2 text-sm font-medium text-gray-700">Voice:</label>
                                    <select id="voiceSelect" class="border border-gray-200 rounded-md px-3 py-1 text-sm focus:ring-indigo-500 focus:border-indigo-500 outline-none">
                                        <option value="us">American English</option>
                                        <option value="uk">British English</option>
                                        <option value="au">Australian English</option>
                                        <option value="in">Indian English</option>
                                    </select>
                                </div>
                                <div class="flex items-center">
                                    <label for="speedSelect" class="mr-2 text-sm font-medium text-gray-700">Speed:</label>
                                    <select id="speedSelect" class="border border-gray-200 rounded-md px-3 py-1 text-sm focus:ring-indigo-500 focus:border-indigo-500 outline-none">
                                        <option value="0.8">Slow</option>
                                        <option value="1.0" selected>Normal</option>
                                        <option value="1.2">Fast</option>
                                    </select>
                                </div>
                            </div>
                            
                            <button id="generateBtn" class="gradient-bg hover:opacity-90 text-white font-medium py-2 px-6 rounded-lg shadow-md transition duration-200 flex items-center">
                                <i class="fas fa-play-circle mr-2"></i>
                                Generate Voice
                            </button>
                        </div>
                    </div>
                    
                    <!-- Output Section -->
                    <div class="p-6">
                        <h2 class="text-xl font-semibold text-gray-800 mb-4">Generated Audio</h2>
                        
                        <!-- Loading State -->
                        <div id="loadingState" class="hidden">
                            <div class="flex flex-col items-center justify-center py-8">
                                <div class="waveform w-full rounded-lg mb-4"></div>
                                <p class="text-gray-600 font-medium">Processing your request with LAHJA AI...</p>
                                <p class="text-sm text-gray-500 mt-1">This may take a few moments</p>
                            </div>
                        </div>
                        
                        <!-- Audio Player -->
                        <div id="audioPlayerContainer" class="hidden">
                            <div class="audio-player bg-gradient-to-r from-indigo-50 to-purple-50 rounded-xl p-4 border border-gray-200">
                                <div class="flex items-center justify-between mb-3">
                                    <div class="flex items-center space-x-3">
                                        <i class="fas fa-headphones text-indigo-600 text-xl"></i>
                                        <div>
                                            <h3 class="font-medium text-gray-800">Generated Speech</h3>
                                            <p class="text-xs text-gray-500" id="audioInfo">American English • Normal speed</p>
                                        </div>
                                    </div>
                                    <button id="downloadBtn" class="text-indigo-600 hover:text-indigo-800 transition">
                                        <i class="fas fa-download"></i>
                                    </button>
                                </div>
                                <audio id="audioPlayer" controls class="w-full"></audio>
                            </div>
                        </div>
                        
                        <!-- Empty State -->
                        <div id="emptyState" class="flex flex-col items-center justify-center py-12 text-center">
                            <i class="fas fa-comment-dots text-4xl text-gray-300 mb-4"></i>
                            <h3 class="text-lg font-medium text-gray-700">No audio generated yet</h3>
                            <p class="text-gray-500 max-w-md mt-1">Enter some text above and click "Generate Voice" to create your speech.</p>
                        </div>
                    </div>
                </div>
                
                <!-- Features Section -->
                <div class="mt-12 grid grid-cols-1 md:grid-cols-3 gap-6">
                    <div class="bg-white p-6 rounded-xl shadow-sm border border-gray-100">
                        <div class="text-indigo-600 mb-3">
                            <i class="fas fa-microchip text-2xl"></i>
                        </div>
                        <h3 class="font-semibold text-lg mb-2">VITS Architecture</h3>
                        <p class="text-gray-600 text-sm">
                            Our advanced VITS model synthesizes realistic audio waveforms directly from text with exceptional clarity and naturalness.
                        </p>
                    </div>
                    <div class="bg-white p-6 rounded-xl shadow-sm border border-gray-100">
                        <div class="text-purple-600 mb-3">
                            <i class="fas fa-language text-2xl"></i>
                        </div>
                        <h3 class="font-semibold text-lg mb-2">Accent-Aware</h3>
                        <p class="text-gray-600 text-sm">
                            Captures local vocal characteristics and intonation patterns for authentic regional speech synthesis.
                        </p>
                    </div>
                    <div class="bg-white p-6 rounded-xl shadow-sm border border-gray-100">
                        <div class="text-pink-600 mb-3">
                            <i class="fas fa-brain text-2xl"></i>
                        </div>
                        <h3 class="font-semibold text-lg mb-2">Transformer Models</h3>
                        <p class="text-gray-600 text-sm">
                            Deep linguistic analysis enables context-aware speech generation that reflects natural human expression.
                        </p>
                    </div>
                </div>
            </div>
        </main>

        <!-- Footer -->
        <footer class="bg-gray-50 py-6 border-t border-gray-200">
            <div class="container mx-auto px-4 text-center">
                <p class="text-gray-500 text-sm">
                    &copy; 2023 LAHJA AI. Advanced text-to-speech powered by VITS architecture and transformer models.
                </p>
            </div>
        </footer>
    </div>

    <script>
        document.addEventListener('DOMContentLoaded', function() {
            // DOM Elements
            const textInput = document.getElementById('textInput');
            const charCount = document.getElementById('charCount');
            const clearBtn = document.getElementById('clearBtn');
            const generateBtn = document.getElementById('generateBtn');
            const voiceSelect = document.getElementById('voiceSelect');
            const speedSelect = document.getElementById('speedSelect');
            const loadingState = document.getElementById('loadingState');
            const audioPlayerContainer = document.getElementById('audioPlayerContainer');
            const emptyState = document.getElementById('emptyState');
            const audioPlayer = document.getElementById('audioPlayer');
            const downloadBtn = document.getElementById('downloadBtn');
            const audioInfo = document.getElementById('audioInfo');
            
            // Update character count
            textInput.addEventListener('input', function() {
                const count = textInput.value.length;
                charCount.textContent = `${count} characters`;
                
                if (count > 0) {
                    clearBtn.classList.remove('invisible');
                } else {
                    clearBtn.classList.add('invisible');
                }
            });
            
            // Clear text input
            clearBtn.addEventListener('click', function() {
                textInput.value = '';
                charCount.textContent = '0 characters';
                clearBtn.classList.add('invisible');
            });
            
            // Generate voice
            generateBtn.addEventListener('click', function() {
                const text = textInput.value.trim();
                if (!text) {
                    alert('Please enter some text to convert to speech.');
                    return;
                }
                
                const voice = voiceSelect.value;
                const speed = speedSelect.value;
                
                // Show loading state
                loadingState.classList.remove('hidden');
                audioPlayerContainer.classList.add('hidden');
                emptyState.classList.add('hidden');
                
                // Simulate API call (in a real app, this would be a fetch or axios call)
                simulateAPICall(text, voice, speed);
            });
            
            // Download audio
            downloadBtn.addEventListener('click', function() {
                if (audioPlayer.src) {
                    const a = document.createElement('a');
                    a.href = audioPlayer.src;
                    a.download = `lahja-ai-voice-${new Date().getTime()}.mp3`;
                    document.body.appendChild(a);
                    a.click();
                    document.body.removeChild(a);
                }
            });
            
            // Simulate API call (replace with actual API call in production)
            function simulateAPICall(text, voice, speed) {
                console.log(`Making API call with text: "${text}", voice: ${voice}, speed: ${speed}`);
                
                // Simulate network delay
                setTimeout(() => {
                    // This is a simulation - in a real app, you would:
                    // 1. Make a POST request to your API endpoint
                    // 2. Handle the response with the audio URL
                    // 3. Set the audio player source
                    
                    // For demo purposes, we'll use a placeholder audio
                    const voiceLabels = {
                        'us': 'American English',
                        'uk': 'British English',
                        'au': 'Australian English',
                        'in': 'Indian English'
                    };
                    
                    const speedLabels = {
                        '0.8': 'Slow',
                        '1.0': 'Normal',
                        '1.2': 'Fast'
                    };
                    
                    // Update audio info
                    audioInfo.textContent = `${voiceLabels[voice]}${speedLabels[speed]} speed`;
                    
                    // Set audio source (in a real app, this would come from the API response)
                    audioPlayer.src = 'https://www.soundhelix.com/examples/mp3/SoundHelix-Song-1.mp3';
                    
                    // Hide loading, show audio player
                    loadingState.classList.add('hidden');
                    audioPlayerContainer.classList.remove('hidden');
                    
                    // Play audio automatically
                    setTimeout(() => {
                        audioPlayer.play().catch(e => console.log('Autoplay prevented:', e));
                    }, 300);
                    
                }, 2000);
            }
            
            // Initialize
            textInput.dispatchEvent(new Event('input'));
        });
    </script>
<p style="border-radius: 8px; text-align: center; font-size: 12px; color: #fff; margin-top: 16px;position: fixed; left: 8px; bottom: 8px; z-index: 10; background: rgba(0, 0, 0, 0.8); padding: 4px 8px;">Made with <img src="https://enzostvs-deepsite.hf.space/logo.svg" alt="DeepSite Logo" style="width: 16px; height: 16px; vertical-align: middle;display:inline-block;margin-right:3px;filter:brightness(0) invert(1);"><a href="https://enzostvs-deepsite.hf.space" style="color: #fff;text-decoration: underline;" target="_blank" >DeepSite</a> - 🧬 <a href="https://enzostvs-deepsite.hf.space?remix=wasmdashai/mywap" style="color: #fff;text-decoration: underline;" target="_blank" >Remix</a></p></body>
</html>