Spaces:
Running
Running
<html lang="en"> | |
<head> | |
<meta charset="UTF-8"> | |
<meta name="viewport" content="width=device-width, initial-scale=1.0"> | |
<title>LAHJA AI - Advanced Text-to-Speech</title> | |
<script src="https://cdn.tailwindcss.com"></script> | |
<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/6.4.0/css/all.min.css"> | |
<style> | |
@import url('https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700&display=swap'); | |
body { | |
font-family: 'Inter', sans-serif; | |
background-color: #f8fafc; | |
} | |
.gradient-bg { | |
background: linear-gradient(135deg, #6366f1 0%, #8b5cf6 50%, #d946ef 100%); | |
} | |
.textarea-shadow { | |
box-shadow: 0 4px 6px -1px rgba(79, 70, 229, 0.1), 0 2px 4px -1px rgba(79, 70, 229, 0.06); | |
} | |
.waveform { | |
height: 60px; | |
background: linear-gradient(90deg, #6366f1, #8b5cf6, #d946ef); | |
opacity: 0.7; | |
position: relative; | |
overflow: hidden; | |
} | |
.waveform::before { | |
content: ""; | |
position: absolute; | |
top: 0; | |
left: 0; | |
right: 0; | |
bottom: 0; | |
background: linear-gradient( | |
90deg, | |
transparent, | |
rgba(255, 255, 255, 0.2), | |
transparent | |
); | |
animation: wave 1.5s linear infinite; | |
} | |
@keyframes wave { | |
0% { | |
transform: translateX(-100%); | |
} | |
100% { | |
transform: translateX(100%); | |
} | |
} | |
.audio-player { | |
transition: all 0.3s ease; | |
} | |
.audio-player:hover { | |
transform: translateY(-2px); | |
box-shadow: 0 10px 15px -3px rgba(0, 0, 0, 0.1), 0 4px 6px -2px rgba(0, 0, 0, 0.05); | |
} | |
</style> | |
</head> | |
<body> | |
<div class="min-h-screen flex flex-col"> | |
<!-- Header --> | |
<header class="gradient-bg text-white py-6 shadow-lg"> | |
<div class="container mx-auto px-4"> | |
<div class="flex justify-between items-center"> | |
<div class="flex items-center space-x-2"> | |
<i class="fas fa-wave-square text-2xl"></i> | |
<h1 class="text-2xl font-bold">LAHJA AI</h1> | |
</div> | |
<div class="hidden md:flex items-center space-x-4"> | |
<span class="text-sm font-medium bg-white/20 px-3 py-1 rounded-full">VITS Architecture</span> | |
<span class="text-sm font-medium bg-white/20 px-3 py-1 rounded-full">Transformers</span> | |
</div> | |
</div> | |
<p class="mt-2 text-sm opacity-80 max-w-2xl"> | |
Advanced AI-powered text-to-speech with accent-aware synthesis using cutting-edge VITS architecture and transformer models. | |
</p> | |
</div> | |
</header> | |
<!-- Main Content --> | |
<main class="flex-grow container mx-auto px-4 py-8"> | |
<div class="max-w-4xl mx-auto"> | |
<div class="bg-white rounded-xl shadow-lg overflow-hidden"> | |
<!-- Input Section --> | |
<div class="p-6 border-b border-gray-100"> | |
<h2 class="text-xl font-semibold text-gray-800 mb-4">Text Input</h2> | |
<div class="relative"> | |
<textarea | |
id="textInput" | |
class="w-full h-48 px-4 py-3 border border-gray-200 rounded-lg textarea-shadow focus:ring-2 focus:ring-indigo-500 focus:border-indigo-500 outline-none transition duration-200 resize-none" | |
placeholder="Enter the text you want to convert to speech..." | |
></textarea> | |
<div class="absolute bottom-3 right-3 flex items-center space-x-2"> | |
<span id="charCount" class="text-xs text-gray-500">0 characters</span> | |
<button id="clearBtn" class="text-gray-400 hover:text-gray-600 transition"> | |
<i class="fas fa-times"></i> | |
</button> | |
</div> | |
</div> | |
<div class="mt-6 flex flex-col sm:flex-row justify-between items-center space-y-4 sm:space-y-0"> | |
<div class="flex items-center space-x-4"> | |
<div class="flex items-center"> | |
<label for="voiceSelect" class="mr-2 text-sm font-medium text-gray-700">Voice:</label> | |
<select id="voiceSelect" class="border border-gray-200 rounded-md px-3 py-1 text-sm focus:ring-indigo-500 focus:border-indigo-500 outline-none"> | |
<option value="us">American English</option> | |
<option value="uk">British English</option> | |
<option value="au">Australian English</option> | |
<option value="in">Indian English</option> | |
</select> | |
</div> | |
<div class="flex items-center"> | |
<label for="speedSelect" class="mr-2 text-sm font-medium text-gray-700">Speed:</label> | |
<select id="speedSelect" class="border border-gray-200 rounded-md px-3 py-1 text-sm focus:ring-indigo-500 focus:border-indigo-500 outline-none"> | |
<option value="0.8">Slow</option> | |
<option value="1.0" selected>Normal</option> | |
<option value="1.2">Fast</option> | |
</select> | |
</div> | |
</div> | |
<button id="generateBtn" class="gradient-bg hover:opacity-90 text-white font-medium py-2 px-6 rounded-lg shadow-md transition duration-200 flex items-center"> | |
<i class="fas fa-play-circle mr-2"></i> | |
Generate Voice | |
</button> | |
</div> | |
</div> | |
<!-- Output Section --> | |
<div class="p-6"> | |
<h2 class="text-xl font-semibold text-gray-800 mb-4">Generated Audio</h2> | |
<!-- Loading State --> | |
<div id="loadingState" class="hidden"> | |
<div class="flex flex-col items-center justify-center py-8"> | |
<div class="waveform w-full rounded-lg mb-4"></div> | |
<p class="text-gray-600 font-medium">Processing your request with LAHJA AI...</p> | |
<p class="text-sm text-gray-500 mt-1">This may take a few moments</p> | |
</div> | |
</div> | |
<!-- Audio Player --> | |
<div id="audioPlayerContainer" class="hidden"> | |
<div class="audio-player bg-gradient-to-r from-indigo-50 to-purple-50 rounded-xl p-4 border border-gray-200"> | |
<div class="flex items-center justify-between mb-3"> | |
<div class="flex items-center space-x-3"> | |
<i class="fas fa-headphones text-indigo-600 text-xl"></i> | |
<div> | |
<h3 class="font-medium text-gray-800">Generated Speech</h3> | |
<p class="text-xs text-gray-500" id="audioInfo">American English • Normal speed</p> | |
</div> | |
</div> | |
<button id="downloadBtn" class="text-indigo-600 hover:text-indigo-800 transition"> | |
<i class="fas fa-download"></i> | |
</button> | |
</div> | |
<audio id="audioPlayer" controls class="w-full"></audio> | |
</div> | |
</div> | |
<!-- Empty State --> | |
<div id="emptyState" class="flex flex-col items-center justify-center py-12 text-center"> | |
<i class="fas fa-comment-dots text-4xl text-gray-300 mb-4"></i> | |
<h3 class="text-lg font-medium text-gray-700">No audio generated yet</h3> | |
<p class="text-gray-500 max-w-md mt-1">Enter some text above and click "Generate Voice" to create your speech.</p> | |
</div> | |
</div> | |
</div> | |
<!-- Features Section --> | |
<div class="mt-12 grid grid-cols-1 md:grid-cols-3 gap-6"> | |
<div class="bg-white p-6 rounded-xl shadow-sm border border-gray-100"> | |
<div class="text-indigo-600 mb-3"> | |
<i class="fas fa-microchip text-2xl"></i> | |
</div> | |
<h3 class="font-semibold text-lg mb-2">VITS Architecture</h3> | |
<p class="text-gray-600 text-sm"> | |
Our advanced VITS model synthesizes realistic audio waveforms directly from text with exceptional clarity and naturalness. | |
</p> | |
</div> | |
<div class="bg-white p-6 rounded-xl shadow-sm border border-gray-100"> | |
<div class="text-purple-600 mb-3"> | |
<i class="fas fa-language text-2xl"></i> | |
</div> | |
<h3 class="font-semibold text-lg mb-2">Accent-Aware</h3> | |
<p class="text-gray-600 text-sm"> | |
Captures local vocal characteristics and intonation patterns for authentic regional speech synthesis. | |
</p> | |
</div> | |
<div class="bg-white p-6 rounded-xl shadow-sm border border-gray-100"> | |
<div class="text-pink-600 mb-3"> | |
<i class="fas fa-brain text-2xl"></i> | |
</div> | |
<h3 class="font-semibold text-lg mb-2">Transformer Models</h3> | |
<p class="text-gray-600 text-sm"> | |
Deep linguistic analysis enables context-aware speech generation that reflects natural human expression. | |
</p> | |
</div> | |
</div> | |
</div> | |
</main> | |
<!-- Footer --> | |
<footer class="bg-gray-50 py-6 border-t border-gray-200"> | |
<div class="container mx-auto px-4 text-center"> | |
<p class="text-gray-500 text-sm"> | |
© 2023 LAHJA AI. Advanced text-to-speech powered by VITS architecture and transformer models. | |
</p> | |
</div> | |
</footer> | |
</div> | |
<script> | |
document.addEventListener('DOMContentLoaded', function() { | |
// DOM Elements | |
const textInput = document.getElementById('textInput'); | |
const charCount = document.getElementById('charCount'); | |
const clearBtn = document.getElementById('clearBtn'); | |
const generateBtn = document.getElementById('generateBtn'); | |
const voiceSelect = document.getElementById('voiceSelect'); | |
const speedSelect = document.getElementById('speedSelect'); | |
const loadingState = document.getElementById('loadingState'); | |
const audioPlayerContainer = document.getElementById('audioPlayerContainer'); | |
const emptyState = document.getElementById('emptyState'); | |
const audioPlayer = document.getElementById('audioPlayer'); | |
const downloadBtn = document.getElementById('downloadBtn'); | |
const audioInfo = document.getElementById('audioInfo'); | |
// Update character count | |
textInput.addEventListener('input', function() { | |
const count = textInput.value.length; | |
charCount.textContent = `${count} characters`; | |
if (count > 0) { | |
clearBtn.classList.remove('invisible'); | |
} else { | |
clearBtn.classList.add('invisible'); | |
} | |
}); | |
// Clear text input | |
clearBtn.addEventListener('click', function() { | |
textInput.value = ''; | |
charCount.textContent = '0 characters'; | |
clearBtn.classList.add('invisible'); | |
}); | |
// Generate voice | |
generateBtn.addEventListener('click', function() { | |
const text = textInput.value.trim(); | |
if (!text) { | |
alert('Please enter some text to convert to speech.'); | |
return; | |
} | |
const voice = voiceSelect.value; | |
const speed = speedSelect.value; | |
// Show loading state | |
loadingState.classList.remove('hidden'); | |
audioPlayerContainer.classList.add('hidden'); | |
emptyState.classList.add('hidden'); | |
// Simulate API call (in a real app, this would be a fetch or axios call) | |
simulateAPICall(text, voice, speed); | |
}); | |
// Download audio | |
downloadBtn.addEventListener('click', function() { | |
if (audioPlayer.src) { | |
const a = document.createElement('a'); | |
a.href = audioPlayer.src; | |
a.download = `lahja-ai-voice-${new Date().getTime()}.mp3`; | |
document.body.appendChild(a); | |
a.click(); | |
document.body.removeChild(a); | |
} | |
}); | |
// Simulate API call (replace with actual API call in production) | |
function simulateAPICall(text, voice, speed) { | |
console.log(`Making API call with text: "${text}", voice: ${voice}, speed: ${speed}`); | |
// Simulate network delay | |
setTimeout(() => { | |
// This is a simulation - in a real app, you would: | |
// 1. Make a POST request to your API endpoint | |
// 2. Handle the response with the audio URL | |
// 3. Set the audio player source | |
// For demo purposes, we'll use a placeholder audio | |
const voiceLabels = { | |
'us': 'American English', | |
'uk': 'British English', | |
'au': 'Australian English', | |
'in': 'Indian English' | |
}; | |
const speedLabels = { | |
'0.8': 'Slow', | |
'1.0': 'Normal', | |
'1.2': 'Fast' | |
}; | |
// Update audio info | |
audioInfo.textContent = `${voiceLabels[voice]} • ${speedLabels[speed]} speed`; | |
// Set audio source (in a real app, this would come from the API response) | |
audioPlayer.src = 'https://www.soundhelix.com/examples/mp3/SoundHelix-Song-1.mp3'; | |
// Hide loading, show audio player | |
loadingState.classList.add('hidden'); | |
audioPlayerContainer.classList.remove('hidden'); | |
// Play audio automatically | |
setTimeout(() => { | |
audioPlayer.play().catch(e => console.log('Autoplay prevented:', e)); | |
}, 300); | |
}, 2000); | |
} | |
// Initialize | |
textInput.dispatchEvent(new Event('input')); | |
}); | |
</script> | |
<p style="border-radius: 8px; text-align: center; font-size: 12px; color: #fff; margin-top: 16px;position: fixed; left: 8px; bottom: 8px; z-index: 10; background: rgba(0, 0, 0, 0.8); padding: 4px 8px;">Made with <img src="https://enzostvs-deepsite.hf.space/logo.svg" alt="DeepSite Logo" style="width: 16px; height: 16px; vertical-align: middle;display:inline-block;margin-right:3px;filter:brightness(0) invert(1);"><a href="https://enzostvs-deepsite.hf.space" style="color: #fff;text-decoration: underline;" target="_blank" >DeepSite</a> - 🧬 <a href="https://enzostvs-deepsite.hf.space?remix=wasmdashai/mywap" style="color: #fff;text-decoration: underline;" target="_blank" >Remix</a></p></body> | |
</html> |