insta-maker-2

Sleeping

App Files Files Community

hivecorp commited on Mar 19

Commit

4c25f4a

verified ·

1 Parent(s): 9ecdae1

Update app.py

Browse files

Files changed (1) hide show

app.py +52 -8

app.py CHANGED Viewed

@@ -13,7 +13,6 @@ import hashlib
 import json
 from pathlib import Path
 from tqdm.asyncio import tqdm
-import ssml.builder as ssml
 class TimingManager:
     def __init__(self):
@@ -206,17 +205,62 @@ class AudioCache:
         cache_file = self.cache_dir / f"{cache_key}.wav"
         audio.export(str(cache_file), format="wav")
 class SpeechEnhancer:
     @staticmethod
     def add_speech_marks(text: str) -> str:
         """Add SSML marks for better speech control"""
-        speech = ssml.Speech()
-        # Add prosody and breaks for natural speech
-        speech.prosody(rate="medium", pitch="medium", volume="medium")
-        for sentence in text.split('. '):
-            speech.p(sentence.strip())
-            speech.break_("medium")
-        return str(speech)
     @staticmethod
     def enhance_timing(segment: Segment) -> Segment:

 import json
 from pathlib import Path
 from tqdm.asyncio import tqdm
 class TimingManager:
     def __init__(self):
         cache_file = self.cache_dir / f"{cache_key}.wav"
         audio.export(str(cache_file), format="wav")
+class SSMLBuilder:
+    def __init__(self):
+        self.content = []
+    def add_text(self, text: str):
+        self.content.append(text)
+        return self
+    def add_break(self, strength: str = "medium"):
+        self.content.append(f'<break strength="{strength}"/>')
+        return self
+    def add_prosody(self, text: str, rate: str = "medium", pitch: str = "medium"):
+        self.content.append(
+            f'<prosody rate="{rate}" pitch="{pitch}">{text}</prosody>'
+        )
+        return self
+    def add_sentence(self, text: str):
+        self.content.append(f'<s>{text}</s>')
+        return self
+    def __str__(self):
+        return (
+            '<?xml version="1.0"?>'
+            '<speak version="1.0" xmlns="http://www.w3.org/2001/10/synthesis">'
+            f'{"".join(self.content)}'
+            '</speak>'
+        )
 class SpeechEnhancer:
     @staticmethod
     def add_speech_marks(text: str) -> str:
         """Add SSML marks for better speech control"""
+        ssml = SSMLBuilder()
+        # Split text and add appropriate SSML tags
+        sentences = text.split('. ')
+        for i, sentence in enumerate(sentences):
+            sentence = sentence.strip()
+            if not sentence:
+                continue
+            ssml.add_sentence(sentence)
+            # Add appropriate breaks between sentences
+            if i < len(sentences) - 1:
+                ssml.add_break("strong")
+            # Add breaks at commas
+            if ',' in sentence:
+                parts = sentence.split(',')
+                for part in parts[:-1]:
+                    ssml.add_break("medium")
+        return str(ssml)
     @staticmethod
     def enhance_timing(segment: Segment) -> Segment: