whisper-large-v3-1-1

Runtime error

App Files Files Community

danielwm994 commited on Oct 16, 2024

Commit

2490630

verified ·

1 Parent(s): be67183

Update app.py

Browse files

Files changed (1) hide show

app.py +32 -7

app.py CHANGED Viewed

@@ -8,6 +8,8 @@ from transformers.pipelines.audio_utils import ffmpeg_read
 import tempfile
 import os
 MODEL_NAME = "openai/whisper-large-v3"
 BATCH_SIZE = 8
@@ -25,8 +27,6 @@ pipe = pipeline(
 @spaces.GPU
-import re
 def transcribe(inputs, task):
     if inputs is None:
         raise gr.Error("No audio file submitted! Please upload or record an audio file before submitting your request.")
@@ -65,8 +65,6 @@ def transcribe(inputs, task):
     return " ".join(final_text), timestamp_str
 def _return_yt_html_embed(yt_url):
     video_id = yt_url.split("?v=")[-1]
     HTML_str = (
@@ -75,6 +73,7 @@ def _return_yt_html_embed(yt_url):
     )
     return HTML_str
 def download_yt_audio(yt_url, filename):
     info_loader = youtube_dl.YoutubeDL()
@@ -106,6 +105,7 @@ def download_yt_audio(yt_url, filename):
         except youtube_dl.utils.ExtractorError as err:
             raise gr.Error(str(err))
 @spaces.GPU
 def yt_transcribe(yt_url, task, max_filesize=75.0):
     html_embed_str = _return_yt_html_embed(yt_url)
@@ -123,9 +123,34 @@ def yt_transcribe(yt_url, task, max_filesize=75.0):
     text = result["text"]
     timestamps = result["chunks"]
-    timestamp_str = "\n".join([f"[{chunk['timestamp']}] {chunk['text']}" for chunk in timestamps])
-    return html_embed_str, text, timestamp_str
 demo = gr.Blocks()

 import tempfile
 import os
+import re
+import time
 MODEL_NAME = "openai/whisper-large-v3"
 BATCH_SIZE = 8
 @spaces.GPU
 def transcribe(inputs, task):
     if inputs is None:
         raise gr.Error("No audio file submitted! Please upload or record an audio file before submitting your request.")
     return " ".join(final_text), timestamp_str
 def _return_yt_html_embed(yt_url):
     video_id = yt_url.split("?v=")[-1]
     HTML_str = (
     )
     return HTML_str
 def download_yt_audio(yt_url, filename):
     info_loader = youtube_dl.YoutubeDL()
         except youtube_dl.utils.ExtractorError as err:
             raise gr.Error(str(err))
 @spaces.GPU
 def yt_transcribe(yt_url, task, max_filesize=75.0):
     html_embed_str = _return_yt_html_embed(yt_url)
     text = result["text"]
     timestamps = result["chunks"]
+    # Список для хранения текстов с правильными разделителями
+    final_text = []
+    timestamp_str = ""
+    current_chunk = []
+    current_timestamp = None
+    for chunk in timestamps:
+        # Текст текущего чанка
+        chunk_text = chunk["text"]
+        chunk_timestamp = chunk["timestamp"]
+        # Проверим, не заканчивается ли текст на точке, восклицательном или вопросительном знаке
+        if re.search(r'[.!?]$', chunk_text):
+            current_chunk.append(chunk_text)
+            final_text.append(" ".join(current_chunk))
+            timestamp_str += f"[{chunk_timestamp}] " + " ".join(current_chunk) + "\n"
+            current_chunk = []
+        else:
+            # Если текст не завершен, собираем его в текущий чанке
+            current_chunk.append(chunk_text)
+    # Если есть незавершенные чанки (например, последний кусок текста не заканчивается на пунктуацию)
+    if current_chunk:
+        final_text.append(" ".join(current_chunk))
+        timestamp_str += f"[{chunk_timestamp}] " + " ".join(current_chunk) + "\n"
+    return html_embed_str, " ".join(final_text), timestamp_str
 demo = gr.Blocks()