Spaces:

EduTechTeam
/

Speech2MSummary

Running

App Files Files Community

John Liao commited on Aug 3, 2024

Commit

5cfb839

verified ·

1 Parent(s): e8e93a8

Update app.py

Browse files

Files changed (1) hide show

app.py +38 -2

app.py CHANGED Viewed

@@ -1,5 +1,7 @@
 import subprocess
 import sys
 try:
     import openai
@@ -25,6 +27,40 @@ def openai_api(prompt, key):
       )
   return completion.choices[0].message.content
 def setup_gradio_interface():
     with gr.Blocks() as demo:
           gr.Markdown("音頻轉文字，並擷取重點")
@@ -37,12 +73,12 @@ def setup_gradio_interface():
                   with gr.Row():
                           content = gr.Textbox(label="第五步：檢視轉譯逐字稿", value="轉譯逐字稿")
                           submit2_button = gr.Button("第六步：開始重點摘錄")
-                          summary = gr.Textbox(label="第七步：輸出重點摘錄", value="重點摘錄")
                           file_output2_txt = gr.File(label="第八步：下載重點摘錄(Optional)")
           def transcribe_and_download(file, key):
                   if file is not None:
-                          txt_content = transcribe(file,key)
                           txt_path = "transcribe.txt"
                           with open(txt_path, "w") as txt_file:
                               txt_file.write(txt_content)

 import subprocess
 import sys
+import os
+from pydub import AudioSegment
 try:
     import openai
       )
   return completion.choices[0].message.content
+def transcribe_large_audio(filename, key, segment_length_ms = 30 * 60 *1000):
+    def get_file_size_in_mb(file_path):
+        return os.path.getsize(file_path) / (1024 * 1024)
+    def split_audio_file(file_path, segment_length_ms = 30 * 60 *1000):
+        audio = AudioSegment.from_file(filename, format="mp3")
+        segment_filenames = []
+        for i in range(0, len(audio), segment_length_ms):
+            end = min(i + segment_length_ms, len(audio))
+            segment = audio[i:end]
+            segment_filename = f"{file_path}_part{len(segment_filenames) + 1}.mp3"
+            segment.export(segment_filename, format="mp3", bitrate="36k")
+            segment_filenames.append(segment_filename)
+        return segment_filenames
+    openai.api_key = key
+    transcript_txt = ""
+    if get_file_size_in_mb(filename) > 25:
+        # Split the audio file if it exceeds the chunk size
+        audio_chunks = split_audio_file(filename)
+        print(audio_chunks)
+        # Process each chunk separately
+        for chunk_filename in audio_chunks:
+            print(chunk_filename)
+            transcript_txt += transcribe(chunk_filename, key)
+            # Remove the temporary chunk file
+            os.remove(chunk_filename)
+    else:
+        transcript_txt = transcribe(filename, key)
+    return transcript_txt
 def setup_gradio_interface():
     with gr.Blocks() as demo:
           gr.Markdown("音頻轉文字，並擷取重點")
                   with gr.Row():
                           content = gr.Textbox(label="第五步：檢視轉譯逐字稿", value="轉譯逐字稿")
                           submit2_button = gr.Button("第六步：開始重點摘錄")
+                          summary = gr.Textbox(label="第七步：輸出重點摘錄(Markdown格式)", value="重點摘錄")
                           file_output2_txt = gr.File(label="第八步：下載重點摘錄(Optional)")
           def transcribe_and_download(file, key):
                   if file is not None:
+                          txt_content = transcribe_large_audio(file,key)
                           txt_path = "transcribe.txt"
                           with open(txt_path, "w") as txt_file:
                               txt_file.write(txt_content)