Spaces:

Merlintxu
/

audio-transcription-app

Sleeping

Merlintxu commited on 22 days ago

Commit

0bab575

•

1 Parent(s): f88c1d0

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,5 +1,7 @@
 import gradio as gr
 from transformers import pipeline
 import requests
 import os
@@ -16,6 +18,21 @@ def download_from_url(url):
                 f.write(chunk)
     return local_filename
 # Función para procesar el archivo o la URL
 def transcribe_audio(file=None, url=None):
     try:
@@ -27,10 +44,16 @@ def transcribe_audio(file=None, url=None):
         else:
             return "No se ha proporcionado un archivo ni un enlace."
-        # Realiza la transcripción
-        result = asr_pipeline(file_path)
-        transcription = result['text']
-        return transcription
     except Exception as e:
         return f"Error durante la transcripción: {str(e)}"

 import gradio as gr
 from transformers import pipeline
+import librosa
+import soundfile as sf
 import requests
 import os
                 f.write(chunk)
     return local_filename
+# Función para dividir un archivo de audio en fragmentos de tamaño manejable
+def split_audio(file_path, segment_duration=30):
+    y, sr = librosa.load(file_path, sr=None)
+    total_duration = librosa.get_duration(y=y, sr=sr)
+    segments = []
+    for start in range(0, int(total_duration), segment_duration):
+        end = min(start + segment_duration, int(total_duration))
+        segment = y[start * sr: end * sr]
+        segment_path = f"{file_path}_segment_{start}-{end}.wav"
+        sf.write(segment_path, segment, sr)
+        segments.append(segment_path)
+    return segments
 # Función para procesar el archivo o la URL
 def transcribe_audio(file=None, url=None):
     try:
         else:
             return "No se ha proporcionado un archivo ni un enlace."
+        # Dividir el archivo en segmentos de 30 segundos
+        segments = split_audio(file_path)
+        # Transcribir cada segmento y concatenar los resultados
+        transcriptions = []
+        for segment in segments:
+            result = asr_pipeline(segment, return_timestamps=True)
+            transcriptions.append(result['text'])
+        return " ".join(transcriptions)
     except Exception as e:
         return f"Error durante la transcripción: {str(e)}"