Spaces:

Ofiroz91
/

HelloWorldTranscription

Running

File size: 2,151 Bytes

2612e90
0adbfae
aa6143f
 
 
0adbfae
 
 
 
7e6ae8c
0adbfae
7e6ae8c
2612e90
ec2db99
aa6143f
 
 
 
 
 
 
0adbfae
 
 
7f10f20
 
aa6143f
0d7c116
 
aa6143f
 
 
 
ec2db99
aa6143f
 
ec2db99
aa6143f
 
 
 
 
 
 
2612e90
7e6ae8c
2612e90
ec2db99
7f10f20
0d7c116
c2e4987
 
0d7c116
ec2db99
 
2612e90

import gradio as gr
from faster_whisper import WhisperModel
from pydub import AudioSegment
import os
import tempfile
from transformers import pipeline

# הגדרת המודל לתמלול
model = WhisperModel("ivrit-ai/faster-whisper-v2-d4")

# הגדרת pipeline לסיכום
summarizer = pipeline("summarization", model="facebook/bart-large-cnn")

def transcribe_and_summarize(file_path):
    try:
        # בדיקה אם הקובץ הוא וידאו והמרת וידאו לאודיו במידת הצורך
        if file_path.endswith((".mp4", ".mov", ".avi", ".mkv")):
            audio_file = convert_video_to_audio(file_path)
        else:
            audio_file = file_path

        # תמלול האודיו
        segments, _ = model.transcribe(audio_file, language="he")
        transcript = " ".join([segment.text for segment in segments])

        # סיכום התמלול
        
        summary = summarizer(transcript, max_length=50, min_length=25, do_sample=False)[0]["summary_text"]
        prompt_text = f"סכם את התמלול הבא כשיעור אקדמי בעברית:\n{transcript}"
        # מחיקת קובץ האודיו במידת הצורך (אם היה וידאו)
        if audio_file != file_path:
            os.remove(audio_file)

        return transcript, summary

    except Exception as e:
        return f"שגיאה בעיבוד הקובץ: {str(e)}", ""

def convert_video_to_audio(video_file):
    # יצירת קובץ אודיו זמני
    temp_audio = tempfile.mktemp(suffix=".wav")
    video = AudioSegment.from_file(video_file)
    video.export(temp_audio, format="wav")
    return temp_audio

# הגדרת ממשק Gradio
interface = gr.Interface(
    fn=transcribe_and_summarize,
    inputs=gr.Audio(type="filepath"),
    outputs=[
        gr.Textbox(label="תמלול"),
        gr.Textbox(label="סיכום")
        ],
    title="ממיר אודיו/וידאו לתמלול וסיכום",
    description="העלה קובץ אודיו או וידאו של מרצה וקבל תמלול מלא וסיכום קצר של התוכן."
)

if __name__ == "__main__":
    interface.launch()