import gradio as gr
from transformers import pipeline
from pydub import AudioSegment
import os
import tempfile

# יצירת pipeline לתמלול ולסיכום
transcriber = pipeline("automatic-speech-recognition", model="openai/whisper-base")
summarizer = pipeline("summarization", model="facebook/bart-large-cnn")

def summarize_audio_or_video(file_path):
    try:
        # בדיקה אם הקובץ הוא וידאו והמרת וידאו לאודיו במידת הצורך
        if file_path.endswith((".mp4", ".mov", ".avi", ".mkv")):
            audio_file = convert_video_to_audio(file_path)
        else:
            audio_file = file_path

        # תמלול האודיו
        transcript = transcriber(audio_file)["text"]

        # יצירת סיכום של התמלול
        summary = summarizer(transcript, max_length=50, min_length=25, do_sample=False)[0]["summary_text"]
        
        # מחיקת קובץ האודיו במידת הצורך (אם היה וידאו)
        if audio_file != file_path:
            os.remove(audio_file)

        return summary

    except Exception as e:
        return f"שגיאה בעיבוד הקובץ: {str(e)}"

def convert_video_to_audio(video_file):
    # יצירת קובץ אודיו זמני
    temp_audio = tempfile.mktemp(suffix=".wav")
    video = AudioSegment.from_file(video_file)
    video.export(temp_audio, format="wav")
    return temp_audio

# הגדרת ממשק Gradio
interface = gr.Interface(
    fn=summarize_audio_or_video,
    inputs=gr.Audio(type="filepath"),  # מתאים לאודיו ווידאו
    outputs="text",
    title="ממיר אודיו/וידאו לסיכום",
    description="העלה קובץ אודיו או וידאו של מרצה וקבל סיכום קצר של התוכן."
)

if __name__ == "__main__":
    interface.launch()