video-ffmpeg

Sleeping

App Files Files Community

Tim13ekd commited on 6 days ago

Commit

b6a8e09

verified ·

1 Parent(s): 0b567d9

Update app.py

Browse files

Files changed (1) hide show

app.py +13 -18

app.py CHANGED Viewed

@@ -20,25 +20,22 @@ def save_temp_audio(audio_file):
     """
     Speichert die hochgeladene Datei sicher mit korrekter Endung in einem temporären Verzeichnis.
     """
-    # Wenn audio_file ein NamedString (Byte-Inhalt) ist
-    if isinstance(audio_file, str):  # Gradio gibt es als NamedString zurück, wenn es sich um einen String handelt
-        # Hier können wir die Datei als binären Inhalt behandeln
         ext = Path(audio_file).suffix
         if ext.lower() not in allowed_audios:
             ext = ".mp3"  # Standard, falls Endung fehlt
         temp_audio = Path(tempfile.mkdtemp()) / f"input{ext}"
         with open(temp_audio, "wb") as f:
-            f.write(audio_file.encode())  # Binäre Datei schreiben
         return temp_audio
-    elif hasattr(audio_file, 'name'):  # Wenn es sich um eine echte Datei handelt
         ext = Path(audio_file.name).suffix
         if ext.lower() not in allowed_audios:
-            ext = ".mp3"  # Standard, falls Endung fehlt
         temp_audio = Path(tempfile.mkdtemp()) / f"input{ext}"
-        audio_file.seek(0)  # Setzt den Zeiger zurück
         with open(temp_audio, "wb") as f:
-            shutil.copyfileobj(audio_file, f)  # Kopiere den Inhalt der Datei
         return temp_audio
     else:
         raise ValueError("Das übergebene Audio ist kein gültiges Dateiformat oder NamedString.")
@@ -66,7 +63,7 @@ def transcribe_audio(audio_file):
     }
     try:
         response = requests.post(API_URL, json=payload)
-        response.raise_for_status()  # Dies wird eine Ausnahme werfen, wenn die Antwort ein Fehler ist
     except requests.RequestException as e:
         return None, f"❌ API Fehler: {e}"
@@ -74,7 +71,7 @@ def transcribe_audio(audio_file):
     text = result['choices'][0]['message']['content']
     return text
-def generate_slideshow_with_audio(images, audio_file, duration_per_image=3, y_pos=0.5, fade_duration=0.7, font_size=60):
     if not images:
         return None, "❌ Keine Bilder ausgewählt"
@@ -82,7 +79,6 @@ def generate_slideshow_with_audio(images, audio_file, duration_per_image=3, y_po
     temp_dir = tempfile.mkdtemp()
     clips = []
-    # Transkription, falls Audio vorhanden
     if audio_file:
         transcript, err = transcribe_audio(audio_file)
         if err:
@@ -100,9 +96,8 @@ def generate_slideshow_with_audio(images, audio_file, duration_per_image=3, y_po
         texts = [""] * len(images)
         temp_audio_file = None
-    # Einzelne Clips erstellen
     for i, img_path in enumerate(images):
-        img_path = Path(img_path.name)  # Hier muss .name verwendet werden, da Gradio temporäre Dateien liefert
         clip_path = Path(temp_dir) / f"clip_{i}.mp4"
         text = texts[i] if i < len(texts) else ""
@@ -113,8 +108,7 @@ def generate_slideshow_with_audio(images, audio_file, duration_per_image=3, y_po
         )
         if text:
-            # Escape problematischer Zeichen für FFmpeg
-            safe_text = shlex.quote(text)  # Sichere Textverarbeitung
             drawtext_filter = (
                 f",drawtext=text={safe_text}:fontcolor=white:fontsize={font_size}:borderw=2:"
                 f"x=(w-text_w)/2:y=(h-text_h)*{y_pos}:"
@@ -160,7 +154,6 @@ def generate_slideshow_with_audio(images, audio_file, duration_per_image=3, y_po
     except subprocess.CalledProcessError as e:
         return None, f"❌ FFmpeg Concat Fehler:\n{e.stderr}"
-    # Audio hinzufügen, falls vorhanden
     if temp_audio_file:
         final_output = Path(temp_dir) / f"slideshow_audio_{uuid.uuid4().hex}.mp4"
         cmd_audio = [
@@ -194,13 +187,15 @@ with gr.Blocks() as demo:
     fade_input = gr.Number(value=0.7, label="Fade Dauer in Sekunden", precision=1)
     ypos_input = gr.Slider(minimum=0.0, maximum=0.9, step=0.01, value=0.5, label="Y-Position für alle Texte (0=oben, 0.5=mitte, 0.9=unten)")
     font_size_input = gr.Number(value=60, label="Textgröße (px)")
     out_video = gr.Video(interactive=False, label="Generiertes Video")
     status = gr.Textbox(interactive=False, label="Status")
     btn = gr.Button("Video erstellen")
     btn.click(
         fn=generate_slideshow_with_audio,
-        inputs=[img_input, audio_input, duration_input, ypos_input, fade_input, font_size_input],
         outputs=[out_video, status]
     )

     """
     Speichert die hochgeladene Datei sicher mit korrekter Endung in einem temporären Verzeichnis.
     """
+    if isinstance(audio_file, str):
         ext = Path(audio_file).suffix
         if ext.lower() not in allowed_audios:
             ext = ".mp3"  # Standard, falls Endung fehlt
         temp_audio = Path(tempfile.mkdtemp()) / f"input{ext}"
         with open(temp_audio, "wb") as f:
+            f.write(audio_file.encode())
         return temp_audio
+    elif hasattr(audio_file, 'name'):
         ext = Path(audio_file.name).suffix
         if ext.lower() not in allowed_audios:
+            ext = ".mp3"
         temp_audio = Path(tempfile.mkdtemp()) / f"input{ext}"
+        audio_file.seek(0)
         with open(temp_audio, "wb") as f:
+            shutil.copyfileobj(audio_file, f)
         return temp_audio
     else:
         raise ValueError("Das übergebene Audio ist kein gültiges Dateiformat oder NamedString.")
     }
     try:
         response = requests.post(API_URL, json=payload)
+        response.raise_for_status()
     except requests.RequestException as e:
         return None, f"❌ API Fehler: {e}"
     text = result['choices'][0]['message']['content']
     return text
+def generate_slideshow_with_audio(images, audio_file, duration_per_image=3, y_pos=0.5, fade_duration=0.7, font_size=60, speed=1.0):
     if not images:
         return None, "❌ Keine Bilder ausgewählt"
     temp_dir = tempfile.mkdtemp()
     clips = []
     if audio_file:
         transcript, err = transcribe_audio(audio_file)
         if err:
         texts = [""] * len(images)
         temp_audio_file = None
     for i, img_path in enumerate(images):
+        img_path = Path(img_path.name)  # Gradio liefert temporäre Dateipfade
         clip_path = Path(temp_dir) / f"clip_{i}.mp4"
         text = texts[i] if i < len(texts) else ""
         )
         if text:
+            safe_text = shlex.quote(text)
             drawtext_filter = (
                 f",drawtext=text={safe_text}:fontcolor=white:fontsize={font_size}:borderw=2:"
                 f"x=(w-text_w)/2:y=(h-text_h)*{y_pos}:"
     except subprocess.CalledProcessError as e:
         return None, f"❌ FFmpeg Concat Fehler:\n{e.stderr}"
     if temp_audio_file:
         final_output = Path(temp_dir) / f"slideshow_audio_{uuid.uuid4().hex}.mp4"
         cmd_audio = [
     fade_input = gr.Number(value=0.7, label="Fade Dauer in Sekunden", precision=1)
     ypos_input = gr.Slider(minimum=0.0, maximum=0.9, step=0.01, value=0.5, label="Y-Position für alle Texte (0=oben, 0.5=mitte, 0.9=unten)")
     font_size_input = gr.Number(value=60, label="Textgröße (px)")
+    speed_input = gr.Slider(minimum=0.1, maximum=3.0, value=1.0, label="Geschwindigkeit der Texteinblendung")
     out_video = gr.Video(interactive=False, label="Generiertes Video")
     status = gr.Textbox(interactive=False, label="Status")
     btn = gr.Button("Video erstellen")
     btn.click(
         fn=generate_slideshow_with_audio,
+        inputs=[img_input, audio_input, duration_input, ypos_input, fade_input, font_size_input, speed_input],
         outputs=[out_video, status]
     )