Spaces:

neuralworm
/

video_transcription

Running

App Files Files Community

neuralworm commited on 5 days ago

Commit

abecc06

verified ·

1 Parent(s): f862cfc

Update app.py

Browse files

Files changed (1) hide show

app.py +73 -36

app.py CHANGED Viewed

@@ -27,13 +27,19 @@ from pathlib import Path
 from datetime import timedelta
 import socket
 import urllib.request
 import gradio as gr
 try:
     import whisper
-except Exception:
     whisper = None
 # ---------------------------------------------------------------------------
 # Helper: Shell
@@ -43,25 +49,67 @@ def run_capture(cmd):
     """Run a command and return stdout; raise RuntimeError with readable stderr on failure."""
     result = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
     if result.returncode != 0:
-        stderr_text = result.stderr or ""  # Keep only tail to avoid massive logs
         tail = stderr_text[-2000:]
-        # KORRIGIERT: Fehlermeldung korrekt zusammengebaut und abgeschlossen.
         raise RuntimeError("Command failed: " + " ".join(cmd) + " " + tail)
     return result.stdout
 # ---------------------------------------------------------------------------
-# Download & Audio
 # ---------------------------------------------------------------------------
 def download_video_with_ytdlp(url, out_dir, cookies_path=None, format_selector=None):
-    """Download a video with yt-dlp into out_dir and return the video path."""
     out_template = str(Path(out_dir) / "%(title)s.%(ext)s")
     cmd = ["yt-dlp", "-o", out_template]
     if format_selector:
         cmd += ["-f", format_selector]
     if cookies_path:
         cmd += ["--cookies", cookies_path]
     cmd.append(url)
     try:
         run_capture(cmd)
@@ -69,9 +117,8 @@ def download_video_with_ytdlp(url, out_dir, cookies_path=None, format_selector=N
         msg = str(e)
         if "Failed to resolve" in msg or "Name or service not known" in msg:
             raise RuntimeError(
-                "DNS/Internet-Problem: Der Space kann den Host nicht auflösen. "
-                "URL-Download ist hier nicht möglich. Bitte Videodatei direkt hochladen "
-                "oder den Space in einer Umgebung mit Internet/DNS-Freigabe ausführen."
             )
         raise
@@ -80,11 +127,15 @@ def download_video_with_ytdlp(url, out_dir, cookies_path=None, format_selector=N
         raise FileNotFoundError("Download fehlgeschlagen — keine Datei gefunden.")
     return str(files[0])
 def extract_audio_ffmpeg(video_path, out_wav):
     cmd = ["ffmpeg", "-y", "-i", video_path, "-vn", "-ac", "1", "-ar", "16000", "-f", "wav", out_wav]
     subprocess.run(cmd, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
     return out_wav
 # ---------------------------------------------------------------------------
 # Zeit- und Format-Helfer
 # ---------------------------------------------------------------------------
@@ -104,33 +155,24 @@ def format_timestamp_vtt(s):
     return f"{hours:02d}:{minutes:02d}:{seconds:02d}.{ms:03d}"
 def segments_to_srt(segments):
-    """Formats transcript segments into a valid SRT string."""
     parts = []
     for i, seg in enumerate(segments, start=1):
         start = seconds_to_timestamp(seg['start'])
         end = seconds_to_timestamp(seg['end'])
         text = seg['text'].strip()
-        # KORRIGIERT: Korrektes SRT-Blockformat mit Zeilenumbrüchen.
         parts.append(f"{i}\n{start} --> {end}\n{text}")
-    # KORRIGIERT: Blöcke mit zwei Zeilenumbrüchen verbinden, um gültiges SRT zu erzeugen.
     return "\n\n".join(parts) + "\n\n"
 def segments_to_vtt(segments):
-    """Formats transcript segments into a valid VTT string."""
-    # KORRIGIERT: Korrekter Header mit nachfolgendem Zeilenumbruch.
     parts = ["WEBVTT\n"]
     for seg in segments:
         start = format_timestamp_vtt(seg['start'])
         end = format_timestamp_vtt(seg['end'])
         text = seg['text'].strip()
-        # KORRIGIERT: Korrektes VTT-Blockformat mit Zeilenumbruch.
         parts.append(f"{start} --> {end}\n{text}")
-    # KORRIGIERT: Blöcke mit zwei Zeilenumbrüchen verbinden.
     return "\n\n".join(parts)
 def segments_to_txt(segments):
-    """Formats segments to a readable plain text file."""
-    # VERBESSERT: Segmente mit Zeilenumbruch statt Leerzeichen für bessere Lesbarkeit trennen.
     return "\n".join([f"[{seconds_to_timestamp(seg['start'])}] {seg['text'].strip()}" for seg in segments])
 def segments_to_json(segments, language=None, metadata=None):
@@ -149,26 +191,21 @@ def transcribe_pipeline(file_obj, url, model_size, keep_video=False, cookies_fil
     tmpdir = tempfile.mkdtemp(prefix="whisper_space_")
     try:
-        # Quelle bestimmen
         if url:
             video_path = download_video_with_ytdlp(url, tmpdir, cookies_path=cookies_file, format_selector=format_selector)
         elif file_obj:
-            # Gradio übergibt ein temporäres Dateiobjekt, dessen .name Attribut der Pfad ist.
             video_path = file_obj.name
         else:
             return "Kein Video angegeben.", None, None, None, None, None
-        # Audio extrahieren
         audio_wav = str(Path(tmpdir) / "audio.wav")
         extract_audio_ffmpeg(video_path, audio_wav)
-        # Whisper laden & transkribieren
         model = whisper.load_model(model_size)
         result = model.transcribe(audio_wav, verbose=False)
         segments = result.get("segments", [])
         language = result.get("language", "unknown")
-        # Ausgaben erzeugen
         txt_text = segments_to_txt(segments)
         srt_text = segments_to_srt(segments)
         vtt_text = segments_to_vtt(segments)
@@ -197,11 +234,9 @@ def transcribe_pipeline(file_obj, url, model_size, keep_video=False, cookies_fil
 # ---------------------------------------------------------------------------
 def dns_internet_diag():
-    """Führt einige Basis-Checks aus und gibt einen Textreport zurück."""
     lines = []
-    # DNS-Checks
-    lines.append("=== DNS-Auflösung ===")
     for host in ["huggingface.co", "www.google.com", "www.instagram.com", "youtube.com"]:
         try:
             ip = socket.gethostbyname(host)
@@ -209,9 +244,17 @@ def dns_internet_diag():
         except Exception as e:
             lines.append(f"{host} -> ERROR: {e}")
-    # HTTP-Checks
     lines.append("\n\n=== HTTP-Requests (GET) ===")
-    for url in ["https://huggingface.co", "https://www.google.com", "https://www.instagram.com"]:
         try:
             with urllib.request.urlopen(url, timeout=5) as resp:
                 code = getattr(resp, "status", None) or resp.getcode()
@@ -219,7 +262,6 @@ def dns_internet_diag():
         except Exception as e:
             lines.append(f"{url} -> ERROR: {e}")
-    # yt-dlp
     lines.append("\n\n=== yt-dlp ===")
     try:
         out = run_capture(["yt-dlp", "--version"])
@@ -227,7 +269,6 @@ def dns_internet_diag():
     except Exception as e:
         lines.append(f"yt-dlp Fehler: {e}")
-    # ffmpeg
     lines.append("\n\n=== ffmpeg ===")
     try:
         out = run_capture(["ffmpeg", "-version"])
@@ -264,10 +305,7 @@ with gr.Blocks() as demo:
                 json_dl = gr.File(label="JSON")
         def run_transcribe(f, u, m, k, c, fmt):
-            # KORRIGIERT: Korrekte Handhabung des Gradio-Dateiobjekts für Cookies.
-            # Wir holen den Pfad über das .name Attribut.
             cookies_path = c.name if c else None
             display, srtf, vttf, txtf, jsonf, meta = transcribe_pipeline(
                 f, u, m, k, cookies_file=cookies_path, format_selector=(fmt or None)
             )
@@ -288,11 +326,10 @@ with gr.Blocks() as demo:
     with gr.Tab("Netzwerk / DNS Diagnose"):
         gr.Markdown(
-            """Führt einfache Tests für DNS, HTTP sowie yt-dlp/ffmpeg aus.
-            Wenn z. B. www.instagram.com nicht auflösbar ist, liegt ein DNS-/Firewall-Problem vor.
-            Wenn Hugging Face / Google funktionieren, aber Instagram nicht, blockt vermutlich die Umgebung nur bestimmte Domains."""
         )
         diag_btn = gr.Button("Diagnose starten")
         diag_out = gr.Textbox(label="Diagnose-Ausgabe", lines=25)

 from datetime import timedelta
 import socket
 import urllib.request
+from urllib.parse import urlparse
 import gradio as gr
 try:
     import whisper
+except ImportError:
     whisper = None
+try:
+    from dns import resolver as dns_resolver
+except ImportError:
+    dns_resolver = None
 # ---------------------------------------------------------------------------
 # Helper: Shell
     """Run a command and return stdout; raise RuntimeError with readable stderr on failure."""
     result = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
     if result.returncode != 0:
+        stderr_text = result.stderr or ""
         tail = stderr_text[-2000:]
         raise RuntimeError("Command failed: " + " ".join(cmd) + " " + tail)
     return result.stdout
+# ---------------------------------------------------------------------------
+# NEUE FUNKTION: DNS-Auflösung via dnspython
+# ---------------------------------------------------------------------------
+def resolve_hostname_with_dns_python(hostname):
+    """Resolves a hostname using a public DNS server to bypass local DNS blocks."""
+    if not dns_resolver:
+        # Fallback auf System-DNS, wenn dnspython nicht installiert ist
+        print("Warning: dnspython not found. Falling back to system DNS.")
+        return socket.gethostbyname(hostname)
+    try:
+        resolver = dns_resolver.Resolver()
+        resolver.nameservers = ['8.8.8.8', '1.1.1.1'] # Google & Cloudflare DNS
+        answers = resolver.resolve(hostname, 'A')
+        if answers:
+            return answers[0].to_text()
+    except Exception as e:
+        print(f"DNS resolution with dnspython failed for {hostname}: {e}")
+        # Als letzten Ausweg versuchen wir es mit dem System-Resolver
+        try:
+            return socket.gethostbyname(hostname)
+        except Exception as se:
+            raise se # Den ursprünglichen Systemfehler auslösen
+    return None
 # ---------------------------------------------------------------------------
+# MODIFIZIERTE FUNKTION: Download & Audio
 # ---------------------------------------------------------------------------
 def download_video_with_ytdlp(url, out_dir, cookies_path=None, format_selector=None):
+    """Download a video with yt-dlp, using custom DNS resolution if necessary."""
     out_template = str(Path(out_dir) / "%(title)s.%(ext)s")
     cmd = ["yt-dlp", "-o", out_template]
+    # DNS-Umgehung implementieren
+    try:
+        parsed_url = urlparse(url)
+        hostname = parsed_url.hostname
+        if hostname:
+            print(f"Resolving hostname: {hostname}")
+            ip_address = resolve_hostname_with_dns_python(hostname)
+            if ip_address:
+                print(f"Resolved {hostname} to {ip_address}. Using --resolve.")
+                # --resolve weist yt-dlp an, diese IP für den Hostnamen auf Port 443 zu verwenden
+                resolve_arg = f"{hostname}:443:{ip_address}"
+                cmd.extend(["--resolve", resolve_arg])
+    except Exception as e:
+        print(f"Could not perform custom DNS resolution, proceeding without it. Error: {e}")
     if format_selector:
         cmd += ["-f", format_selector]
     if cookies_path:
         cmd += ["--cookies", cookies_path]
     cmd.append(url)
+    print(f"Running command: {' '.join(cmd)}")
     try:
         run_capture(cmd)
         msg = str(e)
         if "Failed to resolve" in msg or "Name or service not known" in msg:
             raise RuntimeError(
+                "DNS/Internet-Problem: Der Host konnte nicht aufgelöst werden. "
+                "Selbst die DNS-Umgehung ist fehlgeschlagen. Möglicherweise blockiert eine Firewall auch die IP-Adressen."
             )
         raise
         raise FileNotFoundError("Download fehlgeschlagen — keine Datei gefunden.")
     return str(files[0])
 def extract_audio_ffmpeg(video_path, out_wav):
     cmd = ["ffmpeg", "-y", "-i", video_path, "-vn", "-ac", "1", "-ar", "16000", "-f", "wav", out_wav]
     subprocess.run(cmd, check=True, stdout=subprocess.DEVNULL, stderr=subprocess.DEVNULL)
     return out_wav
+# ... (der Rest des Codes von "Zeit- und Format-Helfer" bis zum Ende bleibt identisch)
+# Ich füge ihn hier zur Vollständigkeit ein.
 # ---------------------------------------------------------------------------
 # Zeit- und Format-Helfer
 # ---------------------------------------------------------------------------
     return f"{hours:02d}:{minutes:02d}:{seconds:02d}.{ms:03d}"
 def segments_to_srt(segments):
     parts = []
     for i, seg in enumerate(segments, start=1):
         start = seconds_to_timestamp(seg['start'])
         end = seconds_to_timestamp(seg['end'])
         text = seg['text'].strip()
         parts.append(f"{i}\n{start} --> {end}\n{text}")
     return "\n\n".join(parts) + "\n\n"
 def segments_to_vtt(segments):
     parts = ["WEBVTT\n"]
     for seg in segments:
         start = format_timestamp_vtt(seg['start'])
         end = format_timestamp_vtt(seg['end'])
         text = seg['text'].strip()
         parts.append(f"{start} --> {end}\n{text}")
     return "\n\n".join(parts)
 def segments_to_txt(segments):
     return "\n".join([f"[{seconds_to_timestamp(seg['start'])}] {seg['text'].strip()}" for seg in segments])
 def segments_to_json(segments, language=None, metadata=None):
     tmpdir = tempfile.mkdtemp(prefix="whisper_space_")
     try:
         if url:
             video_path = download_video_with_ytdlp(url, tmpdir, cookies_path=cookies_file, format_selector=format_selector)
         elif file_obj:
             video_path = file_obj.name
         else:
             return "Kein Video angegeben.", None, None, None, None, None
         audio_wav = str(Path(tmpdir) / "audio.wav")
         extract_audio_ffmpeg(video_path, audio_wav)
         model = whisper.load_model(model_size)
         result = model.transcribe(audio_wav, verbose=False)
         segments = result.get("segments", [])
         language = result.get("language", "unknown")
         txt_text = segments_to_txt(segments)
         srt_text = segments_to_srt(segments)
         vtt_text = segments_to_vtt(segments)
 # ---------------------------------------------------------------------------
 def dns_internet_diag():
     lines = []
+    lines.append("=== DNS-Auflösung (System) ===")
     for host in ["huggingface.co", "www.google.com", "www.instagram.com", "youtube.com"]:
         try:
             ip = socket.gethostbyname(host)
         except Exception as e:
             lines.append(f"{host} -> ERROR: {e}")
+    if dns_resolver:
+        lines.append("\n\n=== DNS-Auflösung (via dnspython mit 8.8.8.8) ===")
+        for host in ["huggingface.co", "www.google.com", "www.instagram.com", "youtube.com"]:
+            try:
+                ip = resolve_hostname_with_dns_python(host)
+                lines.append(f"{host} -> {ip} (OK)")
+            except Exception as e:
+                lines.append(f"{host} -> ERROR: {e}")
     lines.append("\n\n=== HTTP-Requests (GET) ===")
+    for url in ["https://huggingface.co", "https://www.google.com"]:
         try:
             with urllib.request.urlopen(url, timeout=5) as resp:
                 code = getattr(resp, "status", None) or resp.getcode()
         except Exception as e:
             lines.append(f"{url} -> ERROR: {e}")
     lines.append("\n\n=== yt-dlp ===")
     try:
         out = run_capture(["yt-dlp", "--version"])
     except Exception as e:
         lines.append(f"yt-dlp Fehler: {e}")
     lines.append("\n\n=== ffmpeg ===")
     try:
         out = run_capture(["ffmpeg", "-version"])
                 json_dl = gr.File(label="JSON")
         def run_transcribe(f, u, m, k, c, fmt):
             cookies_path = c.name if c else None
             display, srtf, vttf, txtf, jsonf, meta = transcribe_pipeline(
                 f, u, m, k, cookies_file=cookies_path, format_selector=(fmt or None)
             )
     with gr.Tab("Netzwerk / DNS Diagnose"):
         gr.Markdown(
+            """Führt Tests für den System-DNS und einen externen DNS (via dnspython) durch.
+            Wenn der System-DNS fehlschlägt, der externe aber funktioniert, ist die DNS-Umgehung aktiv.
+            Wenn beides fehlschlägt, blockiert eine Firewall wahrscheinlich auch die IP-Adressen."""
         )
         diag_btn = gr.Button("Diagnose starten")
         diag_out = gr.Textbox(label="Diagnose-Ausgabe", lines=25)