Spaces:

neuralworm
/

cognitive_mapping_probe

Sleeping

App Files Files Community

neuralworm commited on 8 days ago

Commit

64ad029

1 Parent(s): b3585ba

v2.3

Browse files

Files changed (1) hide show

app.py +43 -27

app.py CHANGED Viewed

@@ -9,56 +9,85 @@ from cognitive_mapping_probe.auto_experiment import run_auto_suite, get_curated_
 from cognitive_mapping_probe.prompts import RESONANCE_PROMPTS
 from cognitive_mapping_probe.utils import dbg
 theme = gr.themes.Soft(primary_hue="indigo", secondary_hue="blue").set(body_background_fill="#f0f4f9", block_background_fill="white")
 def cleanup_memory():
-    """Eine zentrale Funktion zum Aufräumen des Speichers nach einem Lauf."""
     dbg("Cleaning up memory...")
     gc.collect()
     if torch.cuda.is_available():
         torch.cuda.empty_cache()
     dbg("Memory cleanup complete.")
 def run_single_analysis_display(*args, progress=gr.Progress(track_tqdm=True)):
     """Wrapper für ein einzelnes manuelles Experiment."""
     try:
         results = run_seismic_analysis(*args, progress_callback=progress)
         stats = results.get("stats", {})
         deltas = results.get("state_deltas", [])
         df = pd.DataFrame({"Internal Step": range(len(deltas)), "State Change (Delta)": deltas})
         stats_md = f"### Statistical Signature\n- **Mean Delta:** {stats.get('mean_delta', 0):.4f}\n- **Std Dev Delta:** {stats.get('std_delta', 0):.4f}\n- **Max Delta:** {stats.get('max_delta', 0):.4f}\n"
-        cleanup_memory()
         return f"{results.get('verdict', 'Error')}\n\n{stats_md}", df, results
     except Exception:
-        cleanup_memory()
         return f"### ❌ Analysis Failed\n```\n{traceback.format_exc()}\n```", pd.DataFrame(), {}
 def run_auto_suite_display(model_id, num_steps, seed, experiment_name, progress=gr.Progress(track_tqdm=True)):
-    """Wrapper für die automatisierte Experiment-Suite mit Visualisierung."""
     try:
         summary_df, plot_df, all_results = run_auto_suite(model_id, int(num_steps), int(seed), experiment_name, progress)
-        # DEBUG-Ausgabe zur Überprüfung der DataFrame-Struktur
-        dbg("Plot DataFrame Head:\n", plot_df.head())
-        dbg("Plot DataFrame Dtypes:\n", plot_df.dtypes)
-        cleanup_memory()
-        return summary_df, plot_df, all_results
     except Exception:
         cleanup_memory()
-        return pd.DataFrame(), pd.DataFrame(), f"### ❌ Auto-Experiment Failed\n```\n{traceback.format_exc()}\n```"
 with gr.Blocks(theme=theme, title="Cognitive Seismograph 2.3") as demo:
-    gr.Markdown("# 🧠 Cognitive Seismograph 2.3: Machine Psychology")
     with gr.Tabs():
         with gr.TabItem("🔬 Manual Single Run"):
-            # ... (Dieser Tab bleibt unverändert) ...
             gr.Markdown("Führe ein einzelnes Experiment mit manuellen Parametern durch, um Hypothesen zu explorieren.")
             with gr.Row(variant='panel'):
                 with gr.Column(scale=1):
-                    # ... (Parameter unverändert) ...
                     gr.Markdown("### 1. General Parameters")
                     manual_model_id = gr.Textbox(value="google/gemma-3-1b-it", label="Model ID")
                     manual_prompt_type = gr.Radio(choices=list(RESONANCE_PROMPTS.keys()), value="resonance_prompt", label="Prompt Type")
@@ -85,7 +114,6 @@ with gr.Blocks(theme=theme, title="Cognitive Seismograph 2.3") as demo:
             gr.Markdown("Führe eine vordefinierte, kuratierte Reihe von Experimenten durch und visualisiere die Ergebnisse vergleichend.")
             with gr.Row(variant='panel'):
                 with gr.Column(scale=1):
-                    # ... (Parameter unverändert) ...
                     gr.Markdown("### Auto-Experiment Parameters")
                     auto_model_id = gr.Textbox(value="google/gemma-3-1b-it", label="Model ID")
                     auto_num_steps = gr.Slider(50, 1000, 300, step=10, label="Steps per Run")
@@ -94,19 +122,7 @@ with gr.Blocks(theme=theme, title="Cognitive Seismograph 2.3") as demo:
                     auto_run_btn = gr.Button("Run Curated Auto-Experiment", variant="primary")
                 with gr.Column(scale=2):
                     gr.Markdown("### Suite Results Summary")
-                    # FINALE KORREKTUR: Wir definieren die Spaltennamen explizit,
-                    # um jegliche Ambiguität für Gradio zu beseitigen.
-                    auto_plot_output = gr.LinePlot(
-                        x="Step",
-                        y="Delta",
-                        color="Experiment",
-                        title="Comparative Cognitive Dynamics",
-                        color_legend_title="Experiment Runs",
-                        color_legend_position="bottom",
-                        show_label=True,
-                        height=400,
-                        interactive=True
-                    )
                     auto_summary_df = gr.DataFrame(label="Comparative Statistical Signature", wrap=True)
                     with gr.Accordion("Raw JSON for all runs", open=False):
                         auto_raw_json = gr.JSON()

 from cognitive_mapping_probe.prompts import RESONANCE_PROMPTS
 from cognitive_mapping_probe.utils import dbg
+# --- UI Theme ---
 theme = gr.themes.Soft(primary_hue="indigo", secondary_hue="blue").set(body_background_fill="#f0f4f9", block_background_fill="white")
+# --- Hilfsfunktionen ---
 def cleanup_memory():
+    """Eine zentrale Funktion zum Aufräumen des VRAM und des Python-Speichers."""
     dbg("Cleaning up memory...")
     gc.collect()
     if torch.cuda.is_available():
         torch.cuda.empty_cache()
     dbg("Memory cleanup complete.")
+# --- Wrapper für Gradio-Funktionalität ---
 def run_single_analysis_display(*args, progress=gr.Progress(track_tqdm=True)):
     """Wrapper für ein einzelnes manuelles Experiment."""
     try:
+        # Führe die Analyse durch
         results = run_seismic_analysis(*args, progress_callback=progress)
         stats = results.get("stats", {})
         deltas = results.get("state_deltas", [])
+        # Bereite die Ausgaben vor
         df = pd.DataFrame({"Internal Step": range(len(deltas)), "State Change (Delta)": deltas})
         stats_md = f"### Statistical Signature\n- **Mean Delta:** {stats.get('mean_delta', 0):.4f}\n- **Std Dev Delta:** {stats.get('std_delta', 0):.4f}\n- **Max Delta:** {stats.get('max_delta', 0):.4f}\n"
         return f"{results.get('verdict', 'Error')}\n\n{stats_md}", df, results
     except Exception:
         return f"### ❌ Analysis Failed\n```\n{traceback.format_exc()}\n```", pd.DataFrame(), {}
+    finally:
+        # Stelle sicher, dass der Speicher in jedem Fall aufgeräumt wird
+        cleanup_memory()
+# Definiere die Plot-Parameter an einer zentralen Stelle für Konsistenz
+PLOT_PARAMS = {
+    "x": "Step",
+    "y": "Delta",
+    "color": "Experiment",
+    "title": "Comparative Cognitive Dynamics",
+    "color_legend_title": "Experiment Runs",
+    "color_legend_position": "bottom",
+    "show_label": True,
+    "height": 400,
+    "interactive": True
+}
 def run_auto_suite_display(model_id, num_steps, seed, experiment_name, progress=gr.Progress(track_tqdm=True)):
+    """
+    Wrapper für die automatisierte Experiment-Suite.
+    Gibt eine neue `gr.LinePlot`-Instanz zurück, um den State-Leak-Bug zu beheben.
+    """
     try:
         summary_df, plot_df, all_results = run_auto_suite(model_id, int(num_steps), int(seed), experiment_name, progress)
+        dbg("Plot DataFrame Head for Auto-Suite:\n", plot_df.head())
+        # WISSENSCHAFTLICHE KORREKTUR: Erzeuge eine komplett neue Plot-Komponente
+        # mit den neuen Daten. Dies zwingt Gradio, den alten Zustand zu verwerfen.
+        new_plot = gr.LinePlot(value=plot_df, **PLOT_PARAMS)
+        return summary_df, new_plot, all_results
     except Exception:
+        # Im Fehlerfall, gib leere, aber korrekt typisierte Komponenten zurück
+        empty_plot = gr.LinePlot(value=pd.DataFrame(), **PLOT_PARAMS)
+        return pd.DataFrame(), empty_plot, f"### ❌ Auto-Experiment Failed\n```\n{traceback.format_exc()}\n```"
+    finally:
         cleanup_memory()
+# --- Gradio UI-Definition ---
 with gr.Blocks(theme=theme, title="Cognitive Seismograph 2.3") as demo:
+    gr.Markdown("# 🧠 Cognitive Seismograph 2.3: Advanced Experiment Suite")
     with gr.Tabs():
         with gr.TabItem("🔬 Manual Single Run"):
             gr.Markdown("Führe ein einzelnes Experiment mit manuellen Parametern durch, um Hypothesen zu explorieren.")
             with gr.Row(variant='panel'):
                 with gr.Column(scale=1):
                     gr.Markdown("### 1. General Parameters")
                     manual_model_id = gr.Textbox(value="google/gemma-3-1b-it", label="Model ID")
                     manual_prompt_type = gr.Radio(choices=list(RESONANCE_PROMPTS.keys()), value="resonance_prompt", label="Prompt Type")
             gr.Markdown("Führe eine vordefinierte, kuratierte Reihe von Experimenten durch und visualisiere die Ergebnisse vergleichend.")
             with gr.Row(variant='panel'):
                 with gr.Column(scale=1):
                     gr.Markdown("### Auto-Experiment Parameters")
                     auto_model_id = gr.Textbox(value="google/gemma-3-1b-it", label="Model ID")
                     auto_num_steps = gr.Slider(50, 1000, 300, step=10, label="Steps per Run")
                     auto_run_btn = gr.Button("Run Curated Auto-Experiment", variant="primary")
                 with gr.Column(scale=2):
                     gr.Markdown("### Suite Results Summary")
+                    auto_plot_output = gr.LinePlot(**PLOT_PARAMS)
                     auto_summary_df = gr.DataFrame(label="Comparative Statistical Signature", wrap=True)
                     with gr.Accordion("Raw JSON for all runs", open=False):
                         auto_raw_json = gr.JSON()