Spaces:

neuralworm
/

cognitive_mapping_probe

Sleeping

App Files Files Community

neuralworm commited on 17 days ago

Commit

5028f2b

1 Parent(s): 8049238

fix graphs?

Browse files

Files changed (2) hide show

app.py +6 -5
cognitive_mapping_probe/auto_experiment.py +23 -15

app.py CHANGED Viewed

@@ -28,9 +28,7 @@ def run_single_analysis_display(*args, progress=gr.Progress(track_tqdm=True)):
         df = pd.DataFrame({"Internal Step": range(len(deltas)), "State Change (Delta)": deltas})
         stats_md = f"### Statistical Signature\n- **Mean Delta:** {stats.get('mean_delta', 0):.4f}\n- **Std Dev Delta:** {stats.get('std_delta', 0):.4f}\n- **Max Delta:** {stats.get('max_delta', 0):.4f}\n"
-        # WICHTIG: Speicher aufräumen, BEVOR die Ergebnisse an Gradio zurückgegeben werden.
         cleanup_memory()
         return f"{results.get('verdict', 'Error')}\n\n{stats_md}", df, results
     except Exception:
         cleanup_memory()
@@ -40,10 +38,7 @@ def run_auto_suite_display(model_id, num_steps, seed, experiment_name, progress=
     """Wrapper für die automatisierte Experiment-Suite mit Visualisierung."""
     try:
         summary_df, plot_df, all_results = run_auto_suite(model_id, int(num_steps), int(seed), experiment_name, progress)
-        # WICHTIG: Speicher auch hier aufräumen.
         cleanup_memory()
         return summary_df, plot_df, all_results
     except Exception:
         cleanup_memory()
@@ -54,9 +49,11 @@ with gr.Blocks(theme=theme, title="Cognitive Seismograph 2.2") as demo:
     with gr.Tabs():
         with gr.TabItem("🔬 Manual Single Run"):
             gr.Markdown("Führe ein einzelnes Experiment mit manuellen Parametern durch, um Hypothesen zu explorieren.")
             with gr.Row(variant='panel'):
                 with gr.Column(scale=1):
                     gr.Markdown("### 1. General Parameters")
                     manual_model_id = gr.Textbox(value="google/gemma-3-1b-it", label="Model ID")
                     manual_prompt_type = gr.Radio(choices=list(RESONANCE_PROMPTS.keys()), value="resonance_prompt", label="Prompt Type")
@@ -83,6 +80,7 @@ with gr.Blocks(theme=theme, title="Cognitive Seismograph 2.2") as demo:
             gr.Markdown("Führe eine vordefinierte, kuratierte Reihe von Experimenten durch und visualisiere die Ergebnisse vergleichend.")
             with gr.Row(variant='panel'):
                 with gr.Column(scale=1):
                     gr.Markdown("### Auto-Experiment Parameters")
                     auto_model_id = gr.Textbox(value="google/gemma-3-1b-it", label="Model ID")
                     auto_num_steps = gr.Slider(50, 1000, 300, step=10, label="Steps per Run")
@@ -91,9 +89,12 @@ with gr.Blocks(theme=theme, title="Cognitive Seismograph 2.2") as demo:
                     auto_run_btn = gr.Button("Run Curated Auto-Experiment", variant="primary")
                 with gr.Column(scale=2):
                     gr.Markdown("### Suite Results Summary")
                     auto_plot_output = gr.LinePlot(
                         x="Step", y="Delta", color="Experiment",
                         title="Comparative Cognitive Dynamics",
                         show_label=True, height=400, interactive=True
                     )
                     auto_summary_df = gr.DataFrame(label="Comparative Statistical Signature", wrap=True)

         df = pd.DataFrame({"Internal Step": range(len(deltas)), "State Change (Delta)": deltas})
         stats_md = f"### Statistical Signature\n- **Mean Delta:** {stats.get('mean_delta', 0):.4f}\n- **Std Dev Delta:** {stats.get('std_delta', 0):.4f}\n- **Max Delta:** {stats.get('max_delta', 0):.4f}\n"
         cleanup_memory()
         return f"{results.get('verdict', 'Error')}\n\n{stats_md}", df, results
     except Exception:
         cleanup_memory()
     """Wrapper für die automatisierte Experiment-Suite mit Visualisierung."""
     try:
         summary_df, plot_df, all_results = run_auto_suite(model_id, int(num_steps), int(seed), experiment_name, progress)
         cleanup_memory()
         return summary_df, plot_df, all_results
     except Exception:
         cleanup_memory()
     with gr.Tabs():
         with gr.TabItem("🔬 Manual Single Run"):
+            # ... (Dieser Tab bleibt unverändert) ...
             gr.Markdown("Führe ein einzelnes Experiment mit manuellen Parametern durch, um Hypothesen zu explorieren.")
             with gr.Row(variant='panel'):
                 with gr.Column(scale=1):
+                    # ... (Parameter unverändert) ...
                     gr.Markdown("### 1. General Parameters")
                     manual_model_id = gr.Textbox(value="google/gemma-3-1b-it", label="Model ID")
                     manual_prompt_type = gr.Radio(choices=list(RESONANCE_PROMPTS.keys()), value="resonance_prompt", label="Prompt Type")
             gr.Markdown("Führe eine vordefinierte, kuratierte Reihe von Experimenten durch und visualisiere die Ergebnisse vergleichend.")
             with gr.Row(variant='panel'):
                 with gr.Column(scale=1):
+                    # ... (Parameter unverändert) ...
                     gr.Markdown("### Auto-Experiment Parameters")
                     auto_model_id = gr.Textbox(value="google/gemma-3-1b-it", label="Model ID")
                     auto_num_steps = gr.Slider(50, 1000, 300, step=10, label="Steps per Run")
                     auto_run_btn = gr.Button("Run Curated Auto-Experiment", variant="primary")
                 with gr.Column(scale=2):
                     gr.Markdown("### Suite Results Summary")
+                    # KORREKTUR: Explizite Legenden-Parameter hinzugefügt
                     auto_plot_output = gr.LinePlot(
                         x="Step", y="Delta", color="Experiment",
                         title="Comparative Cognitive Dynamics",
+                        color_legend_title="Experiment Runs",
+                        color_legend_position="bottom",
                         show_label=True, height=400, interactive=True
                     )
                     auto_summary_df = gr.DataFrame(label="Comparative Statistical Signature", wrap=True)

cognitive_mapping_probe/auto_experiment.py CHANGED Viewed

@@ -52,6 +52,7 @@ def run_auto_suite(
 ) -> Tuple[pd.DataFrame, pd.DataFrame, Dict]:
     """
     Führt eine vollständige, kuratierte Experiment-Suite aus.
     """
     all_experiments = get_curated_experiments()
     protocol = all_experiments.get(experiment_name)
@@ -62,38 +63,45 @@ def run_auto_suite(
     summary_data = []
     plot_data_frames = []
-    # Lade das Modell einmal zu Beginn der Suite
-    llm = get_or_load_model(model_id, seed)
     total_runs = len(protocol)
     for i, run_spec in enumerate(protocol):
         label = run_spec["label"]
         dbg(f"--- Running Auto-Experiment: '{label}' ({i+1}/{total_runs}) ---")
         results = run_seismic_analysis(
-            model_id=model_id, prompt_type=run_spec["prompt_type"],
-            seed=seed, num_steps=num_steps,
-            concept_to_inject=run_spec["concept"], injection_strength=run_spec["strength"],
             progress_callback=progress_callback,
-            llm_instance=llm # Wiederverwende die geladene LLM-Instanz
         )
         all_results[label] = results
         stats = results.get("stats", {})
-        summary_data.append({ "Experiment": label, "Mean Delta": stats.get("mean_delta"), "Std Dev Delta": stats.get("std_delta"), "Max Delta": stats.get("max_delta"), })
         deltas = results.get("state_deltas", [])
-        df = pd.DataFrame({ "Step": range(len(deltas)), "Delta": deltas, "Experiment": f"{i}: {label}" })
         plot_data_frames.append(df)
     summary_df = pd.DataFrame(summary_data)
     plot_df = pd.concat(plot_data_frames, ignore_index=True) if plot_data_frames else pd.DataFrame()
-    # WICHTIG: Explizites Aufräumen am Ende der gesamten Suite
-    del llm
-    gc.collect()
-    if torch.cuda.is_available():
-        torch.cuda.empty_cache()
     return summary_df, plot_df, all_results

 ) -> Tuple[pd.DataFrame, pd.DataFrame, Dict]:
     """
     Führt eine vollständige, kuratierte Experiment-Suite aus.
+    KORRIGIERT: Lädt das Modell für jeden Lauf neu, um statistische Unabhängigkeit zu garantieren.
     """
     all_experiments = get_curated_experiments()
     protocol = all_experiments.get(experiment_name)
     summary_data = []
     plot_data_frames = []
     total_runs = len(protocol)
     for i, run_spec in enumerate(protocol):
         label = run_spec["label"]
         dbg(f"--- Running Auto-Experiment: '{label}' ({i+1}/{total_runs}) ---")
+        # WISSENSCHAFTLICHE KORREKTUR: Rufe den Orchestrator so auf, dass er das Modell
+        # für jeden Lauf frisch lädt. `llm_instance=None` ist der Default.
+        # Dies ist der einzige Weg, um garantierte statistische Unabhängigkeit zu gewährleisten.
         results = run_seismic_analysis(
+            model_id=model_id,
+            prompt_type=run_spec["prompt_type"],
+            seed=seed, # Der Seed wird bei jedem Lauf neu gesetzt
+            num_steps=num_steps,
+            concept_to_inject=run_spec["concept"],
+            injection_strength=run_spec["strength"],
             progress_callback=progress_callback,
+            llm_instance=None
         )
         all_results[label] = results
         stats = results.get("stats", {})
+        summary_data.append({
+            "Experiment": label,
+            "Mean Delta": stats.get("mean_delta"),
+            "Std Dev Delta": stats.get("std_delta"),
+            "Max Delta": stats.get("max_delta"),
+        })
         deltas = results.get("state_deltas", [])
+        df = pd.DataFrame({
+            "Step": range(len(deltas)),
+            "Delta": deltas,
+            "Experiment": label # Gradio kann mit String-Labels umgehen, der frühere Fix war unnötig
+        })
         plot_data_frames.append(df)
     summary_df = pd.DataFrame(summary_data)
     plot_df = pd.concat(plot_data_frames, ignore_index=True) if plot_data_frames else pd.DataFrame()
     return summary_df, plot_df, all_results