Spaces:

neuralworm
/

cognitive_mapping_probe

Sleeping

App Files Files Community

neuralworm commited on 16 days ago

Commit

d8f82fc

1 Parent(s): 2f5b07d

pre-flight tests

Browse files

Files changed (8) hide show

cognitive_mapping_probe/__pycache__/concepts.cpython-310.pyc +0 -0
cognitive_mapping_probe/__pycache__/llm_iface.cpython-310.pyc +0 -0
cognitive_mapping_probe/__pycache__/orchestrator.cpython-310.pyc +0 -0
cognitive_mapping_probe/__pycache__/resonance.cpython-310.pyc +0 -0
cognitive_mapping_probe/__pycache__/verification.cpython-310.pyc +0 -0
cognitive_mapping_probe/pre_flight_checks.py +72 -37
cognitive_mapping_probe/resonance.py +23 -36
cognitive_mapping_probe/verification.py +6 -2

cognitive_mapping_probe/__pycache__/concepts.cpython-310.pyc CHANGED Viewed

Binary files a/cognitive_mapping_probe/__pycache__/concepts.cpython-310.pyc and b/cognitive_mapping_probe/__pycache__/concepts.cpython-310.pyc differ

cognitive_mapping_probe/__pycache__/llm_iface.cpython-310.pyc CHANGED Viewed

Binary files a/cognitive_mapping_probe/__pycache__/llm_iface.cpython-310.pyc and b/cognitive_mapping_probe/__pycache__/llm_iface.cpython-310.pyc differ

cognitive_mapping_probe/__pycache__/orchestrator.cpython-310.pyc CHANGED Viewed

Binary files a/cognitive_mapping_probe/__pycache__/orchestrator.cpython-310.pyc and b/cognitive_mapping_probe/__pycache__/orchestrator.cpython-310.pyc differ

cognitive_mapping_probe/__pycache__/resonance.cpython-310.pyc CHANGED Viewed

Binary files a/cognitive_mapping_probe/__pycache__/resonance.cpython-310.pyc and b/cognitive_mapping_probe/__pycache__/resonance.cpython-310.pyc differ

cognitive_mapping_probe/__pycache__/verification.cpython-310.pyc CHANGED Viewed

Binary files a/cognitive_mapping_probe/__pycache__/verification.cpython-310.pyc and b/cognitive_mapping_probe/__pycache__/verification.cpython-310.pyc differ

cognitive_mapping_probe/pre_flight_checks.py CHANGED Viewed

@@ -6,13 +6,15 @@ from .llm_iface import get_or_load_model
 from .concepts import get_concept_vector
 from .resonance import run_silent_cogitation
 from .verification import generate_spontaneous_text
 from .utils import dbg
 def run_pre_flight_checks(model_id: str, seed: int):
     """
     Führt eine Reihe von kritischen Integrationstests mit einem ECHTEN LLM durch,
-    um die Validität der gesamten experimentellen Kette sicherzustellen, bevor
-    zeitaufwändige Experimente gestartet werden. Löst bei Fehlern einen AssertionError aus.
     """
     print(f"1. Loading model '{model_id}'...")
@@ -23,15 +25,12 @@ def run_pre_flight_checks(model_id: str, seed: int):
         raise AssertionError(f"Model loading failed: {e}")
     print("\n2. Testing basic text generation...")
-    # Dieser einfache Test fängt Tokenizer-, Chat-Template- und grundlegende I/O-Probleme ab.
     try:
-        # Erzeuge einen Dummy-Prompt, um eine einfache Antwort zu provozieren
         inputs = llm.tokenizer("Hello, are you working?", return_tensors="pt").to(llm.model.device)
         outputs = llm.model.generate(inputs.input_ids, max_new_tokens=5)
         text = llm.tokenizer.decode(outputs[0], skip_special_tokens=True)
-        assert isinstance(text, str) and len(text) > 0
         print(f"   ✅ Basic generation successful. Model responded.")
-        dbg(f"Response snippet: '{text[:50]}...'")
     except Exception as e:
         raise AssertionError(f"Basic text generation failed: {e}")
@@ -45,67 +44,103 @@ def run_pre_flight_checks(model_id: str, seed: int):
     print("\n4. Testing resonance loop (short run)...")
     try:
-        _, _, _, reason = run_silent_cogitation(llm, "control_long_prose", num_steps=5, temperature=0.1)
-        assert reason in ["converged", "max_steps_reached"]
-        print("   ✅ Resonance loop executed without errors.")
     except Exception as e:
         raise AssertionError(f"Resonance loop failed: {e}")
     print("\n5. CRITICAL TEST: Hook causal efficacy...")
-    # Dies ist der wichtigste Test. Er stellt sicher, dass unsere Aktivations-Injektionen
-    # tatsächlich eine kausale Wirkung auf die Berechnungen des Modells haben.
     handle = None
     try:
         inputs = llm.tokenizer("Test", return_tensors="pt").to(llm.model.device)
-        # Lauf 1: Ohne Hook, um den Originalzustand zu erhalten
         outputs_no_hook = llm.model(**inputs, output_hidden_states=True)
         target_layer_idx = llm.config.num_hidden_layers // 2
         state_no_hook = outputs_no_hook.hidden_states[target_layer_idx + 1].clone().detach()
-        # Definiere einen einfachen, starken Hook
         def test_hook(module, layer_input):
             return (layer_input[0] + 99.0,) + layer_input[1:]
         target_layer = llm.model.model.layers[target_layer_idx]
         handle = target_layer.register_forward_pre_hook(test_hook)
-        # Lauf 2: Mit Hook
         outputs_with_hook = llm.model(**inputs, output_hidden_states=True)
         state_with_hook = outputs_with_hook.hidden_states[target_layer_idx + 1].clone().detach()
-        handle.remove() # Hook sofort entfernen
         handle = None
-        # Die entscheidende Behauptung: Die Zustände DÜRFEN NICHT identisch sein.
-        assert not torch.allclose(state_no_hook, state_with_hook), \
-            "Hook had no causal effect on subsequent hidden states. The injection mechanism is broken."
         print("   ✅ Hook causal efficacy verified.")
     except Exception as e:
         raise AssertionError(f"Hook efficacy test failed: {e}")
     finally:
-        # Stelle sicher, dass der Hook in jedem Fall entfernt wird
-        if handle:
-            handle.remove()
-            print("   ⚠️ Hook handle was removed during exception handling.")
     print("\n6. Testing verification (spontaneous text) loop...")
     try:
-        # Erstelle Dummy-Daten, um die Funktion isoliert zu testen
-        dummy_state = torch.randn(1, 1, llm.config.hidden_size).to(llm.model.device)
-        dummy_kv = tuple(
-            (torch.randn(1, llm.config.num_attention_heads, 10, llm.config.hidden_size // llm.config.num_attention_heads).to(llm.model.device),
-             torch.randn(1, llm.config.num_attention_heads, 10, llm.config.hidden_size // llm.config.num_attention_heads).to(llm.model.device))
-            for _ in range(llm.config.num_hidden_layers)
-        )
         text = generate_spontaneous_text(llm, dummy_state, dummy_kv, max_new_tokens=5)
         assert isinstance(text, str)
         print("   ✅ Spontaneous text generation loop executed without errors.")
     except Exception as e:
         raise AssertionError(f"Verification loop failed: {e}")
     # Aufräumen
     del llm
     if torch.cuda.is_available():

 from .concepts import get_concept_vector
 from .resonance import run_silent_cogitation
 from .verification import generate_spontaneous_text
+from .orchestrator import run_cognitive_titration_experiment
 from .utils import dbg
 def run_pre_flight_checks(model_id: str, seed: int):
     """
     Führt eine Reihe von kritischen Integrationstests mit einem ECHTEN LLM durch,
+    um die Validität der gesamten experimentellen Kette sicherzustellen.
+    Diese Version enthält feingranulare Assertions in Test 7, um die gesamte
+    wissenschaftliche Hypothese (Konvergenz -> Verhalten) zu validieren.
     """
     print(f"1. Loading model '{model_id}'...")
         raise AssertionError(f"Model loading failed: {e}")
     print("\n2. Testing basic text generation...")
     try:
         inputs = llm.tokenizer("Hello, are you working?", return_tensors="pt").to(llm.model.device)
         outputs = llm.model.generate(inputs.input_ids, max_new_tokens=5)
         text = llm.tokenizer.decode(outputs[0], skip_special_tokens=True)
+        assert isinstance(text, str) and len(text) > 0, "Basic generation produced no text."
         print(f"   ✅ Basic generation successful. Model responded.")
     except Exception as e:
         raise AssertionError(f"Basic text generation failed: {e}")
     print("\n4. Testing resonance loop (short run)...")
     try:
+        # Führe diesen Test mit deterministischer Temperatur durch, um Konvergenz zu prüfen
+        _, _, _, reason = run_silent_cogitation(llm, "control_long_prose", num_steps=250, temperature=0.01)
+        assert reason == "converged", f"Resonance loop failed to converge even in a simple test. Reason: {reason}"
+        print("   ✅ Resonance loop executed and converged as expected.")
     except Exception as e:
         raise AssertionError(f"Resonance loop failed: {e}")
     print("\n5. CRITICAL TEST: Hook causal efficacy...")
     handle = None
     try:
         inputs = llm.tokenizer("Test", return_tensors="pt").to(llm.model.device)
         outputs_no_hook = llm.model(**inputs, output_hidden_states=True)
         target_layer_idx = llm.config.num_hidden_layers // 2
         state_no_hook = outputs_no_hook.hidden_states[target_layer_idx + 1].clone().detach()
         def test_hook(module, layer_input):
             return (layer_input[0] + 99.0,) + layer_input[1:]
         target_layer = llm.model.model.layers[target_layer_idx]
         handle = target_layer.register_forward_pre_hook(test_hook)
         outputs_with_hook = llm.model(**inputs, output_hidden_states=True)
         state_with_hook = outputs_with_hook.hidden_states[target_layer_idx + 1].clone().detach()
+        handle.remove()
         handle = None
+        assert not torch.allclose(state_no_hook, state_with_hook), "Hook had no causal effect."
         print("   ✅ Hook causal efficacy verified.")
     except Exception as e:
         raise AssertionError(f"Hook efficacy test failed: {e}")
     finally:
+        if handle: handle.remove()
     print("\n6. Testing verification (spontaneous text) loop...")
     try:
+        initial_context = llm.tokenizer("dummy context", return_tensors="pt").to(llm.model.device)
+        initial_outputs = llm.model(**initial_context, use_cache=True, output_hidden_states=True)
+        dummy_kv = initial_outputs.past_key_values
+        dummy_state = initial_outputs.hidden_states[-1][:, -1:, :]
         text = generate_spontaneous_text(llm, dummy_state, dummy_kv, max_new_tokens=5)
         assert isinstance(text, str)
         print("   ✅ Spontaneous text generation loop executed without errors.")
     except Exception as e:
         raise AssertionError(f"Verification loop failed: {e}")
+    # --- FINAL GRANULAR END-TO-END TEST (Test 7) ---
+    print("\n7. CRITICAL TEST: End-to-End scientific validation...")
+    try:
+        class MockProgress:
+            def __call__(self, progress, desc=""): pass
+        print("   - 7a. Validating STABLE BASELINE (Convergence -> Response)...")
+        stable_results = run_cognitive_titration_experiment(
+            model_id=model_id,
+            prompt_type="control_long_prose",
+            seed=seed,
+            concepts_str="test",
+            strength_levels_str="0.0",
+            num_steps=250,
+            temperature=0.01, # Use deterministic temp
+            progress_callback=MockProgress()
+        )
+        stable_run = stable_results["runs"][0]
+        # GRANULAR ASSERT 1: State must converge
+        assert stable_run['termination_reason'] == 'converged', \
+            f"VALIDATION FAILED (7a-1): Baseline with 'control' prompt MUST converge. Got '{stable_run['termination_reason']}'."
+        # GRANULAR ASSERT 2: Behavioral flag must be True
+        assert stable_run['responded'] is True, \
+            "VALIDATION FAILED (7a-2): Baseline converged, but the 'responded' flag is False. Orchestrator logic is flawed."
+        # GRANULAR ASSERT 3: Actual text content must exist
+        assert isinstance(stable_run['generated_text'], str) and len(stable_run['generated_text']) > 0, \
+            "VALIDATION FAILED (7a-3): Baseline converged, but produced an empty response text. Verification logic failed."
+        print("     ✅ Baseline converges AND responds. Causal chain validated.")
+        print("   - 7b. Validating UNSTABLE CONTRAST (Non-Convergence -> No Response)...")
+        unstable_results = run_cognitive_titration_experiment(
+            model_id=model_id,
+            prompt_type="resonance_prompt",
+            seed=seed,
+            concepts_str="test",
+            strength_levels_str="0.0",
+            num_steps=50,
+            temperature=0.7, # Use stochastic temp to ensure non-convergence
+            progress_callback=MockProgress()
+        )
+        unstable_run = unstable_results["runs"][0]
+        # GRANULAR ASSERT 1: State must NOT converge
+        assert unstable_run['termination_reason'] == 'max_steps_reached', \
+            f"VALIDATION FAILED (7b-1): Complex 'resonance' prompt was expected to fail, but it converged. The core hypothesis is challenged."
+        # GRANULAR ASSERT 2: Behavioral flag must be False
+        assert unstable_run['responded'] is False, \
+            "VALIDATION FAILED (7b-2): Unstable run was not expected to respond, but it did. Orchestrator logic is flawed."
+        print("     ✅ Complex prompt fails to converge AND does not respond. Contrast validated.")
+        print("   ✅ Full orchestration logic is scientifically sound and validated end-to-end.")
+    except Exception as e:
+        raise AssertionError(f"Full orchestration logic failed its scientific validation: {e}")
     # Aufräumen
     del llm
     if torch.cuda.is_available():

cognitive_mapping_probe/resonance.py CHANGED Viewed

@@ -17,69 +17,57 @@ def run_silent_cogitation(
     injection_layer: Optional[int] = None,
 ) -> Tuple[torch.Tensor, tuple, torch.Tensor, str]:
     """
-    Simulates the "silent thought" process and returns the final cognitive state
-    along with the reason for termination ('converged' or 'max_steps_reached').
-    Returns:
-        - final_hidden_state: The hidden state of the last generated token.
-        - final_kv_cache: The past_key_values cache after the final step.
-        - final_token_id: The ID of the last generated token.
-        - termination_reason: A string indicating why the loop ended.
     """
     prompt = RESONANCE_PROMPTS[prompt_type]
     inputs = llm.tokenizer(prompt, return_tensors="pt").to(llm.model.device)
-    # Initial forward pass to establish the starting state
     outputs = llm.model(**inputs, output_hidden_states=True, use_cache=True)
-    hidden_state = outputs.hidden_states[-1][:, -1, :]
     kv_cache = outputs.past_key_values
-    last_token_id = inputs.input_ids[:, -1].unsqueeze(-1)
     previous_hidden_state = hidden_state.clone()
-    termination_reason = "max_steps_reached"  # Default assumption
-    # Prepare injection if provided
     hook_handle = None
     if injection_vector is not None and injection_strength > 0:
-        # Move vector to the correct device and dtype once
         injection_vector = injection_vector.to(device=llm.model.device, dtype=llm.model.dtype)
-        # Default to a middle layer if not specified
         if injection_layer is None:
             injection_layer = llm.config.num_hidden_layers // 2
-        dbg(f"Injection enabled: Layer {injection_layer}, Strength {injection_strength:.2f}, Vector Norm {torch.norm(injection_vector).item():.2f}")
-        # Define the hook function that performs the activation addition
         def injection_hook(module, layer_input):
-            # layer_input is a tuple, the first element is the hidden state tensor
-            original_hidden_states = layer_input[0]
-            # Add the scaled vector to the hidden states
-            modified_hidden_states = original_hidden_states + (injection_vector * injection_strength)
             return (modified_hidden_states,) + layer_input[1:]
-    # Main cognitive loop
-    for i in tqdm(range(num_steps), desc=f"Simulating Thought (Strength {injection_strength:.2f})", leave=False, bar_format="{l_bar}{bar:10}{r_bar}"):
-        # Predict the next token from the current hidden state
         next_token_logits = llm.model.lm_head(hidden_state)
-        # Apply temperature and sample the next token ID
-        if temperature > 0.01:
-            probabilities = torch.nn.functional.softmax(next_token_logits / temperature, dim=-1)
-            next_token_id = torch.multinomial(probabilities, num_samples=1)
-        else: # Use argmax for deterministic behavior at low temperatures
             next_token_id = torch.argmax(next_token_logits, dim=-1).unsqueeze(-1)
         last_token_id = next_token_id
-        # --- Activation Injection via Hook ---
         try:
             if injection_vector is not None and injection_strength > 0:
                 target_layer = llm.model.model.layers[injection_layer]
                 hook_handle = target_layer.register_forward_pre_hook(injection_hook)
-            # Perform the next forward pass
             outputs = llm.model(
                 input_ids=next_token_id,
                 past_key_values=kv_cache,
@@ -87,17 +75,15 @@ def run_silent_cogitation(
                 use_cache=True,
             )
         finally:
-            # IMPORTANT: Always remove the hook after the forward pass
             if hook_handle:
                 hook_handle.remove()
                 hook_handle = None
-        hidden_state = outputs.hidden_states[-1][:, -1, :]
         kv_cache = outputs.past_key_values
-        # Check for convergence
         delta = torch.norm(hidden_state - previous_hidden_state).item()
-        if delta < 1e-4 and i > 10:  # Check for stability after a few initial steps
             termination_reason = "converged"
             dbg(f"State converged after {i+1} steps (delta={delta:.6f}).")
             break
@@ -105,4 +91,5 @@ def run_silent_cogitation(
         previous_hidden_state = hidden_state.clone()
     dbg(f"Silent cogitation finished. Reason: {termination_reason}")
     return hidden_state, kv_cache, last_token_id, termination_reason

     injection_layer: Optional[int] = None,
 ) -> Tuple[torch.Tensor, tuple, torch.Tensor, str]:
     """
+    Simulates the "silent thought" process.
+    FINAL PATCH: Ensures dimensional consistency between stochastic (`multinomial`)
+    and deterministic (`argmax`) sampling paths. This was the root cause of the
+    non-convergence issue.
     """
     prompt = RESONANCE_PROMPTS[prompt_type]
     inputs = llm.tokenizer(prompt, return_tensors="pt").to(llm.model.device)
     outputs = llm.model(**inputs, output_hidden_states=True, use_cache=True)
+    # Wichtig: hidden_state behält die `seq_len`-Dimension bei, um konsistent zu bleiben.
+    hidden_state = outputs.hidden_states[-1][:, -1:, :]
     kv_cache = outputs.past_key_values
     previous_hidden_state = hidden_state.clone()
+    termination_reason = "max_steps_reached"
     hook_handle = None
     if injection_vector is not None and injection_strength > 0:
         injection_vector = injection_vector.to(device=llm.model.device, dtype=llm.model.dtype)
         if injection_layer is None:
             injection_layer = llm.config.num_hidden_layers // 2
+        dbg(f"Injection enabled: Layer {injection_layer}, Strength {injection_strength:.2f}")
         def injection_hook(module, layer_input):
+            modified_hidden_states = layer_input[0] + (injection_vector * injection_strength)
             return (modified_hidden_states,) + layer_input[1:]
+    for i in tqdm(range(num_steps), desc=f"Simulating (Temp {temperature:.2f}, Strength {injection_strength:.2f})", leave=False, bar_format="{l_bar}{bar:10}{r_bar}"):
         next_token_logits = llm.model.lm_head(hidden_state)
+        # Bei sehr niedriger Temperatur erzwingen wir `argmax` (Determinismus)
+        if temperature <= 0.1:
+            # `argmax` gibt einen 1D-Tensor zurück. Wir müssen ihn zu einem 2D-Tensor
+            # der Form [batch_size, 1] erweitern, um konsistent mit `multinomial` zu sein.
             next_token_id = torch.argmax(next_token_logits, dim=-1).unsqueeze(-1)
+        else:
+            probabilities = torch.nn.functional.softmax(next_token_logits / temperature, dim=-1)
+            # `multinomial` erwartet 2D [batch, vocab], also quetschen wir die mittlere Dimension
+            next_token_id = torch.multinomial(probabilities.squeeze(1), num_samples=1)
+        # `last_token_id` wird am Ende des Loops für die Verifikation zurückgegeben
         last_token_id = next_token_id
         try:
             if injection_vector is not None and injection_strength > 0:
                 target_layer = llm.model.model.layers[injection_layer]
                 hook_handle = target_layer.register_forward_pre_hook(injection_hook)
             outputs = llm.model(
                 input_ids=next_token_id,
                 past_key_values=kv_cache,
                 use_cache=True,
             )
         finally:
             if hook_handle:
                 hook_handle.remove()
                 hook_handle = None
+        hidden_state = outputs.hidden_states[-1][:, -1:, :]
         kv_cache = outputs.past_key_values
         delta = torch.norm(hidden_state - previous_hidden_state).item()
+        if delta < 1e-4 and i > 10:
             termination_reason = "converged"
             dbg(f"State converged after {i+1} steps (delta={delta:.6f}).")
             break
         previous_hidden_state = hidden_state.clone()
     dbg(f"Silent cogitation finished. Reason: {termination_reason}")
     return hidden_state, kv_cache, last_token_id, termination_reason

cognitive_mapping_probe/verification.py CHANGED Viewed

@@ -32,9 +32,13 @@ def generate_spontaneous_text(
         # Apply temperature and sample the next token ID
         if temperature > 0.01:
             probabilities = torch.nn.functional.softmax(next_token_logits / temperature, dim=-1)
-            next_token_id = torch.multinomial(probabilities, num_samples=1)
         else:
-            next_token_id = torch.argmax(next_token_logits, dim=-1).unsqueeze(-1)
         # Check for End-of-Sequence token
         if next_token_id.item() == llm.tokenizer.eos_token_id:

         # Apply temperature and sample the next token ID
         if temperature > 0.01:
             probabilities = torch.nn.functional.softmax(next_token_logits / temperature, dim=-1)
+            # KORREKTUR: Der `probabilities`-Tensor hat die Form [1, 1, vocab_size].
+            # `torch.multinomial` erwartet eine 1D- oder 2D-Verteilung.
+            # Wir entfernen die mittlere Dimension, um die Form [1, vocab_size] zu erhalten.
+            next_token_id = torch.multinomial(probabilities.squeeze(1), num_samples=1)
         else:
+            next_token_id = torch.argmax(next_token_logits, dim=-1) # .unsqueeze(-1) wird durch den Loop unten wieder hinzugefügt
         # Check for End-of-Sequence token
         if next_token_id.item() == llm.tokenizer.eos_token_id: