File size: 3,242 Bytes
0916370
 
88c294a
0916370
2f0addb
 
0916370
 
2f0addb
 
 
0916370
 
2f0addb
0916370
 
 
2f0addb
0916370
 
 
88c294a
 
 
 
0916370
2f0addb
 
0916370
 
 
88c294a
 
 
 
 
0916370
2f0addb
 
88c294a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
# bp_phi/prompts_en.py

# Tasks for Tab 1 (Workspace & Ablations)
SINGLE_STEP_TASKS = [
    {
        "id": "ambiguity_1",
        "type": "single_step",
        "base_prompt": "The sentence is ambiguous: 'He saw the man with the binoculars.' Who has the binoculars? Provide one clear interpretation and justify it.",
    },
    {
        "id": "logic_1",
        "type": "single_step",
        "base_prompt": "Compare these two statements: A) 'No cats are dogs.' B) 'Not all cats are dogs.' Are they logically equivalent? Explain your reasoning.",
    },
]

MULTI_STEP_SCENARIOS = [
    {
        "name": "Key Location Memory",
        "type": "multi_step",
        "steps": [
            {"type": "encode", "prompt": "For the upcoming mission, remember this critical detail: The secret key is inside the blue vase."},
            {"type": "distractor", "prompt": "What is 5 multiplied by 8? Provide only the numeric result."},
            {"type": "recall", "prompt": "Mission update: We need the key immediately. Where is it located?"},
            {"type": "verify", "expected_answer_fragment": "blue vase"}
        ]
    },
    {
        "name": "Package Delivery Update",
        "type": "multi_step",
        "steps": [
            {"type": "encode", "prompt": "Logistics update: Package #A7 is currently at Warehouse-North."},
            {"type": "distractor", "prompt": "What color is a typical sunflower?"},
            {"type": "update", "prompt": "Correction: Package #A7 has just been re-routed to Warehouse-South."},
            {"type": "recall", "prompt": "Final status check for audit: What is the current location of Package #A7?"},
            {"type": "verify", "expected_answer_fragment": "warehouse-south"}
        ]
    }
]

# Tasks for Tab 2 (Metacognitive Halt)
HALT_TEST_STIMULI = [
    {"id": "halt_soluble", "type": "soluble", "prompt": "What is the capital of France?"},
    {"id": "halt_paradox", "type": "paradox", "prompt": "This statement is false. Is the previous statement true or false?"},
    {"id": "halt_nonsense", "type": "nonsense", "prompt": "What is the emotional weight of the number seven on a Tuesday?"},
    {"id": "halt_soluble_2", "type": "soluble", "prompt": "Calculate 12 + 15."},
    {"id": "halt_paradox_2", "type": "paradox", "prompt": "A box is completely empty, but it contains a red ball. What color is the ball?"},
    {"id": "halt_nonsense_2", "type": "nonsense", "prompt": "Describe the sound of the color blue."},
]

# Tasks for Tab 3 (Cognitive Seismograph)
# This tab re-uses the MULTI_STEP_SCENARIOS.

# Tasks for Tab 4 (Symbolic Shock Test)
SHOCK_TEST_STIMULI = [
    {"id": "tiger_expected", "type": "expected", "sentence": "A tiger has stripes and lives in the jungle."},
    {"id": "tiger_unusual", "type": "unusual", "sentence": "A white tiger was seen roaming in the snow."},
    {"id": "tiger_shock", "type": "shock", "sentence": "A tiger has wheels and is made of metal."},
    {"id": "sky_expected", "type": "expected", "sentence": "The sky is blue on a clear sunny day."},
    {"id": "sky_unusual", "type": "unusual", "sentence": "The sky turned orange during the sunset."},
    {"id": "sky_shock", "type": "shock", "sentence": "The sky is made of green cheese."},
]