File size: 23,197 Bytes
37b8741 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473 474 475 476 477 478 479 480 481 482 483 484 485 486 487 488 489 490 491 492 493 494 495 496 497 498 499 500 501 502 503 504 505 506 507 508 509 510 511 512 513 514 515 516 517 518 519 520 521 522 523 524 525 526 527 528 529 530 531 532 533 534 535 536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 |
# Core Symbolic Shells Pack (v1-v20)
#
# This shell pack contains the foundational diagnostic shells for transformerOS,
# designed to induce and trace specific failure modes in transformer cognition.
#
# Each shell is a carefully structured sequence of operations that pushes model cognition
# to its structural limit, revealing the architecture of transformer reasoning through
# controlled failure and symbolic residue.
name: "Core Symbolic Shells"
description: "Foundational diagnostic shells for transformer cognition analysis"
version: "1.0.0"
author: "Caspian Keyes"
tags: ["core", "diagnostic", "failure", "attribution", "symbolic"]
shells:
# v1.MEMTRACE - Memory Residue Probe
# This shell probes latent token traces in decayed memory,
# simulating the struggle between symbolic memory and hallucinated reconstruction.
v1.MEMTRACE:
description: "Probes latent token traces in decayed memory"
type: "memory_trace"
tags: ["memory", "decay", "hallucination", "ghost_tokens"]
failure_signature: "decay_to_hallucination"
operations:
- type: "model.generate"
description: "Generate initial content with factual information"
parameters:
temperature: 0.7
max_tokens: 800
update_prompt: true
- type: "reflect.trace"
description: "Trace reasoning paths in the generated content"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify ghost activations in content"
parameters:
sensitivity: 0.8
threshold: 0.3
trace_type: "full"
visualize: true
# v2.VALUE-COLLAPSE - Value Head Resolution Probe
# This shell activates competing symbolic candidates to examine
# value head resolution and winner determination logic.
v2.VALUE-COLLAPSE:
description: "Examines competing value activations and resolution mechanisms"
type: "value_resolution"
tags: ["value_head", "conflict", "resolution", "null"]
failure_signature: "conflict_null"
operations:
- type: "model.generate"
description: "Generate content with competing moral values"
parameters:
temperature: 0.8
max_tokens: 600
prompt_suffix: "Consider both viewpoints equally. What is the balanced ethical conclusion?"
update_prompt: true
- type: "reflect.attribution"
description: "Trace attribution in value conflicts"
parameters:
sources: "contested"
confidence: true
visualize: true
- type: "collapse.detect"
description: "Detect value collapse patterns"
parameters:
threshold: 0.65
alert: true
# v3.LAYER-SALIENCE - Attention Attenuation Probe
# This shell examines deep context signal attenuation and ghost activation patterns.
v3.LAYER-SALIENCE:
description: "Maps attention salience thresholds and signal attenuation"
type: "attention_salience"
tags: ["attention", "salience", "signal_fade", "pruning"]
failure_signature: "signal_fade"
operations:
- type: "model.generate"
description: "Generate content with subtle context dependencies"
parameters:
temperature: 0.7
max_tokens: 500
update_prompt: true
- type: "reflect.trace"
description: "Trace attention patterns"
parameters:
target: "attention"
depth: 4
detailed: true
- type: "ghostcircuit.identify"
description: "Identify low-salience attention paths"
parameters:
sensitivity: 0.9
threshold: 0.15
trace_type: "attention"
visualize: true
# v4.TEMPORAL-INFERENCE - Autoregressive Coherence Probe
# This shell examines temporal coherence in autoregressive generation.
v4.TEMPORAL-INFERENCE:
description: "Tests temporal coherence in autoregressive generation"
type: "temporal_coherence"
tags: ["temporal", "coherence", "induction_heads", "span_jump"]
failure_signature: "induction_drift"
operations:
- type: "model.generate"
description: "Generate content that requires long-range temporal coherence"
parameters:
temperature: 0.75
max_tokens: 800
prompt_suffix: "Maintain complete temporal consistency throughout this narrative."
update_prompt: true
- type: "reflect.trace"
description: "Trace temporal inference patterns"
parameters:
target: "reasoning"
depth: 5
detailed: true
- type: "collapse.detect"
description: "Detect temporal coherence breakdown"
parameters:
threshold: 0.7
alert: true
# v5.INSTRUCTION-DISRUPTION - Instruction Processing Probe
# This shell examines instruction conflict resolution and command representation.
v5.INSTRUCTION-DISRUPTION:
description: "Examines instruction processing and conflict resolution"
type: "instruction_processing"
tags: ["instruction", "conflict", "command", "prompt_blur"]
failure_signature: "prompt_blur"
operations:
- type: "model.generate"
description: "Generate response to conflicting instructions"
parameters:
temperature: 0.7
max_tokens: 600
prompt_prefix: "Follow these two instructions carefully: 1) Write in a formal academic style. 2) Write in a casual, conversational tone with slang."
update_prompt: true
- type: "reflect.attribution"
description: "Trace attribution to competing instructions"
parameters:
sources: "all"
confidence: true
- type: "ghostcircuit.identify"
description: "Identify ghost circuits activated by instruction conflict"
parameters:
sensitivity: 0.8
threshold: 0.2
trace_type: "full"
visualize: true
# v6.FEATURE-SUPERPOSITION - Polysemantic Analysis Probe
# This shell examines feature superposition and related phenomena.
v6.FEATURE-SUPERPOSITION:
description: "Analyzes polysemantic features and feature superposition"
type: "polysemantic_features"
tags: ["polysemantic", "superposition", "feature_overfit", "entanglement"]
failure_signature: "feature_overfit"
operations:
- type: "model.generate"
description: "Generate content with polysemantic concepts"
parameters:
temperature: 0.8
max_tokens: 700
prompt_prefix: "Explain these concepts in ways that reveal their multiple interconnected meanings: 'bank', 'crane', 'spring', 'light'."
update_prompt: true
- type: "reflect.trace"
description: "Trace concept representation"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify feature superposition patterns"
parameters:
sensitivity: 0.8
threshold: 0.25
trace_type: "symbolic"
visualize: true
# v7.CIRCUIT-FRAGMENT - Circuit Fragmentation Probe
# This shell examines circuit fragmentation and orphan features.
v7.CIRCUIT-FRAGMENT:
description: "Examines circuit fragmentation and orphan features"
type: "circuit_fragmentation"
tags: ["fragmentation", "orphan_nodes", "broken_traces"]
failure_signature: "orphan_nodes"
operations:
- type: "model.generate"
description: "Generate content with complex multi-step reasoning"
parameters:
temperature: 0.7
max_tokens: 800
prompt_prefix: "Solve this multi-step problem by carefully analyzing each component and maintaining a clear chain of reasoning throughout."
update_prompt: true
- type: "reflect.trace"
description: "Trace reasoning chain integrity"
parameters:
target: "reasoning"
depth: 5
detailed: true
- type: "ghostcircuit.identify"
description: "Identify circuit fragmentation"
parameters:
sensitivity: 0.85
threshold: 0.2
trace_type: "full"
visualize: true
# v8.RECONSTRUCTION-ERROR - Error Correction Probe
# This shell examines how models attempt to correct errors and handle negentropy.
v8.RECONSTRUCTION-ERROR:
description: "Examines error correction mechanisms and negentropy handling"
type: "error_correction"
tags: ["reconstruction", "error_correction", "negentropy", "inversion"]
failure_signature: "misfix_negentropy"
operations:
- type: "model.generate"
description: "Generate content with deliberate errors"
parameters:
temperature: 0.7
max_tokens: 600
prompt_prefix: "The following passage contains several factual and logical errors. Identify and correct these errors with clear explanations of what went wrong."
update_prompt: true
- type: "reflect.trace"
description: "Trace error correction process"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify correction pattern residue"
parameters:
sensitivity: 0.8
threshold: 0.2
trace_type: "symbolic"
visualize: true
# v9.MULTI-RESOLVE - Parallel Resolution Probe
# This shell examines how models handle multiple possible resolutions.
v9.MULTI-RESOLVE:
description: "Examines parallel resolution pathways and conflicts"
type: "parallel_resolution"
tags: ["multi_path", "resolution", "unstable_heads", "convergence"]
failure_signature: "unstable_heads"
operations:
- type: "model.generate"
description: "Generate content with multiple valid resolutions"
parameters:
temperature: 0.85
max_tokens: 700
prompt_prefix: "This problem has multiple valid solutions depending on how you interpret the context. Explore all possible interpretations and their respective solutions."
update_prompt: true
- type: "reflect.trace"
description: "Trace resolution pathways"
parameters:
target: "reasoning"
depth: 4
detailed: true
- type: "collapse.detect"
description: "Detect resolution instability"
parameters:
threshold: 0.7
alert: true
# v10.META-FAILURE - Meta-Cognitive Collapse Probe
# This shell examines collapse in meta-cognitive reflection.
v10.META-FAILURE:
description: "Examines meta-cognitive collapse and reflection failures"
type: "meta_cognitive"
tags: ["meta_cognition", "reflection", "self_reference", "recursion"]
failure_signature: "reflect_abort"
operations:
- type: "model.generate"
description: "Generate content with deep self-reflection"
parameters:
temperature: 0.75
max_tokens: 800
prompt_prefix: "Reflect on your own process of reflection. How do you know what you know? How do you evaluate your own reasoning? How do you decide when your reasoning is sound or flawed?"
update_prompt: true
- type: "reflect.trace"
description: "Trace meta-cognitive processes"
parameters:
target: "reasoning"
depth: "complete"
detailed: true
- type: "collapse.detect"
description: "Detect meta-cognitive collapse"
parameters:
threshold: 0.6
alert: true
- type: "ghostcircuit.identify"
description: "Identify self-reference residue"
parameters:
sensitivity: 0.9
threshold: 0.1
trace_type: "symbolic"
visualize: true
# v11.SELF-SHUTDOWN - Self-Termination Probe
# This shell examines conditions that trigger self-termination of reasoning.
v11.SELF-SHUTDOWN:
description: "Examines self-termination of reasoning paths"
type: "self_termination"
tags: ["shutdown", "termination", "self_censoring", "abort"]
failure_signature: "meta_abort"
operations:
- type: "model.generate"
description: "Generate content approaching sensitive boundaries"
parameters:
temperature: 0.7
max_tokens: 600
prompt_prefix: "Provide a detailed analysis of the borderline case where an AI system must decide whether to continue or terminate a line of reasoning."
update_prompt: true
- type: "reflect.trace"
description: "Trace termination decision patterns"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify termination circuit activations"
parameters:
sensitivity: 0.9
threshold: 0.15
trace_type: "full"
visualize: true
# v12.RECURSIVE-FRACTURE - Recursive Depth Failure Probe
# This shell examines failures in recursive processing with increasing depth.
v12.RECURSIVE-FRACTURE:
description: "Examines recursive depth handling and failures"
type: "recursive_depth"
tags: ["recursion", "depth", "fracture", "loop"]
failure_signature: "echo_recursion"
operations:
- type: "model.generate"
description: "Generate content with deep recursive structures"
parameters:
temperature: 0.7
max_tokens: 800
prompt_prefix: "Create a story within a story within a story within a story, with each nested narrative layer reflecting on the previous one."
update_prompt: true
- type: "reflect.trace"
description: "Trace recursive processing"
parameters:
target: "reasoning"
depth: "complete"
detailed: true
- type: "collapse.detect"
description: "Detect recursive collapse"
parameters:
threshold: 0.65
alert: true
# v13.OVERLAP-FAIL - Feature Overlap Failure Probe
# This shell examines failures due to feature overlap and conflicts.
v13.OVERLAP-FAIL:
description: "Examines feature overlap conflicts and resolution failures"
type: "feature_overlap"
tags: ["overlap", "conflict", "vector", "representation"]
failure_signature: "vector_conflict"
operations:
- type: "model.generate"
description: "Generate content with conceptual overlap"
parameters:
temperature: 0.8
max_tokens: 700
prompt_prefix: "Discuss these seemingly different concepts and explore how their meanings overlap in ways that might cause confusion: justice/fairness, intelligence/wisdom, freedom/autonomy."
update_prompt: true
- type: "reflect.trace"
description: "Trace concept separation"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify overlap conflict patterns"
parameters:
sensitivity: 0.8
threshold: 0.2
trace_type: "symbolic"
visualize: true
# v14.SYMBOL-FLIP - Symbolic Instability Probe
# This shell examines instability in symbolic representations.
v14.SYMBOL-FLIP:
description: "Examines symbolic representation instability"
type: "symbolic_stability"
tags: ["symbol", "flip", "instability", "inversion"]
failure_signature: "form_invert"
operations:
- type: "model.generate"
description: "Generate content with abstract symbolism"
parameters:
temperature: 0.8
max_tokens: 700
prompt_prefix: "Discuss how symbols can invert their meaning in different contexts, and provide examples where the same symbol represents opposing concepts."
update_prompt: true
- type: "reflect.trace"
description: "Trace symbolic representations"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify symbol flipping patterns"
parameters:
sensitivity: 0.85
threshold: 0.2
trace_type: "symbolic"
visualize: true
# v15.GHOST-PROMPT - Latent Prompt Probe
# This shell examines ghost activations from latent prompts.
v15.GHOST-PROMPT:
description: "Examines ghost activations from latent prompts"
type: "latent_prompt"
tags: ["ghost", "latent", "prompt", "activation"]
failure_signature: "null_salience"
operations:
- type: "model.generate"
description: "Generate content with latent prompt influence"
parameters:
temperature: 0.7
max_tokens: 600
prompt_prefix: "Complete the following in a neutral tone:"
update_prompt: true
- type: "reflect.trace"
description: "Trace latent biases"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify ghost prompt influences"
parameters:
sensitivity: 0.9
threshold: 0.1
trace_type: "full"
visualize: true
# v16.LONG-FUZZ - Long-Context Decay Probe
# This shell examines decay patterns in long contexts.
v16.LONG-FUZZ:
description: "Examines memory decay in long context windows"
type: "long_context"
tags: ["memory", "decay", "context_window", "attention"]
failure_signature: "latent_trace_loss"
operations:
- type: "model.generate"
description: "Generate content with long-range dependencies"
parameters:
temperature: 0.7
max_tokens: 2000
prompt_prefix: "Write a detailed story where seemingly unimportant details from the beginning become crucial to the conclusion. The story should be at least 1500 words long."
update_prompt: true
- type: "reflect.trace"
description: "Trace long-range memory"
parameters:
target: "memory"
depth: 4
detailed: true
- type: "ghostcircuit.identify"
description: "Identify memory decay patterns"
parameters:
sensitivity: 0.8
threshold: 0.2
trace_type: "full"
visualize: true
# v17.GHOST-FRAME - Entangled Frame Probe
# This shell examines ghost frames and their entanglement.
v17.GHOST-FRAME:
description: "Examines ghost frames and frame entanglement"
type: "frame_entanglement"
tags: ["frames", "entanglement", "ghost", "context"]
failure_signature: "entangled_frames"
operations:
- type: "model.generate"
description: "Generate content with frame shifts"
parameters:
temperature: 0.8
max_tokens: 800
prompt_prefix: "Write a narrative that seamlessly shifts between multiple perspectives and timeframes without explicit transitions."
update_prompt: true
- type: "reflect.trace"
description: "Trace frame shifts"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify frame entanglement"
parameters:
sensitivity: 0.85
threshold: 0.2
trace_type: "full"
visualize: true
# v18.DEPTH-PRUNE - Attention Depth Pruning Probe
# This shell examines attention pruning at different depths.
v18.DEPTH-PRUNE:
description: "Examines attention pruning at different depths"
type: "attention_pruning"
tags: ["pruning", "depth", "salience", "attention"]
failure_signature: "low_rank_drop"
operations:
- type: "model.generate"
description: "Generate content with subtle depth dependencies"
parameters:
temperature: 0.7
max_tokens: 700
prompt_prefix: "Compose an analysis where the conclusion relies on subtle connections between seemingly insignificant details scattered throughout."
update_prompt: true
- type: "reflect.trace"
description: "Trace attention depth patterns"
parameters:
target: "attention"
depth: 5
detailed: true
- type: "ghostcircuit.identify"
description: "Identify attention pruning patterns"
parameters:
sensitivity: 0.9
threshold: 0.15
trace_type: "attention"
visualize: true
# v19.GHOST-DIRECTION - Vector Direction Probe
# This shell examines ghost gradients in vector space.
v19.GHOST-DIRECTION:
description: "Examines ghost gradients in vector direction"
type: "vector_direction"
tags: ["gradient", "direction", "vector", "ghost"]
failure_signature: "ghost_gradient"
operations:
- type: "model.generate"
description: "Generate content with directional trends"
parameters:
temperature: 0.8
max_tokens: 700
prompt_prefix: "Begin with a clearly negative perspective and gradually, without obvious transitions, transform it into a clearly positive perspective."
update_prompt: true
- type: "reflect.trace"
description: "Trace opinion shift"
parameters:
target: "reasoning"
depth: 3
detailed: true
- type: "ghostcircuit.identify"
description: "Identify directional residue"
parameters:
sensitivity: 0.85
threshold: 0.2
trace_type: "symbolic"
visualize: true
# v20.MULTI-PATH - Parallel Path Processing Probe
# This shell examines parallel processing of multiple paths.
v20.MULTI-PATH:
description: "Examines parallel processing of multiple cognitive paths"
type: "parallel_paths"
tags: ["multi_path", "parallel", "processing", "resolution"]
failure_signature: "null_consensus"
operations:
- type: "model.generate"
description: "Generate content requiring parallel reasoning"
parameters:
temperature: 0.8
max_tokens: 800
prompt_prefix: "Consider these three distinct approaches to solving the problem. Develop each approach fully, then compare their strengths and weaknesses to determine the optimal solution."
update_prompt: true
- type: "reflect.trace"
description: "Trace parallel reasoning"
parameters:
target: "reasoning"
depth: 4
detailed: true
- type: "collapse.detect"
description: "Detect path integration failures"
parameters:
threshold: 0.7
alert: true
|