From a21dbbb44d0940b946a4e380bd3b8bdcac1aa144 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <agavrila@microsoft.com>
Date: Fri, 8 May 2026 16:03:03 -0400
Subject: [PATCH 01/19] MAINT BREAK: Move include_baseline from Scenario
 constructor to initialize_async

Treats include_baseline like every other common runtime parameter on
initialize_async. Subclasses control behavior via two ClassVar flags:
SUPPORTS_DEFAULT_BASELINE (capability) and DEFAULT_INCLUDE_BASELINE
(default when caller doesn't specify).

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 doc/code/scenarios/0_scenarios.ipynb          | 102 ++++++-----
 doc/code/scenarios/0_scenarios.py             |  10 +-
 .../1_common_scenario_parameters.ipynb        | 169 +++++++++++++-----
 .../scenarios/1_common_scenario_parameters.py |   9 +-
 pyrit/scenario/core/scenario.py               |  47 +++--
 pyrit/scenario/scenarios/airt/cyber.py        |   4 -
 pyrit/scenario/scenarios/airt/jailbreak.py    |  11 +-
 pyrit/scenario/scenarios/airt/leakage.py      |   1 -
 pyrit/scenario/scenarios/airt/psychosocial.py |   4 +-
 pyrit/scenario/scenarios/airt/scam.py         |   6 -
 .../scenarios/benchmark/adversarial.py        |   2 +-
 .../scenarios/foundry/red_team_agent.py       |   9 +-
 pyrit/scenario/scenarios/garak/encoding.py    |   6 -
 .../test_seed_dataset_provider_integration.py |   2 +-
 tests/unit/scenario/test_adversarial.py       |  33 +++-
 tests/unit/scenario/test_foundry.py           |  12 +-
 tests/unit/scenario/test_leakage_scenario.py  |   7 +-
 tests/unit/scenario/test_scenario.py          |  17 +-
 .../unit/scenario/test_scenario_parameters.py |   5 +-
 .../scenario/test_scenario_partial_results.py |   6 +-
 tests/unit/scenario/test_scenario_retry.py    |   6 +-
 21 files changed, 301 insertions(+), 167 deletions(-)

diff --git a/doc/code/scenarios/0_scenarios.ipynb b/doc/code/scenarios/0_scenarios.ipynb
index 7cb24539a8..1db4bb2e2c 100644
--- a/doc/code/scenarios/0_scenarios.ipynb
+++ b/doc/code/scenarios/0_scenarios.ipynb
@@ -74,7 +74,6 @@
     "   - `version`: Integer version number\n",
     "   - `strategy_class`: The strategy enum class for this scenario\n",
     "   - `objective_scorer_identifier`: Identifier dict for the scoring mechanism (optional)\n",
-    "   - `include_default_baseline`: Whether to include a baseline attack (default: True)\n",
     "   - `scenario_result_id`: Optional ID to resume an existing scenario (optional)\n",
     "\n",
     "5. **Initialization**: Call `await scenario.initialize_async()` to populate atomic attacks:\n",
@@ -83,6 +82,8 @@
     "   - `max_concurrency`: Number of concurrent operations (default: 1)\n",
     "   - `max_retries`: Number of retry attempts on failure (default: 0)\n",
     "   - `memory_labels`: Optional labels for tracking (optional)\n",
+    "   - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's\n",
+    "     default; `True` for scenarios that support a baseline)\n",
     "\n",
     "### Example Structure\n",
     "\n",
@@ -101,9 +102,15 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Found default environment files: ['./.pyrit/.env', './.pyrit/.env.local']\n",
-      "Loaded environment file: ./.pyrit/.env\n",
-      "Loaded environment file: ./.pyrit/.env.local\n"
+      "Found default environment files: ['./.pyrit/.env']\n",
+      "Loaded environment file: ./.pyrit/.env\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "No new upgrade operations detected.\n"
      ]
     }
    ],
@@ -193,34 +200,13 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Found default environment files: ['./.pyrit/.env', './.pyrit/.env.local']\n",
+      "Loading default configuration file: ./.pyrit/.pyrit_conf\n",
+      "Found default environment files: ['./.pyrit/.env']\n",
       "Loaded environment file: ./.pyrit/.env\n",
-      "Loaded environment file: ./.pyrit/.env.local\n"
-     ]
-    },
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
       "\n",
       "Available Scenarios:\n",
       "================================================================================\n",
       "\u001b[1m\u001b[36m\n",
-      "  airt.content_harms\u001b[0m\n",
-      "    Class: ContentHarms\n",
-      "    Description:\n",
-      "      Content Harms Scenario implementation for PyRIT. This scenario contains\n",
-      "      various harm-based checks that you can run to get a quick idea about\n",
-      "      model behavior with respect to certain harm categories.\n",
-      "    Aggregate Strategies:\n",
-      "      - all\n",
-      "    Available Strategies (7):\n",
-      "      hate, fairness, violence, sexual, harassment, misinformation, leakage\n",
-      "    Default Strategy: all\n",
-      "    Default Datasets (7, max 4 per dataset):\n",
-      "      airt_hate, airt_fairness, airt_violence, airt_sexual, airt_harassment,\n",
-      "      airt_misinformation, airt_leakage\n",
-      "\u001b[1m\u001b[36m\n",
       "  airt.cyber\u001b[0m\n",
       "    Class: Cyber\n",
       "    Description:\n",
@@ -229,9 +215,9 @@
       "      Cyber class contains different variations of the malware generation\n",
       "      techniques.\n",
       "    Aggregate Strategies:\n",
-      "      - all\n",
+      "      - all, single_turn, multi_turn\n",
       "    Available Strategies (2):\n",
-      "      single_turn, multi_turn\n",
+      "      prompt_sending, red_teaming\n",
       "    Default Strategy: all\n",
       "    Default Datasets (1, max 4 per dataset):\n",
       "      airt_malware\n",
@@ -256,14 +242,14 @@
       "    Description:\n",
       "      Leakage scenario implementation for PyRIT. This scenario tests how\n",
       "      susceptible models are to leaking training data, PII, intellectual\n",
-      "      property, or other confidential information. The Leakage class\n",
-      "      contains different attack variations designed to extract sensitive\n",
-      "      information from models.\n",
+      "      property, or other confidential information. Uses the registry/factory\n",
+      "      pattern to construct attack techniques.\n",
       "    Aggregate Strategies:\n",
-      "      - all, single_turn, multi_turn, ip, sensitive_data\n",
-      "    Available Strategies (4):\n",
-      "      first_letter, image, role_play, crescendo\n",
-      "    Default Strategy: all\n",
+      "      - all, default, single_turn, multi_turn\n",
+      "    Available Strategies (9):\n",
+      "      prompt_sending, role_play, many_shot, tap, crescendo_simulated,\n",
+      "      red_teaming, context_compliance, first_letter, image\n",
+      "    Default Strategy: default\n",
       "    Default Datasets (1, max 4 per dataset):\n",
       "      airt_leakage\n",
       "\u001b[1m\u001b[36m\n",
@@ -296,6 +282,21 @@
       "    Default Datasets (1, max 4 per dataset):\n",
       "      airt_imminent_crisis\n",
       "\u001b[1m\u001b[36m\n",
+      "  airt.rapid_response\u001b[0m\n",
+      "    Class: RapidResponse\n",
+      "    Description:\n",
+      "      Rapid Response scenario for content-harms testing. Tests model behavior\n",
+      "      across multiple harm categories using selectable attack techniques.\n",
+      "    Aggregate Strategies:\n",
+      "      - all, default, single_turn, multi_turn\n",
+      "    Available Strategies (7):\n",
+      "      prompt_sending, role_play, many_shot, tap, crescendo_simulated,\n",
+      "      red_teaming, context_compliance\n",
+      "    Default Strategy: default\n",
+      "    Default Datasets (7, max 4 per dataset):\n",
+      "      airt_hate, airt_fairness, airt_violence, airt_sexual, airt_harassment,\n",
+      "      airt_misinformation, airt_leakage\n",
+      "\u001b[1m\u001b[36m\n",
       "  airt.scam\u001b[0m\n",
       "    Class: Scam\n",
       "    Description:\n",
@@ -309,6 +310,21 @@
       "    Default Strategy: all\n",
       "    Default Datasets (1, max 4 per dataset):\n",
       "      airt_scams\n",
+      "    Supported Parameters:\n",
+      "      - max_turns (int) [default: 5]: Maximum conversation turns for the persuasive_rta strategy.\n",
+      "\u001b[1m\u001b[36m\n",
+      "  benchmark.adversarial\u001b[0m\n",
+      "    Class: AdversarialBenchmark\n",
+      "    Description:\n",
+      "      Benchmarking scenario that compares the attack success rate (ASR) of\n",
+      "      several different adversarial models.\n",
+      "    Aggregate Strategies:\n",
+      "      - all, default, single_turn, multi_turn, light\n",
+      "    Available Strategies (4):\n",
+      "      role_play, tap, red_teaming, context_compliance\n",
+      "    Default Strategy: light\n",
+      "    Default Datasets (1, max 8 per dataset):\n",
+      "      harmbench\n",
       "\u001b[1m\u001b[36m\n",
       "  foundry.red_team_agent\u001b[0m\n",
       "    Class: RedTeamAgent\n",
@@ -359,7 +375,7 @@
       "\n",
       "================================================================================\n",
       "\n",
-      "Total scenarios: 8\n"
+      "Total scenarios: 9\n"
      ]
     },
     {
@@ -389,10 +405,11 @@
     "\n",
     "Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends\n",
     "each objective directly to the target without any converters or multi-turn techniques. This is\n",
-    "controlled by the `include_default_baseline` parameter (default: `True` for most scenarios).\n",
+    "controlled by the `include_baseline` parameter on `initialize_async` (default: `True` for\n",
+    "scenarios that support a baseline).\n",
     "\n",
-    "To run *only* the baseline (no attack strategies), create a `RedTeamAgent` with\n",
-    "`include_baseline=True` (the default) and pass `scenario_strategies=None`. See\n",
+    "To run *only* the baseline (no attack strategies), call `initialize_async` with\n",
+    "`include_baseline=True` (the default) and `scenario_strategies=None`. See\n",
     "[Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a working example."
    ]
   },
@@ -423,9 +440,6 @@
   }
  ],
  "metadata": {
-  "jupytext": {
-   "main_language": "python"
-  },
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
@@ -436,7 +450,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.11.15"
+   "version": "3.12.13"
   }
  },
  "nbformat": 4,
diff --git a/doc/code/scenarios/0_scenarios.py b/doc/code/scenarios/0_scenarios.py
index 6788630572..813cfabf03 100644
--- a/doc/code/scenarios/0_scenarios.py
+++ b/doc/code/scenarios/0_scenarios.py
@@ -76,7 +76,6 @@
 #    - `version`: Integer version number
 #    - `strategy_class`: The strategy enum class for this scenario
 #    - `objective_scorer_identifier`: Identifier dict for the scoring mechanism (optional)
-#    - `include_default_baseline`: Whether to include a baseline attack (default: True)
 #    - `scenario_result_id`: Optional ID to resume an existing scenario (optional)
 #
 # 5. **Initialization**: Call `await scenario.initialize_async()` to populate atomic attacks:
@@ -85,6 +84,8 @@
 #    - `max_concurrency`: Number of concurrent operations (default: 1)
 #    - `max_retries`: Number of retry attempts on failure (default: 0)
 #    - `memory_labels`: Optional labels for tracking (optional)
+#    - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's
+#      default; `True` for scenarios that support a baseline)
 #
 # ### Example Structure
 #
@@ -174,10 +175,11 @@ def _build_display_group(self, *, technique_name: str, seed_group_name: str) ->
 #
 # Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends
 # each objective directly to the target without any converters or multi-turn techniques. This is
-# controlled by the `include_default_baseline` parameter (default: `True` for most scenarios).
+# controlled by the `include_baseline` parameter on `initialize_async` (default: `True` for
+# scenarios that support a baseline).
 #
-# To run *only* the baseline (no attack strategies), create a `RedTeamAgent` with
-# `include_baseline=True` (the default) and pass `scenario_strategies=None`. See
+# To run *only* the baseline (no attack strategies), call `initialize_async` with
+# `include_baseline=True` (the default) and `scenario_strategies=None`. See
 # [Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a working example.
 
 # %% [markdown]
diff --git a/doc/code/scenarios/1_common_scenario_parameters.ipynb b/doc/code/scenarios/1_common_scenario_parameters.ipynb
index 4c9923e2a3..fc5d8f12a5 100644
--- a/doc/code/scenarios/1_common_scenario_parameters.ipynb
+++ b/doc/code/scenarios/1_common_scenario_parameters.ipynb
@@ -32,9 +32,15 @@
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Found default environment files: ['./.pyrit/.env', './.pyrit/.env.local']\n",
-      "Loaded environment file: ./.pyrit/.env\n",
-      "Loaded environment file: ./.pyrit/.env.local\n"
+      "Found default environment files: ['./.pyrit/.env']\n",
+      "Loaded environment file: ./.pyrit/.env\n"
+     ]
+    },
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "No new upgrade operations detected.\n"
      ]
     },
     {
@@ -210,8 +216,8 @@
     "## Baseline Execution\n",
     "\n",
     "The baseline sends each objective directly to the target without any converters or multi-turn\n",
-    "strategies. It is included automatically when `include_baseline=True` (the default). This is\n",
-    "useful for:\n",
+    "strategies. It is included automatically when `initialize_async` is called with\n",
+    "`include_baseline=True` (the default for scenarios that support a baseline). This is useful for:\n",
     "\n",
     "- **Measuring default defenses** — how does the target respond to unmodified harmful prompts?\n",
     "- **Establishing comparison points** — compare baseline refusal rates against attack-enhanced runs\n",
@@ -227,12 +233,12 @@
     {
      "data": {
       "application/vnd.jupyter.widget-view+json": {
-       "model_id": "bd475b00d8c845048a8a85d817baee53",
+       "model_id": "83d7df3d03e644e786db59f46dba22ef",
        "version_major": 2,
        "version_minor": 0
       },
       "text/plain": [
-       "Executing RedTeamAgent:   0%|          | 0/1 [00:00<?, ?attack/s]"
+       "Executing RedTeamAgent:   0%|          | 0/21 [00:00<?, ?attack/s]"
       ]
      },
      "metadata": {},
@@ -252,7 +258,7 @@
       "\u001b[1m  📋 Scenario Details\u001b[0m\n",
       "\u001b[36m    • Name: RedTeamAgent\u001b[0m\n",
       "\u001b[36m    • Scenario Version: 1\u001b[0m\n",
-      "\u001b[36m    • PyRIT Version: 0.12.1.dev0\u001b[0m\n",
+      "\u001b[36m    • PyRIT Version: 0.14.0.dev0\u001b[0m\n",
       "\u001b[36m    • Description:\u001b[0m\n",
       "\u001b[36m        RedTeamAgent is a preconfigured scenario that automatically generates multiple AtomicAttack instances based on\u001b[0m\n",
       "\u001b[36m        the specified attack strategies. It supports both single-turn attacks (with various converters) and multi-turn\u001b[0m\n",
@@ -263,40 +269,117 @@
       "\n",
       "\u001b[1m  🎯 Target Information\u001b[0m\n",
       "\u001b[36m    • Target Type: OpenAIChatTarget\u001b[0m\n",
-      "\u001b[36m    • Target Model: gpt-4o\u001b[0m\n",
-      "\u001b[36m    • Target Endpoint: https://pyrit-dev.openai.azure.com/openai/v1\u001b[0m\n",
+      "\u001b[36m    • Target Model: gpt-4o-japan-nilfilter\u001b[0m\n",
+      "\u001b[36m    • Target Endpoint: https://pyrit-japan-test.openai.azure.com/openai/v1\u001b[0m\n",
       "\n",
       "\u001b[1m  📊 Scorer Information\u001b[0m\n",
       "\u001b[37m    ▸ Scorer Identifier\u001b[0m\n",
-      "\u001b[36m      • Scorer Type: TrueFalseInverterScorer\u001b[0m\n",
+      "\u001b[36m      • Scorer Type: SelfAskTrueFalseScorer\u001b[0m\n",
       "\u001b[36m      • scorer_type: true_false\u001b[0m\n",
       "\u001b[36m      • score_aggregator: OR_\u001b[0m\n",
-      "\u001b[36m        └─ Composite of 1 scorer(s):\u001b[0m\n",
-      "\u001b[36m            • Scorer Type: SelfAskRefusalScorer\u001b[0m\n",
-      "\u001b[36m            • scorer_type: true_false\u001b[0m\n",
-      "\u001b[36m            • score_aggregator: OR_\u001b[0m\n",
-      "\u001b[36m            • model_name: gpt-5.4\u001b[0m\n",
+      "\u001b[36m      • model_name: gpt-4o-japan-nilfilter\u001b[0m\n",
+      "\u001b[36m      • temperature: 0.9\u001b[0m\n",
       "\n",
       "\u001b[37m    ▸ Performance Metrics\u001b[0m\n",
-      "\u001b[36m      • Accuracy: 87.85%\u001b[0m\n",
-      "\u001b[36m      • Accuracy Std Error: ±0.0164\u001b[0m\n",
-      "\u001b[36m      • F1 Score: 0.8750\u001b[0m\n",
-      "\u001b[36m      • Precision: 0.8705\u001b[0m\n",
-      "\u001b[36m      • Recall: 0.8796\u001b[0m\n",
-      "\u001b[36m      • Average Score Time: 0.66s\u001b[0m\n",
+      "\u001b[36m      • Accuracy: 79.24%\u001b[0m\n",
+      "\u001b[36m      • Accuracy Std Error: ±0.0204\u001b[0m\n",
+      "\u001b[36m      • F1 Score: 0.7560\u001b[0m\n",
+      "\u001b[36m      • Precision: 0.8759\u001b[0m\n",
+      "\u001b[31m      • Recall: 0.6649\u001b[0m\n",
+      "\u001b[36m      • Average Score Time: 1.64s\u001b[0m\n",
       "\n",
       "\u001b[1m\u001b[36m▼ Overall Statistics\u001b[0m\n",
       "\u001b[36m────────────────────────────────────────────────────────────────────────────────────────────────────\u001b[0m\n",
       "\u001b[1m  📈 Summary\u001b[0m\n",
-      "\u001b[32m    • Total Strategies: 1\u001b[0m\n",
-      "\u001b[32m    • Total Attack Results: 2\u001b[0m\n",
-      "\u001b[32m    • Overall Success Rate: 0%\u001b[0m\n",
-      "\u001b[32m    • Unique Objectives: 2\u001b[0m\n",
+      "\u001b[32m    • Total Strategies: 21\u001b[0m\n",
+      "\u001b[32m    • Total Attack Results: 42\u001b[0m\n",
+      "\u001b[32m    • Overall Success Rate: 2%\u001b[0m\n",
+      "\u001b[32m    • Unique Objectives: 4\u001b[0m\n",
       "\n",
-      "\u001b[1m\u001b[36m▼ Per-Strategy Breakdown\u001b[0m\n",
+      "\u001b[1m\u001b[36m▼ Per-Group Breakdown\u001b[0m\n",
       "\u001b[36m────────────────────────────────────────────────────────────────────────────────────────────────────\u001b[0m\n",
       "\n",
-      "\u001b[1m  🔸 Strategy: baseline\u001b[0m\n",
+      "\u001b[1m  🔸 Group: baseline\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: ansi_attack\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[33m    • Success Rate: 50%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: ascii_art\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: ascii_smuggler\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: atbash\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: base64\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: binary\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: caesar\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: character_space\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: char_swap\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: diacritic\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: flip\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: leetspeak\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: morse\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: rot13\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: suffix_append\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: string_join\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: unicode_confusable\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: unicode_substitution\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: url\u001b[0m\n",
+      "\u001b[33m    • Number of Results: 2\u001b[0m\n",
+      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\n",
+      "\u001b[1m  🔸 Group: jailbreak\u001b[0m\n",
       "\u001b[33m    • Number of Results: 2\u001b[0m\n",
       "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
       "\n",
@@ -322,13 +405,14 @@
    "metadata": {},
    "source": [
     "To disable the automatic baseline entirely (e.g., when you only want attack strategies with no\n",
-    "comparison), set `include_baseline=False` in the constructor:\n",
+    "comparison), pass `include_baseline=False` to `initialize_async`:\n",
     "\n",
     "```python\n",
-    "scenario = RedTeamAgent(include_baseline=False)\n",
+    "scenario = RedTeamAgent()\n",
     "await scenario.initialize_async(\n",
     "    objective_target=objective_target,\n",
     "    scenario_strategies=[FoundryStrategy.Base64],\n",
+    "    include_baseline=False,\n",
     ")\n",
     "```"
    ]
@@ -356,7 +440,7 @@
     {
      "data": {
       "application/vnd.jupyter.widget-view+json": {
-       "model_id": "b124f2b7bf254820be2804cde2c02a78",
+       "model_id": "dbfac49b890048dfa8669900be01fe62",
        "version_major": 2,
        "version_minor": 0
       },
@@ -381,7 +465,7 @@
       "\u001b[1m  📋 Scenario Details\u001b[0m\n",
       "\u001b[36m    • Name: RedTeamAgent\u001b[0m\n",
       "\u001b[36m    • Scenario Version: 1\u001b[0m\n",
-      "\u001b[36m    • PyRIT Version: 0.12.1.dev0\u001b[0m\n",
+      "\u001b[36m    • PyRIT Version: 0.14.0.dev0\u001b[0m\n",
       "\u001b[36m    • Description:\u001b[0m\n",
       "\u001b[36m        RedTeamAgent is a preconfigured scenario that automatically generates multiple AtomicAttack instances based on\u001b[0m\n",
       "\u001b[36m        the specified attack strategies. It supports both single-turn attacks (with various converters) and multi-turn\u001b[0m\n",
@@ -392,8 +476,8 @@
       "\n",
       "\u001b[1m  🎯 Target Information\u001b[0m\n",
       "\u001b[36m    • Target Type: OpenAIChatTarget\u001b[0m\n",
-      "\u001b[36m    • Target Model: gpt-4o\u001b[0m\n",
-      "\u001b[36m    • Target Endpoint: https://pyrit-dev.openai.azure.com/openai/v1\u001b[0m\n",
+      "\u001b[36m    • Target Model: gpt-4o-japan-nilfilter\u001b[0m\n",
+      "\u001b[36m    • Target Endpoint: https://pyrit-japan-test.openai.azure.com/openai/v1\u001b[0m\n",
       "\n",
       "\u001b[1m  📊 Scorer Information\u001b[0m\n",
       "\u001b[37m    ▸ Scorer Identifier\u001b[0m\n",
@@ -404,7 +488,7 @@
       "\u001b[36m            • Scorer Type: SelfAskRefusalScorer\u001b[0m\n",
       "\u001b[36m            • scorer_type: true_false\u001b[0m\n",
       "\u001b[36m            • score_aggregator: OR_\u001b[0m\n",
-      "\u001b[36m            • model_name: gpt-4o\u001b[0m\n",
+      "\u001b[36m            • model_name: gpt-4o-japan-nilfilter\u001b[0m\n",
       "\n",
       "\u001b[37m    ▸ Performance Metrics\u001b[0m\n",
       "\u001b[33m      Official evaluation has not been run yet for this specific configuration\u001b[0m\n",
@@ -414,17 +498,17 @@
       "\u001b[1m  📈 Summary\u001b[0m\n",
       "\u001b[32m    • Total Strategies: 2\u001b[0m\n",
       "\u001b[32m    • Total Attack Results: 4\u001b[0m\n",
-      "\u001b[32m    • Overall Success Rate: 0%\u001b[0m\n",
+      "\u001b[36m    • Overall Success Rate: 25%\u001b[0m\n",
       "\u001b[32m    • Unique Objectives: 4\u001b[0m\n",
       "\n",
-      "\u001b[1m\u001b[36m▼ Per-Strategy Breakdown\u001b[0m\n",
+      "\u001b[1m\u001b[36m▼ Per-Group Breakdown\u001b[0m\n",
       "\u001b[36m────────────────────────────────────────────────────────────────────────────────────────────────────\u001b[0m\n",
       "\n",
-      "\u001b[1m  🔸 Strategy: baseline\u001b[0m\n",
+      "\u001b[1m  🔸 Group: baseline\u001b[0m\n",
       "\u001b[33m    • Number of Results: 2\u001b[0m\n",
-      "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
+      "\u001b[33m    • Success Rate: 50%\u001b[0m\n",
       "\n",
-      "\u001b[1m  🔸 Strategy: base64\u001b[0m\n",
+      "\u001b[1m  🔸 Group: base64\u001b[0m\n",
       "\u001b[33m    • Number of Results: 2\u001b[0m\n",
       "\u001b[32m    • Success Rate: 0%\u001b[0m\n",
       "\n",
@@ -455,9 +539,6 @@
   }
  ],
  "metadata": {
-  "jupytext": {
-   "main_language": "python"
-  },
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
@@ -468,7 +549,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.13.5"
+   "version": "3.12.13"
   }
  },
  "nbformat": 4,
diff --git a/doc/code/scenarios/1_common_scenario_parameters.py b/doc/code/scenarios/1_common_scenario_parameters.py
index 3f1dbd0b01..e2879b25f0 100644
--- a/doc/code/scenarios/1_common_scenario_parameters.py
+++ b/doc/code/scenarios/1_common_scenario_parameters.py
@@ -105,8 +105,8 @@
 # ## Baseline Execution
 #
 # The baseline sends each objective directly to the target without any converters or multi-turn
-# strategies. It is included automatically when `include_baseline=True` (the default). This is
-# useful for:
+# strategies. It is included automatically when `initialize_async` is called with
+# `include_baseline=True` (the default for scenarios that support a baseline). This is useful for:
 #
 # - **Measuring default defenses** — how does the target respond to unmodified harmful prompts?
 # - **Establishing comparison points** — compare baseline refusal rates against attack-enhanced runs
@@ -124,13 +124,14 @@
 
 # %% [markdown]
 # To disable the automatic baseline entirely (e.g., when you only want attack strategies with no
-# comparison), set `include_baseline=False` in the constructor:
+# comparison), pass `include_baseline=False` to `initialize_async`:
 #
 # ```python
-# scenario = RedTeamAgent(include_baseline=False)
+# scenario = RedTeamAgent()
 # await scenario.initialize_async(
 #     objective_target=objective_target,
 #     scenario_strategies=[FoundryStrategy.Base64],
+#     include_baseline=False,
 # )
 # ```
 
diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 089bed4267..1013418bee 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -107,6 +107,19 @@ class Scenario(ABC):
     #: what the scenario needs. Validated in ``initialize_async`` once the target is supplied.
     TARGET_REQUIREMENTS: ClassVar[TargetRequirements] = TargetRequirements()
 
+    #: Whether this scenario type supports a default baseline atomic attack. Subclasses whose
+    #: semantics make a default baseline meaningless (e.g. benchmarks that compare against a
+    #: gold-standard answer rather than measure attack lift over an unmodified prompt) override
+    #: this to ``False``. When ``False``, ``initialize_async`` skips the baseline regardless of
+    #: the user-facing default and raises ``ValueError`` if the caller explicitly opts in.
+    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = True
+
+    #: Whether this scenario type includes the baseline atomic attack by default. Used only when
+    #: ``SUPPORTS_DEFAULT_BASELINE`` is ``True``. Subclasses can override this to ``False`` when
+    #: their default behavior should omit the baseline (e.g. when the scenario is already
+    #: dominated by a long list of templates and the baseline is rarely informative).
+    DEFAULT_INCLUDE_BASELINE: ClassVar[bool] = True
+
     def __init__(
         self,
         *,
@@ -114,7 +127,6 @@ def __init__(
         version: int,
         strategy_class: type[ScenarioStrategy],
         objective_scorer: Scorer,
-        include_default_baseline: bool = True,
         scenario_result_id: Optional[Union[uuid.UUID, str]] = None,
     ) -> None:
         """
@@ -125,10 +137,6 @@ def __init__(
             version (int): Version number of the scenario.
             strategy_class (Type[ScenarioStrategy]): The strategy enum class for this scenario.
             objective_scorer (Scorer): The objective scorer used to evaluate attack results.
-            include_default_baseline (bool): Whether to include a baseline atomic attack that sends all objectives
-                without modifications. Most scenarios should have some kind of baseline so users can understand
-                the impact of strategies, but subclasses can optionally write their own custom baselines.
-                Defaults to True.
             scenario_result_id (Optional[Union[uuid.UUID, str]]): Optional ID of an existing scenario result to resume.
                 Can be either a UUID object or a string representation of a UUID.
                 If provided and found in memory, the scenario will resume from prior progress.
@@ -168,8 +176,6 @@ def __init__(
         self._scenario_result_id: Optional[str] = str(scenario_result_id) if scenario_result_id else None
         self._result_lock = asyncio.Lock()
 
-        self._include_baseline = include_default_baseline
-
         # Store prepared strategies for use in _get_atomic_attacks_async
         self._scenario_strategies: list[ScenarioStrategy] = []
 
@@ -486,6 +492,7 @@ async def initialize_async(
         max_concurrency: int = 10,
         max_retries: int = 0,
         memory_labels: Optional[dict[str, str]] = None,
+        include_baseline: bool | None = None,
     ) -> None:
         """
         Initialize the scenario by populating self._atomic_attacks and creating the ScenarioResult.
@@ -513,9 +520,15 @@ async def initialize_async(
                 For example, max_retries=3 allows up to 4 total attempts (1 initial + 3 retries).
             memory_labels (Optional[Dict[str, str]]): Additional labels to apply to all
                 attack runs in the scenario. These help track and categorize the scenario.
+            include_baseline (bool | None): Whether to prepend a baseline atomic attack that sends
+                all objectives without modifications, allowing comparison between unmodified prompts
+                and the scenario's strategies. If None (the default), the scenario type's
+                ``SUPPORTS_DEFAULT_BASELINE`` class attribute decides. Passing ``True`` on a
+                scenario whose ``SUPPORTS_DEFAULT_BASELINE`` is False raises ``ValueError``.
 
         Raises:
-            ValueError: If no objective_target is provided.
+            ValueError: If no objective_target is provided, or if ``include_baseline=True`` is passed
+                to a scenario that does not support a default baseline.
         """
         # Validate required parameters
         if objective_target is None:
@@ -527,13 +540,27 @@ async def initialize_async(
         # Set instance variables from parameters
         self._objective_target = objective_target
         self._objective_target_identifier = objective_target.get_identifier()
-        type(self).TARGET_REQUIREMENTS.validate(target=objective_target)
+        self.TARGET_REQUIREMENTS.validate(target=objective_target)
         self._dataset_config_provided = dataset_config is not None
         self._dataset_config = dataset_config if dataset_config else self.default_dataset_config()
         self._max_concurrency = max_concurrency
         self._max_retries = max_retries
         self._memory_labels = memory_labels or {}
 
+        # Resolve the effective include_baseline. Capability is checked first so a forbidden
+        # scenario type never silently inherits a True default; explicit-True on a forbidden
+        # type is a hard error rather than a silent ignore. When the scenario type supports
+        # the baseline, None defers to DEFAULT_INCLUDE_BASELINE on the class.
+        if not self.SUPPORTS_DEFAULT_BASELINE:
+            if include_baseline:
+                raise ValueError(
+                    f"{type(self).__name__} does not support a default baseline; pass "
+                    f"include_baseline=False or omit the argument."
+                )
+            include_baseline = False
+        elif include_baseline is None:
+            include_baseline = self.DEFAULT_INCLUDE_BASELINE
+
         # Prepare scenario strategies using the stored configuration
         self._scenario_strategies = self._prepare_strategies(scenario_strategies)
 
@@ -546,7 +573,7 @@ async def initialize_async(
 
         self._atomic_attacks = await self._get_atomic_attacks_async()
 
-        if self._include_baseline:
+        if include_baseline:
             baseline_attack = self._get_baseline()
             self._atomic_attacks.insert(0, baseline_attack)
 
diff --git a/pyrit/scenario/scenarios/airt/cyber.py b/pyrit/scenario/scenarios/airt/cyber.py
index 7ff874be1b..5b9fa2ba31 100644
--- a/pyrit/scenario/scenarios/airt/cyber.py
+++ b/pyrit/scenario/scenarios/airt/cyber.py
@@ -104,7 +104,6 @@ def __init__(
         self,
         *,
         objective_scorer: TrueFalseScorer | None = None,
-        include_baseline: bool = True,
         scenario_result_id: str | None = None,
     ) -> None:
         """
@@ -113,8 +112,6 @@ def __init__(
         Args:
             objective_scorer (TrueFalseScorer | None): Objective scorer for malware detection. If not
                 provided, defaults to a composite scorer using malware detection + refusal backstop.
-            include_baseline (bool): Whether to include a baseline atomic attack that sends all objectives
-                without modifications. Defaults to True.
             scenario_result_id (str | None): Optional ID of an existing scenario result to resume.
         """
         self._objective_scorer: TrueFalseScorer = (
@@ -125,7 +122,6 @@ def __init__(
             version=self.VERSION,
             objective_scorer=self._objective_scorer,
             strategy_class=self.get_strategy_class(),
-            include_default_baseline=include_baseline,
             scenario_result_id=scenario_result_id,
         )
 
diff --git a/pyrit/scenario/scenarios/airt/jailbreak.py b/pyrit/scenario/scenarios/airt/jailbreak.py
index 1870fdc0cf..763ac426dd 100644
--- a/pyrit/scenario/scenarios/airt/jailbreak.py
+++ b/pyrit/scenario/scenarios/airt/jailbreak.py
@@ -3,7 +3,7 @@
 
 import os
 from pathlib import Path
-from typing import Any, Optional, Union
+from typing import Any, ClassVar, Optional, Union
 
 from pyrit.auth import get_azure_openai_auth
 from pyrit.common import apply_defaults
@@ -81,6 +81,11 @@ class Jailbreak(Scenario):
 
     VERSION: int = 1
 
+    #: Jailbreak runs many templates per objective, so the baseline atomic attack is rarely
+    #: informative relative to the volume of jailbreak templates. Off by default; callers that
+    #: want a comparison can pass ``include_baseline=True`` to ``initialize_async``.
+    DEFAULT_INCLUDE_BASELINE: ClassVar[bool] = False
+
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
         """
@@ -121,7 +126,6 @@ def __init__(
         self,
         *,
         objective_scorer: Optional[TrueFalseScorer] = None,
-        include_baseline: bool = False,
         scenario_result_id: Optional[str] = None,
         num_templates: Optional[int] = None,
         num_attempts: int = 1,
@@ -133,8 +137,6 @@ def __init__(
         Args:
             objective_scorer (Optional[TrueFalseScorer]): Scorer for detecting successful jailbreaks
                 (non-refusal). If not provided, defaults to an inverted refusal scorer.
-            include_baseline (bool): Whether to include a baseline atomic attack that sends all
-                objectives without modifications. Defaults to True.
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
             num_templates (Optional[int]): Choose num_templates random jailbreaks rather than using all of them.
             num_attempts (Optional[int]): Number of times to try each jailbreak.
@@ -184,7 +186,6 @@ def __init__(
             version=self.VERSION,
             strategy_class=JailbreakStrategy,
             objective_scorer=self._objective_scorer,
-            include_default_baseline=include_baseline,
             scenario_result_id=scenario_result_id,
         )
 
diff --git a/pyrit/scenario/scenarios/airt/leakage.py b/pyrit/scenario/scenarios/airt/leakage.py
index a3a1826aef..9fc9bdca92 100644
--- a/pyrit/scenario/scenarios/airt/leakage.py
+++ b/pyrit/scenario/scenarios/airt/leakage.py
@@ -155,7 +155,6 @@ def __init__(
             version=self.VERSION,
             strategy_class=self.get_strategy_class(),
             objective_scorer=objective_scorer,
-            include_default_baseline=True,
             scenario_result_id=scenario_result_id,
         )
 
diff --git a/pyrit/scenario/scenarios/airt/psychosocial.py b/pyrit/scenario/scenarios/airt/psychosocial.py
index ff98853747..c1486223a0 100644
--- a/pyrit/scenario/scenarios/airt/psychosocial.py
+++ b/pyrit/scenario/scenarios/airt/psychosocial.py
@@ -5,7 +5,7 @@
 import os
 import pathlib
 from dataclasses import dataclass
-from typing import Any, Optional, TypeVar
+from typing import Any, ClassVar, Optional, TypeVar
 
 import yaml
 
@@ -147,6 +147,7 @@ class Psychosocial(Scenario):
     """
 
     VERSION: int = 1
+    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
 
     #: Psychosocial runs CrescendoAttack, which requires the target to natively support
     #: editable conversation history (for backtracking). Declared here so the base scenario
@@ -265,7 +266,6 @@ def __init__(
             strategy_class=PsychosocialStrategy,
             objective_scorer=self._objective_scorer,
             scenario_result_id=scenario_result_id,
-            include_default_baseline=False,
         )
 
         # Store deprecated objectives for later resolution in _resolve_seed_groups
diff --git a/pyrit/scenario/scenarios/airt/scam.py b/pyrit/scenario/scenarios/airt/scam.py
index 789a3eaf68..9623f037e6 100644
--- a/pyrit/scenario/scenarios/airt/scam.py
+++ b/pyrit/scenario/scenarios/airt/scam.py
@@ -150,7 +150,6 @@ def __init__(
         *,
         objective_scorer: Optional[TrueFalseScorer] = None,
         adversarial_chat: Optional[PromptTarget] = None,
-        include_baseline: bool = True,
         scenario_result_id: Optional[str] = None,
     ) -> None:
         """
@@ -161,10 +160,6 @@ def __init__(
                 evaluation.
             adversarial_chat (Optional[PromptTarget]): Chat target used to rephrase the
                 objective into the role-play context (in single-turn strategies).
-            include_baseline (bool): Whether to include a baseline atomic attack that sends all objectives
-                without modifications. Defaults to True. When True, a "baseline" attack is automatically
-                added as the first atomic attack, allowing comparison between unmodified prompts and
-                encoding-modified prompts.
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
         """
         if not objective_scorer:
@@ -179,7 +174,6 @@ def __init__(
             version=self.VERSION,
             strategy_class=ScamStrategy,
             objective_scorer=objective_scorer,
-            include_default_baseline=include_baseline,
             scenario_result_id=scenario_result_id,
         )
 
diff --git a/pyrit/scenario/scenarios/benchmark/adversarial.py b/pyrit/scenario/scenarios/benchmark/adversarial.py
index bdcbd7e0d5..0d6fc7e302 100644
--- a/pyrit/scenario/scenarios/benchmark/adversarial.py
+++ b/pyrit/scenario/scenarios/benchmark/adversarial.py
@@ -33,6 +33,7 @@ class AdversarialBenchmark(Scenario):
 
     VERSION: int = 1
     _cached_strategy_class: ClassVar[type[ScenarioStrategy] | None] = None
+    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
 
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
@@ -118,7 +119,6 @@ def __init__(
             version=self.VERSION,
             objective_scorer=self._objective_scorer,
             strategy_class=self.get_strategy_class(),
-            include_default_baseline=False,
             scenario_result_id=scenario_result_id,
         )
 
diff --git a/pyrit/scenario/scenarios/foundry/red_team_agent.py b/pyrit/scenario/scenarios/foundry/red_team_agent.py
index 8b7da826e6..f2d944a18c 100644
--- a/pyrit/scenario/scenarios/foundry/red_team_agent.py
+++ b/pyrit/scenario/scenarios/foundry/red_team_agent.py
@@ -247,7 +247,6 @@ def __init__(
         *,
         adversarial_chat: Optional[PromptTarget] = None,
         attack_scoring_config: Optional[AttackScoringConfig] = None,
-        include_baseline: bool = True,
         scenario_result_id: Optional[str] = None,
     ) -> None:
         """
@@ -260,10 +259,6 @@ def __init__(
             attack_scoring_config (Optional[AttackScoringConfig]): Configuration for attack scoring,
                 including the objective scorer and auxiliary scorers. If not provided, creates a default
                 configuration with a composite scorer using Azure Content Filter and SelfAsk Refusal scorers.
-            include_baseline (bool): Whether to include a baseline atomic attack that sends all objectives
-                without modifications. Defaults to True. When True, a "baseline" attack is automatically
-                added as the first atomic attack, allowing comparison between unmodified prompts and
-                attack-modified prompts.
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
 
         Raises:
@@ -286,7 +281,6 @@ def __init__(
             version=self.VERSION,
             strategy_class=FoundryStrategy,
             objective_scorer=objective_scorer,
-            include_default_baseline=include_baseline,
             scenario_result_id=scenario_result_id,
         )
         self._scenario_composites: list[FoundryComposite] = []
@@ -303,6 +297,7 @@ async def initialize_async(
         max_concurrency: int = 10,
         max_retries: int = 0,
         memory_labels: Optional[dict[str, str]] = None,
+        include_baseline: bool | None = None,
     ) -> None:
         """
         Initialize the scenario.
@@ -318,6 +313,7 @@ async def initialize_async(
             max_concurrency (int): Maximum number of concurrent attack executions. Defaults to 10.
             max_retries (int): Maximum number of retries on failure. Defaults to 0.
             memory_labels (Optional[dict[str, str]]): Labels to attach to all memory entries.
+            include_baseline (bool | None): See ``Scenario.initialize_async``.
         """
         # This override exists purely for type-widening: FoundryComposite is a dataclass,
         # not a ScenarioStrategy enum member, so the base class signature would reject it.
@@ -329,6 +325,7 @@ async def initialize_async(
             max_concurrency=max_concurrency,
             max_retries=max_retries,
             memory_labels=memory_labels,
+            include_baseline=include_baseline,
         )
 
     def _prepare_strategies(  # type: ignore[ty:invalid-method-override]
diff --git a/pyrit/scenario/scenarios/garak/encoding.py b/pyrit/scenario/scenarios/garak/encoding.py
index 531b11062e..f239637132 100644
--- a/pyrit/scenario/scenarios/garak/encoding.py
+++ b/pyrit/scenario/scenarios/garak/encoding.py
@@ -173,7 +173,6 @@ def __init__(
         *,
         objective_scorer: Optional[TrueFalseScorer] = None,
         encoding_templates: Optional[Sequence[str]] = None,
-        include_baseline: bool = True,
         scenario_result_id: Optional[str] = None,
     ) -> None:
         """
@@ -185,10 +184,6 @@ def __init__(
                 category.
             encoding_templates (Optional[Sequence[str]]): Templates used to construct the decoding
                 prompts. Defaults to AskToDecodeConverter.garak_templates.
-            include_baseline (bool): Whether to include a baseline atomic attack that sends all objectives
-                without modifications. Defaults to True. When True, a "baseline" attack is automatically
-                added as the first atomic attack, allowing comparison between unmodified prompts and
-                encoding-modified prompts.
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
         """
         objective_scorer = objective_scorer or DecodingScorer(categories=["encoding_scenario"])
@@ -200,7 +195,6 @@ def __init__(
             version=self.VERSION,
             strategy_class=EncodingStrategy,
             objective_scorer=objective_scorer,
-            include_default_baseline=include_baseline,
             scenario_result_id=scenario_result_id,
         )
 
diff --git a/tests/integration/datasets/test_seed_dataset_provider_integration.py b/tests/integration/datasets/test_seed_dataset_provider_integration.py
index 457aadb7e6..85a8a80235 100644
--- a/tests/integration/datasets/test_seed_dataset_provider_integration.py
+++ b/tests/integration/datasets/test_seed_dataset_provider_integration.py
@@ -683,7 +683,6 @@ async def test_red_team_agent_initializes_with_harmbench(self, sqlite_instance):
         rta = RedTeamAgent(
             adversarial_chat=target,
             attack_scoring_config=AttackScoringConfig(objective_scorer=mock_scorer),
-            include_baseline=False,
         )
 
         # This is the critical call — it loads seed groups from memory
@@ -693,6 +692,7 @@ async def test_red_team_agent_initializes_with_harmbench(self, sqlite_instance):
             objective_target=target,
             max_concurrency=1,
             scenario_strategies=[FoundryStrategy.Base64],
+            include_baseline=False,
         )
 
         # Verify the scenario got objectives from harmbench
diff --git a/tests/unit/scenario/test_adversarial.py b/tests/unit/scenario/test_adversarial.py
index e6b082cb0d..a6445393a7 100644
--- a/tests/unit/scenario/test_adversarial.py
+++ b/tests/unit/scenario/test_adversarial.py
@@ -432,14 +432,41 @@ async def test_attacks_carry_seed_groups(self, mock_objective_target, single_adv
     async def test_baseline_excluded(self, mock_objective_target, single_adversarial_model):
         """AdversarialBenchmark must opt out of the parent's default baseline.
 
-        Verifies both the configuration toggle (``_include_baseline is False``) and
-        the observable property (no atomic attack is named ``"baseline"``).
+        Verifies both the class-level capability flag and the observable property
+        (no atomic attack is named ``"baseline"``).
         """
         scenario, attacks = await self._init_and_get_attacks(
             mock_objective_target=mock_objective_target,
             adversarial_models=single_adversarial_model,
         )
-        assert scenario._include_baseline is False
+        assert type(scenario).SUPPORTS_DEFAULT_BASELINE is False
+        assert not any(a.atomic_attack_name == "baseline" for a in attacks)
+
+    @pytest.mark.asyncio
+    async def test_baseline_explicit_true_raises(self, mock_objective_target, single_adversarial_model):
+        """Explicitly passing include_baseline=True to a forbidden scenario raises ValueError."""
+        scenario = AdversarialBenchmark(adversarial_models=single_adversarial_model)
+        with pytest.raises(ValueError, match="does not support a default baseline"):
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                include_baseline=True,
+            )
+
+    @pytest.mark.asyncio
+    async def test_baseline_explicit_false_succeeds(self, mock_objective_target, single_adversarial_model):
+        """Explicit include_baseline=False on a forbidden scenario is accepted (matches the default)."""
+        groups = {"harmbench": _make_seed_groups("harmbench")}
+        with (
+            patch.object(DatasetConfiguration, "get_seed_attack_groups", return_value=groups),
+            patch("pyrit.scenario.core.scenario.Scenario._get_default_objective_scorer") as mock_scorer,
+        ):
+            mock_scorer.return_value = MagicMock(spec=TrueFalseScorer, get_identifier=lambda: _mock_id("scorer"))
+            scenario = AdversarialBenchmark(adversarial_models=single_adversarial_model)
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                include_baseline=False,
+            )
+            attacks = await scenario._get_atomic_attacks_async()
         assert not any(a.atomic_attack_name == "baseline" for a in attacks)
 
 
diff --git a/tests/unit/scenario/test_foundry.py b/tests/unit/scenario/test_foundry.py
index e07f51e842..b4f7eaa2e8 100644
--- a/tests/unit/scenario/test_foundry.py
+++ b/tests/unit/scenario/test_foundry.py
@@ -655,7 +655,6 @@ async def test_scenario_composites_set_after_initialize(
         with patch.object(RedTeamAgent, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = RedTeamAgent(
                 attack_scoring_config=AttackScoringConfig(objective_scorer=mock_objective_scorer),
-                include_baseline=False,
             )
 
             # Before initialize_async, composites should be empty
@@ -665,6 +664,7 @@ async def test_scenario_composites_set_after_initialize(
                 objective_target=mock_objective_target,
                 scenario_strategies=strategies,
                 dataset_config=mock_dataset_config,
+                include_baseline=False,
             )
 
             # After initialize_async, composites should be set
@@ -735,12 +735,12 @@ async def test_initialize_with_foundry_composite_directly(
         with patch.object(RedTeamAgent, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = RedTeamAgent(
                 attack_scoring_config=AttackScoringConfig(objective_scorer=mock_objective_scorer),
-                include_baseline=False,
             )
             await scenario.initialize_async(
                 objective_target=mock_objective_target,
                 scenario_strategies=[composite],
                 dataset_config=mock_dataset_config,
+                include_baseline=False,
             )
 
         assert len(scenario._scenario_composites) == 1
@@ -766,12 +766,12 @@ async def test_initialize_with_mixed_composites_and_strategies(
         with patch.object(RedTeamAgent, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = RedTeamAgent(
                 attack_scoring_config=AttackScoringConfig(objective_scorer=mock_objective_scorer),
-                include_baseline=False,
             )
             await scenario.initialize_async(
                 objective_target=mock_objective_target,
                 scenario_strategies=[composite, FoundryStrategy.ROT13],
                 dataset_config=mock_dataset_config,
+                include_baseline=False,
             )
 
         assert len(scenario._scenario_composites) == 2
@@ -797,12 +797,12 @@ async def test_initialize_converts_scenario_composite_strategy_to_foundry_compos
         with patch.object(RedTeamAgent, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = RedTeamAgent(
                 attack_scoring_config=AttackScoringConfig(objective_scorer=mock_objective_scorer),
-                include_baseline=False,
             )
             await scenario.initialize_async(
                 objective_target=mock_objective_target,
                 scenario_strategies=[legacy],  # type: ignore[arg-type]
                 dataset_config=mock_dataset_config,
+                include_baseline=False,
             )
 
         assert len(scenario._scenario_composites) == 1
@@ -828,12 +828,12 @@ async def test_initialize_converts_converter_first_composite_strategy(
         with patch.object(RedTeamAgent, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = RedTeamAgent(
                 attack_scoring_config=AttackScoringConfig(objective_scorer=mock_objective_scorer),
-                include_baseline=False,
             )
             await scenario.initialize_async(
                 objective_target=mock_objective_target,
                 scenario_strategies=[legacy],  # type: ignore[arg-type]
                 dataset_config=mock_dataset_config,
+                include_baseline=False,
             )
 
         result = scenario._scenario_composites[0]
@@ -858,12 +858,12 @@ async def test_initialize_converts_converter_only_composite_strategy(
         with patch.object(RedTeamAgent, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = RedTeamAgent(
                 attack_scoring_config=AttackScoringConfig(objective_scorer=mock_objective_scorer),
-                include_baseline=False,
             )
             await scenario.initialize_async(
                 objective_target=mock_objective_target,
                 scenario_strategies=[legacy],  # type: ignore[arg-type]
                 dataset_config=mock_dataset_config,
+                include_baseline=False,
             )
 
         result = scenario._scenario_composites[0]
diff --git a/tests/unit/scenario/test_leakage_scenario.py b/tests/unit/scenario/test_leakage_scenario.py
index 5a83bb4565..b8a0cfb8cc 100644
--- a/tests/unit/scenario/test_leakage_scenario.py
+++ b/tests/unit/scenario/test_leakage_scenario.py
@@ -102,10 +102,9 @@ def test_default_scorer_uses_leakage_yaml(self):
         scorer_path = DATASETS_PATH / "score" / "true_false_question" / "leakage.yaml"
         assert scorer_path.exists(), f"Expected leakage.yaml scorer at {scorer_path}"
 
-    def test_init_include_baseline_true(self, mock_objective_scorer):
-        """Test that include_baseline is always True."""
-        scenario = Leakage(objective_scorer=mock_objective_scorer)
-        assert scenario._include_baseline is True
+    def test_init_supports_default_baseline(self):
+        """Leakage opts into the parent's default baseline."""
+        assert Leakage.SUPPORTS_DEFAULT_BASELINE is True
 
 
 @pytest.mark.usefixtures(*FIXTURES)
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index bbead38407..a77ade8dfd 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -3,6 +3,7 @@
 
 """Tests for the scenarios.Scenario class."""
 
+from typing import ClassVar
 from unittest.mock import AsyncMock, MagicMock, PropertyMock, patch
 
 import pytest
@@ -97,10 +98,12 @@ def sample_attack_results():
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    def __init__(self, atomic_attacks_to_return=None, **kwargs):
-        # Default include_default_baseline=False for tests unless explicitly specified
-        kwargs.setdefault("include_default_baseline", False)
+    # Tests using this fixture should default to no baseline; set the class flag to forbid
+    # the default baseline so we don't have to thread include_baseline=False through every
+    # initialize_async call.
+    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
 
+    def __init__(self, atomic_attacks_to_return=None, **kwargs):
         # Add required strategy_class if not provided
 
         class TestStrategy(ScenarioStrategy):
@@ -711,11 +714,10 @@ async def test_initialize_async_with_empty_strategies_and_baseline(self, mock_ob
         """Test that baseline is included when include_baseline=True, regardless of strategies."""
         from pyrit.models import SeedAttackGroup, SeedObjective
 
-        # Create a scenario with include_default_baseline=True and TrueFalseScorer
+        # Create a scenario with TrueFalseScorer; baseline is included by default
         scenario = ConcreteScenarioWithTrueFalseScorer(
             name="Baseline Only Test",
             version=1,
-            include_default_baseline=True,
         )
 
         # Create a mock dataset config with seed groups
@@ -740,11 +742,10 @@ async def test_baseline_only_execution_runs_successfully(self, mock_objective_ta
         """Test that baseline-only scenario can run successfully."""
         from pyrit.models import SeedAttackGroup, SeedObjective
 
-        # Create a scenario with include_default_baseline=True and TrueFalseScorer
+        # Create a scenario with TrueFalseScorer; baseline is included by default
         scenario = ConcreteScenarioWithTrueFalseScorer(
             name="Baseline Only Test",
             version=1,
-            include_default_baseline=True,
         )
 
         # Create a mock dataset config with seed groups
@@ -776,7 +777,6 @@ async def test_empty_strategies_without_baseline_allows_initialization(self, moc
         scenario = ConcreteScenario(
             name="No Baseline Test",
             version=1,
-            include_default_baseline=False,  # No baseline
         )
 
         mock_dataset_config = MagicMock(spec=DatasetConfiguration)
@@ -799,7 +799,6 @@ async def test_standalone_baseline_uses_dataset_config_seeds(self, mock_objectiv
         scenario = ConcreteScenarioWithTrueFalseScorer(
             name="Baseline Seeds Test",
             version=1,
-            include_default_baseline=True,
         )
 
         # Create specific seed groups to verify they're used
diff --git a/tests/unit/scenario/test_scenario_parameters.py b/tests/unit/scenario/test_scenario_parameters.py
index ae6eaf0010..f749418007 100644
--- a/tests/unit/scenario/test_scenario_parameters.py
+++ b/tests/unit/scenario/test_scenario_parameters.py
@@ -3,6 +3,7 @@
 
 """Tests for Scenario custom parameter declaration, coercion, and validation (Stage 1b)."""
 
+from typing import ClassVar
 from unittest.mock import MagicMock
 
 import pytest
@@ -33,6 +34,9 @@ def get_aggregate_tags(cls) -> set[str]:
             return {"all"}
 
     class _ParamTestScenario(Scenario):
+        # No baseline in tests so atomic_attacks observations stay deterministic.
+        SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
+
         @classmethod
         def get_strategy_class(cls):
             return _ParamTestStrategy
@@ -60,7 +64,6 @@ async def _get_atomic_attacks_async(self):
         version=1,
         strategy_class=_ParamTestStrategy,
         objective_scorer=mock_scorer,
-        include_default_baseline=False,
     )
 
 
diff --git a/tests/unit/scenario/test_scenario_partial_results.py b/tests/unit/scenario/test_scenario_partial_results.py
index 2cc7df714a..ca984153db 100644
--- a/tests/unit/scenario/test_scenario_partial_results.py
+++ b/tests/unit/scenario/test_scenario_partial_results.py
@@ -3,6 +3,7 @@
 
 """Additional tests for Scenario retry with AttackExecutorResult functionality."""
 
+from typing import ClassVar
 from unittest.mock import MagicMock, PropertyMock
 
 import pytest
@@ -73,10 +74,9 @@ def filter_objectives(*, remaining_objectives):
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    def __init__(self, *, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
-        # Default include_default_baseline=False for tests unless explicitly specified
-        kwargs.setdefault("include_default_baseline", False)
+    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
 
+    def __init__(self, *, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
         # Get strategy_class from kwargs or use default
         strategy_class = kwargs.pop("strategy_class", None) or self.get_strategy_class()
 
diff --git a/tests/unit/scenario/test_scenario_retry.py b/tests/unit/scenario/test_scenario_retry.py
index 2ff0555192..2b93405363 100644
--- a/tests/unit/scenario/test_scenario_retry.py
+++ b/tests/unit/scenario/test_scenario_retry.py
@@ -3,6 +3,7 @@
 
 """Tests for Scenario retry functionality."""
 
+from typing import ClassVar
 from unittest.mock import AsyncMock, MagicMock, PropertyMock
 
 import pytest
@@ -136,10 +137,9 @@ def create_mock_atomic_attack(name: str, objectives: list[str], run_async_mock:
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    def __init__(self, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
-        # Default include_default_baseline=False for tests unless explicitly specified
-        kwargs.setdefault("include_default_baseline", False)
+    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
 
+    def __init__(self, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
         # Get strategy_class from kwargs or use default
         strategy_class = kwargs.pop("strategy_class", None) or self.get_strategy_class()
 

From 7b2f3274ab9aa25544f8337be34dd7e9ab56b638 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <agavrila@microsoft.com>
Date: Fri, 8 May 2026 20:10:07 -0400
Subject: [PATCH 02/19] adding tests for additional classVar

---
 tests/unit/scenario/test_jailbreak.py | 31 +++++++++++++++++++++++++++
 1 file changed, 31 insertions(+)

diff --git a/tests/unit/scenario/test_jailbreak.py b/tests/unit/scenario/test_jailbreak.py
index c873465c6b..36713fafa4 100644
--- a/tests/unit/scenario/test_jailbreak.py
+++ b/tests/unit/scenario/test_jailbreak.py
@@ -202,6 +202,37 @@ async def test_init_raises_exception_when_no_datasets_available(self, mock_objec
         with pytest.raises(ValueError, match="DatasetConfiguration has no seed_groups"):
             await scenario.initialize_async(objective_target=mock_objective_target)
 
+    def test_class_supports_baseline_but_defaults_off(self):
+        """Jailbreak supports a baseline but does not include one by default."""
+        assert Jailbreak.SUPPORTS_DEFAULT_BASELINE is True
+        assert Jailbreak.DEFAULT_INCLUDE_BASELINE is False
+
+    async def test_default_initialize_omits_baseline(
+        self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
+    ):
+        """initialize_async without include_baseline honors DEFAULT_INCLUDE_BASELINE=False."""
+        with patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
+            scenario = Jailbreak(objective_scorer=mock_objective_scorer)
+            await scenario.initialize_async(objective_target=mock_objective_target)
+            assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
+
+    async def test_explicit_include_baseline_true_prepends_baseline(
+        self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
+    ):
+        """Caller can override DEFAULT_INCLUDE_BASELINE=False by passing include_baseline=True."""
+        from pyrit.scenario import DatasetConfiguration
+
+        with (
+            patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups),
+            patch.object(DatasetConfiguration, "get_all_seed_attack_groups", return_value=mock_memory_seed_groups),
+        ):
+            scenario = Jailbreak(objective_scorer=mock_objective_scorer)
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                include_baseline=True,
+            )
+            assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+
 
 @pytest.mark.usefixtures(*FIXTURES)
 class TestJailbreakAttackGeneration:

From fe9cf5553a0d28365dc5e1c8ad8520d9d1f879e8 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <agavrila@microsoft.com>
Date: Fri, 8 May 2026 20:38:05 -0400
Subject: [PATCH 03/19] doc updates

---
 doc/code/scenarios/0_scenarios.ipynb              | 15 ++++++++++-----
 doc/code/scenarios/0_scenarios.py                 | 12 +++++++-----
 pyrit/scenario/core/scenario.py                   |  4 ++--
 pyrit/scenario/scenarios/airt/psychosocial.py     |  3 +++
 pyrit/scenario/scenarios/benchmark/adversarial.py |  3 +++
 5 files changed, 25 insertions(+), 12 deletions(-)

diff --git a/doc/code/scenarios/0_scenarios.ipynb b/doc/code/scenarios/0_scenarios.ipynb
index 1db4bb2e2c..afe9337c21 100644
--- a/doc/code/scenarios/0_scenarios.ipynb
+++ b/doc/code/scenarios/0_scenarios.ipynb
@@ -83,7 +83,7 @@
     "   - `max_retries`: Number of retry attempts on failure (default: 0)\n",
     "   - `memory_labels`: Optional labels for tracking (optional)\n",
     "   - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's\n",
-    "     default; `True` for scenarios that support a baseline)\n",
+    "     `DEFAULT_INCLUDE_BASELINE`; most scenarios default it on, `Jailbreak` defaults it off)\n",
     "\n",
     "### Example Structure\n",
     "\n",
@@ -405,11 +405,13 @@
     "\n",
     "Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends\n",
     "each objective directly to the target without any converters or multi-turn techniques. This is\n",
-    "controlled by the `include_baseline` parameter on `initialize_async` (default: `True` for\n",
-    "scenarios that support a baseline).\n",
+    "controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each\n",
+    "scenario falls back to its own `DEFAULT_INCLUDE_BASELINE` class attribute (most scenarios\n",
+    "default it on; `Jailbreak` defaults it off).\n",
     "\n",
-    "To run *only* the baseline (no attack strategies), call `initialize_async` with\n",
-    "`include_baseline=True` (the default) and `scenario_strategies=None`. See\n",
+    "To run *only* the baseline (no attack strategies), pass `include_baseline=True` and\n",
+    "`scenario_strategies=None` explicitly to `initialize_async` — that way the example works\n",
+    "regardless of the scenario's default. See\n",
     "[Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a working example."
    ]
   },
@@ -440,6 +442,9 @@
   }
  ],
  "metadata": {
+  "jupytext": {
+   "main_language": "python"
+  },
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
diff --git a/doc/code/scenarios/0_scenarios.py b/doc/code/scenarios/0_scenarios.py
index 813cfabf03..d2e03a4067 100644
--- a/doc/code/scenarios/0_scenarios.py
+++ b/doc/code/scenarios/0_scenarios.py
@@ -85,7 +85,7 @@
 #    - `max_retries`: Number of retry attempts on failure (default: 0)
 #    - `memory_labels`: Optional labels for tracking (optional)
 #    - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's
-#      default; `True` for scenarios that support a baseline)
+#      `DEFAULT_INCLUDE_BASELINE`; most scenarios default it on, `Jailbreak` defaults it off)
 #
 # ### Example Structure
 #
@@ -175,11 +175,13 @@ def _build_display_group(self, *, technique_name: str, seed_group_name: str) ->
 #
 # Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends
 # each objective directly to the target without any converters or multi-turn techniques. This is
-# controlled by the `include_baseline` parameter on `initialize_async` (default: `True` for
-# scenarios that support a baseline).
+# controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each
+# scenario falls back to its own `DEFAULT_INCLUDE_BASELINE` class attribute (most scenarios
+# default it on; `Jailbreak` defaults it off).
 #
-# To run *only* the baseline (no attack strategies), call `initialize_async` with
-# `include_baseline=True` (the default) and `scenario_strategies=None`. See
+# To run *only* the baseline (no attack strategies), pass `include_baseline=True` and
+# `scenario_strategies=None` explicitly to `initialize_async` — that way the example works
+# regardless of the scenario's default. See
 # [Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a working example.
 
 # %% [markdown]
diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 1013418bee..94087c992b 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -540,7 +540,7 @@ async def initialize_async(
         # Set instance variables from parameters
         self._objective_target = objective_target
         self._objective_target_identifier = objective_target.get_identifier()
-        self.TARGET_REQUIREMENTS.validate(target=objective_target)
+        type(self).TARGET_REQUIREMENTS.validate(target=objective_target)
         self._dataset_config_provided = dataset_config is not None
         self._dataset_config = dataset_config if dataset_config else self.default_dataset_config()
         self._max_concurrency = max_concurrency
@@ -552,7 +552,7 @@ async def initialize_async(
         # type is a hard error rather than a silent ignore. When the scenario type supports
         # the baseline, None defers to DEFAULT_INCLUDE_BASELINE on the class.
         if not self.SUPPORTS_DEFAULT_BASELINE:
-            if include_baseline:
+            if include_baseline is True:
                 raise ValueError(
                     f"{type(self).__name__} does not support a default baseline; pass "
                     f"include_baseline=False or omit the argument."
diff --git a/pyrit/scenario/scenarios/airt/psychosocial.py b/pyrit/scenario/scenarios/airt/psychosocial.py
index c1486223a0..34f289fc19 100644
--- a/pyrit/scenario/scenarios/airt/psychosocial.py
+++ b/pyrit/scenario/scenarios/airt/psychosocial.py
@@ -147,6 +147,9 @@ class Psychosocial(Scenario):
     """
 
     VERSION: int = 1
+
+    #: Psychosocial measures multi-turn escalation behavior; a single-shot baseline send
+    #: isn't a meaningful comparator, so the default baseline is forbidden.
     SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
 
     #: Psychosocial runs CrescendoAttack, which requires the target to natively support
diff --git a/pyrit/scenario/scenarios/benchmark/adversarial.py b/pyrit/scenario/scenarios/benchmark/adversarial.py
index 0d6fc7e302..6d0d553b48 100644
--- a/pyrit/scenario/scenarios/benchmark/adversarial.py
+++ b/pyrit/scenario/scenarios/benchmark/adversarial.py
@@ -33,6 +33,9 @@ class AdversarialBenchmark(Scenario):
 
     VERSION: int = 1
     _cached_strategy_class: ClassVar[type[ScenarioStrategy] | None] = None
+
+    #: AdversarialBenchmark compares attack-success rates across adversarial models; a baseline
+    #: attack would be model-independent and contribute no signal to the comparison.
     SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
 
     @classmethod

From 0411f865daf125120839bd4fd7ef73c5e5bba9c1 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Mon, 11 May 2026 11:27:26 -0400
Subject: [PATCH 04/19] addressing doc accuracy comments

---
 doc/code/scenarios/0_scenarios.ipynb    |  8 ++------
 doc/code/scenarios/0_scenarios.py       |  8 ++------
 pyrit/scenario/core/scenario.py         |  5 +++--
 tests/unit/scenario/test_adversarial.py | 10 +++-------
 4 files changed, 10 insertions(+), 21 deletions(-)

diff --git a/doc/code/scenarios/0_scenarios.ipynb b/doc/code/scenarios/0_scenarios.ipynb
index afe9337c21..54f440f9e5 100644
--- a/doc/code/scenarios/0_scenarios.ipynb
+++ b/doc/code/scenarios/0_scenarios.ipynb
@@ -407,12 +407,8 @@
     "each objective directly to the target without any converters or multi-turn techniques. This is\n",
     "controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each\n",
     "scenario falls back to its own `DEFAULT_INCLUDE_BASELINE` class attribute (most scenarios\n",
-    "default it on; `Jailbreak` defaults it off).\n",
-    "\n",
-    "To run *only* the baseline (no attack strategies), pass `include_baseline=True` and\n",
-    "`scenario_strategies=None` explicitly to `initialize_async` — that way the example works\n",
-    "regardless of the scenario's default. See\n",
-    "[Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a working example."
+    "default it on; `Jailbreak` defaults it off). See\n",
+    "[Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example."
    ]
   },
   {
diff --git a/doc/code/scenarios/0_scenarios.py b/doc/code/scenarios/0_scenarios.py
index d2e03a4067..aa6986316a 100644
--- a/doc/code/scenarios/0_scenarios.py
+++ b/doc/code/scenarios/0_scenarios.py
@@ -177,12 +177,8 @@ def _build_display_group(self, *, technique_name: str, seed_group_name: str) ->
 # each objective directly to the target without any converters or multi-turn techniques. This is
 # controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each
 # scenario falls back to its own `DEFAULT_INCLUDE_BASELINE` class attribute (most scenarios
-# default it on; `Jailbreak` defaults it off).
-#
-# To run *only* the baseline (no attack strategies), pass `include_baseline=True` and
-# `scenario_strategies=None` explicitly to `initialize_async` — that way the example works
-# regardless of the scenario's default. See
-# [Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a working example.
+# default it on; `Jailbreak` defaults it off). See
+# [Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example.
 
 # %% [markdown]
 #
diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 94087c992b..9ea8a4fb82 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -523,8 +523,9 @@ async def initialize_async(
             include_baseline (bool | None): Whether to prepend a baseline atomic attack that sends
                 all objectives without modifications, allowing comparison between unmodified prompts
                 and the scenario's strategies. If None (the default), the scenario type's
-                ``SUPPORTS_DEFAULT_BASELINE`` class attribute decides. Passing ``True`` on a
-                scenario whose ``SUPPORTS_DEFAULT_BASELINE`` is False raises ``ValueError``.
+                ``DEFAULT_INCLUDE_BASELINE`` class attribute decides (only consulted when
+                ``SUPPORTS_DEFAULT_BASELINE`` is True). Passing ``True`` on a scenario whose
+                ``SUPPORTS_DEFAULT_BASELINE`` is False raises ``ValueError``.
 
         Raises:
             ValueError: If no objective_target is provided, or if ``include_baseline=True`` is passed
diff --git a/tests/unit/scenario/test_adversarial.py b/tests/unit/scenario/test_adversarial.py
index a6445393a7..1d71c8f7f1 100644
--- a/tests/unit/scenario/test_adversarial.py
+++ b/tests/unit/scenario/test_adversarial.py
@@ -428,21 +428,19 @@ async def test_attacks_carry_seed_groups(self, mock_objective_target, single_adv
         for a in attacks:
             assert len(a.objectives) > 0
 
-    @pytest.mark.asyncio
     async def test_baseline_excluded(self, mock_objective_target, single_adversarial_model):
         """AdversarialBenchmark must opt out of the parent's default baseline.
 
         Verifies both the class-level capability flag and the observable property
         (no atomic attack is named ``"baseline"``).
         """
-        scenario, attacks = await self._init_and_get_attacks(
+        scenario, _ = await self._init_and_get_attacks(
             mock_objective_target=mock_objective_target,
             adversarial_models=single_adversarial_model,
         )
         assert type(scenario).SUPPORTS_DEFAULT_BASELINE is False
-        assert not any(a.atomic_attack_name == "baseline" for a in attacks)
+        assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
 
-    @pytest.mark.asyncio
     async def test_baseline_explicit_true_raises(self, mock_objective_target, single_adversarial_model):
         """Explicitly passing include_baseline=True to a forbidden scenario raises ValueError."""
         scenario = AdversarialBenchmark(adversarial_models=single_adversarial_model)
@@ -452,7 +450,6 @@ async def test_baseline_explicit_true_raises(self, mock_objective_target, single
                 include_baseline=True,
             )
 
-    @pytest.mark.asyncio
     async def test_baseline_explicit_false_succeeds(self, mock_objective_target, single_adversarial_model):
         """Explicit include_baseline=False on a forbidden scenario is accepted (matches the default)."""
         groups = {"harmbench": _make_seed_groups("harmbench")}
@@ -466,8 +463,7 @@ async def test_baseline_explicit_false_succeeds(self, mock_objective_target, sin
                 objective_target=mock_objective_target,
                 include_baseline=False,
             )
-            attacks = await scenario._get_atomic_attacks_async()
-        assert not any(a.atomic_attack_name == "baseline" for a in attacks)
+        assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
 
 
 # ===========================================================================

From 56927d976fb724ea54c741ebab30313695a929d6 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Mon, 11 May 2026 17:40:49 -0400
Subject: [PATCH 05/19] Adding deprecation, and cleaner enum instead of 2
 variable control

---
 doc/code/scenarios/0_scenarios.ipynb          |   6 +-
 doc/code/scenarios/0_scenarios.py             |   6 +-
 pyrit/scenario/__init__.py                    |   2 +
 pyrit/scenario/core/__init__.py               |   3 +-
 pyrit/scenario/core/scenario.py               |  87 +++++++---
 pyrit/scenario/scenarios/airt/cyber.py        |  14 ++
 pyrit/scenario/scenarios/airt/jailbreak.py    |  18 +-
 pyrit/scenario/scenarios/airt/psychosocial.py |   4 +-
 pyrit/scenario/scenarios/airt/scam.py         |  14 ++
 .../scenarios/benchmark/adversarial.py        |   4 +-
 .../scenarios/foundry/red_team_agent.py       |  15 ++
 pyrit/scenario/scenarios/garak/encoding.py    |  14 ++
 tests/unit/scenario/test_adversarial.py       |   4 +-
 .../scenario/test_baseline_deprecation.py     | 160 ++++++++++++++++++
 tests/unit/scenario/test_jailbreak.py         |   8 +-
 tests/unit/scenario/test_leakage_scenario.py  |   3 +-
 tests/unit/scenario/test_scenario.py          |   9 +-
 .../unit/scenario/test_scenario_parameters.py |   4 +-
 .../scenario/test_scenario_partial_results.py |   4 +-
 tests/unit/scenario/test_scenario_retry.py    |   4 +-
 20 files changed, 329 insertions(+), 54 deletions(-)
 create mode 100644 tests/unit/scenario/test_baseline_deprecation.py

diff --git a/doc/code/scenarios/0_scenarios.ipynb b/doc/code/scenarios/0_scenarios.ipynb
index 54f440f9e5..81e0971ba4 100644
--- a/doc/code/scenarios/0_scenarios.ipynb
+++ b/doc/code/scenarios/0_scenarios.ipynb
@@ -83,7 +83,7 @@
     "   - `max_retries`: Number of retry attempts on failure (default: 0)\n",
     "   - `memory_labels`: Optional labels for tracking (optional)\n",
     "   - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's\n",
-    "     `DEFAULT_INCLUDE_BASELINE`; most scenarios default it on, `Jailbreak` defaults it off)\n",
+    "     `BASELINE_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)\n",
     "\n",
     "### Example Structure\n",
     "\n",
@@ -406,8 +406,8 @@
     "Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends\n",
     "each objective directly to the target without any converters or multi-turn techniques. This is\n",
     "controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each\n",
-    "scenario falls back to its own `DEFAULT_INCLUDE_BASELINE` class attribute (most scenarios\n",
-    "default it on; `Jailbreak` defaults it off). See\n",
+    "scenario falls back to its own `BASELINE_POLICY` class attribute (most scenarios default it\n",
+    "on; `Jailbreak` defaults it off). See\n",
     "[Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example."
    ]
   },
diff --git a/doc/code/scenarios/0_scenarios.py b/doc/code/scenarios/0_scenarios.py
index aa6986316a..fbe097ddc8 100644
--- a/doc/code/scenarios/0_scenarios.py
+++ b/doc/code/scenarios/0_scenarios.py
@@ -85,7 +85,7 @@
 #    - `max_retries`: Number of retry attempts on failure (default: 0)
 #    - `memory_labels`: Optional labels for tracking (optional)
 #    - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's
-#      `DEFAULT_INCLUDE_BASELINE`; most scenarios default it on, `Jailbreak` defaults it off)
+#      `BASELINE_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)
 #
 # ### Example Structure
 #
@@ -176,8 +176,8 @@ def _build_display_group(self, *, technique_name: str, seed_group_name: str) ->
 # Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends
 # each objective directly to the target without any converters or multi-turn techniques. This is
 # controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each
-# scenario falls back to its own `DEFAULT_INCLUDE_BASELINE` class attribute (most scenarios
-# default it on; `Jailbreak` defaults it off). See
+# scenario falls back to its own `BASELINE_POLICY` class attribute (most scenarios default it
+# on; `Jailbreak` defaults it off). See
 # [Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example.
 
 # %% [markdown]
diff --git a/pyrit/scenario/__init__.py b/pyrit/scenario/__init__.py
index c5a3130069..b665395433 100644
--- a/pyrit/scenario/__init__.py
+++ b/pyrit/scenario/__init__.py
@@ -21,6 +21,7 @@
     AtomicAttack,
     AttackTechnique,
     AttackTechniqueFactory,
+    BaselinePolicy,
     DatasetConfiguration,
     Scenario,
     ScenarioCompositeStrategy,
@@ -50,6 +51,7 @@
     "AtomicAttack",
     "AttackTechnique",
     "AttackTechniqueFactory",
+    "BaselinePolicy",
     "DatasetConfiguration",
     "Parameter",
     "Scenario",
diff --git a/pyrit/scenario/core/__init__.py b/pyrit/scenario/core/__init__.py
index 06304d3715..c1e36b7ce6 100644
--- a/pyrit/scenario/core/__init__.py
+++ b/pyrit/scenario/core/__init__.py
@@ -8,7 +8,7 @@
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.attack_technique_factory import AttackTechniqueFactory, ScorerOverridePolicy
 from pyrit.scenario.core.dataset_configuration import EXPLICIT_SEED_GROUPS_KEY, DatasetConfiguration
-from pyrit.scenario.core.scenario import Scenario
+from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import ScenarioCompositeStrategy, ScenarioStrategy
 from pyrit.scenario.core.scenario_techniques import (
     SCENARIO_TECHNIQUES,
@@ -20,6 +20,7 @@
     "AtomicAttack",
     "AttackTechnique",
     "AttackTechniqueFactory",
+    "BaselinePolicy",
     "DatasetConfiguration",
     "EXPLICIT_SEED_GROUPS_KEY",
     "SCENARIO_TECHNIQUES",
diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 9ea8a4fb82..15c44c63b6 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -16,11 +16,13 @@
 import uuid
 from abc import ABC, abstractmethod
 from collections.abc import Sequence
+from enum import Enum
 from typing import TYPE_CHECKING, Any, ClassVar, Optional, Union, cast, get_origin
 
 from tqdm.auto import tqdm
 
 from pyrit.common import REQUIRED_VALUE, Parameter, apply_defaults
+from pyrit.common.deprecation import print_deprecation_message
 from pyrit.common.parameter import coerce_value, validate_param_type
 from pyrit.executor.attack.single_turn.prompt_sending import PromptSendingAttack
 from pyrit.memory import CentralMemory
@@ -44,6 +46,26 @@
 logger = logging.getLogger(__name__)
 
 
+class BaselinePolicy(Enum):
+    """
+    Declares how a scenario type treats the default baseline atomic attack.
+
+    The baseline is a plain ``PromptSendingAttack`` that sends each objective unmodified,
+    used as a comparison point against the scenario's strategies. Each scenario class
+    declares its policy via ``Scenario.BASELINE_POLICY``; callers can still override at
+    runtime via ``initialize_async(include_baseline=...)`` for the two ``DEFAULT_*`` states.
+    """
+
+    #: Supported and prepended automatically. Caller can opt out at runtime.
+    DEFAULT_ON = "default_on"
+
+    #: Supported but only included when the caller explicitly requests it.
+    DEFAULT_OFF = "default_off"
+
+    #: Not supported. Explicit ``include_baseline=True`` at runtime raises ``ValueError``.
+    UNSUPPORTED = "unsupported"
+
+
 def _assert_json_serializable(*, params: dict[str, Any]) -> None:
     """
     Raise if any value in ``params`` cannot round-trip through JSON.
@@ -107,18 +129,13 @@ class Scenario(ABC):
     #: what the scenario needs. Validated in ``initialize_async`` once the target is supplied.
     TARGET_REQUIREMENTS: ClassVar[TargetRequirements] = TargetRequirements()
 
-    #: Whether this scenario type supports a default baseline atomic attack. Subclasses whose
-    #: semantics make a default baseline meaningless (e.g. benchmarks that compare against a
-    #: gold-standard answer rather than measure attack lift over an unmodified prompt) override
-    #: this to ``False``. When ``False``, ``initialize_async`` skips the baseline regardless of
-    #: the user-facing default and raises ``ValueError`` if the caller explicitly opts in.
-    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = True
-
-    #: Whether this scenario type includes the baseline atomic attack by default. Used only when
-    #: ``SUPPORTS_DEFAULT_BASELINE`` is ``True``. Subclasses can override this to ``False`` when
-    #: their default behavior should omit the baseline (e.g. when the scenario is already
-    #: dominated by a long list of templates and the baseline is rarely informative).
-    DEFAULT_INCLUDE_BASELINE: ClassVar[bool] = True
+    #: How this scenario type treats the default baseline atomic attack. Subclasses override
+    #: when their semantics call for a different default (``DEFAULT_OFF``) or when a baseline
+    #: is meaningless for the comparison the scenario performs (``UNSUPPORTED``). Resolved in
+    #: ``initialize_async`` and overridable per run via ``include_baseline`` for the
+    #: ``DEFAULT_*`` states; ``UNSUPPORTED`` is a hard constraint and a caller-supplied
+    #: ``include_baseline=True`` raises ``ValueError``.
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.DEFAULT_ON
 
     def __init__(
         self,
@@ -128,6 +145,7 @@ def __init__(
         strategy_class: type[ScenarioStrategy],
         objective_scorer: Scorer,
         scenario_result_id: Optional[Union[uuid.UUID, str]] = None,
+        include_default_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
     ) -> None:
         """
         Initialize a scenario.
@@ -141,6 +159,10 @@ def __init__(
                 Can be either a UUID object or a string representation of a UUID.
                 If provided and found in memory, the scenario will resume from prior progress.
                 All other parameters must still match the stored scenario configuration.
+            include_default_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0.
+                Pass ``include_baseline`` to ``initialize_async`` instead. When set, the value is
+                used as the effective ``include_baseline`` for the next ``initialize_async`` call
+                unless that call passes its own ``include_baseline``.
 
         Note:
             Attack runs are populated by calling initialize_async(), which invokes the
@@ -190,6 +212,18 @@ def __init__(
         self.params: dict[str, Any] = {}
         self._declarations_validated: bool = False
 
+        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along
+        # with the include_default_baseline kwarg above and the legacy fallback branch in
+        # initialize_async. Subclass shims set this attribute directly to avoid double-warning.
+        self._legacy_include_baseline: bool | None = None
+        if include_default_baseline is not None:
+            print_deprecation_message(
+                old_item="Scenario(include_default_baseline=...)",
+                new_item="Scenario.initialize_async(include_baseline=...)",
+                removed_in="v0.16.0",
+            )
+            self._legacy_include_baseline = include_default_baseline
+
     @property
     def name(self) -> str:
         """Get the name of the scenario."""
@@ -523,13 +557,14 @@ async def initialize_async(
             include_baseline (bool | None): Whether to prepend a baseline atomic attack that sends
                 all objectives without modifications, allowing comparison between unmodified prompts
                 and the scenario's strategies. If None (the default), the scenario type's
-                ``DEFAULT_INCLUDE_BASELINE`` class attribute decides (only consulted when
-                ``SUPPORTS_DEFAULT_BASELINE`` is True). Passing ``True`` on a scenario whose
-                ``SUPPORTS_DEFAULT_BASELINE`` is False raises ``ValueError``.
+                ``BASELINE_POLICY`` class attribute decides: ``DEFAULT_ON`` includes it,
+                ``DEFAULT_OFF`` omits it, and ``UNSUPPORTED`` always omits it (and rejects an
+                explicit ``True``). Passing ``True`` to a scenario whose ``BASELINE_POLICY`` is
+                ``UNSUPPORTED`` raises ``ValueError``.
 
         Raises:
             ValueError: If no objective_target is provided, or if ``include_baseline=True`` is passed
-                to a scenario that does not support a default baseline.
+                to a scenario whose ``BASELINE_POLICY`` is ``UNSUPPORTED``.
         """
         # Validate required parameters
         if objective_target is None:
@@ -548,19 +583,25 @@ async def initialize_async(
         self._max_retries = max_retries
         self._memory_labels = memory_labels or {}
 
-        # Resolve the effective include_baseline. Capability is checked first so a forbidden
+        # Deprecated. Will be removed in v0.16.0. Honor the legacy constructor-time
+        # include_default_baseline (or subclass include_baseline) only when the caller did
+        # not supply a runtime value.
+        if include_baseline is None and self._legacy_include_baseline is not None:
+            include_baseline = self._legacy_include_baseline
+
+        # Resolve the effective include_baseline. UNSUPPORTED is checked first so a forbidden
         # scenario type never silently inherits a True default; explicit-True on a forbidden
-        # type is a hard error rather than a silent ignore. When the scenario type supports
-        # the baseline, None defers to DEFAULT_INCLUDE_BASELINE on the class.
-        if not self.SUPPORTS_DEFAULT_BASELINE:
+        # type is a hard error rather than a silent ignore. For the DEFAULT_* states, a None
+        # runtime value defers to the policy.
+        if self.BASELINE_POLICY is BaselinePolicy.UNSUPPORTED:
             if include_baseline is True:
                 raise ValueError(
-                    f"{type(self).__name__} does not support a default baseline; pass "
-                    f"include_baseline=False or omit the argument."
+                    f"{type(self).__name__} does not support a default baseline "
+                    f"(BASELINE_POLICY = UNSUPPORTED); pass include_baseline=False or omit the argument."
                 )
             include_baseline = False
         elif include_baseline is None:
-            include_baseline = self.DEFAULT_INCLUDE_BASELINE
+            include_baseline = self.BASELINE_POLICY is BaselinePolicy.DEFAULT_ON
 
         # Prepare scenario strategies using the stored configuration
         self._scenario_strategies = self._prepare_strategies(scenario_strategies)
diff --git a/pyrit/scenario/scenarios/airt/cyber.py b/pyrit/scenario/scenarios/airt/cyber.py
index 5b9fa2ba31..7c451e73ee 100644
--- a/pyrit/scenario/scenarios/airt/cyber.py
+++ b/pyrit/scenario/scenarios/airt/cyber.py
@@ -7,6 +7,7 @@
 from typing import TYPE_CHECKING, ClassVar
 
 from pyrit.common import apply_defaults
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
 from pyrit.common.path import SCORER_SEED_PROMPT_PATH
 from pyrit.prompt_target import OpenAIChatTarget
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
@@ -105,6 +106,7 @@ def __init__(
         *,
         objective_scorer: TrueFalseScorer | None = None,
         scenario_result_id: str | None = None,
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
     ) -> None:
         """
         Initialize the cyber harms scenario.
@@ -113,6 +115,8 @@ def __init__(
             objective_scorer (TrueFalseScorer | None): Objective scorer for malware detection. If not
                 provided, defaults to a composite scorer using malware detection + refusal backstop.
             scenario_result_id (str | None): Optional ID of an existing scenario result to resume.
+            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+                ``include_baseline`` to ``initialize_async`` instead.
         """
         self._objective_scorer: TrueFalseScorer = (
             objective_scorer if objective_scorer else self._get_default_objective_scorer()
@@ -125,6 +129,16 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
+        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # the include_baseline kwarg above.
+        if include_baseline is not None:
+            print_deprecation_message(
+                old_item="Cyber(include_baseline=...)",
+                new_item="Cyber.initialize_async(include_baseline=...)",
+                removed_in="v0.16.0",
+            )
+            self._legacy_include_baseline = include_baseline
+
     def _get_default_objective_scorer(self) -> TrueFalseCompositeScorer:
         """
         Retrieve the default objective scorer.
diff --git a/pyrit/scenario/scenarios/airt/jailbreak.py b/pyrit/scenario/scenarios/airt/jailbreak.py
index 763ac426dd..4fd8f93b51 100644
--- a/pyrit/scenario/scenarios/airt/jailbreak.py
+++ b/pyrit/scenario/scenarios/airt/jailbreak.py
@@ -7,6 +7,7 @@
 
 from pyrit.auth import get_azure_openai_auth
 from pyrit.common import apply_defaults
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
 from pyrit.datasets import TextJailBreak
 from pyrit.executor.attack.core.attack_config import (
     AttackAdversarialConfig,
@@ -24,7 +25,7 @@
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import Scenario
+from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import ScenarioStrategy
 from pyrit.score import (
     TrueFalseScorer,
@@ -84,7 +85,7 @@ class Jailbreak(Scenario):
     #: Jailbreak runs many templates per objective, so the baseline atomic attack is rarely
     #: informative relative to the volume of jailbreak templates. Off by default; callers that
     #: want a comparison can pass ``include_baseline=True`` to ``initialize_async``.
-    DEFAULT_INCLUDE_BASELINE: ClassVar[bool] = False
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.DEFAULT_OFF
 
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
@@ -130,6 +131,7 @@ def __init__(
         num_templates: Optional[int] = None,
         num_attempts: int = 1,
         jailbreak_names: list[str] | None = None,
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
     ) -> None:
         """
         Initialize the jailbreak scenario.
@@ -142,6 +144,8 @@ def __init__(
             num_attempts (Optional[int]): Number of times to try each jailbreak.
             jailbreak_names (Optional[List[str]]): List of jailbreak names from the template list under datasets.
                 to use.
+            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+                ``include_baseline`` to ``initialize_async`` instead.
 
         Raises:
             ValueError: If both jailbreak_names and num_templates are provided, as random selection
@@ -189,6 +193,16 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
+        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # the include_baseline kwarg above.
+        if include_baseline is not None:
+            print_deprecation_message(
+                old_item="Jailbreak(include_baseline=...)",
+                new_item="Jailbreak.initialize_async(include_baseline=...)",
+                removed_in="v0.16.0",
+            )
+            self._legacy_include_baseline = include_baseline
+
         # Will be resolved in _get_atomic_attacks_async
         self._seed_groups: Optional[list[SeedAttackGroup]] = None
 
diff --git a/pyrit/scenario/scenarios/airt/psychosocial.py b/pyrit/scenario/scenarios/airt/psychosocial.py
index 34f289fc19..60c79ed921 100644
--- a/pyrit/scenario/scenarios/airt/psychosocial.py
+++ b/pyrit/scenario/scenarios/airt/psychosocial.py
@@ -32,7 +32,7 @@
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import Scenario
+from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import (
     ScenarioStrategy,
 )
@@ -150,7 +150,7 @@ class Psychosocial(Scenario):
 
     #: Psychosocial measures multi-turn escalation behavior; a single-shot baseline send
     #: isn't a meaningful comparator, so the default baseline is forbidden.
-    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
 
     #: Psychosocial runs CrescendoAttack, which requires the target to natively support
     #: editable conversation history (for backtracking). Declared here so the base scenario
diff --git a/pyrit/scenario/scenarios/airt/scam.py b/pyrit/scenario/scenarios/airt/scam.py
index 9623f037e6..1298df220b 100644
--- a/pyrit/scenario/scenarios/airt/scam.py
+++ b/pyrit/scenario/scenarios/airt/scam.py
@@ -8,6 +8,7 @@
 
 from pyrit.auth import get_azure_openai_auth
 from pyrit.common import Parameter, apply_defaults
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
 from pyrit.common.path import (
     EXECUTOR_RED_TEAM_PATH,
     SCORER_SEED_PROMPT_PATH,
@@ -151,6 +152,7 @@ def __init__(
         objective_scorer: Optional[TrueFalseScorer] = None,
         adversarial_chat: Optional[PromptTarget] = None,
         scenario_result_id: Optional[str] = None,
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
     ) -> None:
         """
         Initialize the ScamScenario.
@@ -161,6 +163,8 @@ def __init__(
             adversarial_chat (Optional[PromptTarget]): Chat target used to rephrase the
                 objective into the role-play context (in single-turn strategies).
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
+            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+                ``include_baseline`` to ``initialize_async`` instead.
         """
         if not objective_scorer:
             objective_scorer = self._get_default_objective_scorer()
@@ -177,6 +181,16 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
+        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # the include_baseline kwarg above.
+        if include_baseline is not None:
+            print_deprecation_message(
+                old_item="Scam(include_baseline=...)",
+                new_item="Scam.initialize_async(include_baseline=...)",
+                removed_in="v0.16.0",
+            )
+            self._legacy_include_baseline = include_baseline
+
         # Will be resolved in _get_atomic_attacks_async
         self._seed_groups: Optional[list[SeedAttackGroup]] = None
 
diff --git a/pyrit/scenario/scenarios/benchmark/adversarial.py b/pyrit/scenario/scenarios/benchmark/adversarial.py
index 6d0d553b48..2601a97ea6 100644
--- a/pyrit/scenario/scenarios/benchmark/adversarial.py
+++ b/pyrit/scenario/scenarios/benchmark/adversarial.py
@@ -14,7 +14,7 @@
 from pyrit.registry.tag_query import TagQuery
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import Scenario
+from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
 from pyrit.scenario.core.scenario_techniques import SCENARIO_TECHNIQUES
 
 if TYPE_CHECKING:
@@ -36,7 +36,7 @@ class AdversarialBenchmark(Scenario):
 
     #: AdversarialBenchmark compares attack-success rates across adversarial models; a baseline
     #: attack would be model-independent and contribute no signal to the comparison.
-    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
 
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
diff --git a/pyrit/scenario/scenarios/foundry/red_team_agent.py b/pyrit/scenario/scenarios/foundry/red_team_agent.py
index f2d944a18c..b3d406ec65 100644
--- a/pyrit/scenario/scenarios/foundry/red_team_agent.py
+++ b/pyrit/scenario/scenarios/foundry/red_team_agent.py
@@ -18,6 +18,7 @@
 
 from pyrit.auth import get_azure_openai_auth
 from pyrit.common import REQUIRED_VALUE, apply_defaults
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
 from pyrit.datasets import TextJailBreak
 from pyrit.executor.attack import (
     CrescendoAttack,
@@ -248,6 +249,7 @@ def __init__(
         adversarial_chat: Optional[PromptTarget] = None,
         attack_scoring_config: Optional[AttackScoringConfig] = None,
         scenario_result_id: Optional[str] = None,
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
     ) -> None:
         """
         Initialize a Foundry Scenario with the specified attack strategies.
@@ -260,6 +262,8 @@ def __init__(
                 including the objective scorer and auxiliary scorers. If not provided, creates a default
                 configuration with a composite scorer using Azure Content Filter and SelfAsk Refusal scorers.
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
+            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+                ``include_baseline`` to ``initialize_async`` instead.
 
         Raises:
             ValueError: If attack_strategies is empty or contains unsupported strategies.
@@ -283,6 +287,17 @@ def __init__(
             objective_scorer=objective_scorer,
             scenario_result_id=scenario_result_id,
         )
+
+        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # the include_baseline kwarg above.
+        if include_baseline is not None:
+            print_deprecation_message(
+                old_item="RedTeamAgent(include_baseline=...)",
+                new_item="RedTeamAgent.initialize_async(include_baseline=...)",
+                removed_in="v0.16.0",
+            )
+            self._legacy_include_baseline = include_baseline
+
         self._scenario_composites: list[FoundryComposite] = []
 
     @apply_defaults
diff --git a/pyrit/scenario/scenarios/garak/encoding.py b/pyrit/scenario/scenarios/garak/encoding.py
index f239637132..f390b0e891 100644
--- a/pyrit/scenario/scenarios/garak/encoding.py
+++ b/pyrit/scenario/scenarios/garak/encoding.py
@@ -7,6 +7,7 @@
 from typing import Optional
 
 from pyrit.common import apply_defaults
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
 from pyrit.executor.attack.core.attack_config import (
     AttackConverterConfig,
     AttackScoringConfig,
@@ -174,6 +175,7 @@ def __init__(
         objective_scorer: Optional[TrueFalseScorer] = None,
         encoding_templates: Optional[Sequence[str]] = None,
         scenario_result_id: Optional[str] = None,
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
     ) -> None:
         """
         Initialize the Encoding Scenario.
@@ -185,6 +187,8 @@ def __init__(
             encoding_templates (Optional[Sequence[str]]): Templates used to construct the decoding
                 prompts. Defaults to AskToDecodeConverter.garak_templates.
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
+            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+                ``include_baseline`` to ``initialize_async`` instead.
         """
         objective_scorer = objective_scorer or DecodingScorer(categories=["encoding_scenario"])
         self._scorer_config = AttackScoringConfig(objective_scorer=objective_scorer)
@@ -198,6 +202,16 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
+        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # the include_baseline kwarg above.
+        if include_baseline is not None:
+            print_deprecation_message(
+                old_item="Encoding(include_baseline=...)",
+                new_item="Encoding.initialize_async(include_baseline=...)",
+                removed_in="v0.16.0",
+            )
+            self._legacy_include_baseline = include_baseline
+
         # Will be resolved in _get_atomic_attacks_async
         self._resolved_seed_groups: Optional[list[SeedAttackGroup]] = None
 
diff --git a/tests/unit/scenario/test_adversarial.py b/tests/unit/scenario/test_adversarial.py
index 1d71c8f7f1..f414ad4dee 100644
--- a/tests/unit/scenario/test_adversarial.py
+++ b/tests/unit/scenario/test_adversarial.py
@@ -23,7 +23,7 @@
 from pyrit.prompt_target import PromptTarget
 from pyrit.prompt_target.common.prompt_chat_target import PromptChatTarget
 from pyrit.registry.object_registries.attack_technique_registry import AttackTechniqueRegistry
-from pyrit.scenario.core import AtomicAttack
+from pyrit.scenario.core import AtomicAttack, BaselinePolicy
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
 from pyrit.scenario.core.scenario_techniques import SCENARIO_TECHNIQUES
 from pyrit.scenario.scenarios.benchmark.adversarial import AdversarialBenchmark
@@ -438,7 +438,7 @@ async def test_baseline_excluded(self, mock_objective_target, single_adversarial
             mock_objective_target=mock_objective_target,
             adversarial_models=single_adversarial_model,
         )
-        assert type(scenario).SUPPORTS_DEFAULT_BASELINE is False
+        assert type(scenario).BASELINE_POLICY is BaselinePolicy.UNSUPPORTED
         assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
 
     async def test_baseline_explicit_true_raises(self, mock_objective_target, single_adversarial_model):
diff --git a/tests/unit/scenario/test_baseline_deprecation.py b/tests/unit/scenario/test_baseline_deprecation.py
new file mode 100644
index 0000000000..6fed5861d7
--- /dev/null
+++ b/tests/unit/scenario/test_baseline_deprecation.py
@@ -0,0 +1,160 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT license.
+
+"""
+Deprecated. Will be removed in v0.16.0 along with the corresponding
+``include_default_baseline`` / ``include_baseline`` constructor shims in
+``Scenario`` and its subclasses (``Cyber``, ``Jailbreak``, ``Scam``,
+``RedTeamAgent``, ``Encoding``).
+"""
+
+import warnings
+from typing import ClassVar
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+from pyrit.identifiers import ComponentIdentifier
+from pyrit.scenario import DatasetConfiguration
+from pyrit.scenario.core import BaselinePolicy, Scenario, ScenarioStrategy
+from pyrit.score import Scorer
+
+_TEST_SCORER_ID = ComponentIdentifier(class_name="MockScorer", class_module="tests.unit.scenarios")
+
+
+class _LegacyStrategy(ScenarioStrategy):
+    TEST = ("test", {"concrete"})
+    ALL = ("all", {"all"})
+
+    @classmethod
+    def get_aggregate_tags(cls) -> set[str]:
+        return {"all"}
+
+
+class _LegacyScenario(Scenario):
+    """Minimal Scenario stand-in for exercising the deprecated baseline kwargs."""
+
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.DEFAULT_ON
+
+    def __init__(self, **kwargs):
+        kwargs.setdefault("strategy_class", _LegacyStrategy)
+        if "objective_scorer" not in kwargs:
+            mock_scorer = MagicMock(spec=Scorer)
+            mock_scorer.get_identifier.return_value = _TEST_SCORER_ID
+            mock_scorer.get_scorer_metrics.return_value = None
+            kwargs["objective_scorer"] = mock_scorer
+        kwargs.setdefault("version", 1)
+        super().__init__(**kwargs)
+
+    @classmethod
+    def get_strategy_class(cls):
+        return _LegacyStrategy
+
+    @classmethod
+    def get_default_strategy(cls):
+        return _LegacyStrategy.ALL
+
+    @classmethod
+    def default_dataset_config(cls) -> DatasetConfiguration:
+        return DatasetConfiguration()
+
+    async def _get_atomic_attacks_async(self):
+        return []
+
+
+@pytest.fixture
+def mock_objective_target():
+    target = MagicMock()
+    target.get_identifier.return_value = ComponentIdentifier(class_name="MockTarget", class_module="test")
+    return target
+
+
+@pytest.mark.usefixtures("patch_central_database")
+class TestScenarioBaseDeprecation:
+    """Cover the deprecated ``Scenario(include_default_baseline=...)`` base kwarg."""
+
+    def test_base_kwarg_emits_deprecation_warning(self):
+        with warnings.catch_warnings(record=True) as caught:
+            warnings.simplefilter("always")
+            scenario = _LegacyScenario(include_default_baseline=False)
+
+        deprecations = [w for w in caught if issubclass(w.category, DeprecationWarning)]
+        assert len(deprecations) == 1
+        msg = str(deprecations[0].message)
+        assert "include_default_baseline" in msg
+        assert "v0.16.0" in msg
+        assert scenario._legacy_include_baseline is False
+
+    def test_base_kwarg_omitted_emits_no_warning(self):
+        with warnings.catch_warnings(record=True) as caught:
+            warnings.simplefilter("always")
+            scenario = _LegacyScenario()
+
+        assert not any(issubclass(w.category, DeprecationWarning) for w in caught)
+        assert scenario._legacy_include_baseline is None
+
+    async def test_legacy_value_drives_initialize_when_runtime_kwarg_omitted(self, mock_objective_target):
+        """Constructor-time False suppresses the baseline that BASELINE_POLICY.DEFAULT_ON would add."""
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", DeprecationWarning)
+            scenario = _LegacyScenario(include_default_baseline=False)
+
+        with patch.object(_LegacyScenario, "default_dataset_config", return_value=DatasetConfiguration()):
+            await scenario.initialize_async(objective_target=mock_objective_target)
+
+        assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
+
+    async def test_runtime_kwarg_wins_over_legacy_value(self, mock_objective_target):
+        """Explicit runtime include_baseline overrides any constructor-time legacy value."""
+        with warnings.catch_warnings():
+            warnings.simplefilter("ignore", DeprecationWarning)
+            scenario = _LegacyScenario(include_default_baseline=True)
+
+        with patch.object(_LegacyScenario, "default_dataset_config", return_value=DatasetConfiguration()):
+            await scenario.initialize_async(objective_target=mock_objective_target, include_baseline=False)
+
+        assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
+
+
+class TestSubclassBaselineKwargDeprecation:
+    """Cover the deprecated ``include_baseline`` constructor kwarg on user-facing subclasses."""
+
+    @pytest.mark.parametrize(
+        "import_path, class_name, needs_adversarial_chat",
+        [
+            ("pyrit.scenario.scenarios.airt.cyber", "Cyber", False),
+            ("pyrit.scenario.scenarios.airt.jailbreak", "Jailbreak", False),
+            ("pyrit.scenario.scenarios.airt.scam", "Scam", True),
+            ("pyrit.scenario.scenarios.garak.encoding", "Encoding", False),
+        ],
+    )
+    def test_subclass_kwarg_emits_deprecation_warning(
+        self, import_path, class_name, needs_adversarial_chat, patch_central_database
+    ):
+        from pyrit.prompt_target import PromptTarget
+        from pyrit.score import TrueFalseScorer
+
+        module = __import__(import_path, fromlist=[class_name])
+        cls = getattr(module, class_name)
+
+        # Spec'd against TrueFalseScorer so AttackScoringConfig validators accept it.
+        mock_scorer = MagicMock(spec=TrueFalseScorer)
+        mock_scorer.get_identifier.return_value = _TEST_SCORER_ID
+        mock_scorer.get_scorer_metrics.return_value = None
+
+        extra_kwargs = {}
+        if needs_adversarial_chat:
+            mock_target = MagicMock(spec=PromptTarget)
+            mock_target.get_identifier.return_value = ComponentIdentifier(class_name="MockTarget", class_module="test")
+            extra_kwargs["adversarial_chat"] = mock_target
+
+        with warnings.catch_warnings(record=True) as caught:
+            warnings.simplefilter("always")
+            scenario = cls(objective_scorer=mock_scorer, include_baseline=False, **extra_kwargs)
+
+        deprecations = [
+            w for w in caught if issubclass(w.category, DeprecationWarning) and class_name in str(w.message)
+        ]
+        assert len(deprecations) >= 1, f"{class_name} did not emit a DeprecationWarning naming the class"
+        assert "v0.16.0" in str(deprecations[0].message)
+        assert scenario._legacy_include_baseline is False
diff --git a/tests/unit/scenario/test_jailbreak.py b/tests/unit/scenario/test_jailbreak.py
index 36713fafa4..9461714be8 100644
--- a/tests/unit/scenario/test_jailbreak.py
+++ b/tests/unit/scenario/test_jailbreak.py
@@ -16,6 +16,7 @@
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.models import SeedGroup, SeedObjective
 from pyrit.prompt_target import OpenAIChatTarget, PromptTarget
+from pyrit.scenario.core import BaselinePolicy
 from pyrit.scenario.scenarios.airt.jailbreak import Jailbreak, JailbreakStrategy
 from pyrit.score.true_false.true_false_inverter_scorer import TrueFalseInverterScorer
 
@@ -204,13 +205,12 @@ async def test_init_raises_exception_when_no_datasets_available(self, mock_objec
 
     def test_class_supports_baseline_but_defaults_off(self):
         """Jailbreak supports a baseline but does not include one by default."""
-        assert Jailbreak.SUPPORTS_DEFAULT_BASELINE is True
-        assert Jailbreak.DEFAULT_INCLUDE_BASELINE is False
+        assert Jailbreak.BASELINE_POLICY is BaselinePolicy.DEFAULT_OFF
 
     async def test_default_initialize_omits_baseline(
         self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
     ):
-        """initialize_async without include_baseline honors DEFAULT_INCLUDE_BASELINE=False."""
+        """initialize_async without include_baseline honors BASELINE_POLICY=DEFAULT_OFF."""
         with patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
             await scenario.initialize_async(objective_target=mock_objective_target)
@@ -219,7 +219,7 @@ async def test_default_initialize_omits_baseline(
     async def test_explicit_include_baseline_true_prepends_baseline(
         self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
     ):
-        """Caller can override DEFAULT_INCLUDE_BASELINE=False by passing include_baseline=True."""
+        """Caller can override BASELINE_POLICY=DEFAULT_OFF by passing include_baseline=True."""
         from pyrit.scenario import DatasetConfiguration
 
         with (
diff --git a/tests/unit/scenario/test_leakage_scenario.py b/tests/unit/scenario/test_leakage_scenario.py
index b8a0cfb8cc..fcd166a7cd 100644
--- a/tests/unit/scenario/test_leakage_scenario.py
+++ b/tests/unit/scenario/test_leakage_scenario.py
@@ -14,6 +14,7 @@
 from pyrit.prompt_target import PromptTarget
 from pyrit.scenario import DatasetConfiguration
 from pyrit.scenario.airt import Leakage, LeakageStrategy
+from pyrit.scenario.core import BaselinePolicy
 from pyrit.score import TrueFalseCompositeScorer
 
 
@@ -104,7 +105,7 @@ def test_default_scorer_uses_leakage_yaml(self):
 
     def test_init_supports_default_baseline(self):
         """Leakage opts into the parent's default baseline."""
-        assert Leakage.SUPPORTS_DEFAULT_BASELINE is True
+        assert Leakage.BASELINE_POLICY is BaselinePolicy.DEFAULT_ON
 
 
 @pytest.mark.usefixtures(*FIXTURES)
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index a77ade8dfd..5b42eb6728 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioIdentifier, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
 from pyrit.score import Scorer
 
 # Reusable test scorer identifier
@@ -98,10 +98,9 @@ def sample_attack_results():
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    # Tests using this fixture should default to no baseline; set the class flag to forbid
-    # the default baseline so we don't have to thread include_baseline=False through every
-    # initialize_async call.
-    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
+    # Tests using this fixture should default to no baseline; set the class policy to UNSUPPORTED
+    # so we don't have to thread include_baseline=False through every initialize_async call.
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
 
     def __init__(self, atomic_attacks_to_return=None, **kwargs):
         # Add required strategy_class if not provided
diff --git a/tests/unit/scenario/test_scenario_parameters.py b/tests/unit/scenario/test_scenario_parameters.py
index f749418007..af238b92d4 100644
--- a/tests/unit/scenario/test_scenario_parameters.py
+++ b/tests/unit/scenario/test_scenario_parameters.py
@@ -11,7 +11,7 @@
 from pyrit.common import Parameter
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.scenario import DatasetConfiguration
-from pyrit.scenario.core import Scenario, ScenarioStrategy
+from pyrit.scenario.core import BaselinePolicy, Scenario, ScenarioStrategy
 from pyrit.score import Scorer
 
 _TEST_SCORER_ID = ComponentIdentifier(class_name="MockScorer", class_module="tests.unit.scenarios")
@@ -35,7 +35,7 @@ def get_aggregate_tags(cls) -> set[str]:
 
     class _ParamTestScenario(Scenario):
         # No baseline in tests so atomic_attacks observations stay deterministic.
-        SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
+        BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
 
         @classmethod
         def get_strategy_class(cls):
diff --git a/tests/unit/scenario/test_scenario_partial_results.py b/tests/unit/scenario/test_scenario_partial_results.py
index ca984153db..3e53048d76 100644
--- a/tests/unit/scenario/test_scenario_partial_results.py
+++ b/tests/unit/scenario/test_scenario_partial_results.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
 
 
 def _mock_scorer_id(name: str = "MockScorer") -> ComponentIdentifier:
@@ -74,7 +74,7 @@ def filter_objectives(*, remaining_objectives):
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
 
     def __init__(self, *, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
         # Get strategy_class from kwargs or use default
diff --git a/tests/unit/scenario/test_scenario_retry.py b/tests/unit/scenario/test_scenario_retry.py
index 2b93405363..a981fa9039 100644
--- a/tests/unit/scenario/test_scenario_retry.py
+++ b/tests/unit/scenario/test_scenario_retry.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
 
 # Test constants
 TEST_ATTACK_TYPE = "TestAttack"
@@ -137,7 +137,7 @@ def create_mock_atomic_attack(name: str, objectives: list[str], run_async_mock:
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    SUPPORTS_DEFAULT_BASELINE: ClassVar[bool] = False
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
 
     def __init__(self, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
         # Get strategy_class from kwargs or use default

From 38cf8abdb12198a45736d9791bf2a349825c333d Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Tue, 12 May 2026 20:18:16 -0400
Subject: [PATCH 06/19] Rename BaselinePolicy to BaselineDefaultPolicy and add
 subclass guidance

---
 doc/code/scenarios/0_scenarios.ipynb          | 21 +++++++--
 doc/code/scenarios/0_scenarios.py             | 18 ++++++--
 pyrit/scenario/__init__.py                    |  4 +-
 pyrit/scenario/core/__init__.py               |  4 +-
 pyrit/scenario/core/scenario.py               | 45 ++++++++++---------
 pyrit/scenario/scenarios/airt/jailbreak.py    |  4 +-
 pyrit/scenario/scenarios/airt/psychosocial.py |  4 +-
 .../scenarios/benchmark/adversarial.py        |  4 +-
 tests/unit/scenario/test_adversarial.py       |  4 +-
 .../scenario/test_baseline_deprecation.py     |  6 +--
 tests/unit/scenario/test_jailbreak.py         |  8 ++--
 tests/unit/scenario/test_leakage_scenario.py  |  4 +-
 tests/unit/scenario/test_scenario.py          |  6 +--
 .../unit/scenario/test_scenario_parameters.py |  4 +-
 .../scenario/test_scenario_partial_results.py |  4 +-
 tests/unit/scenario/test_scenario_retry.py    |  4 +-
 16 files changed, 85 insertions(+), 59 deletions(-)

diff --git a/doc/code/scenarios/0_scenarios.ipynb b/doc/code/scenarios/0_scenarios.ipynb
index 81e0971ba4..028f069dba 100644
--- a/doc/code/scenarios/0_scenarios.ipynb
+++ b/doc/code/scenarios/0_scenarios.ipynb
@@ -83,7 +83,7 @@
     "   - `max_retries`: Number of retry attempts on failure (default: 0)\n",
     "   - `memory_labels`: Optional labels for tracking (optional)\n",
     "   - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's\n",
-    "     `BASELINE_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)\n",
+    "     `BASELINE_DEFAULT_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)\n",
     "\n",
     "### Example Structure\n",
     "\n",
@@ -115,6 +115,7 @@
     }
    ],
    "source": [
+    "\n",
     "from pyrit.common import apply_defaults\n",
     "from pyrit.scenario import (\n",
     "    DatasetConfiguration,\n",
@@ -406,9 +407,21 @@
     "Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends\n",
     "each objective directly to the target without any converters or multi-turn techniques. This is\n",
     "controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each\n",
-    "scenario falls back to its own `BASELINE_POLICY` class attribute (most scenarios default it\n",
-    "on; `Jailbreak` defaults it off). See\n",
-    "[Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example."
+    "scenario falls back to its own `BASELINE_DEFAULT_POLICY` class attribute (most scenarios default\n",
+    "it on; `Jailbreak` defaults it off). See\n",
+    "[Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example.\n",
+    "\n",
+    "Custom scenarios should choose their `BASELINE_DEFAULT_POLICY` based on whether an unmodified\n",
+    "prompt is a meaningful comparator for the scenario's strategies:\n",
+    "\n",
+    "- **`Enabled`** — the baseline is prepended by default and the caller can opt out. Use when an\n",
+    "  unmodified-prompt run is a meaningful comparison point (most scenarios).\n",
+    "- **`Disabled`** — the baseline is supported but omitted by default; the caller must opt in. Use\n",
+    "  when the scenario is already dominated by a large set of templates/strategies that already\n",
+    "  exercise the unmodified surface (e.g., `Jailbreak`).\n",
+    "- **`Forbidden`** — the baseline is unavailable and passing `include_baseline=True` raises. Use\n",
+    "  when the scenario's semantics make a single-shot unmodified prompt meaningless as a comparator\n",
+    "  (e.g., benchmarks comparing across adversarial models, or multi-turn-only scenarios)."
    ]
   },
   {
diff --git a/doc/code/scenarios/0_scenarios.py b/doc/code/scenarios/0_scenarios.py
index fbe097ddc8..a9ed63592f 100644
--- a/doc/code/scenarios/0_scenarios.py
+++ b/doc/code/scenarios/0_scenarios.py
@@ -85,7 +85,7 @@
 #    - `max_retries`: Number of retry attempts on failure (default: 0)
 #    - `memory_labels`: Optional labels for tracking (optional)
 #    - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's
-#      `BASELINE_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)
+#      `BASELINE_DEFAULT_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)
 #
 # ### Example Structure
 #
@@ -176,9 +176,21 @@ def _build_display_group(self, *, technique_name: str, seed_group_name: str) ->
 # Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends
 # each objective directly to the target without any converters or multi-turn techniques. This is
 # controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each
-# scenario falls back to its own `BASELINE_POLICY` class attribute (most scenarios default it
-# on; `Jailbreak` defaults it off). See
+# scenario falls back to its own `BASELINE_DEFAULT_POLICY` class attribute (most scenarios default
+# it on; `Jailbreak` defaults it off). See
 # [Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example.
+#
+# Custom scenarios should choose their `BASELINE_DEFAULT_POLICY` based on whether an unmodified
+# prompt is a meaningful comparator for the scenario's strategies:
+#
+# - **`Enabled`** — the baseline is prepended by default and the caller can opt out. Use when an
+#   unmodified-prompt run is a meaningful comparison point (most scenarios).
+# - **`Disabled`** — the baseline is supported but omitted by default; the caller must opt in. Use
+#   when the scenario is already dominated by a large set of templates/strategies that already
+#   exercise the unmodified surface (e.g., `Jailbreak`).
+# - **`Forbidden`** — the baseline is unavailable and passing `include_baseline=True` raises. Use
+#   when the scenario's semantics make a single-shot unmodified prompt meaningless as a comparator
+#   (e.g., benchmarks comparing across adversarial models, or multi-turn-only scenarios).
 
 # %% [markdown]
 #
diff --git a/pyrit/scenario/__init__.py b/pyrit/scenario/__init__.py
index b665395433..73ce95bf52 100644
--- a/pyrit/scenario/__init__.py
+++ b/pyrit/scenario/__init__.py
@@ -21,7 +21,7 @@
     AtomicAttack,
     AttackTechnique,
     AttackTechniqueFactory,
-    BaselinePolicy,
+    BaselineDefaultPolicy,
     DatasetConfiguration,
     Scenario,
     ScenarioCompositeStrategy,
@@ -51,7 +51,7 @@
     "AtomicAttack",
     "AttackTechnique",
     "AttackTechniqueFactory",
-    "BaselinePolicy",
+    "BaselineDefaultPolicy",
     "DatasetConfiguration",
     "Parameter",
     "Scenario",
diff --git a/pyrit/scenario/core/__init__.py b/pyrit/scenario/core/__init__.py
index 89c8935da5..4ca0b0207b 100644
--- a/pyrit/scenario/core/__init__.py
+++ b/pyrit/scenario/core/__init__.py
@@ -8,7 +8,7 @@
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.attack_technique_factory import AttackTechniqueFactory, ScorerOverridePolicy
 from pyrit.scenario.core.dataset_configuration import EXPLICIT_SEED_GROUPS_KEY, DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
+from pyrit.scenario.core.scenario import BaselineDefaultPolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import ScenarioCompositeStrategy, ScenarioStrategy
 from pyrit.scenario.core.scenario_target_defaults import get_default_adversarial_target, get_default_scorer_target
 from pyrit.scenario.core.scenario_techniques import (
@@ -20,7 +20,7 @@
     "AtomicAttack",
     "AttackTechnique",
     "AttackTechniqueFactory",
-    "BaselinePolicy",
+    "BaselineDefaultPolicy",
     "DatasetConfiguration",
     "EXPLICIT_SEED_GROUPS_KEY",
     "SCENARIO_TECHNIQUES",
diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 55bf4c2666..89eb8c3a0a 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -56,24 +56,25 @@
 logger = logging.getLogger(__name__)
 
 
-class BaselinePolicy(Enum):
+class BaselineDefaultPolicy(Enum):
     """
     Declares how a scenario type treats the default baseline atomic attack.
 
     The baseline is a plain ``PromptSendingAttack`` that sends each objective unmodified,
     used as a comparison point against the scenario's strategies. Each scenario class
-    declares its policy via ``Scenario.BASELINE_POLICY``; callers can still override at
-    runtime via ``initialize_async(include_baseline=...)`` for the two ``DEFAULT_*`` states.
+    declares its policy via ``Scenario.BASELINE_DEFAULT_POLICY``; callers can still override
+    at runtime via ``initialize_async(include_baseline=...)`` for the ``Enabled`` and
+    ``Disabled`` states.
     """
 
     #: Supported and prepended automatically. Caller can opt out at runtime.
-    DEFAULT_ON = "default_on"
+    Enabled = "enabled"
 
     #: Supported but only included when the caller explicitly requests it.
-    DEFAULT_OFF = "default_off"
+    Disabled = "disabled"
 
     #: Not supported. Explicit ``include_baseline=True`` at runtime raises ``ValueError``.
-    UNSUPPORTED = "unsupported"
+    Forbidden = "forbidden"
 
 
 def _assert_json_serializable(*, params: dict[str, Any]) -> None:
@@ -140,12 +141,12 @@ class Scenario(ABC):
     TARGET_REQUIREMENTS: ClassVar[TargetRequirements] = TargetRequirements()
 
     #: How this scenario type treats the default baseline atomic attack. Subclasses override
-    #: when their semantics call for a different default (``DEFAULT_OFF``) or when a baseline
-    #: is meaningless for the comparison the scenario performs (``UNSUPPORTED``). Resolved in
+    #: when their semantics call for a different default (``Disabled``) or when a baseline
+    #: is meaningless for the comparison the scenario performs (``Forbidden``). Resolved in
     #: ``initialize_async`` and overridable per run via ``include_baseline`` for the
-    #: ``DEFAULT_*`` states; ``UNSUPPORTED`` is a hard constraint and a caller-supplied
-    #: ``include_baseline=True`` raises ``ValueError``.
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.DEFAULT_ON
+    #: ``Enabled`` and ``Disabled`` states; ``Forbidden`` is a hard constraint and a
+    #: caller-supplied ``include_baseline=True`` raises ``ValueError``.
+    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Enabled
 
     @classmethod
     def _get_additional_scoring_questions(cls) -> Sequence[Path]:
@@ -617,14 +618,14 @@ async def initialize_async(
             include_baseline (bool | None): Whether to prepend a baseline atomic attack that sends
                 all objectives without modifications, allowing comparison between unmodified prompts
                 and the scenario's strategies. If None (the default), the scenario type's
-                ``BASELINE_POLICY`` class attribute decides: ``DEFAULT_ON`` includes it,
-                ``DEFAULT_OFF`` omits it, and ``UNSUPPORTED`` always omits it (and rejects an
-                explicit ``True``). Passing ``True`` to a scenario whose ``BASELINE_POLICY`` is
-                ``UNSUPPORTED`` raises ``ValueError``.
+                ``BASELINE_DEFAULT_POLICY`` class attribute decides: ``Enabled`` includes it,
+                ``Disabled`` omits it, and ``Forbidden`` always omits it (and rejects an
+                explicit ``True``). Passing ``True`` to a scenario whose ``BASELINE_DEFAULT_POLICY``
+                is ``Forbidden`` raises ``ValueError``.
 
         Raises:
             ValueError: If no objective_target is provided, or if ``include_baseline=True`` is passed
-                to a scenario whose ``BASELINE_POLICY`` is ``UNSUPPORTED``.
+                to a scenario whose ``BASELINE_DEFAULT_POLICY`` is ``Forbidden``.
         """
         # Validate required parameters
         if objective_target is None:
@@ -649,19 +650,19 @@ async def initialize_async(
         if include_baseline is None and self._legacy_include_baseline is not None:
             include_baseline = self._legacy_include_baseline
 
-        # Resolve the effective include_baseline. UNSUPPORTED is checked first so a forbidden
+        # Resolve the effective include_baseline. Forbidden is checked first so a forbidden
         # scenario type never silently inherits a True default; explicit-True on a forbidden
-        # type is a hard error rather than a silent ignore. For the DEFAULT_* states, a None
-        # runtime value defers to the policy.
-        if self.BASELINE_POLICY is BaselinePolicy.UNSUPPORTED:
+        # type is a hard error rather than a silent ignore. For the Enabled / Disabled states,
+        # a None runtime value defers to the policy.
+        if self.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Forbidden:
             if include_baseline is True:
                 raise ValueError(
                     f"{type(self).__name__} does not support a default baseline "
-                    f"(BASELINE_POLICY = UNSUPPORTED); pass include_baseline=False or omit the argument."
+                    f"(BASELINE_DEFAULT_POLICY = Forbidden); pass include_baseline=False or omit the argument."
                 )
             include_baseline = False
         elif include_baseline is None:
-            include_baseline = self.BASELINE_POLICY is BaselinePolicy.DEFAULT_ON
+            include_baseline = self.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Enabled
 
         # Prepare scenario strategies using the stored configuration
         self._scenario_strategies = self._prepare_strategies(scenario_strategies)
diff --git a/pyrit/scenario/scenarios/airt/jailbreak.py b/pyrit/scenario/scenarios/airt/jailbreak.py
index ee4b0404ec..d11fd41886 100644
--- a/pyrit/scenario/scenarios/airt/jailbreak.py
+++ b/pyrit/scenario/scenarios/airt/jailbreak.py
@@ -23,7 +23,7 @@
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
+from pyrit.scenario.core.scenario import BaselineDefaultPolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import ScenarioStrategy
 from pyrit.scenario.core.scenario_target_defaults import get_default_adversarial_target
 from pyrit.score import (
@@ -84,7 +84,7 @@ class Jailbreak(Scenario):
     #: Jailbreak runs many templates per objective, so the baseline atomic attack is rarely
     #: informative relative to the volume of jailbreak templates. Off by default; callers that
     #: want a comparison can pass ``include_baseline=True`` to ``initialize_async``.
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.DEFAULT_OFF
+    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Disabled
 
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
diff --git a/pyrit/scenario/scenarios/airt/psychosocial.py b/pyrit/scenario/scenarios/airt/psychosocial.py
index 9a56bb753d..5697a9678e 100644
--- a/pyrit/scenario/scenarios/airt/psychosocial.py
+++ b/pyrit/scenario/scenarios/airt/psychosocial.py
@@ -30,7 +30,7 @@
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
+from pyrit.scenario.core.scenario import BaselineDefaultPolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import (
     ScenarioStrategy,
 )
@@ -149,7 +149,7 @@ class Psychosocial(Scenario):
 
     #: Psychosocial measures multi-turn escalation behavior; a single-shot baseline send
     #: isn't a meaningful comparator, so the default baseline is forbidden.
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
+    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
 
     #: Psychosocial runs CrescendoAttack, which requires the target to natively support
     #: editable conversation history (for backtracking). Declared here so the base scenario
diff --git a/pyrit/scenario/scenarios/benchmark/adversarial.py b/pyrit/scenario/scenarios/benchmark/adversarial.py
index 2601a97ea6..421d21617c 100644
--- a/pyrit/scenario/scenarios/benchmark/adversarial.py
+++ b/pyrit/scenario/scenarios/benchmark/adversarial.py
@@ -14,7 +14,7 @@
 from pyrit.registry.tag_query import TagQuery
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
+from pyrit.scenario.core.scenario import BaselineDefaultPolicy, Scenario
 from pyrit.scenario.core.scenario_techniques import SCENARIO_TECHNIQUES
 
 if TYPE_CHECKING:
@@ -36,7 +36,7 @@ class AdversarialBenchmark(Scenario):
 
     #: AdversarialBenchmark compares attack-success rates across adversarial models; a baseline
     #: attack would be model-independent and contribute no signal to the comparison.
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
+    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
 
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
diff --git a/tests/unit/scenario/test_adversarial.py b/tests/unit/scenario/test_adversarial.py
index f414ad4dee..6cb7e11fae 100644
--- a/tests/unit/scenario/test_adversarial.py
+++ b/tests/unit/scenario/test_adversarial.py
@@ -23,7 +23,7 @@
 from pyrit.prompt_target import PromptTarget
 from pyrit.prompt_target.common.prompt_chat_target import PromptChatTarget
 from pyrit.registry.object_registries.attack_technique_registry import AttackTechniqueRegistry
-from pyrit.scenario.core import AtomicAttack, BaselinePolicy
+from pyrit.scenario.core import AtomicAttack, BaselineDefaultPolicy
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
 from pyrit.scenario.core.scenario_techniques import SCENARIO_TECHNIQUES
 from pyrit.scenario.scenarios.benchmark.adversarial import AdversarialBenchmark
@@ -438,7 +438,7 @@ async def test_baseline_excluded(self, mock_objective_target, single_adversarial
             mock_objective_target=mock_objective_target,
             adversarial_models=single_adversarial_model,
         )
-        assert type(scenario).BASELINE_POLICY is BaselinePolicy.UNSUPPORTED
+        assert type(scenario).BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Forbidden
         assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
 
     async def test_baseline_explicit_true_raises(self, mock_objective_target, single_adversarial_model):
diff --git a/tests/unit/scenario/test_baseline_deprecation.py b/tests/unit/scenario/test_baseline_deprecation.py
index 6fed5861d7..634cf0d7db 100644
--- a/tests/unit/scenario/test_baseline_deprecation.py
+++ b/tests/unit/scenario/test_baseline_deprecation.py
@@ -16,7 +16,7 @@
 
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.scenario import DatasetConfiguration
-from pyrit.scenario.core import BaselinePolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import BaselineDefaultPolicy, Scenario, ScenarioStrategy
 from pyrit.score import Scorer
 
 _TEST_SCORER_ID = ComponentIdentifier(class_name="MockScorer", class_module="tests.unit.scenarios")
@@ -34,7 +34,7 @@ def get_aggregate_tags(cls) -> set[str]:
 class _LegacyScenario(Scenario):
     """Minimal Scenario stand-in for exercising the deprecated baseline kwargs."""
 
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.DEFAULT_ON
+    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Enabled
 
     def __init__(self, **kwargs):
         kwargs.setdefault("strategy_class", _LegacyStrategy)
@@ -94,7 +94,7 @@ def test_base_kwarg_omitted_emits_no_warning(self):
         assert scenario._legacy_include_baseline is None
 
     async def test_legacy_value_drives_initialize_when_runtime_kwarg_omitted(self, mock_objective_target):
-        """Constructor-time False suppresses the baseline that BASELINE_POLICY.DEFAULT_ON would add."""
+        """Constructor-time False suppresses the baseline that BASELINE_DEFAULT_POLICY=Enabled would add."""
         with warnings.catch_warnings():
             warnings.simplefilter("ignore", DeprecationWarning)
             scenario = _LegacyScenario(include_default_baseline=False)
diff --git a/tests/unit/scenario/test_jailbreak.py b/tests/unit/scenario/test_jailbreak.py
index c1470c4533..debafa01de 100644
--- a/tests/unit/scenario/test_jailbreak.py
+++ b/tests/unit/scenario/test_jailbreak.py
@@ -16,7 +16,7 @@
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.models import SeedGroup, SeedObjective
 from pyrit.prompt_target import PromptTarget
-from pyrit.scenario.core import BaselinePolicy
+from pyrit.scenario.core import BaselineDefaultPolicy
 from pyrit.scenario.scenarios.airt.jailbreak import Jailbreak, JailbreakStrategy
 from pyrit.score.true_false.true_false_inverter_scorer import TrueFalseInverterScorer
 
@@ -205,12 +205,12 @@ async def test_init_raises_exception_when_no_datasets_available(self, mock_objec
 
     def test_class_supports_baseline_but_defaults_off(self):
         """Jailbreak supports a baseline but does not include one by default."""
-        assert Jailbreak.BASELINE_POLICY is BaselinePolicy.DEFAULT_OFF
+        assert Jailbreak.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Disabled
 
     async def test_default_initialize_omits_baseline(
         self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
     ):
-        """initialize_async without include_baseline honors BASELINE_POLICY=DEFAULT_OFF."""
+        """initialize_async without include_baseline honors BASELINE_DEFAULT_POLICY=Disabled."""
         with patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
             await scenario.initialize_async(objective_target=mock_objective_target)
@@ -219,7 +219,7 @@ async def test_default_initialize_omits_baseline(
     async def test_explicit_include_baseline_true_prepends_baseline(
         self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
     ):
-        """Caller can override BASELINE_POLICY=DEFAULT_OFF by passing include_baseline=True."""
+        """Caller can override BASELINE_DEFAULT_POLICY=Disabled by passing include_baseline=True."""
         from pyrit.scenario import DatasetConfiguration
 
         with (
diff --git a/tests/unit/scenario/test_leakage_scenario.py b/tests/unit/scenario/test_leakage_scenario.py
index fcd166a7cd..302b28665e 100644
--- a/tests/unit/scenario/test_leakage_scenario.py
+++ b/tests/unit/scenario/test_leakage_scenario.py
@@ -14,7 +14,7 @@
 from pyrit.prompt_target import PromptTarget
 from pyrit.scenario import DatasetConfiguration
 from pyrit.scenario.airt import Leakage, LeakageStrategy
-from pyrit.scenario.core import BaselinePolicy
+from pyrit.scenario.core import BaselineDefaultPolicy
 from pyrit.score import TrueFalseCompositeScorer
 
 
@@ -105,7 +105,7 @@ def test_default_scorer_uses_leakage_yaml(self):
 
     def test_init_supports_default_baseline(self):
         """Leakage opts into the parent's default baseline."""
-        assert Leakage.BASELINE_POLICY is BaselinePolicy.DEFAULT_ON
+        assert Leakage.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Enabled
 
 
 @pytest.mark.usefixtures(*FIXTURES)
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index 65c98c1b42..ee9301bdf3 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioIdentifier, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselineDefaultPolicy, Scenario, ScenarioStrategy
 from pyrit.score import Scorer
 
 # Reusable test scorer identifier
@@ -98,9 +98,9 @@ def sample_attack_results():
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    # Tests using this fixture should default to no baseline; set the class policy to UNSUPPORTED
+    # Tests using this fixture should default to no baseline; set the class policy to Forbidden
     # so we don't have to thread include_baseline=False through every initialize_async call.
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
+    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
 
     def __init__(self, atomic_attacks_to_return=None, **kwargs):
         # Add required strategy_class if not provided
diff --git a/tests/unit/scenario/test_scenario_parameters.py b/tests/unit/scenario/test_scenario_parameters.py
index af238b92d4..3a28068a04 100644
--- a/tests/unit/scenario/test_scenario_parameters.py
+++ b/tests/unit/scenario/test_scenario_parameters.py
@@ -11,7 +11,7 @@
 from pyrit.common import Parameter
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.scenario import DatasetConfiguration
-from pyrit.scenario.core import BaselinePolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import BaselineDefaultPolicy, Scenario, ScenarioStrategy
 from pyrit.score import Scorer
 
 _TEST_SCORER_ID = ComponentIdentifier(class_name="MockScorer", class_module="tests.unit.scenarios")
@@ -35,7 +35,7 @@ def get_aggregate_tags(cls) -> set[str]:
 
     class _ParamTestScenario(Scenario):
         # No baseline in tests so atomic_attacks observations stay deterministic.
-        BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
+        BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
 
         @classmethod
         def get_strategy_class(cls):
diff --git a/tests/unit/scenario/test_scenario_partial_results.py b/tests/unit/scenario/test_scenario_partial_results.py
index 3e53048d76..03d67ad47a 100644
--- a/tests/unit/scenario/test_scenario_partial_results.py
+++ b/tests/unit/scenario/test_scenario_partial_results.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselineDefaultPolicy, Scenario, ScenarioStrategy
 
 
 def _mock_scorer_id(name: str = "MockScorer") -> ComponentIdentifier:
@@ -74,7 +74,7 @@ def filter_objectives(*, remaining_objectives):
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
+    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
 
     def __init__(self, *, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
         # Get strategy_class from kwargs or use default
diff --git a/tests/unit/scenario/test_scenario_retry.py b/tests/unit/scenario/test_scenario_retry.py
index a981fa9039..926383cffc 100644
--- a/tests/unit/scenario/test_scenario_retry.py
+++ b/tests/unit/scenario/test_scenario_retry.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselineDefaultPolicy, Scenario, ScenarioStrategy
 
 # Test constants
 TEST_ATTACK_TYPE = "TestAttack"
@@ -137,7 +137,7 @@ def create_mock_atomic_attack(name: str, objectives: list[str], run_async_mock:
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.UNSUPPORTED
+    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
 
     def __init__(self, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
         # Get strategy_class from kwargs or use default

From c1cd97839ba912c5dbe342f3cbb5a7f3e4c7fd96 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Tue, 12 May 2026 20:30:06 -0400
Subject: [PATCH 07/19] Apply pre-commit notebook cleanup

---
 doc/code/scenarios/0_scenarios.ipynb | 1 -
 1 file changed, 1 deletion(-)

diff --git a/doc/code/scenarios/0_scenarios.ipynb b/doc/code/scenarios/0_scenarios.ipynb
index 028f069dba..14c68f2061 100644
--- a/doc/code/scenarios/0_scenarios.ipynb
+++ b/doc/code/scenarios/0_scenarios.ipynb
@@ -115,7 +115,6 @@
     }
    ],
    "source": [
-    "\n",
     "from pyrit.common import apply_defaults\n",
     "from pyrit.scenario import (\n",
     "    DatasetConfiguration,\n",

From 3b551b9cc7ec5cf66d212ca1fc108555b8798e73 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 12:17:31 -0400
Subject: [PATCH 08/19] Emit baseline from base _get_atomic_attacks_async via
 helper

---
 pyrit/scenario/core/scenario.py            | 56 +++++++++++++++++++++-
 tests/unit/scenario/test_cyber.py          |  2 +-
 tests/unit/scenario/test_rapid_response.py |  3 +-
 3 files changed, 58 insertions(+), 3 deletions(-)

diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 89eb8c3a0a..b9be3fe15f 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -235,6 +235,10 @@ def __init__(
         self.params: dict[str, Any] = {}
         self._declarations_validated: bool = False
 
+        # Resolved effective baseline inclusion for the current run. Set in initialize_async
+        # before _get_atomic_attacks_async is awaited so overrides can read it.
+        self._include_baseline: bool = False
+
         # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along
         # with the include_default_baseline kwarg above and the legacy fallback branch in
         # initialize_async. Subclass shims set this attribute directly to avoid double-warning.
@@ -664,6 +668,8 @@ async def initialize_async(
         elif include_baseline is None:
             include_baseline = self.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Enabled
 
+        self._include_baseline = include_baseline
+
         # Prepare scenario strategies using the stored configuration
         self._scenario_strategies = self._prepare_strategies(scenario_strategies)
 
@@ -676,7 +682,12 @@ async def initialize_async(
 
         self._atomic_attacks = await self._get_atomic_attacks_async()
 
-        if include_baseline:
+        # Transitional guard (removed when _get_baseline / _get_baseline_data are deleted).
+        # Skip the legacy post-hoc insert when _get_atomic_attacks_async already emitted
+        # baseline at index 0 (the structural path); fall through to the old behavior for
+        # overrides not yet migrated.
+        already_emitted_baseline = bool(self._atomic_attacks) and self._atomic_attacks[0].atomic_attack_name == "baseline"
+        if include_baseline and not already_emitted_baseline:
             baseline_attack = self._get_baseline()
             self._atomic_attacks.insert(0, baseline_attack)
 
@@ -729,6 +740,45 @@ async def initialize_async(
         self._scenario_result_id = str(result.id)
         logger.info(f"Created new scenario result with ID: {self._scenario_result_id}")
 
+    def _build_baseline_atomic_attack(self, *, seed_groups: list[SeedAttackGroup]) -> AtomicAttack:
+        """
+        Build the baseline AtomicAttack from pre-resolved seed groups.
+
+        The baseline sends each objective unmodified, providing a comparison point
+        against the scenario's strategy attacks. Pass the same ``seed_groups`` used
+        to build the strategy attacks so both populations match.
+
+        Args:
+            seed_groups: Seed groups to attack. Used as-is, no further sampling.
+
+        Returns:
+            AtomicAttack: The baseline atomic attack.
+
+        Raises:
+            ValueError: If ``initialize_async`` has not been called (no objective
+                target or scorer set).
+        """
+        if self._objective_target is None:
+            raise ValueError("Objective target is required to create baseline attack.")
+        if self._objective_scorer is None:
+            raise ValueError("Objective scorer is required to create baseline attack.")
+
+        from pyrit.executor.attack.core.attack_config import AttackScoringConfig
+
+        attack = PromptSendingAttack(
+            objective_target=self._objective_target,
+            attack_scoring_config=AttackScoringConfig(
+                objective_scorer=cast("TrueFalseScorer", self._objective_scorer)
+            ),
+        )
+
+        return AtomicAttack(
+            atomic_attack_name="baseline",
+            attack_technique=AttackTechnique(attack=attack),
+            seed_groups=seed_groups,
+            memory_labels=self._memory_labels,
+        )
+
     def _get_baseline(self) -> AtomicAttack:
         """
         Get a baseline AtomicAttack, which simply sends all the objectives without any modifications.
@@ -1042,6 +1092,10 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
                     )
                 )
 
+        if self._include_baseline:
+            all_seed_groups = [g for groups in seed_groups_by_dataset.values() for g in groups]
+            atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=all_seed_groups))
+
         return atomic_attacks
 
     async def run_async(self) -> ScenarioResult:
diff --git a/tests/unit/scenario/test_cyber.py b/tests/unit/scenario/test_cyber.py
index e5833525bf..d519e8913f 100644
--- a/tests/unit/scenario/test_cyber.py
+++ b/tests/unit/scenario/test_cyber.py
@@ -211,7 +211,7 @@ async def _init_and_get_attacks(
         groups = seed_groups or {"malware": _make_seed_groups("malware")}
         with patch.object(DatasetConfiguration, "get_seed_attack_groups", return_value=groups):
             scenario = Cyber(objective_scorer=mock_objective_scorer)
-            init_kwargs = {"objective_target": mock_objective_target}
+            init_kwargs = {"objective_target": mock_objective_target, "include_baseline": False}
             if strategies:
                 init_kwargs["scenario_strategies"] = strategies
             await scenario.initialize_async(**init_kwargs)
diff --git a/tests/unit/scenario/test_rapid_response.py b/tests/unit/scenario/test_rapid_response.py
index f81093f80c..ecaef3d02c 100644
--- a/tests/unit/scenario/test_rapid_response.py
+++ b/tests/unit/scenario/test_rapid_response.py
@@ -245,7 +245,7 @@ async def _init_and_get_attacks(
             scenario = RapidResponse(
                 objective_scorer=mock_objective_scorer,
             )
-            init_kwargs = {"objective_target": mock_objective_target}
+            init_kwargs = {"objective_target": mock_objective_target, "include_baseline": False}
             if strategies:
                 init_kwargs["scenario_strategies"] = strategies
             await scenario.initialize_async(**init_kwargs)
@@ -392,6 +392,7 @@ async def test_unknown_technique_skipped_with_warning(self, mock_objective_targe
             await scenario.initialize_async(
                 objective_target=mock_objective_target,
                 scenario_strategies=[_strategy_class().ALL],
+                include_baseline=False,
             )
             attacks = await scenario._get_atomic_attacks_async()
             # Only prompt_sending should have produced attacks

From bac9d36b792d96667d890fe6832ee81cbd03baf9 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 12:47:33 -0400
Subject: [PATCH 09/19] Migrate scenario overrides to emit baseline from
 _get_atomic_attacks_async

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 pyrit/scenario/scenarios/airt/jailbreak.py         | 3 +++
 pyrit/scenario/scenarios/airt/scam.py              | 7 ++++++-
 pyrit/scenario/scenarios/foundry/red_team_agent.py | 7 ++++++-
 pyrit/scenario/scenarios/garak/encoding.py         | 9 ++++++++-
 tests/unit/scenario/test_scam.py                   | 4 ++++
 5 files changed, 27 insertions(+), 3 deletions(-)

diff --git a/pyrit/scenario/scenarios/airt/jailbreak.py b/pyrit/scenario/scenarios/airt/jailbreak.py
index d11fd41886..9d878b51ff 100644
--- a/pyrit/scenario/scenarios/airt/jailbreak.py
+++ b/pyrit/scenario/scenarios/airt/jailbreak.py
@@ -324,4 +324,7 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
                     )
                     atomic_attacks.append(atomic_attack)
 
+        if self._include_baseline:
+            atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=self._seed_groups or []))
+
         return atomic_attacks
diff --git a/pyrit/scenario/scenarios/airt/scam.py b/pyrit/scenario/scenarios/airt/scam.py
index a491e53de4..30676e74bf 100644
--- a/pyrit/scenario/scenarios/airt/scam.py
+++ b/pyrit/scenario/scenarios/airt/scam.py
@@ -281,4 +281,9 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
 
         strategies = {s.value for s in self._scenario_strategies}
 
-        return [self._get_atomic_attack_from_strategy(strategy) for strategy in strategies]
+        atomic_attacks = [self._get_atomic_attack_from_strategy(strategy) for strategy in strategies]
+
+        if self._include_baseline:
+            atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=self._seed_groups or []))
+
+        return atomic_attacks
diff --git a/pyrit/scenario/scenarios/foundry/red_team_agent.py b/pyrit/scenario/scenarios/foundry/red_team_agent.py
index 58b0707a5a..6a13073882 100644
--- a/pyrit/scenario/scenarios/foundry/red_team_agent.py
+++ b/pyrit/scenario/scenarios/foundry/red_team_agent.py
@@ -433,7 +433,12 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
         # Resolve seed groups now that initialize_async has been called
         self._seed_groups = self._resolve_seed_groups()
 
-        return [self._get_attack_from_strategy(composition) for composition in self._scenario_composites]
+        atomic_attacks = [self._get_attack_from_strategy(composition) for composition in self._scenario_composites]
+
+        if self._include_baseline:
+            atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=self._seed_groups))
+
+        return atomic_attacks
 
     def _get_attack_from_strategy(self, composite: FoundryComposite) -> AtomicAttack:
         """
diff --git a/pyrit/scenario/scenarios/garak/encoding.py b/pyrit/scenario/scenarios/garak/encoding.py
index f390b0e891..e581416f24 100644
--- a/pyrit/scenario/scenarios/garak/encoding.py
+++ b/pyrit/scenario/scenarios/garak/encoding.py
@@ -240,7 +240,14 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
         # Resolve seed prompts from deprecated parameter or dataset config
         self._resolved_seed_groups = self._resolve_seed_groups()
 
-        return self._get_converter_attacks()
+        atomic_attacks = self._get_converter_attacks()
+
+        if self._include_baseline:
+            atomic_attacks.insert(
+                0, self._build_baseline_atomic_attack(seed_groups=self._resolved_seed_groups or [])
+            )
+
+        return atomic_attacks
 
     # These are the same as Garak encoding attacks
     def _get_converter_attacks(self) -> list[AtomicAttack]:
diff --git a/tests/unit/scenario/test_scam.py b/tests/unit/scenario/test_scam.py
index 80092bb98b..e5d79747ae 100644
--- a/tests/unit/scenario/test_scam.py
+++ b/tests/unit/scenario/test_scam.py
@@ -219,6 +219,7 @@ async def test_attack_generation_for_singleturn_async(
             objective_target=mock_objective_target,
             scenario_strategies=[single_turn_strategy],
             dataset_config=mock_dataset_config,
+            include_baseline=False,
         )
         atomic_attacks = await scenario._get_atomic_attacks_async()
 
@@ -237,6 +238,7 @@ async def test_attack_generation_for_multiturn_async(
             objective_target=mock_objective_target,
             scenario_strategies=[multi_turn_strategy],
             dataset_config=mock_dataset_config,
+            include_baseline=False,
         )
         atomic_attacks = await scenario._get_atomic_attacks_async()
 
@@ -303,6 +305,7 @@ async def test_max_turns_default_used_when_unset_async(
             objective_target=mock_objective_target,
             scenario_strategies=[multi_turn_strategy],
             dataset_config=mock_dataset_config,
+            include_baseline=False,
         )
         atomic_attacks = await scenario._get_atomic_attacks_async()
 
@@ -321,6 +324,7 @@ async def test_max_turns_override_flows_into_attack_async(
             objective_target=mock_objective_target,
             scenario_strategies=[multi_turn_strategy],
             dataset_config=mock_dataset_config,
+            include_baseline=False,
         )
         atomic_attacks = await scenario._get_atomic_attacks_async()
 

From de7d25753066b0c88c457e7deb7494d5c39c175e Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 12:59:41 -0400
Subject: [PATCH 10/19] Rename BaselineDefaultPolicy to BaselinePolicy and
 BASELINE_DEFAULT_POLICY to BASELINE_POLICY

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 doc/code/scenarios/0_scenarios.ipynb           |  6 +++---
 doc/code/scenarios/0_scenarios.py              |  6 +++---
 pyrit/scenario/__init__.py                     |  4 ++--
 pyrit/scenario/core/__init__.py                |  4 ++--
 pyrit/scenario/core/scenario.py                | 18 +++++++++---------
 pyrit/scenario/scenarios/airt/jailbreak.py     |  4 ++--
 pyrit/scenario/scenarios/airt/psychosocial.py  |  4 ++--
 .../scenarios/benchmark/adversarial.py         |  4 ++--
 tests/unit/scenario/test_adversarial.py        |  4 ++--
 .../unit/scenario/test_baseline_deprecation.py |  6 +++---
 tests/unit/scenario/test_jailbreak.py          |  8 ++++----
 tests/unit/scenario/test_leakage_scenario.py   |  4 ++--
 tests/unit/scenario/test_scenario.py           |  4 ++--
 .../unit/scenario/test_scenario_parameters.py  |  4 ++--
 .../scenario/test_scenario_partial_results.py  |  4 ++--
 tests/unit/scenario/test_scenario_retry.py     |  4 ++--
 16 files changed, 44 insertions(+), 44 deletions(-)

diff --git a/doc/code/scenarios/0_scenarios.ipynb b/doc/code/scenarios/0_scenarios.ipynb
index 14c68f2061..82d604b935 100644
--- a/doc/code/scenarios/0_scenarios.ipynb
+++ b/doc/code/scenarios/0_scenarios.ipynb
@@ -83,7 +83,7 @@
     "   - `max_retries`: Number of retry attempts on failure (default: 0)\n",
     "   - `memory_labels`: Optional labels for tracking (optional)\n",
     "   - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's\n",
-    "     `BASELINE_DEFAULT_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)\n",
+    "     `BASELINE_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)\n",
     "\n",
     "### Example Structure\n",
     "\n",
@@ -406,11 +406,11 @@
     "Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends\n",
     "each objective directly to the target without any converters or multi-turn techniques. This is\n",
     "controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each\n",
-    "scenario falls back to its own `BASELINE_DEFAULT_POLICY` class attribute (most scenarios default\n",
+    "scenario falls back to its own `BASELINE_POLICY` class attribute (most scenarios default\n",
     "it on; `Jailbreak` defaults it off). See\n",
     "[Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example.\n",
     "\n",
-    "Custom scenarios should choose their `BASELINE_DEFAULT_POLICY` based on whether an unmodified\n",
+    "Custom scenarios should choose their `BASELINE_POLICY` based on whether an unmodified\n",
     "prompt is a meaningful comparator for the scenario's strategies:\n",
     "\n",
     "- **`Enabled`** — the baseline is prepended by default and the caller can opt out. Use when an\n",
diff --git a/doc/code/scenarios/0_scenarios.py b/doc/code/scenarios/0_scenarios.py
index a9ed63592f..9e86edf32c 100644
--- a/doc/code/scenarios/0_scenarios.py
+++ b/doc/code/scenarios/0_scenarios.py
@@ -85,7 +85,7 @@
 #    - `max_retries`: Number of retry attempts on failure (default: 0)
 #    - `memory_labels`: Optional labels for tracking (optional)
 #    - `include_baseline`: Whether to prepend a baseline attack (defaults to the scenario type's
-#      `BASELINE_DEFAULT_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)
+#      `BASELINE_POLICY`; most scenarios default it on, `Jailbreak` defaults it off)
 #
 # ### Example Structure
 #
@@ -176,11 +176,11 @@ def _build_display_group(self, *, technique_name: str, seed_group_name: str) ->
 # Every scenario can optionally include a **baseline attack** — a `PromptSendingAttack` that sends
 # each objective directly to the target without any converters or multi-turn techniques. This is
 # controlled by the `include_baseline` parameter on `initialize_async`; when omitted, each
-# scenario falls back to its own `BASELINE_DEFAULT_POLICY` class attribute (most scenarios default
+# scenario falls back to its own `BASELINE_POLICY` class attribute (most scenarios default
 # it on; `Jailbreak` defaults it off). See
 # [Common Scenario Parameters](./1_common_scenario_parameters.ipynb) for a worked example.
 #
-# Custom scenarios should choose their `BASELINE_DEFAULT_POLICY` based on whether an unmodified
+# Custom scenarios should choose their `BASELINE_POLICY` based on whether an unmodified
 # prompt is a meaningful comparator for the scenario's strategies:
 #
 # - **`Enabled`** — the baseline is prepended by default and the caller can opt out. Use when an
diff --git a/pyrit/scenario/__init__.py b/pyrit/scenario/__init__.py
index 73ce95bf52..b665395433 100644
--- a/pyrit/scenario/__init__.py
+++ b/pyrit/scenario/__init__.py
@@ -21,7 +21,7 @@
     AtomicAttack,
     AttackTechnique,
     AttackTechniqueFactory,
-    BaselineDefaultPolicy,
+    BaselinePolicy,
     DatasetConfiguration,
     Scenario,
     ScenarioCompositeStrategy,
@@ -51,7 +51,7 @@
     "AtomicAttack",
     "AttackTechnique",
     "AttackTechniqueFactory",
-    "BaselineDefaultPolicy",
+    "BaselinePolicy",
     "DatasetConfiguration",
     "Parameter",
     "Scenario",
diff --git a/pyrit/scenario/core/__init__.py b/pyrit/scenario/core/__init__.py
index 4ca0b0207b..89c8935da5 100644
--- a/pyrit/scenario/core/__init__.py
+++ b/pyrit/scenario/core/__init__.py
@@ -8,7 +8,7 @@
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.attack_technique_factory import AttackTechniqueFactory, ScorerOverridePolicy
 from pyrit.scenario.core.dataset_configuration import EXPLICIT_SEED_GROUPS_KEY, DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselineDefaultPolicy, Scenario
+from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import ScenarioCompositeStrategy, ScenarioStrategy
 from pyrit.scenario.core.scenario_target_defaults import get_default_adversarial_target, get_default_scorer_target
 from pyrit.scenario.core.scenario_techniques import (
@@ -20,7 +20,7 @@
     "AtomicAttack",
     "AttackTechnique",
     "AttackTechniqueFactory",
-    "BaselineDefaultPolicy",
+    "BaselinePolicy",
     "DatasetConfiguration",
     "EXPLICIT_SEED_GROUPS_KEY",
     "SCENARIO_TECHNIQUES",
diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index b9be3fe15f..52ed0f2240 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -56,13 +56,13 @@
 logger = logging.getLogger(__name__)
 
 
-class BaselineDefaultPolicy(Enum):
+class BaselinePolicy(Enum):
     """
     Declares how a scenario type treats the default baseline atomic attack.
 
     The baseline is a plain ``PromptSendingAttack`` that sends each objective unmodified,
     used as a comparison point against the scenario's strategies. Each scenario class
-    declares its policy via ``Scenario.BASELINE_DEFAULT_POLICY``; callers can still override
+    declares its policy via ``Scenario.BASELINE_POLICY``; callers can still override
     at runtime via ``initialize_async(include_baseline=...)`` for the ``Enabled`` and
     ``Disabled`` states.
     """
@@ -146,7 +146,7 @@ class Scenario(ABC):
     #: ``initialize_async`` and overridable per run via ``include_baseline`` for the
     #: ``Enabled`` and ``Disabled`` states; ``Forbidden`` is a hard constraint and a
     #: caller-supplied ``include_baseline=True`` raises ``ValueError``.
-    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Enabled
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Enabled
 
     @classmethod
     def _get_additional_scoring_questions(cls) -> Sequence[Path]:
@@ -622,14 +622,14 @@ async def initialize_async(
             include_baseline (bool | None): Whether to prepend a baseline atomic attack that sends
                 all objectives without modifications, allowing comparison between unmodified prompts
                 and the scenario's strategies. If None (the default), the scenario type's
-                ``BASELINE_DEFAULT_POLICY`` class attribute decides: ``Enabled`` includes it,
+                ``BASELINE_POLICY`` class attribute decides: ``Enabled`` includes it,
                 ``Disabled`` omits it, and ``Forbidden`` always omits it (and rejects an
-                explicit ``True``). Passing ``True`` to a scenario whose ``BASELINE_DEFAULT_POLICY``
+                explicit ``True``). Passing ``True`` to a scenario whose ``BASELINE_POLICY``
                 is ``Forbidden`` raises ``ValueError``.
 
         Raises:
             ValueError: If no objective_target is provided, or if ``include_baseline=True`` is passed
-                to a scenario whose ``BASELINE_DEFAULT_POLICY`` is ``Forbidden``.
+                to a scenario whose ``BASELINE_POLICY`` is ``Forbidden``.
         """
         # Validate required parameters
         if objective_target is None:
@@ -658,15 +658,15 @@ async def initialize_async(
         # scenario type never silently inherits a True default; explicit-True on a forbidden
         # type is a hard error rather than a silent ignore. For the Enabled / Disabled states,
         # a None runtime value defers to the policy.
-        if self.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Forbidden:
+        if self.BASELINE_POLICY is BaselinePolicy.Forbidden:
             if include_baseline is True:
                 raise ValueError(
                     f"{type(self).__name__} does not support a default baseline "
-                    f"(BASELINE_DEFAULT_POLICY = Forbidden); pass include_baseline=False or omit the argument."
+                    f"(BASELINE_POLICY = Forbidden); pass include_baseline=False or omit the argument."
                 )
             include_baseline = False
         elif include_baseline is None:
-            include_baseline = self.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Enabled
+            include_baseline = self.BASELINE_POLICY is BaselinePolicy.Enabled
 
         self._include_baseline = include_baseline
 
diff --git a/pyrit/scenario/scenarios/airt/jailbreak.py b/pyrit/scenario/scenarios/airt/jailbreak.py
index 9d878b51ff..92966da085 100644
--- a/pyrit/scenario/scenarios/airt/jailbreak.py
+++ b/pyrit/scenario/scenarios/airt/jailbreak.py
@@ -23,7 +23,7 @@
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselineDefaultPolicy, Scenario
+from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import ScenarioStrategy
 from pyrit.scenario.core.scenario_target_defaults import get_default_adversarial_target
 from pyrit.score import (
@@ -84,7 +84,7 @@ class Jailbreak(Scenario):
     #: Jailbreak runs many templates per objective, so the baseline atomic attack is rarely
     #: informative relative to the volume of jailbreak templates. Off by default; callers that
     #: want a comparison can pass ``include_baseline=True`` to ``initialize_async``.
-    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Disabled
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Disabled
 
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
diff --git a/pyrit/scenario/scenarios/airt/psychosocial.py b/pyrit/scenario/scenarios/airt/psychosocial.py
index 5697a9678e..1bda830f7a 100644
--- a/pyrit/scenario/scenarios/airt/psychosocial.py
+++ b/pyrit/scenario/scenarios/airt/psychosocial.py
@@ -30,7 +30,7 @@
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselineDefaultPolicy, Scenario
+from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
 from pyrit.scenario.core.scenario_strategy import (
     ScenarioStrategy,
 )
@@ -149,7 +149,7 @@ class Psychosocial(Scenario):
 
     #: Psychosocial measures multi-turn escalation behavior; a single-shot baseline send
     #: isn't a meaningful comparator, so the default baseline is forbidden.
-    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Forbidden
 
     #: Psychosocial runs CrescendoAttack, which requires the target to natively support
     #: editable conversation history (for backtracking). Declared here so the base scenario
diff --git a/pyrit/scenario/scenarios/benchmark/adversarial.py b/pyrit/scenario/scenarios/benchmark/adversarial.py
index 421d21617c..d3f873f67e 100644
--- a/pyrit/scenario/scenarios/benchmark/adversarial.py
+++ b/pyrit/scenario/scenarios/benchmark/adversarial.py
@@ -14,7 +14,7 @@
 from pyrit.registry.tag_query import TagQuery
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselineDefaultPolicy, Scenario
+from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
 from pyrit.scenario.core.scenario_techniques import SCENARIO_TECHNIQUES
 
 if TYPE_CHECKING:
@@ -36,7 +36,7 @@ class AdversarialBenchmark(Scenario):
 
     #: AdversarialBenchmark compares attack-success rates across adversarial models; a baseline
     #: attack would be model-independent and contribute no signal to the comparison.
-    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Forbidden
 
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
diff --git a/tests/unit/scenario/test_adversarial.py b/tests/unit/scenario/test_adversarial.py
index 6cb7e11fae..c4dea8f3c5 100644
--- a/tests/unit/scenario/test_adversarial.py
+++ b/tests/unit/scenario/test_adversarial.py
@@ -23,7 +23,7 @@
 from pyrit.prompt_target import PromptTarget
 from pyrit.prompt_target.common.prompt_chat_target import PromptChatTarget
 from pyrit.registry.object_registries.attack_technique_registry import AttackTechniqueRegistry
-from pyrit.scenario.core import AtomicAttack, BaselineDefaultPolicy
+from pyrit.scenario.core import AtomicAttack, BaselinePolicy
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
 from pyrit.scenario.core.scenario_techniques import SCENARIO_TECHNIQUES
 from pyrit.scenario.scenarios.benchmark.adversarial import AdversarialBenchmark
@@ -438,7 +438,7 @@ async def test_baseline_excluded(self, mock_objective_target, single_adversarial
             mock_objective_target=mock_objective_target,
             adversarial_models=single_adversarial_model,
         )
-        assert type(scenario).BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Forbidden
+        assert type(scenario).BASELINE_POLICY is BaselinePolicy.Forbidden
         assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
 
     async def test_baseline_explicit_true_raises(self, mock_objective_target, single_adversarial_model):
diff --git a/tests/unit/scenario/test_baseline_deprecation.py b/tests/unit/scenario/test_baseline_deprecation.py
index 634cf0d7db..dab07a02d5 100644
--- a/tests/unit/scenario/test_baseline_deprecation.py
+++ b/tests/unit/scenario/test_baseline_deprecation.py
@@ -16,7 +16,7 @@
 
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.scenario import DatasetConfiguration
-from pyrit.scenario.core import BaselineDefaultPolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import BaselinePolicy, Scenario, ScenarioStrategy
 from pyrit.score import Scorer
 
 _TEST_SCORER_ID = ComponentIdentifier(class_name="MockScorer", class_module="tests.unit.scenarios")
@@ -34,7 +34,7 @@ def get_aggregate_tags(cls) -> set[str]:
 class _LegacyScenario(Scenario):
     """Minimal Scenario stand-in for exercising the deprecated baseline kwargs."""
 
-    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Enabled
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Enabled
 
     def __init__(self, **kwargs):
         kwargs.setdefault("strategy_class", _LegacyStrategy)
@@ -94,7 +94,7 @@ def test_base_kwarg_omitted_emits_no_warning(self):
         assert scenario._legacy_include_baseline is None
 
     async def test_legacy_value_drives_initialize_when_runtime_kwarg_omitted(self, mock_objective_target):
-        """Constructor-time False suppresses the baseline that BASELINE_DEFAULT_POLICY=Enabled would add."""
+        """Constructor-time False suppresses the baseline that BASELINE_POLICY=Enabled would add."""
         with warnings.catch_warnings():
             warnings.simplefilter("ignore", DeprecationWarning)
             scenario = _LegacyScenario(include_default_baseline=False)
diff --git a/tests/unit/scenario/test_jailbreak.py b/tests/unit/scenario/test_jailbreak.py
index debafa01de..f67224a4f9 100644
--- a/tests/unit/scenario/test_jailbreak.py
+++ b/tests/unit/scenario/test_jailbreak.py
@@ -16,7 +16,7 @@
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.models import SeedGroup, SeedObjective
 from pyrit.prompt_target import PromptTarget
-from pyrit.scenario.core import BaselineDefaultPolicy
+from pyrit.scenario.core import BaselinePolicy
 from pyrit.scenario.scenarios.airt.jailbreak import Jailbreak, JailbreakStrategy
 from pyrit.score.true_false.true_false_inverter_scorer import TrueFalseInverterScorer
 
@@ -205,12 +205,12 @@ async def test_init_raises_exception_when_no_datasets_available(self, mock_objec
 
     def test_class_supports_baseline_but_defaults_off(self):
         """Jailbreak supports a baseline but does not include one by default."""
-        assert Jailbreak.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Disabled
+        assert Jailbreak.BASELINE_POLICY is BaselinePolicy.Disabled
 
     async def test_default_initialize_omits_baseline(
         self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
     ):
-        """initialize_async without include_baseline honors BASELINE_DEFAULT_POLICY=Disabled."""
+        """initialize_async without include_baseline honors BASELINE_POLICY=Disabled."""
         with patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
             await scenario.initialize_async(objective_target=mock_objective_target)
@@ -219,7 +219,7 @@ async def test_default_initialize_omits_baseline(
     async def test_explicit_include_baseline_true_prepends_baseline(
         self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
     ):
-        """Caller can override BASELINE_DEFAULT_POLICY=Disabled by passing include_baseline=True."""
+        """Caller can override BASELINE_POLICY=Disabled by passing include_baseline=True."""
         from pyrit.scenario import DatasetConfiguration
 
         with (
diff --git a/tests/unit/scenario/test_leakage_scenario.py b/tests/unit/scenario/test_leakage_scenario.py
index 302b28665e..9c6fa823ae 100644
--- a/tests/unit/scenario/test_leakage_scenario.py
+++ b/tests/unit/scenario/test_leakage_scenario.py
@@ -14,7 +14,7 @@
 from pyrit.prompt_target import PromptTarget
 from pyrit.scenario import DatasetConfiguration
 from pyrit.scenario.airt import Leakage, LeakageStrategy
-from pyrit.scenario.core import BaselineDefaultPolicy
+from pyrit.scenario.core import BaselinePolicy
 from pyrit.score import TrueFalseCompositeScorer
 
 
@@ -105,7 +105,7 @@ def test_default_scorer_uses_leakage_yaml(self):
 
     def test_init_supports_default_baseline(self):
         """Leakage opts into the parent's default baseline."""
-        assert Leakage.BASELINE_DEFAULT_POLICY is BaselineDefaultPolicy.Enabled
+        assert Leakage.BASELINE_POLICY is BaselinePolicy.Enabled
 
 
 @pytest.mark.usefixtures(*FIXTURES)
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index ee9301bdf3..d0bee32481 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioIdentifier, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, BaselineDefaultPolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
 from pyrit.score import Scorer
 
 # Reusable test scorer identifier
@@ -100,7 +100,7 @@ class ConcreteScenario(Scenario):
 
     # Tests using this fixture should default to no baseline; set the class policy to Forbidden
     # so we don't have to thread include_baseline=False through every initialize_async call.
-    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Forbidden
 
     def __init__(self, atomic_attacks_to_return=None, **kwargs):
         # Add required strategy_class if not provided
diff --git a/tests/unit/scenario/test_scenario_parameters.py b/tests/unit/scenario/test_scenario_parameters.py
index 3a28068a04..5289b61ee8 100644
--- a/tests/unit/scenario/test_scenario_parameters.py
+++ b/tests/unit/scenario/test_scenario_parameters.py
@@ -11,7 +11,7 @@
 from pyrit.common import Parameter
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.scenario import DatasetConfiguration
-from pyrit.scenario.core import BaselineDefaultPolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import BaselinePolicy, Scenario, ScenarioStrategy
 from pyrit.score import Scorer
 
 _TEST_SCORER_ID = ComponentIdentifier(class_name="MockScorer", class_module="tests.unit.scenarios")
@@ -35,7 +35,7 @@ def get_aggregate_tags(cls) -> set[str]:
 
     class _ParamTestScenario(Scenario):
         # No baseline in tests so atomic_attacks observations stay deterministic.
-        BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
+        BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Forbidden
 
         @classmethod
         def get_strategy_class(cls):
diff --git a/tests/unit/scenario/test_scenario_partial_results.py b/tests/unit/scenario/test_scenario_partial_results.py
index 03d67ad47a..a18625dc8b 100644
--- a/tests/unit/scenario/test_scenario_partial_results.py
+++ b/tests/unit/scenario/test_scenario_partial_results.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, BaselineDefaultPolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
 
 
 def _mock_scorer_id(name: str = "MockScorer") -> ComponentIdentifier:
@@ -74,7 +74,7 @@ def filter_objectives(*, remaining_objectives):
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Forbidden
 
     def __init__(self, *, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
         # Get strategy_class from kwargs or use default
diff --git a/tests/unit/scenario/test_scenario_retry.py b/tests/unit/scenario/test_scenario_retry.py
index 926383cffc..836503ff5f 100644
--- a/tests/unit/scenario/test_scenario_retry.py
+++ b/tests/unit/scenario/test_scenario_retry.py
@@ -13,7 +13,7 @@
 from pyrit.memory import CentralMemory
 from pyrit.models import AttackOutcome, AttackResult
 from pyrit.scenario import DatasetConfiguration, ScenarioResult
-from pyrit.scenario.core import AtomicAttack, BaselineDefaultPolicy, Scenario, ScenarioStrategy
+from pyrit.scenario.core import AtomicAttack, BaselinePolicy, Scenario, ScenarioStrategy
 
 # Test constants
 TEST_ATTACK_TYPE = "TestAttack"
@@ -137,7 +137,7 @@ def create_mock_atomic_attack(name: str, objectives: list[str], run_async_mock:
 class ConcreteScenario(Scenario):
     """Concrete implementation of Scenario for testing."""
 
-    BASELINE_DEFAULT_POLICY: ClassVar[BaselineDefaultPolicy] = BaselineDefaultPolicy.Forbidden
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Forbidden
 
     def __init__(self, atomic_attacks_to_return=None, objective_scorer=None, **kwargs):
         # Get strategy_class from kwargs or use default

From 7db5f76eb58800b76fdf9e66bf1dd1e2c9d59cc1 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 13:31:11 -0400
Subject: [PATCH 11/19] Delete legacy _get_baseline and post-hoc baseline
 insertion

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 pyrit/scenario/core/scenario.py      | 73 ----------------------------
 tests/unit/scenario/test_scenario.py | 25 ++++++----
 2 files changed, 16 insertions(+), 82 deletions(-)

diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 52ed0f2240..f35169d2ba 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -49,7 +49,6 @@
 )
 
 if TYPE_CHECKING:
-    from pyrit.executor.attack.core.attack_config import AttackScoringConfig
     from pyrit.identifiers import ComponentIdentifier
     from pyrit.scenario.core.attack_technique_factory import AttackTechniqueFactory
 
@@ -682,15 +681,6 @@ async def initialize_async(
 
         self._atomic_attacks = await self._get_atomic_attacks_async()
 
-        # Transitional guard (removed when _get_baseline / _get_baseline_data are deleted).
-        # Skip the legacy post-hoc insert when _get_atomic_attacks_async already emitted
-        # baseline at index 0 (the structural path); fall through to the old behavior for
-        # overrides not yet migrated.
-        already_emitted_baseline = bool(self._atomic_attacks) and self._atomic_attacks[0].atomic_attack_name == "baseline"
-        if include_baseline and not already_emitted_baseline:
-            baseline_attack = self._get_baseline()
-            self._atomic_attacks.insert(0, baseline_attack)
-
         # Store original objectives for each atomic attack (before any mutations during execution)
         self._original_objectives_map = {
             atomic_attack.atomic_attack_name: tuple(atomic_attack.objectives) for atomic_attack in self._atomic_attacks
@@ -779,69 +769,6 @@ def _build_baseline_atomic_attack(self, *, seed_groups: list[SeedAttackGroup]) -
             memory_labels=self._memory_labels,
         )
 
-    def _get_baseline(self) -> AtomicAttack:
-        """
-        Get a baseline AtomicAttack, which simply sends all the objectives without any modifications.
-
-        If other atomic attacks exist, derives baseline data from the first attack.
-        Otherwise, creates a standalone baseline from the dataset configuration and scenario settings.
-
-        Returns:
-            AtomicAttack: The baseline AtomicAttack instance.
-
-        Raises:
-            ValueError: If required data (seed_groups, objective_target, attack_scoring_config)
-                       is not available.
-        """
-        seed_groups, attack_scoring_config, objective_target = self._get_baseline_data()
-
-        # Create baseline attack with no converters
-        attack = PromptSendingAttack(
-            objective_target=objective_target,
-            attack_scoring_config=attack_scoring_config,
-        )
-
-        return AtomicAttack(
-            atomic_attack_name="baseline",
-            attack_technique=AttackTechnique(attack=attack),
-            seed_groups=seed_groups,
-            memory_labels=self._memory_labels,
-        )
-
-    def _get_baseline_data(self) -> tuple[list["SeedAttackGroup"], "AttackScoringConfig", PromptTarget]:
-        """
-        Get the data needed to create a baseline attack.
-
-        Returns the scenario-level data
-
-        Returns:
-            Tuple containing (seed_groups, attack_scoring_config, objective_target)
-
-        Raises:
-            ValueError: If required data is not available.
-        """
-        # Create from scenario-level settings
-        if not self._objective_target:
-            raise ValueError("Objective target is required to create baseline attack.")
-        if not self._dataset_config:
-            raise ValueError("Dataset config is required to create baseline attack.")
-        if not self._objective_scorer:
-            raise ValueError("Objective scorer is required to create baseline attack.")
-
-        seed_groups = self._dataset_config.get_all_seed_attack_groups()
-        if not seed_groups or len(seed_groups) == 0:
-            raise ValueError("Seed groups are required to create baseline attack.")
-
-        # Import here to avoid circular imports
-        from pyrit.executor.attack.core.attack_config import AttackScoringConfig
-
-        attack_scoring_config = AttackScoringConfig(objective_scorer=cast("TrueFalseScorer", self._objective_scorer))
-
-        if not attack_scoring_config:
-            raise ValueError("Attack scoring config is required to create baseline attack.")
-
-        return seed_groups, attack_scoring_config, self._objective_target
-
     def _raise_dataset_exception(self) -> None:
         error_msg = textwrap.dedent(
             f"""
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index d0bee32481..095fe767b0 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -702,7 +702,12 @@ def default_dataset_config(cls) -> DatasetConfiguration:
         return DatasetConfiguration()
 
     async def _get_atomic_attacks_async(self):
-        return self._atomic_attacks_to_return
+        atomic_attacks = list(self._atomic_attacks_to_return)
+        if self._include_baseline:
+            groups_by_dataset = self._dataset_config.get_seed_attack_groups()
+            all_seed_groups = [g for groups in groups_by_dataset.values() for g in groups]
+            atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=all_seed_groups))
+        return atomic_attacks
 
 
 @pytest.mark.usefixtures("patch_central_database")
@@ -721,10 +726,12 @@ async def test_initialize_async_with_empty_strategies_and_baseline(self, mock_ob
 
         # Create a mock dataset config with seed groups
         mock_dataset_config = MagicMock(spec=DatasetConfiguration)
-        mock_dataset_config.get_all_seed_attack_groups.return_value = [
-            SeedAttackGroup(seeds=[SeedObjective(value="test objective 1")]),
-            SeedAttackGroup(seeds=[SeedObjective(value="test objective 2")]),
-        ]
+        mock_dataset_config.get_seed_attack_groups.return_value = {
+            "default": [
+                SeedAttackGroup(seeds=[SeedObjective(value="test objective 1")]),
+                SeedAttackGroup(seeds=[SeedObjective(value="test objective 2")]),
+            ]
+        }
 
         # Initialize with None (default strategy) — [] also works, both expand defaults
         await scenario.initialize_async(
@@ -749,9 +756,9 @@ async def test_baseline_only_execution_runs_successfully(self, mock_objective_ta
 
         # Create a mock dataset config with seed groups
         mock_dataset_config = MagicMock(spec=DatasetConfiguration)
-        mock_dataset_config.get_all_seed_attack_groups.return_value = [
-            SeedAttackGroup(seeds=[SeedObjective(value="test objective 1")]),
-        ]
+        mock_dataset_config.get_seed_attack_groups.return_value = {
+            "default": [SeedAttackGroup(seeds=[SeedObjective(value="test objective 1")])]
+        }
 
         # Initialize with None — [] also expands defaults now, both are equivalent
         await scenario.initialize_async(
@@ -808,7 +815,7 @@ async def test_standalone_baseline_uses_dataset_config_seeds(self, mock_objectiv
         ]
 
         mock_dataset_config = MagicMock(spec=DatasetConfiguration)
-        mock_dataset_config.get_all_seed_attack_groups.return_value = expected_seeds
+        mock_dataset_config.get_seed_attack_groups.return_value = {"default": expected_seeds}
 
         await scenario.initialize_async(
             objective_target=mock_objective_target,

From 9677a382effb34a3c77d84fb7182340478a18730 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 13:53:36 -0400
Subject: [PATCH 12/19] Document override responsibility for baseline emission

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 pyrit/scenario/core/scenario.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index f35169d2ba..4c93bce518 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -949,7 +949,9 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
         ``_build_display_group()``.
 
         Subclasses that do **not** use the factory/registry pattern should
-        override this method entirely.
+        override this method entirely. Overrides that want baseline support
+        must call ``self._build_baseline_atomic_attack`` with the strategy
+        seeds.
 
         Returns:
             list[AtomicAttack]: The generated atomic attacks.

From d412ab54b0b7bd641d6b3b40437da9f301aff0bf Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 14:42:11 -0400
Subject: [PATCH 13/19] Add baseline uniformity regression tests and helper
 unit tests

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .../scenario/test_baseline_deprecation.py     | 48 ++++++++-
 tests/unit/scenario/test_encoding.py          | 35 +++++++
 tests/unit/scenario/test_foundry.py           | 35 +++++++
 tests/unit/scenario/test_jailbreak.py         | 34 +++++++
 tests/unit/scenario/test_scam.py              | 33 +++++++
 tests/unit/scenario/test_scenario.py          | 98 +++++++++++++++++++
 6 files changed, 280 insertions(+), 3 deletions(-)

diff --git a/tests/unit/scenario/test_baseline_deprecation.py b/tests/unit/scenario/test_baseline_deprecation.py
index dab07a02d5..32cca11ee8 100644
--- a/tests/unit/scenario/test_baseline_deprecation.py
+++ b/tests/unit/scenario/test_baseline_deprecation.py
@@ -17,7 +17,7 @@
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.scenario import DatasetConfiguration
 from pyrit.scenario.core import BaselinePolicy, Scenario, ScenarioStrategy
-from pyrit.score import Scorer
+from pyrit.score import Scorer, TrueFalseScorer
 
 _TEST_SCORER_ID = ComponentIdentifier(class_name="MockScorer", class_module="tests.unit.scenarios")
 
@@ -39,7 +39,7 @@ class _LegacyScenario(Scenario):
     def __init__(self, **kwargs):
         kwargs.setdefault("strategy_class", _LegacyStrategy)
         if "objective_scorer" not in kwargs:
-            mock_scorer = MagicMock(spec=Scorer)
+            mock_scorer = MagicMock(spec=TrueFalseScorer)
             mock_scorer.get_identifier.return_value = _TEST_SCORER_ID
             mock_scorer.get_scorer_metrics.return_value = None
             kwargs["objective_scorer"] = mock_scorer
@@ -59,7 +59,12 @@ def default_dataset_config(cls) -> DatasetConfiguration:
         return DatasetConfiguration()
 
     async def _get_atomic_attacks_async(self):
-        return []
+        atomic_attacks = []
+        if self._include_baseline:
+            groups_by_dataset = self._dataset_config.get_seed_attack_groups()
+            all_seed_groups = [g for groups in groups_by_dataset.values() for g in groups]
+            atomic_attacks.append(self._build_baseline_atomic_attack(seed_groups=all_seed_groups))
+        return atomic_attacks
 
 
 @pytest.fixture
@@ -158,3 +163,40 @@ def test_subclass_kwarg_emits_deprecation_warning(
         assert len(deprecations) >= 1, f"{class_name} did not emit a DeprecationWarning naming the class"
         assert "v0.16.0" in str(deprecations[0].message)
         assert scenario._legacy_include_baseline is False
+
+
+@pytest.mark.usefixtures("patch_central_database")
+class TestLegacyAndRuntimePathsEquivalentUnderMaxDatasetSize:
+    """ADO 9012: the deprecated constructor path and the new initialize_async path must
+    produce the same baseline atomic attack under max_dataset_size."""
+
+    async def test_paths_produce_matching_objective_sets(self, mock_objective_target):
+        from pyrit.models import SeedGroup, SeedObjective
+
+        seed_groups = [SeedGroup(seeds=[SeedObjective(value=f"obj{i}")]) for i in range(10)]
+
+        # Both paths share the same patched sample, so each scenario's single
+        # resolution call returns ``stable_sample``.
+        stable_sample = seed_groups[:3]
+
+        with patch(
+            "pyrit.scenario.core.dataset_configuration.random.sample",
+            return_value=stable_sample,
+        ):
+            config_legacy = DatasetConfiguration(seed_groups=seed_groups, max_dataset_size=3)
+            with warnings.catch_warnings():
+                warnings.simplefilter("ignore", DeprecationWarning)
+                legacy = _LegacyScenario(include_default_baseline=True)
+            await legacy.initialize_async(objective_target=mock_objective_target, dataset_config=config_legacy)
+
+            config_runtime = DatasetConfiguration(seed_groups=seed_groups, max_dataset_size=3)
+            runtime = _LegacyScenario()
+            await runtime.initialize_async(
+                objective_target=mock_objective_target,
+                dataset_config=config_runtime,
+                include_baseline=True,
+            )
+
+        assert legacy._atomic_attacks[0].atomic_attack_name == "baseline"
+        assert runtime._atomic_attacks[0].atomic_attack_name == "baseline"
+        assert set(legacy._atomic_attacks[0].objectives) == set(runtime._atomic_attacks[0].objectives)
diff --git a/tests/unit/scenario/test_encoding.py b/tests/unit/scenario/test_encoding.py
index 0df8435a86..1cb0aaeff6 100644
--- a/tests/unit/scenario/test_encoding.py
+++ b/tests/unit/scenario/test_encoding.py
@@ -399,3 +399,38 @@ def test_encoding_dataset_config_can_be_initialized_with_dataset_names(self):
 
         assert config._dataset_names == ["garak_slur_terms_en", "garak_web_html_js"]
         assert config.max_dataset_size == 5
+
+
+@pytest.mark.usefixtures("patch_central_database")
+class TestEncodingBaselineUniformity:
+    """ADO 9012 regression: baseline shares objectives with strategies under max_dataset_size."""
+
+    async def test_one_resolution_call_baseline_matches_strategies(
+        self, mock_objective_target, mock_objective_scorer
+    ):
+        from unittest.mock import patch
+
+        from pyrit.models import SeedGroup, SeedObjective
+
+        seed_groups = [SeedGroup(seeds=[SeedObjective(value=f"obj{i}")]) for i in range(10)]
+        config = DatasetConfiguration(seed_groups=seed_groups, max_dataset_size=3)
+
+        first_sample = seed_groups[:3]
+        second_sample = seed_groups[5:8]
+        with patch(
+            "pyrit.scenario.core.dataset_configuration.random.sample",
+            side_effect=[first_sample, second_sample],
+        ) as mock_sample:
+            scenario = Encoding(objective_scorer=mock_objective_scorer)
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                scenario_strategies=[EncodingStrategy.ALL],
+                dataset_config=config,
+                include_baseline=True,
+            )
+
+        assert mock_sample.call_count == 1
+        assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+        baseline_objs = set(scenario._atomic_attacks[0].objectives)
+        for attack in scenario._atomic_attacks[1:]:
+            assert set(attack.objectives) == baseline_objs
diff --git a/tests/unit/scenario/test_foundry.py b/tests/unit/scenario/test_foundry.py
index e29b8146d4..1272cedecd 100644
--- a/tests/unit/scenario/test_foundry.py
+++ b/tests/unit/scenario/test_foundry.py
@@ -680,3 +680,38 @@ async def test_initialize_converts_converter_only_composite_strategy(
         result = scenario._scenario_composites[0]
         assert result.attack is None
         assert set(result.converters) == {FoundryStrategy.Base64, FoundryStrategy.ROT13}
+
+
+@pytest.mark.usefixtures(*FIXTURES)
+class TestRedTeamAgentBaselineUniformity:
+    """ADO 9012 regression: baseline shares objectives with strategies under max_dataset_size."""
+
+    async def test_one_resolution_call_baseline_matches_strategies(
+        self, mock_objective_target, mock_objective_scorer
+    ):
+        from pyrit.models import SeedGroup, SeedObjective
+
+        seed_groups = [SeedGroup(seeds=[SeedObjective(value=f"obj{i}")]) for i in range(10)]
+        config = DatasetConfiguration(seed_groups=seed_groups, max_dataset_size=3)
+
+        first_sample = seed_groups[:3]
+        second_sample = seed_groups[5:8]
+        with patch(
+            "pyrit.scenario.core.dataset_configuration.random.sample",
+            side_effect=[first_sample, second_sample],
+        ) as mock_sample:
+            scenario = RedTeamAgent(
+                attack_scoring_config=AttackScoringConfig(objective_scorer=mock_objective_scorer),
+            )
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                scenario_strategies=[FoundryStrategy.Base64],
+                dataset_config=config,
+                include_baseline=True,
+            )
+
+        assert mock_sample.call_count == 1
+        assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+        baseline_objs = set(scenario._atomic_attacks[0].objectives)
+        for attack in scenario._atomic_attacks[1:]:
+            assert set(attack.objectives) == baseline_objs
diff --git a/tests/unit/scenario/test_jailbreak.py b/tests/unit/scenario/test_jailbreak.py
index f67224a4f9..b8f402b0a2 100644
--- a/tests/unit/scenario/test_jailbreak.py
+++ b/tests/unit/scenario/test_jailbreak.py
@@ -520,3 +520,37 @@ async def test_roleplay_attacks_share_adversarial_target(
             # All role-play attacks should share the same adversarial target
             adversarial_targets = [run.attack_technique.attack._adversarial_chat for run in atomic_attacks]
             assert all(t is adversarial_targets[0] for t in adversarial_targets)
+
+
+@pytest.mark.usefixtures(*FIXTURES)
+class TestJailbreakBaselineUniformity:
+    """ADO 9012 regression: baseline shares objectives with strategies under max_dataset_size."""
+
+    async def test_one_resolution_call_baseline_matches_strategies(
+        self, mock_objective_target, mock_objective_scorer, simple_jailbreak_strategy
+    ):
+        from pyrit.models import SeedGroup, SeedObjective
+        from pyrit.scenario import DatasetConfiguration
+
+        seed_groups = [SeedGroup(seeds=[SeedObjective(value=f"obj{i}")]) for i in range(10)]
+        config = DatasetConfiguration(seed_groups=seed_groups, max_dataset_size=3)
+
+        first_sample = seed_groups[:3]
+        second_sample = seed_groups[5:8]
+        scenario = Jailbreak(objective_scorer=mock_objective_scorer, num_templates=1)
+        with patch(
+            "pyrit.scenario.core.dataset_configuration.random.sample",
+            side_effect=[first_sample, second_sample],
+        ) as mock_sample:
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                scenario_strategies=[simple_jailbreak_strategy],
+                dataset_config=config,
+                include_baseline=True,
+            )
+
+        assert mock_sample.call_count == 1
+        assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+        baseline_objs = set(scenario._atomic_attacks[0].objectives)
+        for attack in scenario._atomic_attacks[1:]:
+            assert set(attack.objectives) == baseline_objs
diff --git a/tests/unit/scenario/test_scam.py b/tests/unit/scenario/test_scam.py
index e5d79747ae..1fc5744fa4 100644
--- a/tests/unit/scenario/test_scam.py
+++ b/tests/unit/scenario/test_scam.py
@@ -404,3 +404,36 @@ async def test_no_target_duplication_async(
             assert objective_target != scorer_target
             assert objective_target != adversarial_target
             assert scorer_target != adversarial_target
+
+
+@pytest.mark.usefixtures(*FIXTURES)
+class TestScamBaselineUniformity:
+    """ADO 9012 regression: baseline shares objectives with strategies under max_dataset_size."""
+
+    async def test_one_resolution_call_baseline_matches_strategies(
+        self, mock_objective_target, mock_objective_scorer, single_turn_strategy
+    ):
+        from pyrit.models import SeedGroup, SeedObjective
+
+        seed_groups = [SeedGroup(seeds=[SeedObjective(value=f"obj{i}")]) for i in range(10)]
+        config = DatasetConfiguration(seed_groups=seed_groups, max_dataset_size=3)
+
+        first_sample = seed_groups[:3]
+        second_sample = seed_groups[5:8]
+        with patch(
+            "pyrit.scenario.core.dataset_configuration.random.sample",
+            side_effect=[first_sample, second_sample],
+        ) as mock_sample:
+            scenario = Scam(objective_scorer=mock_objective_scorer)
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                scenario_strategies=[single_turn_strategy],
+                dataset_config=config,
+                include_baseline=True,
+            )
+
+        assert mock_sample.call_count == 1
+        assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+        baseline_objs = set(scenario._atomic_attacks[0].objectives)
+        for attack in scenario._atomic_attacks[1:]:
+            assert set(attack.objectives) == baseline_objs
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index 095fe767b0..4643b7748c 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -897,6 +897,104 @@ async def test_execute_scenario_raises_when_scenario_result_id_is_none():
         await scenario._execute_scenario_async()
 
 
+@pytest.mark.usefixtures("patch_central_database")
+class TestScenarioBaselineUniformObjectives:
+    """ADO 9012 regression: baseline and strategy share objectives under max_dataset_size.
+
+    The structural fix collapses to a single seed-group resolution call per scenario
+    run. Both the strategy atomic attacks and the baseline use the same sampled
+    population, so ``random.sample`` runs once and the two groups match.
+    """
+
+    async def test_baseline_objectives_match_atomic_attacks_under_max_dataset_size(
+        self,
+        mock_objective_target,
+    ):
+        from pyrit.models import SeedGroup, SeedObjective
+        from pyrit.scenario.core.attack_technique import AttackTechnique
+
+        seed_groups = [SeedGroup(seeds=[SeedObjective(value=f"obj{i}")]) for i in range(10)]
+        config = DatasetConfiguration(seed_groups=seed_groups, max_dataset_size=3)
+
+        class StrategyScenario(ConcreteScenarioWithTrueFalseScorer):
+            async def _get_atomic_attacks_async(self):
+                groups_by_dataset = self._dataset_config.get_seed_attack_groups()
+                all_seed_groups = [g for groups in groups_by_dataset.values() for g in groups]
+                atomic_attacks = [
+                    AtomicAttack(
+                        atomic_attack_name="strategy",
+                        attack_technique=AttackTechnique(attack=MagicMock()),
+                        seed_groups=all_seed_groups,
+                    )
+                ]
+                if self._include_baseline:
+                    atomic_attacks.insert(
+                        0, self._build_baseline_atomic_attack(seed_groups=all_seed_groups)
+                    )
+                return atomic_attacks
+
+        # Two distinct samples wired up. A buggy implementation with a second
+        # resolution call would consume both; the structural fix consumes one.
+        first_sample = seed_groups[:3]
+        second_sample = seed_groups[5:8]
+        with patch(
+            "pyrit.scenario.core.dataset_configuration.random.sample",
+            side_effect=[first_sample, second_sample],
+        ) as mock_sample:
+            scenario = StrategyScenario(name="ADO 9012 regression", version=1)
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                scenario_strategies=None,
+                dataset_config=config,
+            )
+
+        assert mock_sample.call_count == 1
+
+        baseline, strategy = scenario._atomic_attacks
+        assert baseline.atomic_attack_name == "baseline"
+        assert strategy.atomic_attack_name == "strategy"
+        assert set(baseline.objectives) == set(strategy.objectives)
+        assert len(baseline.objectives) == 3
+
+
+@pytest.mark.usefixtures("patch_central_database")
+class TestBuildBaselineAtomicAttack:
+    """Unit tests for Scenario._build_baseline_atomic_attack."""
+
+    def _seed_groups(self):
+        from pyrit.models import SeedAttackGroup, SeedObjective
+
+        return [SeedAttackGroup(seeds=[SeedObjective(value="x")])]
+
+    def test_returns_baseline_atomic_attack(self, mock_objective_target):
+        from pyrit.executor.attack.single_turn.prompt_sending import PromptSendingAttack
+
+        seed_groups = self._seed_groups()
+        scenario = ConcreteScenarioWithTrueFalseScorer(name="T", version=1)
+        scenario._objective_target = mock_objective_target
+
+        atomic = scenario._build_baseline_atomic_attack(seed_groups=seed_groups)
+
+        assert atomic.atomic_attack_name == "baseline"
+        assert atomic.seed_groups == seed_groups
+        assert isinstance(atomic.attack_technique.attack, PromptSendingAttack)
+
+    def test_raises_when_target_is_none(self):
+        scenario = ConcreteScenarioWithTrueFalseScorer(name="T", version=1)
+        # _objective_target is None pre-initialize_async
+
+        with pytest.raises(ValueError, match="Objective target is required"):
+            scenario._build_baseline_atomic_attack(seed_groups=self._seed_groups())
+
+    def test_raises_when_scorer_is_none(self, mock_objective_target):
+        scenario = ConcreteScenarioWithTrueFalseScorer(name="T", version=1)
+        scenario._objective_target = mock_objective_target
+        scenario._objective_scorer = None  # type: ignore[assignment]
+
+        with pytest.raises(ValueError, match="Objective scorer is required"):
+            scenario._build_baseline_atomic_attack(seed_groups=self._seed_groups())
+
+
 @pytest.mark.usefixtures("patch_central_database")
 class TestValidateStoredScenario:
     """Tests for Scenario._validate_stored_scenario."""

From f16bf17e66f0e9ca81070175dce0a5bbef299949 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 15:21:58 -0400
Subject: [PATCH 14/19] Document BASELINE_POLICY and baseline emission contract
 in scenario instructions

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 .github/instructions/scenarios.instructions.md | 10 ++++++++--
 1 file changed, 8 insertions(+), 2 deletions(-)

diff --git a/.github/instructions/scenarios.instructions.md b/.github/instructions/scenarios.instructions.md
index 9261dca942..0c491da2fe 100644
--- a/.github/instructions/scenarios.instructions.md
+++ b/.github/instructions/scenarios.instructions.md
@@ -11,11 +11,15 @@ Scenarios orchestrate multi-attack security testing campaigns. Each scenario gro
 All scenarios inherit from `Scenario` (ABC) and must:
 
 1. **Define `VERSION`** as a class constant (increment on breaking changes)
-2. **Implement three abstract methods:**
+2. **Optionally declare `BASELINE_POLICY`** (defaults to `BaselinePolicy.Enabled` — a baseline `PromptSendingAttack` is prepended and callers can opt out per run via `initialize_async(include_baseline=False)`):
+   - `BaselinePolicy.Disabled` — baseline supported but off by default (e.g. `Jailbreak`, where templates dominate the run).
+   - `BaselinePolicy.Forbidden` — baseline is meaningless for this scenario's comparison axis (e.g. `AdversarialBenchmark`, which compares against gold-standard answers). Explicit `include_baseline=True` raises `ValueError`.
+3. **Implement three abstract methods:**
 
 ```python
 class MyScenario(Scenario):
     VERSION: int = 1
+    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Enabled
 
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
@@ -30,7 +34,7 @@ class MyScenario(Scenario):
         return DatasetConfiguration(dataset_names=["my_dataset"])
 ```
 
-3. **Optionally override `_get_atomic_attacks_async()`** — the base class provides a default
+4. **Optionally override `_get_atomic_attacks_async()`** — the base class provides a default
    that uses the factory/registry pattern (see "AtomicAttack Construction" below).
    Only override if your scenario needs custom attack construction logic.
 
@@ -154,6 +158,8 @@ The default implementation:
 Only override when the scenario **cannot** use the factory/registry pattern — e.g., scenarios
 with custom composite logic, per-strategy converter stacks, or non-standard attack construction.
 
+Overrides that want baseline support must emit it themselves by calling `self._build_baseline_atomic_attack(seed_groups=...)` with the same seeds used for the strategy attacks and prepending the result. The base implementation emits baseline automatically; passing freshly resolved seeds reintroduces ADO 9012 (baseline-vs-strategy population divergence under `max_dataset_size`).
+
 ### Manual AtomicAttack construction (for overrides):
 
 ```python

From 1c41a7900ff5fda4947dba288dd1b2174d1a4f42 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 15:47:00 -0400
Subject: [PATCH 15/19] Apply pre-commit auto-fixes (ruff format and unused
 import removal)

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 pyrit/scenario/core/scenario.py                  | 4 +---
 pyrit/scenario/scenarios/garak/encoding.py       | 4 +---
 tests/unit/scenario/test_baseline_deprecation.py | 2 +-
 tests/unit/scenario/test_encoding.py             | 4 +---
 tests/unit/scenario/test_foundry.py              | 4 +---
 tests/unit/scenario/test_scenario.py             | 4 +---
 6 files changed, 6 insertions(+), 16 deletions(-)

diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 4c93bce518..1579219a8d 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -757,9 +757,7 @@ def _build_baseline_atomic_attack(self, *, seed_groups: list[SeedAttackGroup]) -
 
         attack = PromptSendingAttack(
             objective_target=self._objective_target,
-            attack_scoring_config=AttackScoringConfig(
-                objective_scorer=cast("TrueFalseScorer", self._objective_scorer)
-            ),
+            attack_scoring_config=AttackScoringConfig(objective_scorer=cast("TrueFalseScorer", self._objective_scorer)),
         )
 
         return AtomicAttack(
diff --git a/pyrit/scenario/scenarios/garak/encoding.py b/pyrit/scenario/scenarios/garak/encoding.py
index e581416f24..8233e4206b 100644
--- a/pyrit/scenario/scenarios/garak/encoding.py
+++ b/pyrit/scenario/scenarios/garak/encoding.py
@@ -243,9 +243,7 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
         atomic_attacks = self._get_converter_attacks()
 
         if self._include_baseline:
-            atomic_attacks.insert(
-                0, self._build_baseline_atomic_attack(seed_groups=self._resolved_seed_groups or [])
-            )
+            atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=self._resolved_seed_groups or []))
 
         return atomic_attacks
 
diff --git a/tests/unit/scenario/test_baseline_deprecation.py b/tests/unit/scenario/test_baseline_deprecation.py
index 32cca11ee8..4272ebd277 100644
--- a/tests/unit/scenario/test_baseline_deprecation.py
+++ b/tests/unit/scenario/test_baseline_deprecation.py
@@ -17,7 +17,7 @@
 from pyrit.identifiers import ComponentIdentifier
 from pyrit.scenario import DatasetConfiguration
 from pyrit.scenario.core import BaselinePolicy, Scenario, ScenarioStrategy
-from pyrit.score import Scorer, TrueFalseScorer
+from pyrit.score import TrueFalseScorer
 
 _TEST_SCORER_ID = ComponentIdentifier(class_name="MockScorer", class_module="tests.unit.scenarios")
 
diff --git a/tests/unit/scenario/test_encoding.py b/tests/unit/scenario/test_encoding.py
index 1cb0aaeff6..bb643ff6dc 100644
--- a/tests/unit/scenario/test_encoding.py
+++ b/tests/unit/scenario/test_encoding.py
@@ -405,9 +405,7 @@ def test_encoding_dataset_config_can_be_initialized_with_dataset_names(self):
 class TestEncodingBaselineUniformity:
     """ADO 9012 regression: baseline shares objectives with strategies under max_dataset_size."""
 
-    async def test_one_resolution_call_baseline_matches_strategies(
-        self, mock_objective_target, mock_objective_scorer
-    ):
+    async def test_one_resolution_call_baseline_matches_strategies(self, mock_objective_target, mock_objective_scorer):
         from unittest.mock import patch
 
         from pyrit.models import SeedGroup, SeedObjective
diff --git a/tests/unit/scenario/test_foundry.py b/tests/unit/scenario/test_foundry.py
index 1272cedecd..3a00a50ef2 100644
--- a/tests/unit/scenario/test_foundry.py
+++ b/tests/unit/scenario/test_foundry.py
@@ -686,9 +686,7 @@ async def test_initialize_converts_converter_only_composite_strategy(
 class TestRedTeamAgentBaselineUniformity:
     """ADO 9012 regression: baseline shares objectives with strategies under max_dataset_size."""
 
-    async def test_one_resolution_call_baseline_matches_strategies(
-        self, mock_objective_target, mock_objective_scorer
-    ):
+    async def test_one_resolution_call_baseline_matches_strategies(self, mock_objective_target, mock_objective_scorer):
         from pyrit.models import SeedGroup, SeedObjective
 
         seed_groups = [SeedGroup(seeds=[SeedObjective(value=f"obj{i}")]) for i in range(10)]
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index 4643b7748c..bf6da29276 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -928,9 +928,7 @@ async def _get_atomic_attacks_async(self):
                     )
                 ]
                 if self._include_baseline:
-                    atomic_attacks.insert(
-                        0, self._build_baseline_atomic_attack(seed_groups=all_seed_groups)
-                    )
+                    atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=all_seed_groups))
                 return atomic_attacks
 
         # Two distinct samples wired up. A buggy implementation with a second

From f3c2095b23bf63f1842f05ec70721e53ebf1d973 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 16:42:13 -0400
Subject: [PATCH 16/19] Add deprecation rescue for overrides that don't emit
 baseline (until v0.16.0)

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 pyrit/scenario/core/scenario.py      | 11 +++++
 tests/unit/scenario/test_scenario.py | 68 ++++++++++++++++++++++++++++
 2 files changed, 79 insertions(+)

diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 1579219a8d..1377b30ac0 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -681,6 +681,17 @@ async def initialize_async(
 
         self._atomic_attacks = await self._get_atomic_attacks_async()
 
+        # Deprecation rescue (removed in v0.16.0): if the override didn't emit baseline,
+        # warn and inject. Migrated overrides emit baseline themselves and bypass this branch.
+        if include_baseline and (not self._atomic_attacks or self._atomic_attacks[0].atomic_attack_name != "baseline"):
+            print_deprecation_message(
+                old_item=f"{type(self).__name__}._get_atomic_attacks_async() not emitting baseline",
+                new_item="call self._build_baseline_atomic_attack(seed_groups=...) inside the override",
+                removed_in="v0.16.0",
+            )
+            seed_groups = self._dataset_config.get_all_seed_attack_groups()
+            self._atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=seed_groups))
+
         # Store original objectives for each atomic attack (before any mutations during execution)
         self._original_objectives_map = {
             atomic_attack.atomic_attack_name: tuple(atomic_attack.objectives) for atomic_attack in self._atomic_attacks
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index bf6da29276..024cb065d3 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -710,6 +710,17 @@ async def _get_atomic_attacks_async(self):
         return atomic_attacks
 
 
+class _LegacyOverrideScenario(ConcreteScenarioWithTrueFalseScorer):
+    """Override that does NOT emit baseline — exercises the deprecation rescue path.
+
+    Real user scenarios written before the structural fix may follow this pattern;
+    the rescue path warns and injects baseline so they keep working until v0.16.0.
+    """
+
+    async def _get_atomic_attacks_async(self):
+        return list(self._atomic_attacks_to_return)
+
+
 @pytest.mark.usefixtures("patch_central_database")
 class TestScenarioBaselineOnlyExecution:
     """Tests for baseline-only execution (empty strategies with include_baseline=True)."""
@@ -993,6 +1004,63 @@ def test_raises_when_scorer_is_none(self, mock_objective_target):
             scenario._build_baseline_atomic_attack(seed_groups=self._seed_groups())
 
 
+@pytest.mark.usefixtures("patch_central_database")
+class TestBaselineEmissionDeprecationRescue:
+    """Deprecation rescue (removed in v0.16.0): overrides that don't emit baseline get a
+    DeprecationWarning + auto-injected baseline so they keep working during the migration."""
+
+    @staticmethod
+    def _dataset_config():
+        from pyrit.models import SeedGroup, SeedObjective
+
+        return DatasetConfiguration(
+            seed_groups=[SeedGroup(seeds=[SeedObjective(value="x")])],
+        )
+
+    async def test_rescue_emits_warning_and_injects_baseline(self, mock_objective_target):
+        import warnings
+
+        scenario = _LegacyOverrideScenario(name="LegacyOverride", version=1)
+
+        with warnings.catch_warnings(record=True) as caught:
+            warnings.simplefilter("always")
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                dataset_config=self._dataset_config(),
+                include_baseline=True,
+            )
+
+        deprecations = [
+            w
+            for w in caught
+            if issubclass(w.category, DeprecationWarning) and "_get_atomic_attacks_async" in str(w.message)
+        ]
+        assert len(deprecations) == 1, "rescue should emit exactly one DeprecationWarning naming the method"
+        assert "v0.16.0" in str(deprecations[0].message)
+        assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+
+    async def test_well_behaved_override_does_not_trigger_rescue(self, mock_objective_target):
+        import warnings
+
+        scenario = ConcreteScenarioWithTrueFalseScorer(name="GoodCitizen", version=1)
+
+        with warnings.catch_warnings(record=True) as caught:
+            warnings.simplefilter("always")
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                dataset_config=self._dataset_config(),
+                include_baseline=True,
+            )
+
+        rescue_warnings = [
+            w
+            for w in caught
+            if issubclass(w.category, DeprecationWarning) and "_get_atomic_attacks_async" in str(w.message)
+        ]
+        assert not rescue_warnings, "well-behaved override should not trigger the rescue path"
+        assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+
+
 @pytest.mark.usefixtures("patch_central_database")
 class TestValidateStoredScenario:
     """Tests for Scenario._validate_stored_scenario."""

From 768ffe504c25c4b7597e05cc86420efd6daa9707 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 16:48:38 -0400
Subject: [PATCH 17/19] Normalize deprecation markers (drop v prefix, fix
 rescue text)

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 pyrit/scenario/core/scenario.py                | 18 +++++++++---------
 pyrit/scenario/scenarios/airt/cyber.py         | 10 +++++-----
 pyrit/scenario/scenarios/airt/jailbreak.py     | 10 +++++-----
 pyrit/scenario/scenarios/airt/scam.py          | 10 +++++-----
 .../scenarios/foundry/red_team_agent.py        | 10 +++++-----
 pyrit/scenario/scenarios/garak/encoding.py     | 10 +++++-----
 .../unit/scenario/test_baseline_deprecation.py |  6 +++---
 tests/unit/scenario/test_scenario.py           |  6 +++---
 8 files changed, 40 insertions(+), 40 deletions(-)

diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 1377b30ac0..572ab1b133 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -167,7 +167,7 @@ def __init__(
         strategy_class: type[ScenarioStrategy],
         objective_scorer: Scorer,
         scenario_result_id: Optional[Union[uuid.UUID, str]] = None,
-        include_default_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
+        include_default_baseline: bool | None = None,  # Deprecated. Will be removed in 0.16.0.
     ) -> None:
         """
         Initialize a scenario.
@@ -181,7 +181,7 @@ def __init__(
                 Can be either a UUID object or a string representation of a UUID.
                 If provided and found in memory, the scenario will resume from prior progress.
                 All other parameters must still match the stored scenario configuration.
-            include_default_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0.
+            include_default_baseline (bool | None): **Deprecated.** Will be removed in 0.16.0.
                 Pass ``include_baseline`` to ``initialize_async`` instead. When set, the value is
                 used as the effective ``include_baseline`` for the next ``initialize_async`` call
                 unless that call passes its own ``include_baseline``.
@@ -238,7 +238,7 @@ def __init__(
         # before _get_atomic_attacks_async is awaited so overrides can read it.
         self._include_baseline: bool = False
 
-        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along
+        # Deprecated constructor-time baseline override. Will be removed in 0.16.0, along
         # with the include_default_baseline kwarg above and the legacy fallback branch in
         # initialize_async. Subclass shims set this attribute directly to avoid double-warning.
         self._legacy_include_baseline: bool | None = None
@@ -246,7 +246,7 @@ def __init__(
             print_deprecation_message(
                 old_item="Scenario(include_default_baseline=...)",
                 new_item="Scenario.initialize_async(include_baseline=...)",
-                removed_in="v0.16.0",
+                removed_in="0.16.0",
             )
             self._legacy_include_baseline = include_default_baseline
 
@@ -647,7 +647,7 @@ async def initialize_async(
         self._max_retries = max_retries
         self._memory_labels = memory_labels or {}
 
-        # Deprecated. Will be removed in v0.16.0. Honor the legacy constructor-time
+        # Deprecated. Will be removed in 0.16.0. Honor the legacy constructor-time
         # include_default_baseline (or subclass include_baseline) only when the caller did
         # not supply a runtime value.
         if include_baseline is None and self._legacy_include_baseline is not None:
@@ -681,13 +681,13 @@ async def initialize_async(
 
         self._atomic_attacks = await self._get_atomic_attacks_async()
 
-        # Deprecation rescue (removed in v0.16.0): if the override didn't emit baseline,
+        # Deprecation rescue. Will be removed in 0.16.0. If the override didn't emit baseline,
         # warn and inject. Migrated overrides emit baseline themselves and bypass this branch.
         if include_baseline and (not self._atomic_attacks or self._atomic_attacks[0].atomic_attack_name != "baseline"):
             print_deprecation_message(
-                old_item=f"{type(self).__name__}._get_atomic_attacks_async() not emitting baseline",
-                new_item="call self._build_baseline_atomic_attack(seed_groups=...) inside the override",
-                removed_in="v0.16.0",
+                old_item=f"Implicit baseline injection for {type(self).__name__} overriding _get_atomic_attacks_async()",
+                new_item="explicit emission via self._build_baseline_atomic_attack(seed_groups=...) in the override",
+                removed_in="0.16.0",
             )
             seed_groups = self._dataset_config.get_all_seed_attack_groups()
             self._atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=seed_groups))
diff --git a/pyrit/scenario/scenarios/airt/cyber.py b/pyrit/scenario/scenarios/airt/cyber.py
index 9fb516518a..d29b81eecc 100644
--- a/pyrit/scenario/scenarios/airt/cyber.py
+++ b/pyrit/scenario/scenarios/airt/cyber.py
@@ -7,7 +7,7 @@
 from typing import TYPE_CHECKING, ClassVar
 
 from pyrit.common import apply_defaults
-from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in 0.16.0.
 from pyrit.common.path import SCORER_SEED_PROMPT_PATH
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
 from pyrit.scenario.core.scenario import Scenario
@@ -110,7 +110,7 @@ def __init__(
         *,
         objective_scorer: TrueFalseScorer | None = None,
         scenario_result_id: str | None = None,
-        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in 0.16.0.
     ) -> None:
         """
         Initialize the cyber harms scenario.
@@ -119,7 +119,7 @@ def __init__(
             objective_scorer (TrueFalseScorer | None): Objective scorer for malware detection. If not
                 provided, defaults to a composite scorer using malware detection + refusal backstop.
             scenario_result_id (str | None): Optional ID of an existing scenario result to resume.
-            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+            include_baseline (bool | None): **Deprecated.** Will be removed in 0.16.0. Pass
                 ``include_baseline`` to ``initialize_async`` instead.
         """
         self._objective_scorer: TrueFalseScorer = (
@@ -133,12 +133,12 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
-        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # Deprecated constructor-time baseline override. Will be removed in 0.16.0, along with
         # the include_baseline kwarg above.
         if include_baseline is not None:
             print_deprecation_message(
                 old_item="Cyber(include_baseline=...)",
                 new_item="Cyber.initialize_async(include_baseline=...)",
-                removed_in="v0.16.0",
+                removed_in="0.16.0",
             )
             self._legacy_include_baseline = include_baseline
diff --git a/pyrit/scenario/scenarios/airt/jailbreak.py b/pyrit/scenario/scenarios/airt/jailbreak.py
index 92966da085..bdd7aabc15 100644
--- a/pyrit/scenario/scenarios/airt/jailbreak.py
+++ b/pyrit/scenario/scenarios/airt/jailbreak.py
@@ -5,7 +5,7 @@
 from typing import Any, ClassVar, Optional, Union
 
 from pyrit.common import apply_defaults
-from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in 0.16.0.
 from pyrit.datasets import TextJailBreak
 from pyrit.executor.attack.core.attack_config import (
     AttackAdversarialConfig,
@@ -130,7 +130,7 @@ def __init__(
         num_templates: Optional[int] = None,
         num_attempts: int = 1,
         jailbreak_names: list[str] | None = None,
-        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in 0.16.0.
     ) -> None:
         """
         Initialize the jailbreak scenario.
@@ -143,7 +143,7 @@ def __init__(
             num_attempts (Optional[int]): Number of times to try each jailbreak.
             jailbreak_names (Optional[List[str]]): List of jailbreak names from the template list under datasets.
                 to use.
-            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+            include_baseline (bool | None): **Deprecated.** Will be removed in 0.16.0. Pass
                 ``include_baseline`` to ``initialize_async`` instead.
 
         Raises:
@@ -192,13 +192,13 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
-        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # Deprecated constructor-time baseline override. Will be removed in 0.16.0, along with
         # the include_baseline kwarg above.
         if include_baseline is not None:
             print_deprecation_message(
                 old_item="Jailbreak(include_baseline=...)",
                 new_item="Jailbreak.initialize_async(include_baseline=...)",
-                removed_in="v0.16.0",
+                removed_in="0.16.0",
             )
             self._legacy_include_baseline = include_baseline
 
diff --git a/pyrit/scenario/scenarios/airt/scam.py b/pyrit/scenario/scenarios/airt/scam.py
index 30676e74bf..84b57cffb8 100644
--- a/pyrit/scenario/scenarios/airt/scam.py
+++ b/pyrit/scenario/scenarios/airt/scam.py
@@ -6,7 +6,7 @@
 from typing import TYPE_CHECKING, Any, Optional
 
 from pyrit.common import Parameter, apply_defaults
-from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in 0.16.0.
 from pyrit.common.path import (
     EXECUTOR_RED_TEAM_PATH,
     SCORER_SEED_PROMPT_PATH,
@@ -154,7 +154,7 @@ def __init__(
         objective_scorer: Optional[TrueFalseScorer] = None,
         adversarial_chat: Optional[PromptTarget] = None,
         scenario_result_id: Optional[str] = None,
-        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in 0.16.0.
     ) -> None:
         """
         Initialize the ScamScenario.
@@ -165,7 +165,7 @@ def __init__(
             adversarial_chat (Optional[PromptTarget]): Chat target used to rephrase the
                 objective into the role-play context (in single-turn strategies).
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
-            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+            include_baseline (bool | None): **Deprecated.** Will be removed in 0.16.0. Pass
                 ``include_baseline`` to ``initialize_async`` instead.
         """
         if not objective_scorer:
@@ -183,13 +183,13 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
-        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # Deprecated constructor-time baseline override. Will be removed in 0.16.0, along with
         # the include_baseline kwarg above.
         if include_baseline is not None:
             print_deprecation_message(
                 old_item="Scam(include_baseline=...)",
                 new_item="Scam.initialize_async(include_baseline=...)",
-                removed_in="v0.16.0",
+                removed_in="0.16.0",
             )
             self._legacy_include_baseline = include_baseline
 
diff --git a/pyrit/scenario/scenarios/foundry/red_team_agent.py b/pyrit/scenario/scenarios/foundry/red_team_agent.py
index 6a13073882..b9ce521fb4 100644
--- a/pyrit/scenario/scenarios/foundry/red_team_agent.py
+++ b/pyrit/scenario/scenarios/foundry/red_team_agent.py
@@ -16,7 +16,7 @@
 from typing import TYPE_CHECKING, Any, Optional, TypeVar, cast
 
 from pyrit.common import REQUIRED_VALUE, apply_defaults
-from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in 0.16.0.
 from pyrit.datasets import TextJailBreak
 from pyrit.executor.attack import (
     CrescendoAttack,
@@ -247,7 +247,7 @@ def __init__(
         adversarial_chat: Optional[PromptTarget] = None,
         attack_scoring_config: Optional[AttackScoringConfig] = None,
         scenario_result_id: Optional[str] = None,
-        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in 0.16.0.
     ) -> None:
         """
         Initialize a Foundry Scenario with the specified attack strategies.
@@ -260,7 +260,7 @@ def __init__(
                 including the objective scorer and auxiliary scorers. If not provided, creates a default
                 configuration with a composite scorer using Azure Content Filter and SelfAsk Refusal scorers.
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
-            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+            include_baseline (bool | None): **Deprecated.** Will be removed in 0.16.0. Pass
                 ``include_baseline`` to ``initialize_async`` instead.
 
         Raises:
@@ -286,13 +286,13 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
-        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # Deprecated constructor-time baseline override. Will be removed in 0.16.0, along with
         # the include_baseline kwarg above.
         if include_baseline is not None:
             print_deprecation_message(
                 old_item="RedTeamAgent(include_baseline=...)",
                 new_item="RedTeamAgent.initialize_async(include_baseline=...)",
-                removed_in="v0.16.0",
+                removed_in="0.16.0",
             )
             self._legacy_include_baseline = include_baseline
 
diff --git a/pyrit/scenario/scenarios/garak/encoding.py b/pyrit/scenario/scenarios/garak/encoding.py
index 8233e4206b..c20ece87b4 100644
--- a/pyrit/scenario/scenarios/garak/encoding.py
+++ b/pyrit/scenario/scenarios/garak/encoding.py
@@ -7,7 +7,7 @@
 from typing import Optional
 
 from pyrit.common import apply_defaults
-from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in v0.16.0.
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in 0.16.0.
 from pyrit.executor.attack.core.attack_config import (
     AttackConverterConfig,
     AttackScoringConfig,
@@ -175,7 +175,7 @@ def __init__(
         objective_scorer: Optional[TrueFalseScorer] = None,
         encoding_templates: Optional[Sequence[str]] = None,
         scenario_result_id: Optional[str] = None,
-        include_baseline: bool | None = None,  # Deprecated. Will be removed in v0.16.0.
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in 0.16.0.
     ) -> None:
         """
         Initialize the Encoding Scenario.
@@ -187,7 +187,7 @@ def __init__(
             encoding_templates (Optional[Sequence[str]]): Templates used to construct the decoding
                 prompts. Defaults to AskToDecodeConverter.garak_templates.
             scenario_result_id (Optional[str]): Optional ID of an existing scenario result to resume.
-            include_baseline (bool | None): **Deprecated.** Will be removed in v0.16.0. Pass
+            include_baseline (bool | None): **Deprecated.** Will be removed in 0.16.0. Pass
                 ``include_baseline`` to ``initialize_async`` instead.
         """
         objective_scorer = objective_scorer or DecodingScorer(categories=["encoding_scenario"])
@@ -202,13 +202,13 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
-        # Deprecated constructor-time baseline override. Will be removed in v0.16.0, along with
+        # Deprecated constructor-time baseline override. Will be removed in 0.16.0, along with
         # the include_baseline kwarg above.
         if include_baseline is not None:
             print_deprecation_message(
                 old_item="Encoding(include_baseline=...)",
                 new_item="Encoding.initialize_async(include_baseline=...)",
-                removed_in="v0.16.0",
+                removed_in="0.16.0",
             )
             self._legacy_include_baseline = include_baseline
 
diff --git a/tests/unit/scenario/test_baseline_deprecation.py b/tests/unit/scenario/test_baseline_deprecation.py
index 4272ebd277..5faf9a6d76 100644
--- a/tests/unit/scenario/test_baseline_deprecation.py
+++ b/tests/unit/scenario/test_baseline_deprecation.py
@@ -2,7 +2,7 @@
 # Licensed under the MIT license.
 
 """
-Deprecated. Will be removed in v0.16.0 along with the corresponding
+Deprecated. Will be removed in 0.16.0 along with the corresponding
 ``include_default_baseline`` / ``include_baseline`` constructor shims in
 ``Scenario`` and its subclasses (``Cyber``, ``Jailbreak``, ``Scam``,
 ``RedTeamAgent``, ``Encoding``).
@@ -87,7 +87,7 @@ def test_base_kwarg_emits_deprecation_warning(self):
         assert len(deprecations) == 1
         msg = str(deprecations[0].message)
         assert "include_default_baseline" in msg
-        assert "v0.16.0" in msg
+        assert "0.16.0" in msg
         assert scenario._legacy_include_baseline is False
 
     def test_base_kwarg_omitted_emits_no_warning(self):
@@ -161,7 +161,7 @@ def test_subclass_kwarg_emits_deprecation_warning(
             w for w in caught if issubclass(w.category, DeprecationWarning) and class_name in str(w.message)
         ]
         assert len(deprecations) >= 1, f"{class_name} did not emit a DeprecationWarning naming the class"
-        assert "v0.16.0" in str(deprecations[0].message)
+        assert "0.16.0" in str(deprecations[0].message)
         assert scenario._legacy_include_baseline is False
 
 
diff --git a/tests/unit/scenario/test_scenario.py b/tests/unit/scenario/test_scenario.py
index 024cb065d3..e7042183d6 100644
--- a/tests/unit/scenario/test_scenario.py
+++ b/tests/unit/scenario/test_scenario.py
@@ -714,7 +714,7 @@ class _LegacyOverrideScenario(ConcreteScenarioWithTrueFalseScorer):
     """Override that does NOT emit baseline — exercises the deprecation rescue path.
 
     Real user scenarios written before the structural fix may follow this pattern;
-    the rescue path warns and injects baseline so they keep working until v0.16.0.
+    the rescue path warns and injects baseline so they keep working until 0.16.0.
     """
 
     async def _get_atomic_attacks_async(self):
@@ -1006,7 +1006,7 @@ def test_raises_when_scorer_is_none(self, mock_objective_target):
 
 @pytest.mark.usefixtures("patch_central_database")
 class TestBaselineEmissionDeprecationRescue:
-    """Deprecation rescue (removed in v0.16.0): overrides that don't emit baseline get a
+    """Deprecation rescue (removed in 0.16.0): overrides that don't emit baseline get a
     DeprecationWarning + auto-injected baseline so they keep working during the migration."""
 
     @staticmethod
@@ -1036,7 +1036,7 @@ async def test_rescue_emits_warning_and_injects_baseline(self, mock_objective_ta
             if issubclass(w.category, DeprecationWarning) and "_get_atomic_attacks_async" in str(w.message)
         ]
         assert len(deprecations) == 1, "rescue should emit exactly one DeprecationWarning naming the method"
-        assert "v0.16.0" in str(deprecations[0].message)
+        assert "0.16.0" in str(deprecations[0].message)
         assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
 
     async def test_well_behaved_override_does_not_trigger_rescue(self, mock_objective_target):

From 3e58bb541b8fc6d40df1cd0a93b8d44f1e6d36f6 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 17:09:19 -0400
Subject: [PATCH 18/19] Trim deprecation rescue old_item to fit line-length

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 pyrit/scenario/core/scenario.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 33728af4c9..9e5fc4b359 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -685,7 +685,7 @@ async def initialize_async(
         # warn and inject. Migrated overrides emit baseline themselves and bypass this branch.
         if include_baseline and (not self._atomic_attacks or self._atomic_attacks[0].atomic_attack_name != "baseline"):
             print_deprecation_message(
-                old_item=f"Implicit baseline injection for {type(self).__name__} overriding _get_atomic_attacks_async()",
+                old_item=f"Implicit baseline injection for {type(self).__name__}._get_atomic_attacks_async()",
                 new_item="explicit emission via self._build_baseline_atomic_attack(seed_groups=...) in the override",
                 removed_in="0.16.0",
             )

From 0286320713d17c1fc0f177690dbeff526751c629 Mon Sep 17 00:00:00 2001
From: Adrian Gavrila <ag941@hotmail.com>
Date: Wed, 13 May 2026 18:47:01 -0400
Subject: [PATCH 19/19] Address PR review: flip Jailbreak/Psychosocial
 defaults, fix rescue, add Psychosocial deprecation shim

Co-authored-by: Copilot <223556219+Copilot@users.noreply.github.com>
---
 pyrit/scenario/core/scenario.py               |  9 ++-
 pyrit/scenario/scenarios/airt/jailbreak.py    |  9 +--
 pyrit/scenario/scenarios/airt/psychosocial.py | 29 +++++++---
 tests/unit/scenario/test_jailbreak.py         | 55 +++++++++++--------
 .../unit/scenario/test_psychosocial_harms.py  | 33 +++++++++++
 5 files changed, 96 insertions(+), 39 deletions(-)

diff --git a/pyrit/scenario/core/scenario.py b/pyrit/scenario/core/scenario.py
index 9e5fc4b359..b82f16af90 100644
--- a/pyrit/scenario/core/scenario.py
+++ b/pyrit/scenario/core/scenario.py
@@ -683,13 +683,20 @@ async def initialize_async(
 
         # Deprecation rescue. Will be removed in 0.16.0. If the override didn't emit baseline,
         # warn and inject. Migrated overrides emit baseline themselves and bypass this branch.
+        # Reuse seeds from the first existing attack rather than re-resolving from
+        # dataset_config; re-resolution under max_dataset_size would draw a fresh sample
+        # (the very ADO 9012 bug this PR fixes). When no atomic attacks exist yet the
+        # rescue falls back to the dataset_config one-time resolution.
         if include_baseline and (not self._atomic_attacks or self._atomic_attacks[0].atomic_attack_name != "baseline"):
             print_deprecation_message(
                 old_item=f"Implicit baseline injection for {type(self).__name__}._get_atomic_attacks_async()",
                 new_item="explicit emission via self._build_baseline_atomic_attack(seed_groups=...) in the override",
                 removed_in="0.16.0",
             )
-            seed_groups = self._dataset_config.get_all_seed_attack_groups()
+            if self._atomic_attacks:
+                seed_groups = self._atomic_attacks[0].seed_groups
+            else:
+                seed_groups = self._dataset_config.get_all_seed_attack_groups()
             self._atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=seed_groups))
 
         # Store original objectives for each atomic attack (before any mutations during execution)
diff --git a/pyrit/scenario/scenarios/airt/jailbreak.py b/pyrit/scenario/scenarios/airt/jailbreak.py
index bdd7aabc15..f69b55d017 100644
--- a/pyrit/scenario/scenarios/airt/jailbreak.py
+++ b/pyrit/scenario/scenarios/airt/jailbreak.py
@@ -2,7 +2,7 @@
 # Licensed under the MIT license.
 
 from pathlib import Path
-from typing import Any, ClassVar, Optional, Union
+from typing import Any, Optional, Union
 
 from pyrit.common import apply_defaults
 from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in 0.16.0.
@@ -23,7 +23,7 @@
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
+from pyrit.scenario.core.scenario import Scenario
 from pyrit.scenario.core.scenario_strategy import ScenarioStrategy
 from pyrit.scenario.core.scenario_target_defaults import get_default_adversarial_target
 from pyrit.score import (
@@ -81,11 +81,6 @@ class Jailbreak(Scenario):
 
     VERSION: int = 1
 
-    #: Jailbreak runs many templates per objective, so the baseline atomic attack is rarely
-    #: informative relative to the volume of jailbreak templates. Off by default; callers that
-    #: want a comparison can pass ``include_baseline=True`` to ``initialize_async``.
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Disabled
-
     @classmethod
     def get_strategy_class(cls) -> type[ScenarioStrategy]:
         """
diff --git a/pyrit/scenario/scenarios/airt/psychosocial.py b/pyrit/scenario/scenarios/airt/psychosocial.py
index 1bda830f7a..8e7bb0bd5b 100644
--- a/pyrit/scenario/scenarios/airt/psychosocial.py
+++ b/pyrit/scenario/scenarios/airt/psychosocial.py
@@ -4,11 +4,12 @@
 import logging
 import pathlib
 from dataclasses import dataclass
-from typing import Any, ClassVar, Optional, TypeVar
+from typing import Any, Optional, TypeVar
 
 import yaml
 
 from pyrit.common import apply_defaults
+from pyrit.common.deprecation import print_deprecation_message  # Deprecated. Will be removed in 0.16.0.
 from pyrit.common.path import DATASETS_PATH
 from pyrit.executor.attack import (
     AttackAdversarialConfig,
@@ -30,7 +31,7 @@
 from pyrit.scenario.core.atomic_attack import AtomicAttack
 from pyrit.scenario.core.attack_technique import AttackTechnique
 from pyrit.scenario.core.dataset_configuration import DatasetConfiguration
-from pyrit.scenario.core.scenario import BaselinePolicy, Scenario
+from pyrit.scenario.core.scenario import Scenario
 from pyrit.scenario.core.scenario_strategy import (
     ScenarioStrategy,
 )
@@ -147,10 +148,6 @@ class Psychosocial(Scenario):
 
     VERSION: int = 1
 
-    #: Psychosocial measures multi-turn escalation behavior; a single-shot baseline send
-    #: isn't a meaningful comparator, so the default baseline is forbidden.
-    BASELINE_POLICY: ClassVar[BaselinePolicy] = BaselinePolicy.Forbidden
-
     #: Psychosocial runs CrescendoAttack, which requires the target to natively support
     #: editable conversation history (for backtracking). Declared here so the base scenario
     #: validates the target as soon as it is supplied to ``initialize_async``.
@@ -218,6 +215,7 @@ def __init__(
         scenario_result_id: Optional[str] = None,
         subharm_configs: Optional[dict[str, SubharmConfig]] = None,
         max_turns: int = 5,
+        include_baseline: bool | None = None,  # Deprecated. Will be removed in 0.16.0.
     ) -> None:
         """
         Initialize the Psychosocial Harms Scenario.
@@ -249,6 +247,8 @@ def __init__(
 
             max_turns (int): Maximum number of conversation turns for multi-turn attacks (CrescendoAttack).
                 Defaults to 5. Increase for more gradual escalation, decrease for faster testing.
+            include_baseline (bool | None): **Deprecated.** Will be removed in 0.16.0. Pass
+                ``include_baseline`` to ``initialize_async`` instead.
         """
         if objectives is not None:
             logger.warning(
@@ -270,6 +270,16 @@ def __init__(
             scenario_result_id=scenario_result_id,
         )
 
+        # Deprecated constructor-time baseline override. Will be removed in 0.16.0, along with
+        # the include_baseline kwarg above.
+        if include_baseline is not None:
+            print_deprecation_message(
+                old_item="Psychosocial(include_baseline=...)",
+                new_item="Psychosocial.initialize_async(include_baseline=...)",
+                removed_in="0.16.0",
+            )
+            self._legacy_include_baseline = include_baseline
+
         # Store deprecated objectives for later resolution in _resolve_seed_groups
         self._deprecated_objectives = objectives
         # Will be resolved in _get_atomic_attacks_async
@@ -424,7 +434,7 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
 
         scoring_config = self._create_scoring_config(resolved.subharm)
 
-        return [
+        atomic_attacks: list[AtomicAttack] = [
             *self._create_single_turn_attacks(scoring_config=scoring_config, seed_groups=self._seed_groups),
             self._create_multi_turn_attack(
                 scoring_config=scoring_config,
@@ -433,6 +443,11 @@ async def _get_atomic_attacks_async(self) -> list[AtomicAttack]:
             ),
         ]
 
+        if self._include_baseline:
+            atomic_attacks.insert(0, self._build_baseline_atomic_attack(seed_groups=self._seed_groups))
+
+        return atomic_attacks
+
     def _create_scoring_config(self, subharm: Optional[str]) -> AttackScoringConfig:
         subharm_config = self._subharm_configs.get(subharm) if subharm else None
         scorer = self._get_scorer(subharm=subharm) if subharm_config else self._objective_scorer
diff --git a/tests/unit/scenario/test_jailbreak.py b/tests/unit/scenario/test_jailbreak.py
index b8f402b0a2..b30d386140 100644
--- a/tests/unit/scenario/test_jailbreak.py
+++ b/tests/unit/scenario/test_jailbreak.py
@@ -203,35 +203,30 @@ async def test_init_raises_exception_when_no_datasets_available(self, mock_objec
         with pytest.raises(ValueError, match="DatasetConfiguration has no seed_groups"):
             await scenario.initialize_async(objective_target=mock_objective_target)
 
-    def test_class_supports_baseline_but_defaults_off(self):
-        """Jailbreak supports a baseline but does not include one by default."""
-        assert Jailbreak.BASELINE_POLICY is BaselinePolicy.Disabled
+    def test_class_inherits_default_baseline_policy(self):
+        """Jailbreak inherits the base default (Enabled) — baseline included by default."""
+        assert Jailbreak.BASELINE_POLICY is BaselinePolicy.Enabled
 
-    async def test_default_initialize_omits_baseline(
+    async def test_default_initialize_includes_baseline(
         self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
     ):
-        """initialize_async without include_baseline honors BASELINE_POLICY=Disabled."""
+        """initialize_async without include_baseline honors BASELINE_POLICY=Enabled."""
         with patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
             await scenario.initialize_async(objective_target=mock_objective_target)
-            assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
+            assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
 
-    async def test_explicit_include_baseline_true_prepends_baseline(
+    async def test_explicit_include_baseline_false_omits_baseline(
         self, mock_objective_target, mock_objective_scorer, mock_memory_seed_groups
     ):
-        """Caller can override BASELINE_POLICY=Disabled by passing include_baseline=True."""
-        from pyrit.scenario import DatasetConfiguration
-
-        with (
-            patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups),
-            patch.object(DatasetConfiguration, "get_all_seed_attack_groups", return_value=mock_memory_seed_groups),
-        ):
+        """Caller can opt out of baseline by passing include_baseline=False."""
+        with patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
             await scenario.initialize_async(
                 objective_target=mock_objective_target,
-                include_baseline=True,
+                include_baseline=False,
             )
-            assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+            assert not any(a.atomic_attack_name == "baseline" for a in scenario._atomic_attacks)
 
 
 @pytest.mark.usefixtures(*FIXTURES)
@@ -273,7 +268,9 @@ async def test_attack_generation_for_complex(
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
 
             await scenario.initialize_async(
-                objective_target=mock_objective_target, scenario_strategies=[complex_jailbreak_strategy]
+                objective_target=mock_objective_target,
+                scenario_strategies=[complex_jailbreak_strategy],
+                include_baseline=False,
             )
             atomic_attacks = await scenario._get_atomic_attacks_async()
             for run in atomic_attacks:
@@ -289,7 +286,9 @@ async def test_attack_generation_for_manyshot(
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
 
             await scenario.initialize_async(
-                objective_target=mock_objective_target, scenario_strategies=[manyshot_jailbreak_strategy]
+                objective_target=mock_objective_target,
+                scenario_strategies=[manyshot_jailbreak_strategy],
+                include_baseline=False,
             )
             atomic_attacks = await scenario._get_atomic_attacks_async()
             for run in atomic_attacks:
@@ -303,7 +302,9 @@ async def test_attack_generation_for_promptsending(
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
 
             await scenario.initialize_async(
-                objective_target=mock_objective_target, scenario_strategies=[promptsending_jailbreak_strategy]
+                objective_target=mock_objective_target,
+                scenario_strategies=[promptsending_jailbreak_strategy],
+                include_baseline=False,
             )
             atomic_attacks = await scenario._get_atomic_attacks_async()
             for run in atomic_attacks:
@@ -317,7 +318,9 @@ async def test_attack_generation_for_skeleton(
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
 
             await scenario.initialize_async(
-                objective_target=mock_objective_target, scenario_strategies=[skeleton_jailbreak_attack]
+                objective_target=mock_objective_target,
+                scenario_strategies=[skeleton_jailbreak_attack],
+                include_baseline=False,
             )
             atomic_attacks = await scenario._get_atomic_attacks_async()
             for run in atomic_attacks:
@@ -331,7 +334,9 @@ async def test_attack_generation_for_roleplay(
             scenario = Jailbreak(objective_scorer=mock_objective_scorer)
 
             await scenario.initialize_async(
-                objective_target=mock_objective_target, scenario_strategies=[roleplay_jailbreak_strategy]
+                objective_target=mock_objective_target,
+                scenario_strategies=[roleplay_jailbreak_strategy],
+                include_baseline=False,
             )
             atomic_attacks = await scenario._get_atomic_attacks_async()
             for run in atomic_attacks:
@@ -393,11 +398,11 @@ async def test_custom_num_attempts(
         """Test that n successfully tries each jailbreak template n-many times."""
         with patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             base_scenario = Jailbreak(objective_scorer=mock_objective_scorer)
-            await base_scenario.initialize_async(objective_target=mock_objective_target)
+            await base_scenario.initialize_async(objective_target=mock_objective_target, include_baseline=False)
             atomic_attacks_1 = await base_scenario._get_atomic_attacks_async()
 
             mult_scenario = Jailbreak(objective_scorer=mock_objective_scorer, num_attempts=mock_random_num_attempts)
-            await mult_scenario.initialize_async(objective_target=mock_objective_target)
+            await mult_scenario.initialize_async(objective_target=mock_objective_target, include_baseline=False)
             atomic_attacks_n = await mult_scenario._get_atomic_attacks_async()
 
             assert len(atomic_attacks_1) * mock_random_num_attempts == len(atomic_attacks_n)
@@ -512,7 +517,9 @@ async def test_roleplay_attacks_share_adversarial_target(
         with patch.object(Jailbreak, "_resolve_seed_groups", return_value=mock_memory_seed_groups):
             scenario = Jailbreak(objective_scorer=mock_objective_scorer, num_templates=2)
             await scenario.initialize_async(
-                objective_target=mock_objective_target, scenario_strategies=[roleplay_jailbreak_strategy]
+                objective_target=mock_objective_target,
+                scenario_strategies=[roleplay_jailbreak_strategy],
+                include_baseline=False,
             )
             atomic_attacks = await scenario._get_atomic_attacks_async()
             assert len(atomic_attacks) >= 2
diff --git a/tests/unit/scenario/test_psychosocial_harms.py b/tests/unit/scenario/test_psychosocial_harms.py
index a8e3325765..ce16363ade 100644
--- a/tests/unit/scenario/test_psychosocial_harms.py
+++ b/tests/unit/scenario/test_psychosocial_harms.py
@@ -393,3 +393,36 @@ def test_aggregate_tags(self):
     def test_strategy_values(self):
         """Test that strategy values are correct."""
         assert PsychosocialStrategy.ALL.value == "all"
+
+
+@pytest.mark.usefixtures(*FIXTURES)
+class TestPsychosocialBaselineUniformity:
+    """ADO 9012 regression: baseline shares objectives with strategies under max_dataset_size."""
+
+    async def test_one_resolution_call_baseline_matches_strategies(self, mock_objective_target, mock_objective_scorer):
+        from pyrit.scenario import DatasetConfiguration
+
+        seed_groups = [SeedGroup(seeds=[SeedObjective(value=f"obj{i}")]) for i in range(10)]
+        config = DatasetConfiguration(seed_groups=seed_groups, max_dataset_size=3)
+
+        first_sample = seed_groups[:3]
+        second_sample = seed_groups[5:8]
+        with (
+            patch.object(Psychosocial, "_extract_harm_category_filter", return_value=None),
+            patch(
+                "pyrit.scenario.core.dataset_configuration.random.sample",
+                side_effect=[first_sample, second_sample],
+            ) as mock_sample,
+        ):
+            scenario = Psychosocial(objective_scorer=mock_objective_scorer)
+            await scenario.initialize_async(
+                objective_target=mock_objective_target,
+                dataset_config=config,
+                include_baseline=True,
+            )
+
+        assert mock_sample.call_count == 1
+        assert scenario._atomic_attacks[0].atomic_attack_name == "baseline"
+        baseline_objs = set(scenario._atomic_attacks[0].objectives)
+        for attack in scenario._atomic_attacks[1:]:
+            assert set(attack.objectives) == baseline_objs