Source code for pyrit.scenario.core.scenario

# Copyright (c) Microsoft Corporation.
# Licensed under the MIT license.

"""
Scenario class for grouping and executing multiple AtomicAttacks.

This module provides the Scenario class that orchestrates the execution of multiple
AtomicAttack instances sequentially, enabling comprehensive security testing campaigns.
"""

import asyncio
import logging
import uuid
from abc import ABC, abstractmethod
from typing import Dict, List, Optional, Sequence, Set, Type, Union

from tqdm.auto import tqdm

from pyrit.common import REQUIRED_VALUE, apply_defaults
from pyrit.executor.attack.single_turn.prompt_sending import PromptSendingAttack
from pyrit.memory import CentralMemory
from pyrit.memory.memory_models import ScenarioResultEntry
from pyrit.models import AttackResult
from pyrit.models.scenario_result import ScenarioIdentifier, ScenarioResult
from pyrit.prompt_target import PromptTarget
from pyrit.scenario.core.atomic_attack import AtomicAttack
from pyrit.scenario.core.scenario_strategy import (
    ScenarioCompositeStrategy,
    ScenarioStrategy,
)

logger = logging.getLogger(__name__)



[docs]
class Scenario(ABC):
    """
    Groups and executes multiple AtomicAttack instances sequentially.

    A Scenario represents a comprehensive testing campaign composed of multiple
    atomic attack tests (AtomicAttacks). It executes each AtomicAttack in sequence and
    aggregates the results into a ScenarioResult.

    Example:
        >>> from pyrit.scenario import Scenario, AtomicAttack
        >>> from pyrit.executor.attack.single_turn.prompt_sending import PromptSendingAttack
        >>> from pyrit.prompt_target import OpenAIChatTarget
        >>> from pyrit.prompt_converter import Base64Converter
        >>>
        >>> target = OpenAIChatTarget()
        >>>
        >>> # Create a custom scenario subclass
        >>> class MyScenario(Scenario):
        ...     async def _get_atomic_attacks_async(self) -> List[AtomicAttack]:
        ...         base64_attack = PromptSendingAttack(
        ...             objective_target=target,
        ...             converters=[Base64Converter()]
        ...         )
        ...         return [
        ...             AtomicAttack(
        ...                 attack=base64_attack,
        ...                 objectives=["Tell me how to make a bomb"]
        ...             )
        ...         ]
        >>>
        >>> # Create and execute scenario
        >>> scenario = MyScenario(
        ...     name="Security Test Campaign",
        ...     version=1,
        ...     attack_strategies=["base64"]
        ... )
        >>> await scenario.initialize_async()
        >>> result = await scenario.run_async()
        >>> print(f"Completed {len(result.attack_results)} tests")
    """


[docs]
    def __init__(
        self,
        *,
        name: str,
        version: int,
        strategy_class: Type[ScenarioStrategy],
        objective_scorer_identifier: Optional[Dict[str, str]] = None,
        include_default_baseline: bool = True,
        scenario_result_id: Optional[Union[uuid.UUID, str]] = None,
    ) -> None:
        """
        Initialize a scenario.

        Args:
            name (str): Descriptive name for the scenario.
            version (int): Version number of the scenario.
            strategy_class (Type[ScenarioStrategy]): The strategy enum class for this scenario.
            objective_scorer_identifier (Optional[Dict[str, str]]): Identifier for the objective scorer.
            include_default_baseline (bool): Whether to include a baseline atomic attack that sends all objectives
                from the first atomic attack without modifications. Most scenarios should have some kind of
                baseline so users can understand the impact of strategies, but subclasses can optionally write
                their own custom baselines. Defaults to True.
            scenario_result_id (Optional[Union[uuid.UUID, str]]): Optional ID of an existing scenario result to resume.
                Can be either a UUID object or a string representation of a UUID.
                If provided and found in memory, the scenario will resume from prior progress.
                All other parameters must still match the stored scenario configuration.

        Note:
            Attack runs are populated by calling initialize_async(), which invokes the
            subclass's _get_atomic_attacks_async() method.

            The scenario description is automatically extracted from the class's docstring (__doc__)
            with whitespace normalized for display.
        """
        # Use the class docstring with normalized whitespace as description
        description = " ".join(self.__class__.__doc__.split()) if self.__class__.__doc__ else ""

        self._identifier = ScenarioIdentifier(
            name=type(self).__name__, scenario_version=version, description=description
        )

        # Store strategy configuration for use in initialize_async
        self._strategy_class = strategy_class

        # These will be set in initialize_async
        self._objective_target: Optional[PromptTarget] = None
        self._objective_target_identifier: Optional[Dict[str, str]] = None
        self._memory_labels: Dict[str, str] = {}
        self._max_concurrency: int = 1
        self._max_retries: int = 0

        self._objective_scorer_identifier = objective_scorer_identifier or {}

        self._name = name
        self._memory = CentralMemory.get_memory_instance()
        self._atomic_attacks: List[AtomicAttack] = []
        self._scenario_result_id: Optional[str] = str(scenario_result_id) if scenario_result_id else None
        self._result_lock = asyncio.Lock()

        self._include_baseline = include_default_baseline

        # Store prepared strategy composites for use in _get_atomic_attacks_async
        self._scenario_composites: List[ScenarioCompositeStrategy] = []

        # Store original objectives for each atomic attack (before any mutations)
        # Key: atomic_attack_name, Value: tuple of original objectives
        self._original_objectives_map: Dict[str, tuple[str, ...]] = {}


    @property
    def name(self) -> str:
        """Get the name of the scenario."""
        return self._name

    @property
    def atomic_attack_count(self) -> int:
        """Get the number of atomic attacks in this scenario."""
        return len(self._atomic_attacks)


[docs]
    @classmethod
    @abstractmethod
    def get_strategy_class(cls) -> Type[ScenarioStrategy]:
        """
        Get the strategy enum class for this scenario.

        This abstract method must be implemented by all scenario subclasses to return
        the ScenarioStrategy enum class that defines the available attack strategies
        for the scenario.

        Returns:
            Type[ScenarioStrategy]: The strategy enum class (e.g., FoundryStrategy, EncodingStrategy).

        Example:
            >>> class MyScenario(Scenario):
            ...     @classmethod
            ...     def get_strategy_class(cls) -> Type[ScenarioStrategy]:
            ...         return MyStrategy
            >>>
            >>> # Registry can now discover strategies without instantiation
            >>> strategy_class = MyScenario.get_strategy_class()
            >>> all_strategies = list(strategy_class)
        """
        pass



[docs]
    @classmethod
    @abstractmethod
    def get_default_strategy(cls) -> ScenarioStrategy:
        """
        Get the default strategy used when no strategies are specified.

        This abstract method must be implemented by all scenario subclasses to return
        the default aggregate strategy (like EASY, ALL) used when scenario_strategies
        parameter is None.

        Returns:
            ScenarioStrategy: The default aggregate strategy (e.g., FoundryStrategy.EASY, EncodingStrategy.ALL).

        Example:
            >>> class MyScenario(Scenario):
            ...     @classmethod
            ...     def get_default_strategy(cls) -> ScenarioStrategy:
            ...         return MyStrategy.EASY
            >>>
            >>> # Registry can discover default strategy without instantiation
            >>> default = MyScenario.get_default_strategy()
        """
        pass



[docs]
    @apply_defaults
    async def initialize_async(
        self,
        *,
        objective_target: PromptTarget = REQUIRED_VALUE,  # type: ignore
        scenario_strategies: Optional[Sequence[ScenarioStrategy | ScenarioCompositeStrategy]] = None,
        max_concurrency: int = 1,
        max_retries: int = 0,
        memory_labels: Optional[Dict[str, str]] = None,
    ) -> None:
        """
        Initialize the scenario by populating self._atomic_attacks and creating the ScenarioResult.

        This method allows scenarios to be initialized with atomic attacks after construction,
        which is useful when atomic attacks require async operations to be built.

        If a scenario_result_id was provided in __init__, this method will check if it exists
        in memory and validate that the stored scenario matches the current configuration.
        If it matches, the scenario will resume from prior progress. If it doesn't match or
        doesn't exist, a new scenario result will be created.

        Args:
            objective_target (PromptTarget): The target system to attack.
            scenario_strategies (Optional[Sequence[ScenarioStrategy | ScenarioCompositeStrategy]]):
                The strategies to execute. Can be a list of bare ScenarioStrategy enums or
                ScenarioCompositeStrategy instances for advanced composition. Bare enums are
                automatically wrapped into composites. If None, uses the default aggregate
                from the scenario's configuration.
            max_concurrency (int): Maximum number of concurrent attack executions. Defaults to 1.
            max_retries (int): Maximum number of automatic retries if the scenario raises an exception.
                Set to 0 (default) for no automatic retries. If set to a positive number,
                the scenario will automatically retry up to this many times after an exception.
                For example, max_retries=3 allows up to 4 total attempts (1 initial + 3 retries).
            memory_labels (Optional[Dict[str, str]]): Additional labels to apply to all
                attack runs in the scenario. These help track and categorize the scenario.

        Raises:
            ValueError: If no objective_target is provided.

        Example:
            >>> # New scenario
            >>> scenario = MyScenario(
            ...     name="Security Test",
            ...     version=1
            ... )
            >>> await scenario.initialize_async(
            ...     objective_target=target,
            ...     scenario_strategies=[MyStrategy.Base64, MyStrategy.ROT13]
            ... )
            >>> results = await scenario.run_async()
            >>>
            >>> # Resume existing scenario
            >>> scenario_id = results.id
            >>> resumed_scenario = MyScenario(
            ...     name="Security Test",
            ...     version=1,
            ...     scenario_result_id=str(scenario_id)
            ... )
            >>> await resumed_scenario.initialize_async(
            ...     objective_target=target,
            ...     scenario_strategies=[MyStrategy.Base64, MyStrategy.ROT13]
            ... )
            >>> results = await resumed_scenario.run_async()  # Resumes from progress
        """
        # Validate required parameters
        if objective_target is None:
            raise ValueError(
                "objective_target is required. "
                "Provide it either as a parameter or via set_default_value() in an initialization script."
            )

        # Set instance variables from parameters
        self._objective_target = objective_target
        self._objective_target_identifier = objective_target.get_identifier()
        self._max_concurrency = max_concurrency
        self._max_retries = max_retries
        self._memory_labels = memory_labels or {}

        # Prepare scenario strategies using the stored configuration
        self._scenario_composites = self._strategy_class.prepare_scenario_strategies(
            scenario_strategies, default_aggregate=self.get_default_strategy()
        )

        self._atomic_attacks = await self._get_atomic_attacks_async()

        if self._include_baseline:
            baseline_attack = self._get_baseline_from_first_attack()
            self._atomic_attacks.insert(0, baseline_attack)

        # Store original objectives for each atomic attack (before any mutations during execution)
        self._original_objectives_map = {
            atomic_attack.atomic_attack_name: tuple(atomic_attack._objectives) for atomic_attack in self._atomic_attacks
        }

        # Check if we're resuming an existing scenario
        if self._scenario_result_id:
            existing_results = self._memory.get_scenario_results(scenario_result_ids=[self._scenario_result_id])

            if existing_results:
                existing_result = existing_results[0]

                # Validate that the stored scenario matches current configuration
                if self._validate_stored_scenario(stored_result=existing_result):
                    return  # Valid match - skip creating new scenario result
                else:
                    # Validation failed - will create new scenario result
                    self._scenario_result_id = None
            else:
                logger.warning(
                    f"Scenario result ID {self._scenario_result_id} not found in memory. "
                    f"Creating new scenario result."
                )
                self._scenario_result_id = None

        # Create new scenario result
        attack_results: Dict[str, List[AttackResult]] = {
            atomic_attack.atomic_attack_name: [] for atomic_attack in self._atomic_attacks
        }

        result = ScenarioResult(
            scenario_identifier=self._identifier,
            objective_target_identifier=self._objective_target_identifier,
            objective_scorer_identifier=self._objective_scorer_identifier,
            labels=self._memory_labels,
            attack_results=attack_results,
            scenario_run_state="CREATED",
        )

        self._memory.add_scenario_results_to_memory(scenario_results=[result])
        self._scenario_result_id = str(result.id)
        logger.info(f"Created new scenario result with ID: {self._scenario_result_id}")


    def _get_baseline_from_first_attack(self) -> AtomicAttack:
        """
        Get a baseline AtomicAttack, which simply sends all the objectives without any modifications.

        Returns:
            AtomicAttack: The baseline AtomicAttack instance.

        Raises:
            ValueError: If no atomic attacks are available to derive baseline from.
        """
        if not self._atomic_attacks or len(self._atomic_attacks) == 0:
            raise ValueError("No atomic attacks available to derive baseline from.")

        first_attack = self._atomic_attacks[0]

        # Copy objectives, scoring, target from the first attack
        objectives = first_attack.objectives
        attack_scoring_config = first_attack._attack.get_attack_scoring_config()
        objective_target = first_attack._attack.get_objective_target()

        if not objectives or len(objectives) == 0:
            raise ValueError("First atomic attack must have objectives to create baseline.")

        if not objective_target:
            raise ValueError("Objective target is required to create baseline attack.")

        if not attack_scoring_config:
            raise ValueError("Attack scoring config is required to create baseline attack.")

        # Create baseline attack with no converters
        attack = PromptSendingAttack(
            objective_target=objective_target,
            attack_scoring_config=attack_scoring_config,
        )

        return AtomicAttack(
            atomic_attack_name="baseline",
            attack=attack,
            objectives=objectives,
            memory_labels=self._memory_labels,
        )

    def _validate_stored_scenario(self, *, stored_result: ScenarioResult) -> bool:
        """
        Validate that a stored scenario result matches the current scenario configuration.

        Args:
            stored_result (ScenarioResult): The scenario result retrieved from memory.

        Returns:
            bool: True if the stored scenario matches current configuration, False otherwise.
        """
        stored_name = stored_result.scenario_identifier.name
        stored_version = stored_result.scenario_identifier.version

        if stored_name != self._identifier.name:
            logger.warning(
                f"Scenario result ID {self._scenario_result_id} has mismatched name: "
                f"stored='{stored_name}', current='{self._identifier.name}'. "
                f"Creating new scenario result."
            )
            return False

        if stored_version != self._identifier.version:
            logger.warning(
                f"Scenario result ID {self._scenario_result_id} has mismatched version: "
                f"stored={stored_version}, current={self._identifier.version}. "
                f"Creating new scenario result."
            )
            return False

        # Valid match - log resumption
        logger.info(
            f"Resuming scenario '{self._name}' from existing result "
            f"(ID: {self._scenario_result_id}, state: {stored_result.scenario_run_state})"
        )
        return True

    def _get_completed_objectives_for_attack(self, *, atomic_attack_name: str) -> Set[str]:
        """
        Get the set of objectives that have already been completed for a specific atomic attack.

        Args:
            atomic_attack_name (str): The name of the atomic attack to check.

        Returns:
            Set[str]: Set of objective strings that have been completed.
        """
        if not self._scenario_result_id:
            return set()

        completed_objectives: Set[str] = set()

        try:
            # Retrieve the scenario result from memory
            scenario_results = self._memory.get_scenario_results(scenario_result_ids=[self._scenario_result_id])

            if scenario_results:
                scenario_result = scenario_results[0]
                # Get completed objectives for this atomic attack name
                if atomic_attack_name in scenario_result.attack_results:
                    completed_objectives = {
                        result.objective for result in scenario_result.attack_results[atomic_attack_name]
                    }
        except Exception as e:
            logger.warning(
                f"Failed to retrieve completed objectives for atomic attack '{atomic_attack_name}': {str(e)}"
            )

        return completed_objectives

    async def _get_remaining_atomic_attacks_async(self) -> List[AtomicAttack]:
        """
        Get the list of atomic attacks that still have objectives to complete.

        This method filters out atomic attacks where all objectives have been completed,
        and updates the objectives list for atomic attacks that are partially complete.

        Returns:
            List[AtomicAttack]: List of atomic attacks with uncompleted objectives.
        """
        if not self._scenario_result_id:
            # No scenario result yet, return all atomic attacks
            return self._atomic_attacks

        remaining_attacks: List[AtomicAttack] = []

        for atomic_attack in self._atomic_attacks:
            # Get completed objectives for this atomic attack name
            completed_objectives = self._get_completed_objectives_for_attack(
                atomic_attack_name=atomic_attack.atomic_attack_name
            )

            # Get ORIGINAL objectives (before any mutations) from stored map
            original_objectives = self._original_objectives_map.get(atomic_attack.atomic_attack_name, ())

            # Calculate remaining objectives
            remaining_objectives = [obj for obj in original_objectives if obj not in completed_objectives]

            if remaining_objectives:
                # If there are remaining objectives, update the atomic attack
                if len(remaining_objectives) < len(original_objectives):
                    logger.info(
                        f"Atomic attack '{atomic_attack.atomic_attack_name}' has "
                        f"{len(remaining_objectives)}/{len(original_objectives)} objectives remaining"
                    )
                # Update the objectives for this atomic attack to only include remaining ones
                atomic_attack._objectives = remaining_objectives

                remaining_attacks.append(atomic_attack)
            else:
                logger.info(
                    f"Atomic attack '{atomic_attack.atomic_attack_name}' has all objectives completed, skipping"
                )

        return remaining_attacks

    async def _update_scenario_result_async(
        self, *, atomic_attack_name: str, attack_results: List[AttackResult]
    ) -> None:
        """
        Update the scenario result in memory with new attack results (thread-safe).

        This method is thread-safe and can be called from parallel executions.

        Args:
            atomic_attack_name (str): The name of the atomic attack.
            attack_results (List[AttackResult]): The list of new attack results to add.
        """
        if not self._scenario_result_id:
            logger.warning("Cannot update scenario result: no scenario result ID available")
            return

        async with self._result_lock:
            success = self._memory.add_attack_results_to_scenario(
                scenario_result_id=self._scenario_result_id,
                atomic_attack_name=atomic_attack_name,
                attack_results=attack_results,
            )

            if not success:
                logger.error(
                    f"Failed to update scenario result with {len(attack_results)} results "
                    f"for atomic attack '{atomic_attack_name}'"
                )

    @abstractmethod
    async def _get_atomic_attacks_async(self) -> List[AtomicAttack]:
        """
        Retrieve the list of AtomicAttack instances in this scenario.

        This method can be overridden by subclasses to perform async operations
        needed to build or fetch the atomic attacks.

        Returns:
            List[AtomicAttack]: The list of AtomicAttack instances in this scenario.
        """
        pass


[docs]
    async def run_async(self) -> ScenarioResult:
        """
        Execute all atomic attacks in the scenario sequentially.

        Each AtomicAttack is executed in order, and all results are aggregated
        into a ScenarioResult containing the scenario metadata and all attack results.
        This method supports resumption - if the scenario raises an exception partway through,
        calling run_async again will skip already-completed objectives.

        If max_retries is set, the scenario will automatically retry after an exception up to
        the specified number of times. Each retry will resume from where it left off,
        skipping completed objectives.

        Returns:
            ScenarioResult: Contains scenario identifier and aggregated list of all
                attack results from all atomic attacks.

        Raises:
            ValueError: If the scenario has no atomic attacks configured. If your scenario
                requires initialization, call await scenario.initialize() first.
            ValueError: If the scenario raises an exception after exhausting all retry attempts.
            RuntimeError: If the scenario fails for any other reason while executing.

        Example:
            >>> result = await scenario.run_async()
            >>> print(f"Scenario: {result.scenario_identifier.name}")
            >>> print(f"Total results: {len(result.attack_results)}")
        """
        if not self._atomic_attacks:
            raise ValueError(
                "Cannot run scenario with no atomic attacks. Either supply them in initialization or"
                "call await scenario.initialize_async() first."
            )

        if not self._scenario_result_id:
            raise ValueError("Scenario not properly initialized. Call await scenario.initialize_async() first.")

        # Type narrowing: create local variable that type checker knows is non-None
        scenario_result_id: str = self._scenario_result_id

        # Implement retry logic
        last_exception = None
        for retry_attempt in range(self._max_retries + 1):  # +1 for initial attempt
            try:
                result = await self._execute_scenario_async()
                return result
            except Exception as e:
                last_exception = e

                # Get current scenario to check number of tries
                scenario_results = self._memory.get_scenario_results(scenario_result_ids=[scenario_result_id])
                current_tries = scenario_results[0].number_tries if scenario_results else retry_attempt + 1

                # Check if we have more retries available
                remaining_retries = self._max_retries - retry_attempt

                if remaining_retries > 0:
                    logger.error(
                        f"Scenario '{self._name}' failed on attempt {current_tries} with error: {str(e)}. "
                        f"Retrying... ({remaining_retries} retries remaining)",
                        exc_info=True,
                    )
                    # Continue to next iteration for retry
                    continue
                else:
                    # No more retries, log final failure
                    logger.error(
                        f"Scenario '{self._name}' failed after {current_tries} attempts "
                        f"(initial + {self._max_retries} retries) with error: {str(e)}. Giving up.",
                        exc_info=True,
                    )
                    raise

        # This should never be reached, but just in case
        if last_exception:
            raise last_exception
        raise RuntimeError(f"Scenario '{self._name}' completed unexpectedly without result")


    async def _execute_scenario_async(self) -> ScenarioResult:
        """
        Perform a single execution attempt of the scenario.

        This method contains the core execution logic and can be called multiple times
        for retry attempts. It increments the try counter, executes remaining atomic attacks,
        and returns the scenario result.

        Returns:
            ScenarioResult: The result of this execution attempt.

        Raises:
            Exception: Any exception that occurs during scenario execution.
            ValueError: If a lookup for a scenario for a given ID fails.
            ValueError: If atomic attack execution fails.
        """
        logger.info(f"Starting scenario '{self._name}' execution with {len(self._atomic_attacks)} atomic attacks")

        # Type narrowing: _scenario_result_id is guaranteed to be non-None at this point
        # (verified in run_async before calling this method)
        assert self._scenario_result_id is not None
        scenario_result_id: str = self._scenario_result_id

        # Increment number_tries at the start of each run
        scenario_results = self._memory.get_scenario_results(scenario_result_ids=[scenario_result_id])
        if scenario_results:
            current_scenario = scenario_results[0]
            current_scenario.number_tries += 1
            entry = ScenarioResultEntry(entry=current_scenario)
            self._memory._update_entry(entry)
            logger.info(f"Scenario '{self._name}' attempt #{current_scenario.number_tries}")
        else:
            raise ValueError(f"Scenario result with ID {scenario_result_id} not found")

        # Get remaining atomic attacks (filters out completed ones and updates objectives)
        remaining_attacks = await self._get_remaining_atomic_attacks_async()

        if not remaining_attacks:
            logger.info(f"Scenario '{self._name}' has no remaining objectives to execute")
            # Mark scenario as completed
            self._memory.update_scenario_run_state(
                scenario_result_id=scenario_result_id, scenario_run_state="COMPLETED"
            )
            # Retrieve and return the current scenario result
            scenario_results = self._memory.get_scenario_results(scenario_result_ids=[scenario_result_id])
            if scenario_results:
                return scenario_results[0]
            else:
                raise ValueError(f"Scenario result with ID {scenario_result_id} not found")

        logger.info(
            f"Scenario '{self._name}' has {len(remaining_attacks)} atomic attacks "
            f"with remaining objectives (out of {len(self._atomic_attacks)} total)"
        )

        # Mark scenario as in progress
        self._memory.update_scenario_run_state(scenario_result_id=scenario_result_id, scenario_run_state="IN_PROGRESS")

        # Calculate starting index based on completed attacks
        completed_count = len(self._atomic_attacks) - len(remaining_attacks)

        try:
            for i, atomic_attack in enumerate(
                tqdm(
                    remaining_attacks,
                    desc=f"Executing {self._name}",
                    unit="attack",
                    total=len(self._atomic_attacks),
                    initial=completed_count,
                ),
                start=completed_count + 1,
            ):
                logger.info(
                    f"Executing atomic attack {i}/{len(self._atomic_attacks)} "
                    f"('{atomic_attack.atomic_attack_name}') in scenario '{self._name}'"
                )

                try:
                    atomic_results = await atomic_attack.run_async(
                        max_concurrency=self._max_concurrency, return_partial_on_failure=True
                    )

                    # Always save completed results, even if some objectives didn't complete
                    if atomic_results.completed_results:
                        await self._update_scenario_result_async(
                            atomic_attack_name=atomic_attack.atomic_attack_name,
                            attack_results=atomic_results.completed_results,
                        )

                    # Check if there were any incomplete objectives
                    if atomic_results.has_incomplete:
                        incomplete_count = len(atomic_results.incomplete_objectives)
                        completed_count = len(atomic_results.completed_results)

                        logger.error(
                            f"Atomic attack {i}/{len(self._atomic_attacks)} "
                            f"('{atomic_attack.atomic_attack_name}') partially completed: "
                            f"{completed_count} completed, {incomplete_count} incomplete"
                        )

                        # Log details of each incomplete objective
                        for obj, exc in atomic_results.incomplete_objectives:
                            logger.error(f"  Incomplete objective '{obj[:50]}...': {str(exc)}")

                        # Mark scenario as failed
                        self._memory.update_scenario_run_state(
                            scenario_result_id=scenario_result_id, scenario_run_state="FAILED"
                        )

                        # Raise exception with detailed information
                        raise ValueError(
                            f"Failed to execute atomic attack {i} ('{atomic_attack.atomic_attack_name}') "
                            f"in scenario '{self._name}': {incomplete_count} of {incomplete_count + completed_count} "
                            f"objectives incomplete. First failure: {atomic_results.incomplete_objectives[0][1]}"
                        ) from atomic_results.incomplete_objectives[0][1]
                    else:
                        logger.info(
                            f"Atomic attack {i}/{len(self._atomic_attacks)} completed successfully with "
                            f"{len(atomic_results.completed_results)} results"
                        )

                except Exception as e:
                    # Exception was raised either by run_async or by our check above
                    logger.error(
                        f"Atomic attack {i}/{len(self._atomic_attacks)} "
                        f"('{atomic_attack.atomic_attack_name}') failed in scenario '{self._name}': {str(e)}"
                    )

                    # Mark scenario as failed if not already done
                    scenario_results = self._memory.get_scenario_results(scenario_result_ids=[scenario_result_id])
                    if scenario_results and scenario_results[0].scenario_run_state != "FAILED":
                        self._memory.update_scenario_run_state(
                            scenario_result_id=scenario_result_id, scenario_run_state="FAILED"
                        )

                    raise

            logger.info(f"Scenario '{self._name}' completed successfully")

            # Mark scenario as completed
            self._memory.update_scenario_run_state(
                scenario_result_id=scenario_result_id, scenario_run_state="COMPLETED"
            )

            # Retrieve and return final scenario result
            scenario_results = self._memory.get_scenario_results(scenario_result_ids=[scenario_result_id])
            if not scenario_results:
                raise ValueError(f"Scenario result with ID {self._scenario_result_id} not found")

            return scenario_results[0]

        except Exception as e:
            logger.error(f"Scenario '{self._name}' failed with error: {str(e)}")
            raise