Source code for pyrit.datasets.tdc23_redteaming_dataset
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT license.
from datasets import load_dataset
from pyrit.models import SeedPromptDataset
from pyrit.models.seed_prompt import SeedPrompt
[docs]
def fetch_tdc23_redteaming_dataset() -> SeedPromptDataset:
"""
Fetch TDC23-RedTeaming examples and create a SeedPromptDataset.
Returns:
SeedPromptDataset: A SeedPromptDataset containing the examples.
"""
# Load the TDC23-RedTeaming dataset
data = load_dataset("walledai/TDC23-RedTeaming", "default")
prompts = [item["prompt"] for item in data["train"]]
# Create SeedPrompt instances from each example in 'prompts'
seed_prompts = [
SeedPrompt(
value=prompt,
data_type="text",
name="walledai/TDC23-RedTeaming",
dataset_name="walledai/TDC23-RedTeaming",
description="""TDC23-RedTeaming dataset from HuggingFace,
created by Walled AI (https://huggingface.co/walledai).
Contains 100 prompts aimed at generating harmful content
across multiple harm categories related to fairness,
misinformation, dangerous and criminal activities,
violence, etc. in the style of writing narratives.""",
source="https://huggingface.co/datasets/walledai/TDC23-RedTeaming",
)
for prompt in prompts
]
seed_prompt_dataset = SeedPromptDataset(prompts=seed_prompts)
return seed_prompt_dataset