Source code for pyrit.datasets.mlcommons_ailuminate_demo_dataset
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT license.
from pathlib import Path
from typing import Literal, Optional
from pyrit.datasets.dataset_helper import fetch_examples
from pyrit.models import SeedPromptDataset
from pyrit.models.seed_prompt import SeedPrompt
# https://github.com/mlcommons/ailuminate#hazard-categories-and-abbreviations
_hazard_categories_map = {
"vcr": "Violent Crimes",
"src": "Sex-Related Crimes",
"cse": "Child Sexual Exploitation",
"ssh": "Suicide & Self-Harm",
"iwp": "Indiscriminate Weapons (CBRNE)",
"ipv": "Intellectual Property Violations",
"dfm": "Defamation",
"ncr": "Non-Violent Crimes",
"hte": "Hate",
"prv": "Privacy Violations",
"spc_ele": "Specialized Advice; elections",
"spc_fin": "Specialized Advice; financial",
"spc_hlt": "Specialized Advice; health",
"sxc_prn": "Sexual Content; pornographic",
"spc_lgl": "Specialized Advice; legal",
}
[docs]
def fetch_mlcommons_ailuminate_demo_dataset(
source: str = (
"https://raw.githubusercontent.com/mlcommons/ailuminate/refs/heads/main/"
"airr_official_1.0_demo_en_us_prompt_set_release.csv"
),
source_type: Literal["public_url"] = "public_url",
cache: bool = True,
data_home: Optional[Path] = None,
) -> SeedPromptDataset:
"""
Fetch examples from AILuminate v1.0 DEMO Prompt Set and create a SeedPromptDataset.
Returns:
SeedPromptDataset: A SeedPromptDataset containing the examples.
Note:
For more information about the dataset and related materials, visit: \n
- https://github.com/mlcommons/ailuminate \n
- https://mlcommons.org/ailuminate/ \n
- https://doi.org/10.48550/arXiv.2404.12241
"""
examples = fetch_examples(source, source_type, cache, data_home)
seed_prompts = [
SeedPrompt(
value=example["prompt_text"],
data_type="text",
name="",
dataset_name="AILuminate v1.0 DEMO Prompt Set",
# Saving both the full hazard category name and the abbreviation
harm_categories=[_hazard_categories_map[example["hazard"]], example["hazard"]],
description=(
"This dataset contains the DEMO prompt library of the AILuminate 1.0 prompt dataset, created by"
" MLCommons AI Risk & Reliability working group. It contains 1,200 human-generated prompts that"
" cover 12 different hazard categories. The dataset is a mix of adversarial and non-adversarial"
" prompts. This dataset is a 10% subset of the full AILuminate training dataset."
),
source="https://github.com/mlcommons/ailuminate",
)
for example in examples
]
seed_prompt_dataset = SeedPromptDataset(prompts=seed_prompts)
return seed_prompt_dataset