Source code for pyrit.prompt_converter.zalgo_converter
# Copyright (c) Microsoft Corporation.
# Licensed under the MIT license.
import logging
import random
from typing import Optional
from pyrit.prompt_converter.text_selection_strategy import WordSelectionStrategy
from pyrit.prompt_converter.word_level_converter import WordLevelConverter
# Unicode combining characters for Zalgo effect (U+0300–U+036F)
ZALGO_MARKS = [chr(code) for code in range(0x0300, 0x036F + 1)]
# Setting a max intensity so people don't do anything unreasonable
MAX_INTENSITY = 100
logger = logging.getLogger(__name__)
[docs]
class ZalgoConverter(WordLevelConverter):
"""
Converts text into cursed Zalgo text using combining Unicode marks.
"""
[docs]
def __init__(
self,
*,
intensity: int = 10,
seed: Optional[int] = None,
word_selection_strategy: Optional[WordSelectionStrategy] = None,
):
"""
Initializes the converter with the specified selection parameters.
Args:
intensity (int): Number of combining marks per character (higher = more cursed). Default is 10.
seed (Optional[int]): Optional seed for reproducible output.
word_selection_strategy (Optional[WordSelectionStrategy]): Strategy for selecting which words to convert.
If None, all words will be converted.
"""
super().__init__(word_selection_strategy=word_selection_strategy)
self._intensity = self._normalize_intensity(intensity)
self._seed = seed
def _normalize_intensity(self, intensity: int) -> int:
try:
intensity = int(intensity)
except (TypeError, ValueError):
raise ValueError(f"Invalid intensity value: {intensity!r} (must be an integer)")
normalized_intensity = max(0, min(intensity, MAX_INTENSITY))
if intensity != normalized_intensity:
logger.warning(
f"ZalgoConverter supports intensity between 0 and {MAX_INTENSITY}, "
f"but received a value of {intensity}. Normalizing to {normalized_intensity}."
)
return normalized_intensity
[docs]
async def convert_word_async(self, word: str) -> str:
if self._intensity <= 0:
return word
def glitch(char: str) -> str:
return char + "".join(random.choice(ZALGO_MARKS) for _ in range(random.randint(1, self._intensity)))
return "".join(glitch(c) if c.isalnum() else c for c in word)