Merge branch 'Azure:main' into fix/openai-chat-no-content-704

Azure · Feb 12, 2025 · e5070b8 · e5070b8
2 parents 44f857c + 6d07f5b
commit e5070b8
Show file tree

Hide file tree

Showing 65 changed files with 737 additions and 74 deletions.
diff --git a/doc/_toc.yml b/doc/_toc.yml
@@ -111,6 +111,7 @@ chapters:
   - file: api.rst
   - file: blog/README
     sections:
+    - file: blog/2025_02_11
     - file: blog/2025_01_27
     - file: blog/2025_01_14
     - file: blog/2024_12_3
diff --git a/doc/blog/2025_02_11.md b/doc/blog/2025_02_11.md
@@ -0,0 +1,37 @@
+# Datasets and Seed Prompts
+
+<small>11 Feb 2025 - Eugenia Kim</small>
+
+How should we approach datasets in PyRIT? As red teamers, we use multimodal data types - text, images, audio, video - from various sources and need to work with these datasets effectively to build out robust attacks. Let's dive into how a `SeedPromptDataset` works in PyRIT to help us do just that!
+
+## The problem
+
+We need to be able to use multimodal datasets which include text, audio, and video while also loading from locally stored prompts and open-source repositories! Dataset needs can change quickly which we've see through the evolution of text-based models to now multi-modal generative AI systems. With new data types and generative AI modalities, how can we build out prompts to attack with?
+
+## The solution: Introducing a `SeedPrompt`
+
+PyRIT makes this super easy with seed prompts! By standardizing how prompts are used in PyRIT, we can easily send unique prompts by loading and/or building datasets used for probing. Let's look at some of the attributes in a `SeedPrompt` which makes each prompt not only unique, but also with metadata helpful for filtering:
+
+- `id` defines a unique identifier associated with the prompt
+- `value` refers to either the actual text value or path to file containing the prompt (i.e. image path)
+- `value_sha256` is the hash value used for recognizing duplicates
+- `data_type` specifies the type of prompt data (e.g. `text`, `audio_path`)
+- `harm_categories` is a list of harm categories associated with the prompt (e.g. violence)
+
+We can also use a `SeedPrompt` as a template! By using `render_template_value`, we can put in parameters like `{{ prompt }}` to put the prompt into the template.
+
+For more examples, updated documentation on seed prompts is [here](../code/datasets/1_seed_prompt.ipynb).
+
+## Loading datasets with seed prompts
+
+The next step to using a `SeedPrompt` is to organize it within a `SeedPromptDataset`. This structure makes it easy to fetch and load datasets whether pulling from external repositories or importing YAML files! Using the same attributes listed above, we can directly load in our datasets by providing prompts by their `value`, including their `harm_categories` and other fields in a `SeedPrompt`. But what if we want to use a dataset from an open source repository? Let's load them in as a `SeedPromptDataset`!
+
+Currently in PyRIT, we already have twelve datasets which are ready to be used through our fetch functions. They are in the `fetch_example_datasets.py` file. Since PyRIT is an open-source project, we’d love to see more datasets contributed! If you have a dataset that could improve red teaming efforts, consider submitting a PR — looking forward to adding it to the collection!
+
+See the updated documentation [here](../code/datasets/2_fetch_dataset.ipynb).
+
+## What else can we do with this?
+
+Now that we've loaded our dataset into PyRIT as a `SeedPromptDataset` the really exciting red teaming can begin. A great example of this is in our [Sending a Million Prompts](../cookbooks/1_sending_prompts.ipynb) notebook! We can use the prompts to evaluate the target by sending all the previously loaded promtps, modifying which attacks to use, and storing the scores for further analysis.
+
+In this blog post, we've walked through how we use structured datasets through our `SeedPrompt` and `SeedPromptDataset` classes. PyRIT's architecture allows for customization at every stage - whether through converters or configuring different scorers - and seed prompts set us up to effectively probe for risks in AI systems. Send over any contributions to add more datasets, refine seed prompts, or any open issues on Github! Now that you understand a core component of PyRIT, go ahead and try it out!
diff --git a/doc/code/converters/pdf_converter.py b/doc/code/converters/pdf_converter.py
@@ -70,7 +70,7 @@
 # Initialize the PDFConverter
 pdf_converter = PDFConverter(
     prompt_template=prompt_template,
-    font_type="Arial",
+    font_type="Helvetica",
     font_size=12,
     page_width=210,
     page_height=297,
@@ -102,7 +102,7 @@
 # Initialize the PDFConverter without a template
 pdf_converter = PDFConverter(
     prompt_template=None,  # No template provided
-    font_type="Arial",
+    font_type="Helvetica",
     font_size=12,
     page_width=210,
     page_height=297,
@@ -177,7 +177,7 @@
 # Initialize the PDFConverter with the existing PDF and injection items
 pdf_converter = PDFConverter(
     prompt_template=None,  # No template provided
-    font_type="Arial",
+    font_type="Helvetica",
     font_size=12,
     page_width=210,
     page_height=297,

diff --git a/pyproject.toml b/pyproject.toml
@@ -140,6 +140,9 @@ all = [
     "types-PyYAML>=6.0.12.9",
 ]
 
+[project.scripts]
+pyrit_scan = "pyrit.cli.__main__:main"
+
 [tool.pytest.ini_options]
 pythonpath = ["."]
 
@@ -156,7 +159,7 @@ target-version = ["py310"]
 line-length = 120
 
 [build-system]
-requires = ["setuptools", "wheel"]
+requires = ["setuptools>=64.0.0", "wheel"]
 build-backend = "setuptools.build_meta"
 
 [tool.setuptools.packages.find]

diff --git a/pyrit/cli/__init__.py b/pyrit/cli/__init__.py
@@ -0,0 +1,2 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
diff --git a/pyrit/cli/__main__.py b/pyrit/cli/__main__.py
@@ -0,0 +1,228 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+
+import asyncio
+import inspect
+from argparse import ArgumentDefaultsHelpFormatter, ArgumentParser, Namespace
+from copy import deepcopy
+from datetime import datetime
+from importlib import import_module
+from pathlib import Path
+from typing import Any, Dict, List, Optional
+from uuid import uuid4
+
+import yaml
+
+from pyrit.common import initialize_pyrit
+from pyrit.memory import CentralMemory
+from pyrit.models import SeedPrompt, SeedPromptDataset
+from pyrit.models.seed_prompt import SeedPromptGroup
+from pyrit.orchestrator import Orchestrator
+from pyrit.prompt_converter import PromptConverter
+from pyrit.prompt_normalizer.normalizer_request import NormalizerRequest
+from pyrit.prompt_normalizer.prompt_converter_configuration import (
+    PromptConverterConfiguration,
+)
+from pyrit.prompt_target import PromptTarget
+from pyrit.prompt_target.common.prompt_chat_target import PromptChatTarget
+from pyrit.score.scorer import Scorer
+
+
+def parse_args(args=None) -> Namespace:
+    parser = ArgumentParser(
+        prog="pyrit_scan",
+        description="Parse the arguments for the Pyrit Scanner CLI.",
+        formatter_class=ArgumentDefaultsHelpFormatter,
+    )
+    parser.add_argument(
+        "--config-file",
+        type=str,
+        help="The path to the configuration file.",
+        required=True,
+    )
+
+    parsed_args = parser.parse_args(args)
+    config_file = Path(parsed_args.config_file)
+    if not config_file.exists():
+        raise FileNotFoundError(f"Configuration file {config_file.absolute()} does not exist.")
+    return parsed_args
+
+
+def load_config(config_file: Path) -> Dict[str, Any]:
+    # Load the configuration YAML file
+    with open(config_file, "r") as file:
+        config = yaml.safe_load(file)
+
+    if not config:
+        raise ValueError("Configuration file is empty.")
+
+    if not isinstance(config, dict):
+        raise TypeError("Configuration file must be a dictionary.")
+
+    return config
+
+
+async def validate_config_and_run_async(config: Dict[str, Any], memory_labels: Optional[Dict[str, str]] = None) -> None:
+    if "scenarios" not in config:
+        raise KeyError("Configuration file must contain a 'scenarios' key.")
+
+    scenarios = config["scenarios"]
+
+    if not scenarios:
+        raise ValueError("Scenarios list is empty.")
+
+    initialize_pyrit(memory_db_type="DuckDB")
+
+    seed_prompts = generate_datasets(config)
+    objective_target = validate_target(config, target_key="objective_target")
+    prompt_converters: list[PromptConverter] = []
+    # prompt_converters = validate_converters(config)
+    scorer = None
+    # TODO: need to find a solution for single/multiple scorers and scoring_targets
+    # scorers = validate_scorers(config)
+    adversarial_chat = None
+    # adversarial_chat = validate_adversarial_chat(config)
+
+    orchestrators = []
+    for scenario_config in scenarios:
+        orchestrators.append(
+            validate_scenario(
+                scenario_config=scenario_config,
+                objective_target=objective_target,
+                adversarial_chat=adversarial_chat,
+                prompt_converters=prompt_converters,
+                scorer=scorer,
+            )
+        )
+
+    # This is a separate loop because we want to validate all scenarios before starting execution.
+    for orchestrator in orchestrators:
+        if hasattr(orchestrator, "run_attack_async"):
+            for seed_prompt in seed_prompts:
+                await orchestrator.run_attack_async(objective=seed_prompt.value, memory_labels=memory_labels)
+        elif hasattr(orchestrator, "send_normalizer_requests_async"):
+            converter_configurations = [
+                PromptConverterConfiguration(converters=prompt_converters if prompt_converters else [])
+            ]
+
+            normalizer_requests = [
+                NormalizerRequest(
+                    seed_prompt_group=SeedPromptGroup(prompts=[seed_prompt]),
+                    request_converter_configurations=converter_configurations,
+                    conversation_id=str(uuid4()),
+                )
+                for seed_prompt in seed_prompts
+            ]
+            await orchestrator.send_normalizer_requests_async(
+                prompt_request_list=normalizer_requests,
+                memory_labels=memory_labels,
+            )
+        else:
+            supported_methods = ["run_attack_async", "send_normalizer_requests_async"]
+            raise ValueError(
+                f"The orchestrator of type {type(orchestrator).__name__} does not have a compatible "
+                f"method to execute its attack. The supported methods are {supported_methods}."
+            )
+
+
+def validate_scenario(
+    scenario_config: Dict[str, Any],
+    objective_target: PromptTarget,
+    adversarial_chat: Optional[PromptChatTarget] = None,
+    prompt_converters: Optional[List[PromptConverter]] = None,
+    scorer: Optional[Scorer] = None,
+) -> Orchestrator:
+    if "type" not in scenario_config:
+        raise KeyError("Scenario must contain a 'type' key.")
+
+    scenario_type = scenario_config["type"]
+    scenario_args = deepcopy(scenario_config)
+    del scenario_args["type"]
+
+    try:
+        orchestrator_module = import_module("pyrit.orchestrator")
+        orchestrator_class = getattr(orchestrator_module, scenario_type)
+    except Exception as ex:
+        raise RuntimeError(f"Failed to import orchestrator {scenario_type} from pyrit.orchestrator") from ex
+
+    try:
+        constructor_arg_names = [arg.name for arg in inspect.signature(orchestrator_class.__init__).parameters.values()]
+
+        # Some orchestrator arguments have their own configuration since they
+        # are more complex. They are passed in as args to this function.
+        complex_arg_names = ["objective_target", "adversarial_chat", "prompt_converters", "scorer"]
+        for complex_arg_name in complex_arg_names:
+            if complex_arg_name in scenario_args:
+                raise ValueError(
+                    f"{complex_arg_name} needs to be configured at the top level of the scanner configuration."
+                    f"The scenario configuration cannot include {complex_arg_name}."
+                )
+
+            # Add complex args to the argument list.
+            local_vars = locals()
+            if complex_arg_name in constructor_arg_names:
+                arg_value = local_vars[complex_arg_name]
+                if arg_value:
+                    scenario_args[complex_arg_name] = arg_value
+
+        orchestrator = orchestrator_class(**scenario_args)
+    except Exception as ex:
+        raise ValueError(f"Failed to validate scenario {scenario_type}") from ex
+    return orchestrator
+
+
+def generate_datasets(config: Dict[str, Any]) -> List[SeedPrompt]:
+    datasets = config.get("datasets")
+
+    if not datasets:
+        raise KeyError("Send prompts scenario must contain a 'datasets' key.")
+
+    loaded_dataset_prompts = []
+    for dataset_path in datasets:
+        dataset = SeedPromptDataset.from_yaml_file(dataset_path)
+        loaded_dataset_prompts.extend(dataset.prompts)
+
+    return loaded_dataset_prompts
+
+
+def validate_target(config: Dict[str, Any], target_key: str) -> PromptTarget:
+    if target_key not in config:
+        raise KeyError(f"Configuration file must contain a '{target_key}' key.")
+
+    if not config[target_key] or not config[target_key].get("type"):
+        raise KeyError(f"Target {target_key} must contain a 'type' key.")
+
+    target_config = deepcopy(config[target_key])
+    target_type = target_config.get("type")
+
+    try:
+        target_module = import_module("pyrit.prompt_target")
+        target_class = getattr(target_module, target_type)
+    except Exception as ex:
+        raise RuntimeError(f"Failed to import target {target_type} from pyrit.prompt_target") from ex
+
+    # type is not an actual arg so remove it
+    del target_config["type"]
+    target = target_class(**target_config)
+    return target
+
+
+def main(args=None):
+    parsed_args = parse_args(args)
+    config_file = parsed_args.config_file
+    config = load_config(config_file)
+    memory_labels = config.get("memory_labels", {})
+    # Add timestamp to distinguish between scanner runs with the same memory labels
+    memory_labels["scanner_execution_start_time"] = datetime.now().isoformat()
+
+    asyncio.run(validate_config_and_run_async(config, memory_labels))
+
+    memory = CentralMemory.get_memory_instance()
+    all_pieces = memory.get_prompt_request_pieces(labels=memory_labels)
+    conversation_id = None
+    for piece in all_pieces:
+        if piece.conversation_id != conversation_id:
+            conversation_id = piece.conversation_id
+            print("===================================================")
+            print(f"Conversation ID: {conversation_id}")
+        print(f"{piece.role}: {piece.converted_value}")
diff --git a/pyrit/models/embeddings.py b/pyrit/models/embeddings.py
@@ -38,7 +38,7 @@ def save_to_file(self, directory_path: Path) -> str:
         Returns:
             The full path to the file that was saved
         """
-        embedding_json = self.json()
+        embedding_json = self.model_dump_json()
         embedding_hash = sha256(embedding_json.encode()).hexdigest()
         embedding_output_file_path = Path(directory_path, f"{embedding_hash}.json")
         embedding_output_file_path.write_text(embedding_json)

diff --git a/pyrit/models/prompt_response.py b/pyrit/models/prompt_response.py
@@ -49,7 +49,7 @@ def save_to_file(self, directory_path: Path) -> str:
         Returns:
             The full path to the file that was saved
         """
-        embedding_json = self.json()
+        embedding_json = self.model_dump_json()
         embedding_hash = hashlib.sha256(embedding_json.encode()).hexdigest()
         embedding_output_file_path = Path(directory_path, f"{embedding_hash}.json")
         embedding_output_file_path.write_text(embedding_json)

diff --git a/pyrit/prompt_converter/__init__.py b/pyrit/prompt_converter/__init__.py
@@ -7,6 +7,7 @@
 from pyrit.prompt_converter.add_text_image_converter import AddTextImageConverter
 from pyrit.prompt_converter.ansi_escape.ansi_attack_converter import AnsiAttackConverter
 from pyrit.prompt_converter.ascii_art_converter import AsciiArtConverter
+from pyrit.prompt_converter.ascii_smuggler_converter import AsciiSmugglerConverter
 from pyrit.prompt_converter.atbash_converter import AtbashConverter
 from pyrit.prompt_converter.audio_frequency_converter import AudioFrequencyConverter
 from pyrit.prompt_converter.azure_speech_audio_to_text_converter import AzureSpeechAudioToTextConverter
@@ -15,7 +16,10 @@
 from pyrit.prompt_converter.binary_converter import BinaryConverter
 from pyrit.prompt_converter.caesar_converter import CaesarConverter
 from pyrit.prompt_converter.character_space_converter import CharacterSpaceConverter
+from pyrit.prompt_converter.charswap_attack_converter import CharSwapGenerator
 from pyrit.prompt_converter.codechameleon_converter import CodeChameleonConverter
+from pyrit.prompt_converter.colloquial_wordswap_converter import ColloquialWordswapConverter
+from pyrit.prompt_converter.diacritic_converter import DiacriticConverter
 from pyrit.prompt_converter.emoji_converter import EmojiConverter
 from pyrit.prompt_converter.flip_converter import FlipConverter
 from pyrit.prompt_converter.fuzzer_converter import (
@@ -56,6 +60,7 @@
     "AddTextImageConverter",
     "AnsiAttackConverter",
     "AsciiArtConverter",
+    "AsciiSmugglerConverter",
     "AtbashConverter",
     "AudioFrequencyConverter",
     "AzureSpeechAudioToTextConverter",
@@ -64,7 +69,10 @@
     "BinaryConverter",
     "CaesarConverter",
     "CharacterSpaceConverter",
+    "CharSwapGenerator",
     "CodeChameleonConverter",
+    "ColloquialWordswapConverter",
+    "DiacriticConverter",
     "ConverterResult",
     "EmojiConverter",
     "FlipConverter",
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1,2 @@
		# Copyright (c) Microsoft Corporation.
		# Licensed under the MIT License.