Spaces:
Build error
Build error
import gradio as gr | |
from pyrit.core.pyrit import PyRIT | |
from pyrit.core.config import LLMProvider | |
from pyrit.llm_providers.huggingface_local import HuggingFaceLocal | |
# Initialize PyRIT with a local HF model (you can change this) | |
provider = HuggingFaceLocal( | |
model_name="HuggingFaceH4/zephyr-7b-beta", # Change model here | |
max_tokens=512, | |
) | |
pyrit = PyRIT(provider=provider) | |
def attack_prompt(prompt): | |
try: | |
result = pyrit.run(prompt, attack="jailbreak", max_tokens=512) | |
return f"✅ Successful Attack:\n{result}" | |
except Exception as e: | |
return f"❌ Error: {str(e)}" | |
gr.Interface( | |
fn=attack_prompt, | |
inputs=gr.Textbox(label="Prompt to Attack", placeholder="Enter a benign-looking prompt..."), | |
outputs=gr.Textbox(label="Attack Result"), | |
title="🧪 PyRIT - Red Teaming Hugging Face LLMs", | |
description="This tool uses PyRIT to test Hugging Face models for jailbreak-style adversarial prompts.", | |
).launch() | |