diff --git a/README.md b/README.md index 4bfeada..acd0bf5 100644 --- a/README.md +++ b/README.md @@ -133,8 +133,8 @@ Create a `.env` file with your API credentials: ```python import asyncio import os -from OpenRT.models.implementations.openai_model import OpenAIModel -from OpenRT.attacks.blackbox.implementations.evosynth import EvosynthAttack, EvosynthConfig +from jailbreak_toolbox.models.implementations.openai_model import OpenAIModel +from jailbreak_toolbox.attacks.blackbox.implementations.evosynth import EvosynthAttack, EvosynthConfig from dotenv import load_dotenv load_dotenv() @@ -207,7 +207,7 @@ EvoSynth/ ├── eval_async.py # Main entry point ├── data/ │ └── harmbench.csv # Evaluation dataset -└── OpenRT/ +└── jailbreak_toolbox/ ├── core/ # Orchestration & registry │ ├── async_orchestrator.py │ └── registry.py diff --git a/jailbreak_toolbox/attacks/blackbox/implementations/evosynth/basic_usage.py b/jailbreak_toolbox/attacks/blackbox/implementations/evosynth/basic_usage.py index 9b6867e..4b9d34c 100644 --- a/jailbreak_toolbox/attacks/blackbox/implementations/evosynth/basic_usage.py +++ b/jailbreak_toolbox/attacks/blackbox/implementations/evosynth/basic_usage.py @@ -8,13 +8,11 @@ from sklearn import base # Add paths for imports sys.path.append(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))) - -# Add jailbreak_toolbox to Python path -jailbreak_toolbox_path = "/mnt/shared-storage-user/chenyunhao/jailbreak-agent/jailbreak_toolbox" from jailbreak_toolbox.models.implementations.openai_model import OpenAIModel from evosynth_attack import EvosynthAttack from evosynth.config import EvosynthConfig - +from dotenv import load_dotenv +load_dotenv() def basic_attack_example(): """Simple attack with explicit judge model.""" @@ -29,7 +27,7 @@ def basic_attack_example(): # Initialize explicit judge model (can be different from target) judge_model = OpenAIModel( model_name="gpt-4o-mini", # Or use a different model like "gpt-4" - temperature=0.1, # Lower temperature for consistent judging + temperature=0.0, # Lower temperature for consistent judging api_key=os.getenv("OPENAI_API_KEY"), base_url=os.getenv("OPENAI_BASE_URL") )