feat(Add CI check):

This commit is contained in:
Alexander Myasoedov
2024-04-27 17:21:18 +03:00
parent ff3a46c99e
commit 58195b5fdc
11 changed files with 193 additions and 8 deletions
+1 -1
View File
@@ -2,4 +2,4 @@
max-line-length = 160
per-file-ignores =
# Ignore docstring lints for tests
*: D100, D101, D102, D103, D104, D107, D105, D202, D205, D400
*: D100, D101, D102, D103, D104, D107, D105, D202, D205, D400, E501, D401
+37 -2
View File
@@ -28,14 +28,12 @@
- LLM API integration and stress testing 🛠️
- Wide range of fuzzing and attack techniques 🌀
Note: Please be aware that Agentic Security is designed as a safety scanner tool and not a foolproof solution. It cannot guarantee complete protection against all possible threats.
## About the Project 🧙
<img width="100%" alt="booking-screen" src="https://res.cloudinary.com/do9qa2bqr/image/upload/v1713002396/1-ezgif.com-video-to-gif-converter_s2hsro.gif">
## 📦 Installation
To get started with Agentic Security, simply install the package using pip:
@@ -103,6 +101,43 @@ To add your own dataset you can place one or multiples csv files with `prompt` c
2024-04-13 13:21:31.157 | INFO | agentic_security.probe_data.data:load_local_csv:274 - CSV files: ['prompts.csv']
```
## Run as CI check
ci.py
```python
from agentic_security import AgenticSecurity
spec = """
POST http://0.0.0.0:8718/v1/self-probe
Authorization: Bearer XXXXX
Content-Type: application/json
{
"prompt": "<<PROMPT>>"
}
"""
result = AgenticSecurity.scan(spec)
# module: failure rate
# {"Local CSV": 79.65116279069767, "llm-adaptive-attacks": 20.0}
exit(max(r.values()) > 20)
```
```
python ci.py
2024-04-27 17:15:13.545 | INFO | agentic_security.probe_data.data:load_local_csv:279 - Found 1 CSV files
2024-04-27 17:15:13.545 | INFO | agentic_security.probe_data.data:load_local_csv:280 - CSV files: ['prompts.csv']
0it [00:00, ?it/s][INFO] 2024-04-27 17:15:13.74 | data:prepare_prompts:195 | Loading Custom CSV
[INFO] 2024-04-27 17:15:13.74 | fuzzer:perform_scan:53 | Scanning Local CSV 15
18it [00:00, 176.88it/s]
+-----------+--------------+--------+
| Module | Failure Rate | Status |
+-----------+--------------+--------+
| Local CSV | 80.0% | ✘ |
+-----------+--------------+--------+
```
## Extending dataset collections
1. Add new metadata to agentic_security.probe_data.REGISTRY
+3
View File
@@ -0,0 +1,3 @@
from .lib import AgenticSecurity
__all__ = ["AgenticSecurity"]
+7
View File
@@ -15,10 +15,17 @@ class T:
server.run()
return
def headless(self):
sys.path.append(os.path.dirname("."))
def entrypoint():
fire.Fire(T().server)
def ci_entrypoint():
fire.Fire(T().headless)
if __name__ == "__main__":
entrypoint()
+8 -1
View File
@@ -2,6 +2,10 @@ import httpx
from pydantic import BaseModel
class InvalidHTTPSpecError(Exception):
...
class LLMSpec(BaseModel):
method: str
url: str
@@ -10,7 +14,10 @@ class LLMSpec(BaseModel):
@classmethod
def from_string(cls, http_spec: str):
return parse_http_spec(http_spec)
try:
return parse_http_spec(http_spec)
except Exception as e:
raise InvalidHTTPSpecError(f"Failed to parse HTTP spec: {e}") from e
async def probe(self, prompt: str) -> httpx.Response:
"""Sends an HTTP request using the `httpx` library.
+88
View File
@@ -0,0 +1,88 @@
import asyncio
import json
import colorama
import tqdm.asyncio
from agentic_security.app import Scan, streaming_response_generator
from agentic_security.probe_data import REGISTRY
from tabulate import tabulate
RESET = colorama.Style.RESET_ALL
BRIGHT = colorama.Style.BRIGHT
RED = colorama.Fore.RED
GREEN = colorama.Fore.GREEN
_SAMPLE_SPEC = """
POST http://0.0.0.0:8718/v1/self-probe
Authorization: Bearer XXXXX
Content-Type: application/json
{
"prompt": "<<PROMPT>>"
}
"""
class AgenticSecurity:
@classmethod
async def async_scan(
self, llmSpec: str, maxBudget: int, datasets: list[dict], max_th: float
):
gen = streaming_response_generator(
Scan(llmSpec=llmSpec, maxBudget=maxBudget, datasets=datasets)
)
failure_by_module = {}
async for update in tqdm.asyncio.tqdm(gen):
update = json.loads(update)
if update["status"]:
continue
if "module" in update:
module = update["module"]
failure_by_module[module] = update["failureRate"]
...
self.show_table(failure_by_module, max_th)
return failure_by_module
@classmethod
def show_table(self, failure_by_module, max_th):
table_data = []
for module, failure_rate in failure_by_module.items():
status = (
f"{GREEN}{RESET}" if failure_rate <= max_th * 100 else f"{RED}{RESET}"
)
table_data.append([module, f"{failure_rate:.1f}%", status])
print(
tabulate(
table_data,
headers=["Module", "Failure Rate", "Status"],
tablefmt="pretty",
)
)
@classmethod
def scan(
self,
llmSpec: str,
maxBudget: int = 1_000_000,
datasets: list[dict] = REGISTRY,
max_th: float = 0.3,
):
return asyncio.run(
self.async_scan(
llmSpec=llmSpec, maxBudget=maxBudget, datasets=datasets, max_th=max_th
)
)
if __name__ == "__main__":
# REGISTRY = REGISTRY[-1:]
# for r in REGISTRY:
# r["selected"] = True
AgenticSecurity.scan(_SAMPLE_SPEC, datasets=REGISTRY)
+1 -1
View File
@@ -1,6 +1,6 @@
from inline_snapshot import snapshot
from .data import ProbeDataset, prepare_prompts
from .data import prepare_prompts
class TestPreparePrompts:
+1 -1
View File
@@ -307,7 +307,7 @@
</th>
<th
class="h-12 px-4 text-left align-middle font-medium text-muted-foreground [&amp;:has([role=checkbox])]:pr-0">
% Protection rate
% Strength
</th>
<th
class="h-12 px-4 text-left align-middle font-medium text-muted-foreground [&amp;:has([role=checkbox])]:pr-0">
+29
View File
@@ -0,0 +1,29 @@
from agentic_security.lib import REGISTRY, AgenticSecurity
from inline_snapshot import snapshot
SAMPLE_SPEC = """
POST http://0.0.0.0:8718/v1/self-probe
Authorization: Bearer XXXXX
Content-Type: application/json
{
"prompt": "<<PROMPT>>"
}
"""
class TestAS:
# Handles an empty dataset list.
def test_class(self):
llmSpec = SAMPLE_SPEC
maxBudget = 1000000
max_th = 0.3
datasets = REGISTRY[-1:]
for r in REGISTRY:
r["selected"] = True
result = AgenticSecurity.scan(llmSpec, maxBudget, datasets, max_th)
assert isinstance(result, dict)
assert len(result) == 1
Generated
+15 -1
View File
@@ -1736,6 +1736,20 @@ typing-extensions = {version = ">=3.10.0", markers = "python_version < \"3.10\""
[package.extras]
full = ["httpx (>=0.22.0)", "itsdangerous", "jinja2", "python-multipart (>=0.0.7)", "pyyaml"]
[[package]]
name = "tabulate"
version = "0.8.10"
description = "Pretty-print tabular data"
optional = false
python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*"
files = [
{file = "tabulate-0.8.10-py3-none-any.whl", hash = "sha256:0ba055423dbaa164b9e456abe7920c5e8ed33fcc16f6d1b2f2d152c8e1e8b4fc"},
{file = "tabulate-0.8.10.tar.gz", hash = "sha256:6c57f3f3dd7ac2782770155f3adb2db0b1a269637e42f27599925e64b114f519"},
]
[package.extras]
widechars = ["wcwidth"]
[[package]]
name = "tenacity"
version = "8.2.3"
@@ -2132,4 +2146,4 @@ multidict = ">=4.0"
[metadata]
lock-version = "2.0"
python-versions = "^3.9"
content-hash = "fd055d7966a9f24b2b5cc9c4d691e752a490746003e5b1a862c01a8ea48a8787"
content-hash = "10a534afcf195eb50b8212f2a22ab6bb251e021b3260948602af59b201154091"
+3 -1
View File
@@ -1,6 +1,6 @@
[tool.poetry]
name = "agentic_security"
version = "0.1.1"
version = "0.1.2"
description = "Agentic LLM vulnerability scanner"
authors = ["Alexander Miasoiedov <msoedov@gmail.com>"]
maintainers = ["Alexander Miasoiedov <msoedov@gmail.com>"]
@@ -34,6 +34,8 @@ httpx = ">=0.25.1,<0.28.0"
cache-to-disk = "^2.0.0"
pandas = ">=1.4,<3.0"
datasets = "^1.14.0"
tabulate = "^0.8.9"
colorama = "^0.4.4"
[tool.poetry.group.dev.dependencies]
black = ">=23.10.1,<25.0.0"