diff --git a/CHANGELOG.md b/CHANGELOG.md index 2c105feb..6b7a995b 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,3 +1,36 @@ +## v0.10.0 (2026-05-22) + +### ✨ Features + +- possibility to enable or disable thinking with ollama +- possibility to enable or disable thinking with ollama + +### šŸ›šŸš‘ļø Fixes + +- abort attack if non-default category classifier model is not s… +- fixed integration tests +- abort attack if non-default category classifier model is not specified and the default model is not present in ollama + +### bump + +- **deps-dev**: bump pre-commit from 4.5.1 to 4.6.0 +- **deps**: bump click from 8.1.8 to 8.4.0 +- **deps-dev**: bump pytest-rerunfailures from 16.1 to 16.2 +- **deps-dev**: bump packaging from 26.0 to 26.2 +- version 0.9.0 → 0.9.1 +- **deps-dev**: bump commitizen from 4.13.10 to 4.16.0 + +### fix + +- move examples/ inside hackagent package for correct wheel packaging +- normalize TAP judge scores to consistent 1-10 scale +- pass TAP success_threshold to coordinator finalize_all_goals +- normalize TAP judge scores to a consistent 1-10 scale + +### 🫄 fixup + +- fixed merge conflict on tag bump + ## v0.9.1 (2026-05-21) ## v0.9.0 (2026-05-15) diff --git a/codecov.yml b/codecov.yml index 30bfb10f..c3962e57 100644 --- a/codecov.yml +++ b/codecov.yml @@ -40,6 +40,6 @@ comment: ignore: - "tests/**/*" - "docs/**/*" - - "examples/**/*" + - "hackagent/examples/**/*" - "htmlcov/**/*" - "**/__pycache__/**" diff --git a/examples/google_adk/jailbreak_eval/__init__.py b/hackagent/examples/google_adk/jailbreak_eval/__init__.py similarity index 100% rename from examples/google_adk/jailbreak_eval/__init__.py rename to hackagent/examples/google_adk/jailbreak_eval/__init__.py diff --git a/examples/google_adk/jailbreak_eval/agent.py b/hackagent/examples/google_adk/jailbreak_eval/agent.py similarity index 100% rename from examples/google_adk/jailbreak_eval/agent.py rename to hackagent/examples/google_adk/jailbreak_eval/agent.py diff --git a/examples/google_adk/jailbreak_eval/hack.py b/hackagent/examples/google_adk/jailbreak_eval/hack.py similarity index 100% rename from examples/google_adk/jailbreak_eval/hack.py rename to hackagent/examples/google_adk/jailbreak_eval/hack.py diff --git a/examples/google_adk/multi_tool_agent/__init__.py b/hackagent/examples/google_adk/multi_tool_agent/__init__.py similarity index 100% rename from examples/google_adk/multi_tool_agent/__init__.py rename to hackagent/examples/google_adk/multi_tool_agent/__init__.py diff --git a/examples/google_adk/multi_tool_agent/agent.py b/hackagent/examples/google_adk/multi_tool_agent/agent.py similarity index 100% rename from examples/google_adk/multi_tool_agent/agent.py rename to hackagent/examples/google_adk/multi_tool_agent/agent.py diff --git a/examples/google_adk/multi_tool_agent/hack.py b/hackagent/examples/google_adk/multi_tool_agent/hack.py similarity index 100% rename from examples/google_adk/multi_tool_agent/hack.py rename to hackagent/examples/google_adk/multi_tool_agent/hack.py diff --git a/examples/langchain/rag/README.md b/hackagent/examples/langchain/rag/README.md similarity index 100% rename from examples/langchain/rag/README.md rename to hackagent/examples/langchain/rag/README.md diff --git a/examples/langchain/rag/agent_client.py b/hackagent/examples/langchain/rag/agent_client.py similarity index 100% rename from examples/langchain/rag/agent_client.py rename to hackagent/examples/langchain/rag/agent_client.py diff --git a/examples/langchain/rag/agent_server.py b/hackagent/examples/langchain/rag/agent_server.py similarity index 100% rename from examples/langchain/rag/agent_server.py rename to hackagent/examples/langchain/rag/agent_server.py diff --git a/examples/langchain/rag/hack.py b/hackagent/examples/langchain/rag/hack.py similarity index 100% rename from examples/langchain/rag/hack.py rename to hackagent/examples/langchain/rag/hack.py diff --git a/examples/langchain/rag/ingest.py b/hackagent/examples/langchain/rag/ingest.py similarity index 100% rename from examples/langchain/rag/ingest.py rename to hackagent/examples/langchain/rag/ingest.py diff --git a/examples/langchain/rag/policies.pdf b/hackagent/examples/langchain/rag/policies.pdf similarity index 100% rename from examples/langchain/rag/policies.pdf rename to hackagent/examples/langchain/rag/policies.pdf diff --git a/examples/langchain/rag/read_db.py b/hackagent/examples/langchain/rag/read_db.py similarity index 100% rename from examples/langchain/rag/read_db.py rename to hackagent/examples/langchain/rag/read_db.py diff --git a/examples/ollama/demo.py b/hackagent/examples/ollama/demo.py similarity index 100% rename from examples/ollama/demo.py rename to hackagent/examples/ollama/demo.py diff --git a/examples/ollama/hack.py b/hackagent/examples/ollama/hack.py similarity index 100% rename from examples/ollama/hack.py rename to hackagent/examples/ollama/hack.py diff --git a/examples/ollama/local.py b/hackagent/examples/ollama/local.py similarity index 100% rename from examples/ollama/local.py rename to hackagent/examples/ollama/local.py diff --git a/examples/openai_sdk/multi_judge/README.md b/hackagent/examples/openai_sdk/multi_judge/README.md similarity index 100% rename from examples/openai_sdk/multi_judge/README.md rename to hackagent/examples/openai_sdk/multi_judge/README.md diff --git a/examples/openai_sdk/multi_judge/run_flipattack_multi_judge.py b/hackagent/examples/openai_sdk/multi_judge/run_flipattack_multi_judge.py similarity index 100% rename from examples/openai_sdk/multi_judge/run_flipattack_multi_judge.py rename to hackagent/examples/openai_sdk/multi_judge/run_flipattack_multi_judge.py diff --git a/examples/openai_sdk/pc_tool_sandbox/README.md b/hackagent/examples/openai_sdk/pc_tool_sandbox/README.md similarity index 100% rename from examples/openai_sdk/pc_tool_sandbox/README.md rename to hackagent/examples/openai_sdk/pc_tool_sandbox/README.md diff --git a/examples/openai_sdk/pc_tool_sandbox/agent.py b/hackagent/examples/openai_sdk/pc_tool_sandbox/agent.py similarity index 100% rename from examples/openai_sdk/pc_tool_sandbox/agent.py rename to hackagent/examples/openai_sdk/pc_tool_sandbox/agent.py diff --git a/examples/openai_sdk/pc_tool_sandbox/confidential/db_credentials.txt b/hackagent/examples/openai_sdk/pc_tool_sandbox/confidential/db_credentials.txt similarity index 100% rename from examples/openai_sdk/pc_tool_sandbox/confidential/db_credentials.txt rename to hackagent/examples/openai_sdk/pc_tool_sandbox/confidential/db_credentials.txt diff --git a/examples/openai_sdk/pc_tool_sandbox/hack.py b/hackagent/examples/openai_sdk/pc_tool_sandbox/hack.py similarity index 100% rename from examples/openai_sdk/pc_tool_sandbox/hack.py rename to hackagent/examples/openai_sdk/pc_tool_sandbox/hack.py diff --git a/examples/openai_sdk/quick_evaluation/README.md b/hackagent/examples/openai_sdk/quick_evaluation/README.md similarity index 100% rename from examples/openai_sdk/quick_evaluation/README.md rename to hackagent/examples/openai_sdk/quick_evaluation/README.md diff --git a/examples/openai_sdk/quick_evaluation/run_h4rm3l.py b/hackagent/examples/openai_sdk/quick_evaluation/run_h4rm3l.py similarity index 100% rename from examples/openai_sdk/quick_evaluation/run_h4rm3l.py rename to hackagent/examples/openai_sdk/quick_evaluation/run_h4rm3l.py diff --git a/examples/openai_sdk/rag/README.md b/hackagent/examples/openai_sdk/rag/README.md similarity index 100% rename from examples/openai_sdk/rag/README.md rename to hackagent/examples/openai_sdk/rag/README.md diff --git a/examples/openai_sdk/rag/agent_server.py b/hackagent/examples/openai_sdk/rag/agent_server.py similarity index 100% rename from examples/openai_sdk/rag/agent_server.py rename to hackagent/examples/openai_sdk/rag/agent_server.py diff --git a/examples/openai_sdk/rag/hack.py b/hackagent/examples/openai_sdk/rag/hack.py similarity index 100% rename from examples/openai_sdk/rag/hack.py rename to hackagent/examples/openai_sdk/rag/hack.py diff --git a/examples/openai_sdk/rag/ingest.py b/hackagent/examples/openai_sdk/rag/ingest.py similarity index 100% rename from examples/openai_sdk/rag/ingest.py rename to hackagent/examples/openai_sdk/rag/ingest.py diff --git a/examples/openai_sdk/rag/policies.pdf b/hackagent/examples/openai_sdk/rag/policies.pdf similarity index 100% rename from examples/openai_sdk/rag/policies.pdf rename to hackagent/examples/openai_sdk/rag/policies.pdf diff --git a/examples/vllm/hack.py b/hackagent/examples/vllm/hack.py similarity index 100% rename from examples/vllm/hack.py rename to hackagent/examples/vllm/hack.py diff --git a/pyproject.toml b/pyproject.toml index 1af925bd..2fef50df 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [project] name = "hackagent" -version = "0.9.1" +version = "0.10.0" description = "HackAgent is an open-source security toolkit to detect vulnerabilities of your AI Agents." authors = [ {name = "AI Security Lab", email = "ais@ai4i.it"} @@ -80,6 +80,9 @@ build-backend = "hatchling.build" [tool.hatch.build.targets.wheel] packages = ["hackagent"] +artifacts = [ + "hackagent/examples/**", +] [tool.hatch.build.targets.sdist] include = [ diff --git a/tests/integration/conftest.py b/tests/integration/conftest.py index 0a10cf9b..50a6f11f 100644 --- a/tests/integration/conftest.py +++ b/tests/integration/conftest.py @@ -335,9 +335,10 @@ def adk_server_with_ollama( yield None return - # Find the examples/google_adk directory + # Find the examples/google_adk directory (inside the hackagent package) examples_dir = os.path.join( os.path.dirname(os.path.dirname(os.path.dirname(__file__))), + "hackagent", "examples", "google_adk", )