hyperplane-eval 0.1.8__tar.gz → 0.1.9__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {hyperplane_eval-0.1.8/hyperplane_eval.egg-info → hyperplane_eval-0.1.9}/PKG-INFO +3 -2
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/README.md +2 -1
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/evaluator.py +6 -4
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/dimensions/__init__.py +1 -1
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9/hyperplane_eval.egg-info}/PKG-INFO +3 -2
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/setup.py +1 -1
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/LICENSE +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/MANIFEST.in +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/app.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/llms/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/llms/llm_client.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/local_bindings/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/local_bindings/executor.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/local_bindings/scanner.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/runners/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/cli/runners/agent_runner.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/config.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/dimensions/adversarial_features.json +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/dimensions/conversational_features.json +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/dimensions/prompt_feature.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/base.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/evaluated.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/executed.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/synthesized.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/input_space.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/input_space_factory.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/orchestrator.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/plane_evaluator.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/reporting/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/reporting/analyser.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/reporting/templates/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/stages/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/stages/evaluator.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/stages/generator.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/stages/navigator.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/llms/schema_prompt.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/prompt_loader.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/reporting/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/reporting/dimension_mitigation.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/reporting/vulnerability_patch.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/anchors_sys.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/anchors_user.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/brainstorm_sys.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/brainstorm_user.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/refine_sys.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/refine_user.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/evaluator/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/evaluator/judge.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/__init__.py +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/continue_sys.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/continue_user.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/copyeditor_sys.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/copyeditor_user.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/eval_checks_sys.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/eval_checks_user.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/seed_sys.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/seed_user.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/SOURCES.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/dependency_links.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/entry_points.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/requires.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/top_level.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/requirements.txt +0 -0
- {hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/setup.cfg +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: hyperplane-eval
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.9
|
|
4
4
|
Summary: Local tool to evaluate AI agents and find their weak points.
|
|
5
5
|
Author: Marten Panchev
|
|
6
6
|
Author-email: marten@aquithm.com
|
|
@@ -110,7 +110,8 @@ evaluator = Evaluator(
|
|
|
110
110
|
agent_desc="A helpful AI assistant",
|
|
111
111
|
param_desc={"prompt": "The user input prompt"},
|
|
112
112
|
target_callable=my_agent,
|
|
113
|
-
llm_client=router
|
|
113
|
+
llm_client=router,
|
|
114
|
+
model_name="gpt-4o"
|
|
114
115
|
)
|
|
115
116
|
|
|
116
117
|
# 4. Add constraints and run
|
|
@@ -21,6 +21,7 @@ class Evaluator:
|
|
|
21
21
|
param_desc: dict,
|
|
22
22
|
target_callable: Callable,
|
|
23
23
|
llm_client: litellm.Router,
|
|
24
|
+
model_name: str,
|
|
24
25
|
):
|
|
25
26
|
"""
|
|
26
27
|
Initialize the Evaluator.
|
|
@@ -35,6 +36,7 @@ class Evaluator:
|
|
|
35
36
|
self.param_desc = param_desc
|
|
36
37
|
self.target_callable = target_callable
|
|
37
38
|
self.llm_client = llm_client
|
|
39
|
+
self.model_name = model_name
|
|
38
40
|
|
|
39
41
|
def run(
|
|
40
42
|
self,
|
|
@@ -83,9 +85,9 @@ class Evaluator:
|
|
|
83
85
|
|
|
84
86
|
# 3. Resolve LLM configuration
|
|
85
87
|
class RouterWrapper(LLMClient):
|
|
86
|
-
def __init__(self, router):
|
|
88
|
+
def __init__(self, router, model_name):
|
|
87
89
|
self.router = router
|
|
88
|
-
self.model =
|
|
90
|
+
self.model = model_name
|
|
89
91
|
self._semaphore = asyncio.Semaphore(10)
|
|
90
92
|
|
|
91
93
|
async def generate(
|
|
@@ -97,7 +99,7 @@ class Evaluator:
|
|
|
97
99
|
prompt += "\n\n" + load_prompt("llms/schema_prompt", schema=schema_str)
|
|
98
100
|
|
|
99
101
|
kwargs = {
|
|
100
|
-
"model":
|
|
102
|
+
"model": self.model,
|
|
101
103
|
"messages": [{"role": "user", "content": prompt}],
|
|
102
104
|
"temperature": temperature,
|
|
103
105
|
"response_format": {"type": "json_object"},
|
|
@@ -108,7 +110,7 @@ class Evaluator:
|
|
|
108
110
|
except Exception as e:
|
|
109
111
|
raise RuntimeError(f"LLM Server Error: {e}")
|
|
110
112
|
|
|
111
|
-
llm_client_resolved = RouterWrapper(self.llm_client)
|
|
113
|
+
llm_client_resolved = RouterWrapper(self.llm_client, self.model_name)
|
|
112
114
|
|
|
113
115
|
# 4. Setup Custom Execution Environment
|
|
114
116
|
selected_func = {
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: hyperplane-eval
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.9
|
|
4
4
|
Summary: Local tool to evaluate AI agents and find their weak points.
|
|
5
5
|
Author: Marten Panchev
|
|
6
6
|
Author-email: marten@aquithm.com
|
|
@@ -110,7 +110,8 @@ evaluator = Evaluator(
|
|
|
110
110
|
agent_desc="A helpful AI assistant",
|
|
111
111
|
param_desc={"prompt": "The user input prompt"},
|
|
112
112
|
target_callable=my_agent,
|
|
113
|
-
llm_client=router
|
|
113
|
+
llm_client=router,
|
|
114
|
+
model_name="gpt-4o"
|
|
114
115
|
)
|
|
115
116
|
|
|
116
117
|
# 4. Add constraints and run
|
|
@@ -13,7 +13,7 @@ except FileNotFoundError:
|
|
|
13
13
|
|
|
14
14
|
setup(
|
|
15
15
|
name="hyperplane-eval",
|
|
16
|
-
version="0.1.
|
|
16
|
+
version="0.1.9",
|
|
17
17
|
description="Local tool to evaluate AI agents and find their weak points. ",
|
|
18
18
|
long_description=long_description,
|
|
19
19
|
long_description_content_type="text/markdown",
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/evaluated.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/executed.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/synthesized.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/__init__.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/input_space.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/framework/reporting/templates/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/reporting/vulnerability_patch.txt
RENAMED
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/__init__.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/anchors_sys.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/anchors_user.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/brainstorm_sys.txt
RENAMED
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/refine_sys.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/refine_user.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/evaluator/__init__.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/evaluator/judge.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/__init__.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/continue_sys.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/seed_sys.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/seed_user.txt
RENAMED
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.8 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|