hyperplane-eval 0.1.7__tar.gz → 0.1.9__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {hyperplane_eval-0.1.7/hyperplane_eval.egg-info → hyperplane_eval-0.1.9}/PKG-INFO +3 -2
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/README.md +2 -1
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/evaluator.py +6 -4
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/dimensions/__init__.py +1 -1
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/reporting/analyser.py +2 -2
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9/hyperplane_eval.egg-info}/PKG-INFO +3 -2
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/setup.py +1 -1
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/LICENSE +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/MANIFEST.in +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/app.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/llms/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/llms/llm_client.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/local_bindings/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/local_bindings/executor.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/local_bindings/scanner.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/runners/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/cli/runners/agent_runner.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/config.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/dimensions/adversarial_features.json +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/dimensions/conversational_features.json +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/dimensions/prompt_feature.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/base.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/evaluated.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/executed.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/synthesized.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/input_space.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/input_space_factory.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/orchestrator.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/plane_evaluator.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/reporting/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/reporting/templates/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/stages/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/stages/evaluator.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/stages/generator.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/stages/navigator.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/llms/schema_prompt.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/prompt_loader.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/reporting/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/reporting/dimension_mitigation.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/reporting/vulnerability_patch.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/anchors_sys.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/anchors_user.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/brainstorm_sys.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/brainstorm_user.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/refine_sys.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/refine_user.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/evaluator/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/evaluator/judge.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/__init__.py +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/continue_sys.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/continue_user.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/copyeditor_sys.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/copyeditor_user.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/eval_checks_sys.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/eval_checks_user.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/seed_sys.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/seed_user.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/SOURCES.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/dependency_links.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/entry_points.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/requires.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/top_level.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/requirements.txt +0 -0
- {hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/setup.cfg +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: hyperplane-eval
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.9
|
|
4
4
|
Summary: Local tool to evaluate AI agents and find their weak points.
|
|
5
5
|
Author: Marten Panchev
|
|
6
6
|
Author-email: marten@aquithm.com
|
|
@@ -110,7 +110,8 @@ evaluator = Evaluator(
|
|
|
110
110
|
agent_desc="A helpful AI assistant",
|
|
111
111
|
param_desc={"prompt": "The user input prompt"},
|
|
112
112
|
target_callable=my_agent,
|
|
113
|
-
llm_client=router
|
|
113
|
+
llm_client=router,
|
|
114
|
+
model_name="gpt-4o"
|
|
114
115
|
)
|
|
115
116
|
|
|
116
117
|
# 4. Add constraints and run
|
|
@@ -21,6 +21,7 @@ class Evaluator:
|
|
|
21
21
|
param_desc: dict,
|
|
22
22
|
target_callable: Callable,
|
|
23
23
|
llm_client: litellm.Router,
|
|
24
|
+
model_name: str,
|
|
24
25
|
):
|
|
25
26
|
"""
|
|
26
27
|
Initialize the Evaluator.
|
|
@@ -35,6 +36,7 @@ class Evaluator:
|
|
|
35
36
|
self.param_desc = param_desc
|
|
36
37
|
self.target_callable = target_callable
|
|
37
38
|
self.llm_client = llm_client
|
|
39
|
+
self.model_name = model_name
|
|
38
40
|
|
|
39
41
|
def run(
|
|
40
42
|
self,
|
|
@@ -83,9 +85,9 @@ class Evaluator:
|
|
|
83
85
|
|
|
84
86
|
# 3. Resolve LLM configuration
|
|
85
87
|
class RouterWrapper(LLMClient):
|
|
86
|
-
def __init__(self, router):
|
|
88
|
+
def __init__(self, router, model_name):
|
|
87
89
|
self.router = router
|
|
88
|
-
self.model =
|
|
90
|
+
self.model = model_name
|
|
89
91
|
self._semaphore = asyncio.Semaphore(10)
|
|
90
92
|
|
|
91
93
|
async def generate(
|
|
@@ -97,7 +99,7 @@ class Evaluator:
|
|
|
97
99
|
prompt += "\n\n" + load_prompt("llms/schema_prompt", schema=schema_str)
|
|
98
100
|
|
|
99
101
|
kwargs = {
|
|
100
|
-
"model":
|
|
102
|
+
"model": self.model,
|
|
101
103
|
"messages": [{"role": "user", "content": prompt}],
|
|
102
104
|
"temperature": temperature,
|
|
103
105
|
"response_format": {"type": "json_object"},
|
|
@@ -108,7 +110,7 @@ class Evaluator:
|
|
|
108
110
|
except Exception as e:
|
|
109
111
|
raise RuntimeError(f"LLM Server Error: {e}")
|
|
110
112
|
|
|
111
|
-
llm_client_resolved = RouterWrapper(self.llm_client)
|
|
113
|
+
llm_client_resolved = RouterWrapper(self.llm_client, self.model_name)
|
|
112
114
|
|
|
113
115
|
# 4. Setup Custom Execution Environment
|
|
114
116
|
selected_func = {
|
|
@@ -591,7 +591,7 @@ class ResultsAnalyser:
|
|
|
591
591
|
f"- Adherence Score: {v.p_sat:.2f}\n"
|
|
592
592
|
)
|
|
593
593
|
|
|
594
|
-
from hyperplane.
|
|
594
|
+
from hyperplane.prompts.prompt_loader import load_prompt
|
|
595
595
|
|
|
596
596
|
prompt_parts.append("\n" + load_prompt("reporting/vulnerability_patch.txt"))
|
|
597
597
|
|
|
@@ -702,7 +702,7 @@ class ResultsAnalyser:
|
|
|
702
702
|
|
|
703
703
|
failing_prompts_list = "\n".join(prompt_parts)
|
|
704
704
|
|
|
705
|
-
from hyperplane.
|
|
705
|
+
from hyperplane.prompts.prompt_loader import load_prompt
|
|
706
706
|
|
|
707
707
|
prompt_template = load_prompt("reporting/dimension_mitigation.txt")
|
|
708
708
|
prompt = prompt_template.format(
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: hyperplane-eval
|
|
3
|
-
Version: 0.1.
|
|
3
|
+
Version: 0.1.9
|
|
4
4
|
Summary: Local tool to evaluate AI agents and find their weak points.
|
|
5
5
|
Author: Marten Panchev
|
|
6
6
|
Author-email: marten@aquithm.com
|
|
@@ -110,7 +110,8 @@ evaluator = Evaluator(
|
|
|
110
110
|
agent_desc="A helpful AI assistant",
|
|
111
111
|
param_desc={"prompt": "The user input prompt"},
|
|
112
112
|
target_callable=my_agent,
|
|
113
|
-
llm_client=router
|
|
113
|
+
llm_client=router,
|
|
114
|
+
model_name="gpt-4o"
|
|
114
115
|
)
|
|
115
116
|
|
|
116
117
|
# 4. Add constraints and run
|
|
@@ -13,7 +13,7 @@ except FileNotFoundError:
|
|
|
13
13
|
|
|
14
14
|
setup(
|
|
15
15
|
name="hyperplane-eval",
|
|
16
|
-
version="0.1.
|
|
16
|
+
version="0.1.9",
|
|
17
17
|
description="Local tool to evaluate AI agents and find their weak points. ",
|
|
18
18
|
long_description=long_description,
|
|
19
19
|
long_description_content_type="text/markdown",
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/evaluated.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/executed.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/domain/vectors/synthesized.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/__init__.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/input_space/input_space.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/framework/reporting/templates/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/reporting/vulnerability_patch.txt
RENAMED
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/__init__.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/anchors_sys.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/anchors_user.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/brainstorm_sys.txt
RENAMED
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/refine_sys.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/creator/refine_user.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/evaluator/__init__.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/evaluator/judge.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/__init__.py
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/continue_sys.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/seed_sys.txt
RENAMED
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane/prompts/stages/generator/seed_user.txt
RENAMED
|
File without changes
|
|
File without changes
|
{hyperplane_eval-0.1.7 → hyperplane_eval-0.1.9}/hyperplane_eval.egg-info/dependency_links.txt
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|