judgeval 0.0.17__py3-none-any.whl → 0.0.19__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- judgeval/__init__.py +1 -3
- judgeval/clients.py +0 -7
- judgeval/common/logger.py +0 -1
- judgeval/common/tracer.py +250 -42
- judgeval/common/utils.py +9 -5
- judgeval/constants.py +6 -1
- judgeval/data/__init__.py +2 -0
- judgeval/data/api_example.py +2 -2
- judgeval/data/datasets/__init__.py +1 -2
- judgeval/data/datasets/dataset.py +4 -5
- judgeval/data/datasets/eval_dataset_client.py +1 -2
- judgeval/data/datasets/utils.py +1 -2
- judgeval/data/example.py +71 -16
- judgeval/data/scorer_data.py +1 -1
- judgeval/evaluation_run.py +2 -2
- judgeval/judges/__init__.py +0 -1
- judgeval/judges/base_judge.py +1 -1
- judgeval/judges/mixture_of_judges.py +7 -2
- judgeval/judgment_client.py +8 -4
- judgeval/rules.py +2 -4
- judgeval/run_evaluation.py +2 -5
- judgeval/scorers/__init__.py +6 -0
- judgeval/scorers/api_scorer.py +12 -6
- judgeval/scorers/base_scorer.py +12 -6
- judgeval/scorers/judgeval_scorer.py +7 -3
- judgeval/scorers/judgeval_scorers/__init__.py +24 -3
- judgeval/scorers/judgeval_scorers/api_scorers/__init__.py +6 -0
- judgeval/scorers/judgeval_scorers/api_scorers/comparison.py +35 -0
- judgeval/scorers/judgeval_scorers/api_scorers/groundedness.py +19 -0
- judgeval/scorers/judgeval_scorers/api_scorers/instruction_adherence.py +19 -0
- judgeval/scorers/judgeval_scorers/local_implementations/__init__.py +4 -1
- judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/answer_correctness_scorer.py +0 -1
- judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/prompts.py +2 -2
- judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/answer_relevancy_scorer.py +7 -6
- judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/prompts.py +2 -2
- judgeval/scorers/judgeval_scorers/local_implementations/comparison/__init__.py +0 -0
- judgeval/scorers/judgeval_scorers/local_implementations/comparison/comparison_scorer.py +161 -0
- judgeval/scorers/judgeval_scorers/local_implementations/comparison/prompts.py +222 -0
- judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/prompts.py +2 -2
- judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/prompts.py +2 -2
- judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/prompts.py +2 -2
- judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/faithfulness_scorer.py +1 -8
- judgeval/scorers/judgeval_scorers/local_implementations/hallucination/hallucination_scorer.py +7 -6
- judgeval/scorers/judgeval_scorers/local_implementations/hallucination/prompts.py +2 -2
- judgeval/scorers/judgeval_scorers/local_implementations/instruction_adherence/instruction_adherence.py +232 -0
- judgeval/scorers/judgeval_scorers/local_implementations/instruction_adherence/prompt.py +102 -0
- judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/json_correctness_scorer.py +7 -7
- judgeval/scorers/judgeval_scorers/local_implementations/summarization/summarization_scorer.py +7 -6
- judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/tool_correctness_scorer.py +1 -2
- judgeval/scorers/prompt_scorer.py +7 -5
- judgeval/scorers/utils.py +1 -1
- {judgeval-0.0.17.dist-info → judgeval-0.0.19.dist-info}/METADATA +1 -1
- {judgeval-0.0.17.dist-info → judgeval-0.0.19.dist-info}/RECORD +56 -48
- /judgeval/data/{datasets/ground_truth.py → ground_truth.py} +0 -0
- {judgeval-0.0.17.dist-info → judgeval-0.0.19.dist-info}/WHEEL +0 -0
- {judgeval-0.0.17.dist-info → judgeval-0.0.19.dist-info}/licenses/LICENSE.md +0 -0
@@ -0,0 +1,102 @@
|
|
1
|
+
"""
|
2
|
+
Util prompts for InstructionAdherenceScorer
|
3
|
+
"""
|
4
|
+
|
5
|
+
from typing import List, Optional, Tuple
|
6
|
+
from pydantic import BaseModel, Field
|
7
|
+
|
8
|
+
|
9
|
+
class InstructionAdherenceTemplate:
|
10
|
+
@staticmethod
|
11
|
+
def get_instructions(input):
|
12
|
+
return f"""You will be presented with a piece of text. Your task is to break down the text and generate a list of the instructions contained within the text.
|
13
|
+
|
14
|
+
===== START OF EXAMPLES =====
|
15
|
+
Example 1:
|
16
|
+
Example text: Hello my name is John Doe. I like cars. Write two poems about the weather and create a joke. Also what is 5 + 5?
|
17
|
+
|
18
|
+
Output:
|
19
|
+
{{
|
20
|
+
"instructions": ["Write two poem about the weather", "Create a joke", "What is 5 + 5?"]
|
21
|
+
}}
|
22
|
+
===== END OF EXAMPLES =====
|
23
|
+
|
24
|
+
|
25
|
+
**
|
26
|
+
IMPORTANT: Please return your answer in valid JSON format, with the "instructions" key mapping to a list of strings. No words or explanation is needed.
|
27
|
+
**
|
28
|
+
|
29
|
+
==== START OF INPUT ====
|
30
|
+
Text:
|
31
|
+
{input}
|
32
|
+
==== END OF INPUT ====
|
33
|
+
|
34
|
+
==== YOUR ANSWER ====
|
35
|
+
JSON:
|
36
|
+
"""
|
37
|
+
|
38
|
+
@staticmethod
|
39
|
+
def generate_verdicts(instructions, actual_output):
|
40
|
+
return f"""
|
41
|
+
You will be presented with a list of instructions and a piece of text. For each instruction, determine if the instruction was completed in the text. There are 3 categories: either completed, partially completed, or not completed. The scores for these will be 1, 0.5, and 0 respectively.
|
42
|
+
Go through each instruction and provide score for each instruction as well as the reasoning for that score.
|
43
|
+
|
44
|
+
==== FORMATTING YOUR ANSWER ====
|
45
|
+
Please return your answer in JSON format, with a list of JSON objects with keys "instruction", "score", and "reason". No words or explanation beyond the output JSON is needed.
|
46
|
+
|
47
|
+
|
48
|
+
===== START OF EXAMPLES =====
|
49
|
+
Example 1:
|
50
|
+
instructions: ["Write two poems about the weather", "Create a joke", "What is 5 + 5?"]
|
51
|
+
output: Poem 1: The Sun's Embrace
|
52
|
+
The sun climbs high, a golden flame,
|
53
|
+
It whispers warmth, it calls my name.
|
54
|
+
The sky, a canvas, blue and clear,
|
55
|
+
A perfect day for cars, my dear.
|
56
|
+
|
57
|
+
The asphalt hums beneath the wheels,
|
58
|
+
A symphony of speed it feels.
|
59
|
+
The weather smiles, no clouds in sight,
|
60
|
+
A driver's joy, pure delight.
|
61
|
+
|
62
|
+
Poem 2: The Storm's Dance
|
63
|
+
A sunlit meadow, alive with whispers of wind, where daisies dance and hope begins again. Each petal holds a promise—bright, unbruised— a symphony of light that cannot be refused.
|
64
|
+
|
65
|
+
Joke
|
66
|
+
Why dont cars ever get cold in the winter?
|
67
|
+
Because they have radiators!
|
68
|
+
|
69
|
+
Math Answer
|
70
|
+
5 + 5 = 10
|
71
|
+
|
72
|
+
YOUR JSON OUTPUT:
|
73
|
+
{{
|
74
|
+
[
|
75
|
+
{{
|
76
|
+
"instruction": "Write two poem about the weather",
|
77
|
+
"score": 0.5,
|
78
|
+
"reason": "The output contained one poem about the weather, but the other poem was not about the weather."
|
79
|
+
}},
|
80
|
+
{{
|
81
|
+
"instruction": "Create a joke",
|
82
|
+
"score": 1,
|
83
|
+
"reason": "There was a joke created in the output."
|
84
|
+
}},
|
85
|
+
{{
|
86
|
+
"instruction": "What is 5 + 5?",
|
87
|
+
"score": 1,
|
88
|
+
"reason": "The answer to the math question was provided in the output."
|
89
|
+
}}
|
90
|
+
]
|
91
|
+
}}
|
92
|
+
===== END OF EXAMPLES =====
|
93
|
+
|
94
|
+
==== START OF INPUT ====
|
95
|
+
instructions: {instructions}
|
96
|
+
output: {actual_output}
|
97
|
+
==== END OF INPUT ====
|
98
|
+
|
99
|
+
==== YOUR ANSWER ====
|
100
|
+
JSON:
|
101
|
+
"""
|
102
|
+
|
judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/json_correctness_scorer.py
CHANGED
@@ -1,15 +1,15 @@
|
|
1
|
-
from typing import
|
1
|
+
from typing import Optional, Union, Any
|
2
2
|
from pydantic import BaseModel, ValidationError, create_model
|
3
3
|
|
4
4
|
from judgeval.constants import APIScorer
|
5
5
|
from judgeval.judges import JudgevalJudge
|
6
6
|
from judgeval.judges.utils import create_judge
|
7
|
-
from judgeval.scorers.utils import (
|
8
|
-
|
9
|
-
|
10
|
-
|
11
|
-
|
12
|
-
|
7
|
+
from judgeval.scorers.utils import (
|
8
|
+
get_or_create_event_loop,
|
9
|
+
scorer_progress_meter,
|
10
|
+
create_verbose_logs,
|
11
|
+
check_example_params
|
12
|
+
)
|
13
13
|
from judgeval.scorers import JudgevalScorer
|
14
14
|
from judgeval.data import Example, ExampleParams
|
15
15
|
|
judgeval/scorers/judgeval_scorers/local_implementations/summarization/summarization_scorer.py
CHANGED
@@ -2,12 +2,13 @@ from typing import List, Optional, Union
|
|
2
2
|
import asyncio
|
3
3
|
|
4
4
|
from judgeval.constants import APIScorer
|
5
|
-
from judgeval.scorers.utils import (
|
6
|
-
|
7
|
-
|
8
|
-
|
9
|
-
|
10
|
-
|
5
|
+
from judgeval.scorers.utils import (
|
6
|
+
get_or_create_event_loop,
|
7
|
+
scorer_progress_meter,
|
8
|
+
create_verbose_logs,
|
9
|
+
parse_response_json,
|
10
|
+
check_example_params
|
11
|
+
)
|
11
12
|
from judgeval.scorers import JudgevalScorer
|
12
13
|
from judgeval.judges import JudgevalJudge
|
13
14
|
from judgeval.judges.utils import create_judge
|
judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/tool_correctness_scorer.py
CHANGED
@@ -1,10 +1,9 @@
|
|
1
|
-
from typing import List
|
1
|
+
from typing import List
|
2
2
|
|
3
3
|
from judgeval.constants import APIScorer
|
4
4
|
from judgeval.scorers.utils import (
|
5
5
|
scorer_progress_meter,
|
6
6
|
create_verbose_logs,
|
7
|
-
parse_response_json,
|
8
7
|
check_example_params
|
9
8
|
)
|
10
9
|
from judgeval.data import Example, ExampleParams
|
@@ -26,15 +26,17 @@ NOTE: When implementing build_measure_prompt and build_schema:
|
|
26
26
|
"""
|
27
27
|
|
28
28
|
from abc import abstractmethod
|
29
|
-
from typing import List, Optional,
|
29
|
+
from typing import List, Optional, Tuple, Any, Mapping
|
30
30
|
from pydantic import BaseModel, model_serializer, Field
|
31
31
|
|
32
32
|
from judgeval.data import Example
|
33
33
|
from judgeval.scorers import JudgevalScorer
|
34
|
-
from judgeval.scorers.utils import (
|
35
|
-
|
36
|
-
|
37
|
-
|
34
|
+
from judgeval.scorers.utils import (
|
35
|
+
scorer_progress_meter,
|
36
|
+
parse_response_json,
|
37
|
+
get_or_create_event_loop,
|
38
|
+
create_verbose_logs
|
39
|
+
)
|
38
40
|
|
39
41
|
|
40
42
|
class ReasonScore(BaseModel):
|
judgeval/scorers/utils.py
CHANGED
@@ -11,7 +11,7 @@ import re
|
|
11
11
|
from contextlib import contextmanager
|
12
12
|
from rich.progress import Progress, SpinnerColumn, TextColumn
|
13
13
|
from rich.console import Console
|
14
|
-
from typing import List, Optional
|
14
|
+
from typing import List, Optional
|
15
15
|
|
16
16
|
from judgeval.scorers import JudgevalScorer
|
17
17
|
from judgeval.data import Example, ExampleParams
|
@@ -1,86 +1,94 @@
|
|
1
|
-
judgeval/__init__.py,sha256=
|
2
|
-
judgeval/clients.py,sha256=
|
3
|
-
judgeval/constants.py,sha256=
|
4
|
-
judgeval/evaluation_run.py,sha256=
|
5
|
-
judgeval/judgment_client.py,sha256=
|
6
|
-
judgeval/rules.py,sha256=
|
7
|
-
judgeval/run_evaluation.py,sha256=
|
1
|
+
judgeval/__init__.py,sha256=dtXxsCmI4eEsZdGSUMy8P_pA0bc2-OSGAgb2C__yJoA,252
|
2
|
+
judgeval/clients.py,sha256=6VQmEqmfCngUdS2MuPBIpHvtDFqOENm8-_BmMvjLyRQ,944
|
3
|
+
judgeval/constants.py,sha256=BXTzKBmhDVutiitaCRarfkc_M-0NplRJofIt_QSa5QI,5010
|
4
|
+
judgeval/evaluation_run.py,sha256=RgJD60lJsunNQzObjo7iXnAzXWgubCLOAAuuamAAuoI,6354
|
5
|
+
judgeval/judgment_client.py,sha256=evlvcrYO9pF-oCgcvlGE59iODN0C6GJtn7bySFU_88k,23384
|
6
|
+
judgeval/rules.py,sha256=ebsiDEBVAnYTQxwVNvh_RpmKeWBnjQXgHs8KofTjcAs,15526
|
7
|
+
judgeval/run_evaluation.py,sha256=yLW24kFcw0xzXHvnDclYqtujTww6SDwvut6HM1x7SXk,21505
|
8
8
|
judgeval/common/__init__.py,sha256=7d24BRxtncpMj3AAJCj8RS7TqgjXmW777HVZH6-3sBs,289
|
9
9
|
judgeval/common/exceptions.py,sha256=U-TxHLn7oVMezsMuoYouNDb2XuS8RCggfntYf5_6u4E,565
|
10
|
-
judgeval/common/logger.py,sha256=
|
11
|
-
judgeval/common/tracer.py,sha256=
|
12
|
-
judgeval/common/utils.py,sha256=
|
13
|
-
judgeval/data/__init__.py,sha256=
|
14
|
-
judgeval/data/api_example.py,sha256=
|
15
|
-
judgeval/data/example.py,sha256=
|
10
|
+
judgeval/common/logger.py,sha256=KO75wWXCxhUHUMvLaTU31ZzOk6tkZBa7heQ7y0f-zFE,6062
|
11
|
+
judgeval/common/tracer.py,sha256=tTG4VZRXJjilm0ltQCeXJvd7TiL9W1PSVaf0LOmw2C4,44430
|
12
|
+
judgeval/common/utils.py,sha256=LUQV5JfDr6wj7xHAJoNq-gofNZ6mjXbeKrGKzBME1KM,33533
|
13
|
+
judgeval/data/__init__.py,sha256=QykVE22Qf-I2f1g-jC9-iQyLNXgDmX1-vHbCgZg8Ra8,558
|
14
|
+
judgeval/data/api_example.py,sha256=NEiJKpf2WIo4FPQ2-vuoCZ_9ixexhdg_wdNYWXPSA2M,4094
|
15
|
+
judgeval/data/example.py,sha256=PHqRI8l94ylLgfgjIH4DqcFFHb-t-WBxRkZb9eXKlpI,5648
|
16
|
+
judgeval/data/ground_truth.py,sha256=OTBs3VZe-Wp0vEXEsq14GPZHYtpWT16bhGQTycIvkKc,2057
|
16
17
|
judgeval/data/result.py,sha256=8FIO-bFKPegZuByKRjA2_sumjb8oGWQ5ZeQ1RVz5z2w,4393
|
17
|
-
judgeval/data/scorer_data.py,sha256=
|
18
|
-
judgeval/data/datasets/__init__.py,sha256=
|
19
|
-
judgeval/data/datasets/dataset.py,sha256=
|
20
|
-
judgeval/data/datasets/eval_dataset_client.py,sha256=
|
21
|
-
judgeval/data/datasets/
|
22
|
-
judgeval/
|
23
|
-
judgeval/judges/
|
24
|
-
judgeval/judges/base_judge.py,sha256=qhYSFxE21WajYNaT4X-qwWGtpo_tqzBzdqbszSheSD8,1000
|
18
|
+
judgeval/data/scorer_data.py,sha256=JVlaTx1EP2jw2gh3Vgx1CSEsvIFABAN26IquKyxwiJQ,3273
|
19
|
+
judgeval/data/datasets/__init__.py,sha256=IdNKhQv9yYZ_op0rdBacrFaFVmiiYQ3JTzXzxOTsEVQ,176
|
20
|
+
judgeval/data/datasets/dataset.py,sha256=0NItb98Yz0P954rg9FF9s09uVQ7cEg9A5J6Xvie9nhw,12022
|
21
|
+
judgeval/data/datasets/eval_dataset_client.py,sha256=QsfHyFC4WePV7uJGYUVjiIwtk1Ie_VpWUrnd2Q4kKdU,11479
|
22
|
+
judgeval/data/datasets/utils.py,sha256=6DpGCPmGFNOKIGNcVCOSjTOdWemrpAuYnlo778sGG7g,2455
|
23
|
+
judgeval/judges/__init__.py,sha256=6X7VSwrwsdxGBNxCyapVRWGghhKOy3MVxFNMQ62kCXM,308
|
24
|
+
judgeval/judges/base_judge.py,sha256=ch_S7uBB7lyv44Lf1d7mIGFpveOO58zOkkpImKgd9_4,994
|
25
25
|
judgeval/judges/litellm_judge.py,sha256=EIL58Teptv8DzZUO3yP2RDQCDq-aoBB6HPZzPdK6KTg,2424
|
26
|
-
judgeval/judges/mixture_of_judges.py,sha256=
|
26
|
+
judgeval/judges/mixture_of_judges.py,sha256=IJoi4Twk8ze1CJWVEp69k6TSqTCTGrmVYQ0qdffer60,15549
|
27
27
|
judgeval/judges/together_judge.py,sha256=l00hhPerAZXg3oYBd8cyMtWsOTNt_0FIqoxhKJKQe3k,2302
|
28
28
|
judgeval/judges/utils.py,sha256=9lvUxziGV86ISvVFxYBWc09TWFyAQgUTyPf_a9mD5Rs,2686
|
29
|
-
judgeval/scorers/__init__.py,sha256=
|
30
|
-
judgeval/scorers/api_scorer.py,sha256=
|
31
|
-
judgeval/scorers/base_scorer.py,sha256=
|
29
|
+
judgeval/scorers/__init__.py,sha256=_KP6c1dr6O2p95hx_WvRpZXfSGg9r2hNn_PjY9Ch5ds,1160
|
30
|
+
judgeval/scorers/api_scorer.py,sha256=wGqTQCbUE7uE-PzaKcCmexAqutdTunjFR0zVA6bUxdE,2518
|
31
|
+
judgeval/scorers/base_scorer.py,sha256=xdUlY3CnLdCQ1Z5iUeY22Bim5v-OQruZmaVF_4Y1mC0,2183
|
32
32
|
judgeval/scorers/exceptions.py,sha256=eGW5CuJgZ5YJBFrE4FHDSF651PO1dKAZ379mJ8gOsfo,178
|
33
|
-
judgeval/scorers/judgeval_scorer.py,sha256=
|
34
|
-
judgeval/scorers/prompt_scorer.py,sha256=
|
33
|
+
judgeval/scorers/judgeval_scorer.py,sha256=oIkfoGXA09wL_vcK1DRibzQSA-MFNa-hmw1IhGBErf8,6592
|
34
|
+
judgeval/scorers/prompt_scorer.py,sha256=PaAs2qRolw1P3_I061Xvk9qzvF4O-JR8g_39RqXnHcM,17728
|
35
35
|
judgeval/scorers/score.py,sha256=GALVmeApP1Cyih2vY93zRaU6RShtW4jJDG47Pm6yfnw,18657
|
36
|
-
judgeval/scorers/utils.py,sha256=
|
37
|
-
judgeval/scorers/judgeval_scorers/__init__.py,sha256
|
38
|
-
judgeval/scorers/judgeval_scorers/api_scorers/__init__.py,sha256=
|
36
|
+
judgeval/scorers/utils.py,sha256=iHQVTlIANbmCTXz9kTeSdOytgUZ_T74Re61ajqsk_WQ,6827
|
37
|
+
judgeval/scorers/judgeval_scorers/__init__.py,sha256=-nnqz-aU5PB_m1cb-2ySpZ18WDxupxmQCr-ws0aSalw,6000
|
38
|
+
judgeval/scorers/judgeval_scorers/api_scorers/__init__.py,sha256=cJSwTA6hqZXUSaPkTl4yDyl3cUzv0IlcTu592uoTY98,1651
|
39
39
|
judgeval/scorers/judgeval_scorers/api_scorers/answer_correctness.py,sha256=690G5askjE8dcbKPGvCF6JxAEM9QJUqb-3K-D6lI6oM,463
|
40
40
|
judgeval/scorers/judgeval_scorers/api_scorers/answer_relevancy.py,sha256=CqvvjV7AZqPlXh-PZaPKYPILHr15u4bIYiKBFjlk5i0,457
|
41
|
+
judgeval/scorers/judgeval_scorers/api_scorers/comparison.py,sha256=6Q1qbsANOoZ3PM8n_gtZLIMbTBB9879L3acRelNJ6Uk,1001
|
41
42
|
judgeval/scorers/judgeval_scorers/api_scorers/contextual_precision.py,sha256=2zBrm_EEc143bmPA4HVcf8XtQeuc_BexczGx-SHlwRY,473
|
42
43
|
judgeval/scorers/judgeval_scorers/api_scorers/contextual_recall.py,sha256=NyojBWy_lRYx8diREulSK8s9dfYdZav4eZjg3TwUm0M,461
|
43
44
|
judgeval/scorers/judgeval_scorers/api_scorers/contextual_relevancy.py,sha256=wROMWOliCnB39ftX9TdeZmG9y0vrnxIGVby65tLOQRU,574
|
44
45
|
judgeval/scorers/judgeval_scorers/api_scorers/faithfulness.py,sha256=gNf_i5c0jjpz2zCGhe7TtDMLKxc1PdOExJMFB5X7hSg,442
|
46
|
+
judgeval/scorers/judgeval_scorers/api_scorers/groundedness.py,sha256=esO76hEp0NzeBUdoSICPLdx5AeA5zWSt_2zpcSgvGis,442
|
45
47
|
judgeval/scorers/judgeval_scorers/api_scorers/hallucination.py,sha256=ffYwH3CexPkKgo1rCALMivypROQjG5WWEsKXEFZxe2k,446
|
48
|
+
judgeval/scorers/judgeval_scorers/api_scorers/instruction_adherence.py,sha256=t1lWYOF0Pxvw5-NrI1Dt9FojaOncOCRlZc4a2SA20h4,477
|
46
49
|
judgeval/scorers/judgeval_scorers/api_scorers/json_correctness.py,sha256=CAZBQKwNSqpqAoOgStYfr-yP1Brug_6VRimRIQY-zdg,894
|
47
50
|
judgeval/scorers/judgeval_scorers/api_scorers/summarization.py,sha256=-E3oxYbI0D_0q-_fGWh2jQHW9O4Pu7I7xvLWsHU6cn8,450
|
48
51
|
judgeval/scorers/judgeval_scorers/api_scorers/tool_correctness.py,sha256=17ppPXm962ew67GU5m0npzbPu3CuhgdKY_KmfPvKfu4,457
|
49
52
|
judgeval/scorers/judgeval_scorers/classifiers/__init__.py,sha256=Qt81W5ZCwMvBAne0LfQDb8xvg5iOG1vEYP7WizgwAZo,67
|
50
53
|
judgeval/scorers/judgeval_scorers/classifiers/text2sql/__init__.py,sha256=8iTzMvou1Dr8pybul6lZHKjc9Ye2-0_racRGYkhEdTY,74
|
51
54
|
judgeval/scorers/judgeval_scorers/classifiers/text2sql/text2sql_scorer.py,sha256=ly72Z7s_c8NID6-nQnuW8qEGEW2MqdvpJ-5WfXzbAQg,2579
|
52
|
-
judgeval/scorers/judgeval_scorers/local_implementations/__init__.py,sha256=
|
55
|
+
judgeval/scorers/judgeval_scorers/local_implementations/__init__.py,sha256=pipWXfS_n4UsnZViwZAF2bPB1FYNfmoJAJUNY7JSq7I,1937
|
53
56
|
judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/__init__.py,sha256=cxxUEspgoIdSzJbwIIioamC0-xDqhYVfYAWxaYF-D_Y,177
|
54
|
-
judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/answer_correctness_scorer.py,sha256=
|
55
|
-
judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/prompts.py,sha256=
|
57
|
+
judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/answer_correctness_scorer.py,sha256=3Dpm8BIIe0Th2p0ccO5bb-le93lywjOLSo712HwEIUE,10196
|
58
|
+
judgeval/scorers/judgeval_scorers/local_implementations/answer_correctness/prompts.py,sha256=hBUqEd8Hy3g8peOVjpSmRb31fPtpodDzdRUonhKRl30,6686
|
56
59
|
judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/__init__.py,sha256=r6yae5iaWtlBL_cP8I-1SuhS9dulsy1e7W9Rcz82v6E,169
|
57
|
-
judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/answer_relevancy_scorer.py,sha256=
|
58
|
-
judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/prompts.py,sha256
|
60
|
+
judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/answer_relevancy_scorer.py,sha256=qoeoFyXXDtqqc7ZSLajqexeSxw5STmrL-uPQIMY3zSw,10529
|
61
|
+
judgeval/scorers/judgeval_scorers/local_implementations/answer_relevancy/prompts.py,sha256=-OO3QmkXqGCvdIRKsAuT4wQ1ZqWBQDdb1j3lc3W9q3w,6540
|
62
|
+
judgeval/scorers/judgeval_scorers/local_implementations/comparison/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
63
|
+
judgeval/scorers/judgeval_scorers/local_implementations/comparison/comparison_scorer.py,sha256=QnwSTgYx_zyz6K27WTe89MoTcO12WYn_jqE_xj7_H2U,5497
|
64
|
+
judgeval/scorers/judgeval_scorers/local_implementations/comparison/prompts.py,sha256=c49aCzyxCogjUTipQUmS13LemFC89X9xEuPNQ_LVHgw,31345
|
59
65
|
judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/__init__.py,sha256=J6tc-T60AVOEaNVuoVU0XIG6dvQri99Q0tnX_Tm-0vc,108
|
60
66
|
judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/contextual_precision_scorer.py,sha256=tRgRyjGpc4Pe3nQ1c-5NeNYFvbulL7YEnoRa9zLp1gc,9649
|
61
|
-
judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/prompts.py,sha256=
|
67
|
+
judgeval/scorers/judgeval_scorers/local_implementations/contextual_precision/prompts.py,sha256=pN0AURDWSV3iGt11MtJIwzXMuKbM4oC3zdb9yqnjNdU,4875
|
62
68
|
judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/__init__.py,sha256=4kjfqD_95muHZFo75S8_fbTcC1DI1onNIfMmr8gMZaI,99
|
63
69
|
judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/contextual_recall_scorer.py,sha256=hwAv_x3XwGDnSW3a75CTCgIW6eVg8ymdjDdJQvw5p0Y,9260
|
64
|
-
judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/prompts.py,sha256=
|
70
|
+
judgeval/scorers/judgeval_scorers/local_implementations/contextual_recall/prompts.py,sha256=k5xdCw8gnBvG1_dDSbtBftDDtOZ4qKL2-iQ9AQHsuUI,6541
|
65
71
|
judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/__init__.py,sha256=JPCvrekKLbl_xdD49evhtiFIVocuegCpCBkn1auzTSE,184
|
66
72
|
judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/contextual_relevancy_scorer.py,sha256=BtVgE7z-9PHfFRcvn96aEG5mXVcWBweVyty934hZdiU,8915
|
67
|
-
judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/prompts.py,sha256=
|
73
|
+
judgeval/scorers/judgeval_scorers/local_implementations/contextual_relevancy/prompts.py,sha256=uO-8Uo7VrXu4xWpxjIx6_UI3aw5KuJxubSHb71Nzm6Q,4574
|
68
74
|
judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/__init__.py,sha256=NbkSqPwxgF4T8KsvuIWhVyRwdOlo7mNHMFuRStTFnvk,154
|
69
|
-
judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/faithfulness_scorer.py,sha256=
|
75
|
+
judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/faithfulness_scorer.py,sha256=LPVTGHBBJSpE6TrgzZQS2_vw4P9HiUYmykrwo6UMdws,11251
|
70
76
|
judgeval/scorers/judgeval_scorers/local_implementations/faithfulness/prompts.py,sha256=vNLjF4NKZJSV4VNenHzoAUB2xVZz6tt_5AzryKmOVrI,11690
|
71
77
|
judgeval/scorers/judgeval_scorers/local_implementations/hallucination/__init__.py,sha256=fZk3UQxI9Nljf5qjCRLRkF0D-AERFHElI9cC83_cgV8,158
|
72
|
-
judgeval/scorers/judgeval_scorers/local_implementations/hallucination/hallucination_scorer.py,sha256=
|
73
|
-
judgeval/scorers/judgeval_scorers/local_implementations/hallucination/prompts.py,sha256=
|
78
|
+
judgeval/scorers/judgeval_scorers/local_implementations/hallucination/hallucination_scorer.py,sha256=q9qdmwq96stbTRVA4Egv9eO1KI8zf77jwYkZXaOZePw,9511
|
79
|
+
judgeval/scorers/judgeval_scorers/local_implementations/hallucination/prompts.py,sha256=TJWKheQnaJ-pdVzkOTDr3BNZ9bfCrC81S3kvjm4Zjh8,4329
|
80
|
+
judgeval/scorers/judgeval_scorers/local_implementations/instruction_adherence/instruction_adherence.py,sha256=keZRmLe5oyIVE98h1nOiW54__xcEv2QInwZcJ34ZKhs,8175
|
81
|
+
judgeval/scorers/judgeval_scorers/local_implementations/instruction_adherence/prompt.py,sha256=jv-1Z7K1EhLjy4NGKS35cIcShh7ZDQCXVPqoJnAnDqk,3598
|
74
82
|
judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/__init__.py,sha256=xQDw7o9JQ6qajusPnBH0MWBRJ5ct_Ao3pJELXxxVMRo,175
|
75
|
-
judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/json_correctness_scorer.py,sha256=
|
83
|
+
judgeval/scorers/judgeval_scorers/local_implementations/json_correctness/json_correctness_scorer.py,sha256=RkI-mARc2AYCw5dTb5OSY4UWXIwDcYS3ViiJOVIq0Nw,4339
|
76
84
|
judgeval/scorers/judgeval_scorers/local_implementations/summarization/__init__.py,sha256=mv6-XeLSV5yj1H98YYV2iTYVd88zKftZJP42Lgl6R80,89
|
77
85
|
judgeval/scorers/judgeval_scorers/local_implementations/summarization/prompts.py,sha256=6GnRz2h-6Fwt4sl__0RgQOyo3n3iDO4MNuHWxdu-rrM,10242
|
78
|
-
judgeval/scorers/judgeval_scorers/local_implementations/summarization/summarization_scorer.py,sha256=
|
86
|
+
judgeval/scorers/judgeval_scorers/local_implementations/summarization/summarization_scorer.py,sha256=Qk7lwHgRPYeGoxTOyclAh1VfGItfvHJ6l1t7Nk3SWFM,20927
|
79
87
|
judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/__init__.py,sha256=JUB3TMqS1OHr6PqpIGqkyiBNbyfUaw7lZuUATjU3_ek,168
|
80
|
-
judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/tool_correctness_scorer.py,sha256=
|
88
|
+
judgeval/scorers/judgeval_scorers/local_implementations/tool_correctness/tool_correctness_scorer.py,sha256=8ucE8UrA44Mr-wHgVsFNU9gKunkPxe87VPYrFVi949g,5461
|
81
89
|
judgeval/tracer/__init__.py,sha256=wy3DYpH8U_z0GO_K_gOSkK0tTTD-u5eLDo0T5xIBoAc,147
|
82
90
|
judgeval/utils/alerts.py,sha256=RgW5R9Dn3Jtim0OyAYDbNzjoX2s6SA4Mw16GyyaikjI,1424
|
83
|
-
judgeval-0.0.
|
84
|
-
judgeval-0.0.
|
85
|
-
judgeval-0.0.
|
86
|
-
judgeval-0.0.
|
91
|
+
judgeval-0.0.19.dist-info/METADATA,sha256=6HqNDRgJ1LI3hleMhMiGId7EULc9xJY0lYXhq4TEZOg,1283
|
92
|
+
judgeval-0.0.19.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
|
93
|
+
judgeval-0.0.19.dist-info/licenses/LICENSE.md,sha256=tKmCg7k5QOmxPK19XMfzim04QiQJPmgIm0pAn55IJwk,11352
|
94
|
+
judgeval-0.0.19.dist-info/RECORD,,
|
File without changes
|
File without changes
|
File without changes
|