PyPI - deepeval - Versions diffs - 3.7.1__py3-none-any.whl → 3.7.2__py3-none-any.whl - Mend

deepeval 3.7.1py3-none-any.whl → 3.7.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

deepeval/_version.py +1 -1
deepeval/evaluate/compare.py +6 -2
deepeval/synthesizer/config.py +9 -0
deepeval/synthesizer/schema.py +23 -0
deepeval/synthesizer/synthesizer.py +1137 -2
deepeval/synthesizer/templates/__init__.py +11 -2
deepeval/synthesizer/templates/template.py +554 -1
deepeval/synthesizer/templates/template_extraction.py +32 -0
deepeval/synthesizer/templates/template_prompt.py +262 -0
{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/METADATA +2 -1
{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/RECORD +14 -14
{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/LICENSE.md +0 -0
{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/WHEEL +0 -0
{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/entry_points.txt +0 -0

deepeval/synthesizer/templates/template_prompt.py CHANGED Viewed

@@ -37,6 +37,69 @@ class PromptSynthesizerTemplate:
         JSON:
         """
+    @staticmethod
+    def generate_synthetic_conversational_scenarios(
+        scenario: str,
+        conversational_task: str,
+        participant_roles: str,
+        num_goldens: int,
+    ):
+        return f"""
+        Generate a series of conversational SCENARIOS from scratch based on the provided scenario description,
+        conversational task, and participant roles.
+        A SCENARIO is a narrative description of a situation in which a conversation naturally occurs.
+        It is NOT a question, NOT a prompt, and NOT a user query. It MUST purely describe context.
+        Each scenario MUST depict a realistic MULTI-TURN conversational situation involving the given participants.
+        **
+        IMPORTANT FORMAT:
+        - Only return JSON
+        - JSON MUST contain: {{ "data": [ {{ "scenario": "..." }}, ... ] }}
+        - You MUST TRY to generate {num_goldens} items
+        **
+        Example of GOOD scenarios (situational descriptions):
+        - "During a late afternoon code review session, a junior engineer asks their senior engineer why an async function is inconsistent, leading to a detailed back-and-forth about race conditions."
+        - "While preparing for a sprint demo, a senior engineer helps a junior engineer interpret stack traces, prompting a step-by-step explanation."
+        Example of BAD scenarios (DO NOT DO):
+        - "Why does my async function return inconsistent results?" (This is a prompt)
+        - "Explain how to debug race conditions." (Instruction)
+        - "What is the freezing point of water?" (Question)
+        CRITICAL REQUIREMENTS:
+        - Scenario MUST be a narrative description of a SITUATION.
+        - Scenario MUST involve these participant roles: {participant_roles}
+        - Scenario MUST align with this conversational task: {conversational_task}
+        - Scenario MUST feel natural, real-world, and MULTI-TURN.
+        - Scenario MUST NOT contain:
+            • direct questions
+            • instructions
+            • tasks
+            • explicit prompts
+            • standalone facts
+        - Scenario MUST be grounded in the meaning of the provided base scenario description.
+        You MUST TRY to generate {num_goldens} high-quality, non-repetitive scenarios.
+        **
+        Base Scenario Description:
+        {scenario}
+        Conversational Task:
+        {conversational_task}
+        Participant Roles:
+        {participant_roles}
+        Num Scenarios:
+        {num_goldens}
+        JSON:
+        """
 ######################################################################################################
 ##### Approach similar to https://github.com/nlpxucan/WizardLM/blob/main/Evol_Instruct/depth.py ######
@@ -282,3 +345,202 @@ class PromptEvolutionTemplate:
             Rewritten Input:
             """
         )
+class ConversationalPromptEvolutionTemplate:
+    base_instruction = """I want you to act as a conversational scenario rewriter.
+    Your objective is to rewrite the given `Scenario`. You MUST complicate the `Scenario` using the following method:"""
+    @staticmethod
+    def reasoning_evolution(scenario):
+        return (
+            ConversationalPromptEvolutionTemplate.base_instruction
+            + f"""
+            1. Rewrite `Scenario` to force participants into multi-step conversational reasoning.
+            2. Add layered inferences or analytical leaps required in dialogue.
+            3. `Rewritten Scenario` must stay concise, human-readable, and remain a conversation setup.
+            4. Do NOT exceed **15 words**.
+            **
+            EXAMPLES
+            Example scenario:
+            Two students discuss climate change.
+            Example rewritten scenario:
+            Two students debate climate impacts, tracing cause-effect chains across multiple evidence sources.
+            --------------------------
+            Example scenario:
+            A doctor explains treatment options.
+            Example rewritten scenario:
+            Doctor and patient reason through symptoms requiring sequential diagnostic logic.
+            --------------------------
+            Scenario:
+            {scenario}
+            Rewritten Scenario:
+            """
+        )
+    @staticmethod
+    def concretizing_evolution(scenario):
+        return (
+            ConversationalPromptEvolutionTemplate.base_instruction
+            + f"""
+            1. Replace broad conversation setup with a **more specific, concrete** conversational scene.
+            2. Add real-world detail (location, constraint, specific topic).
+            3. Keep under **15 words**, concise, and still a dialogue setup.
+            **
+            EXAMPLES
+            Example scenario:
+            Two engineers talk about safety.
+            Example rewritten scenario:
+            Two engineers argue over failing brake-system logs during late-night review.
+            --------------------------
+            Example scenario:
+            Two friends discuss exercise.
+            Example rewritten scenario:
+            Two friends compare heart-rate sensor issues during a marathon-training chat.
+            --------------------------
+            Scenario:
+            {scenario}
+            Rewritten Scenario:
+            """
+        )
+    @staticmethod
+    def constrained_evolution(scenario):
+        return (
+            ConversationalPromptEvolutionTemplate.base_instruction
+            + f"""
+            1. Add at least one new constraint shaping the conversation.
+            2. Constraint must significantly affect the dialogue.
+            3. Keep under **15 words**, concise, conversational.
+            **
+            EXAMPLES
+            Example scenario:
+            Two coworkers plan a report.
+            Example rewritten scenario:
+            Two coworkers plan a report with strict no-internet constraint.
+            --------------------------
+            Example scenario:
+            A teacher reviews homework.
+            Example rewritten scenario:
+            Teacher and student discuss homework under urgent submission deadline.
+            --------------------------
+            Scenario:
+            {scenario}
+            Rewritten Scenario:
+            """
+        )
+    @staticmethod
+    def comparative_question_evolution(scenario):
+        return (
+            ConversationalPromptEvolutionTemplate.base_instruction
+            + f"""
+            1. Rewrite `Scenario` so the conversation centers on comparing two+ items.
+            2. Must highlight similarities/differences through dialogue.
+            3. Keep under **15 words**, concise, conversational.
+            **
+            EXAMPLES
+            Example scenario:
+            Two analysts discuss tools.
+            Example rewritten scenario:
+            Two analysts compare legacy analytics pipeline vs. new automated system.
+            --------------------------
+            Example scenario:
+            Two students study history.
+            Example rewritten scenario:
+            Two students contrast Renaissance ideals with Enlightenment philosophies.
+            --------------------------
+            Scenario:
+            {scenario}
+            Rewritten Scenario:
+            """
+        )
+    @staticmethod
+    def hypothetical_scenario_evolution(scenario):
+        return (
+            ConversationalPromptEvolutionTemplate.base_instruction
+            + f"""
+            1. Rewrite `Scenario` to introduce a hypothetical twist derived from the setup.
+            2. The hypothetical MUST drive the conversation.
+            3. Keep under **15 words**, concise, conversational.
+            **
+            EXAMPLES
+            Example scenario:
+            Two scientists discuss pollution.
+            Example rewritten scenario:
+            Two scientists debate effects if emissions doubled overnight.
+            --------------------------
+            Example scenario:
+            A medic trains a recruit.
+            Example rewritten scenario:
+            Medic and recruit plan response to hypothetical antibiotic-resistant outbreak.
+            --------------------------
+            Scenario:
+            {scenario}
+            Rewritten Scenario:
+            """
+        )
+    @staticmethod
+    def in_breadth_evolution(scenario):
+        return (
+            ConversationalPromptEvolutionTemplate.base_instruction
+            + f"""
+            1. Rewrite `Scenario` into a new conversation within the same domain.
+            2. The new conversation must explore a rarer, niche angle.
+            3. Keep under **15 words**, concise, conversational.
+            **
+            EXAMPLES
+            Example scenario:
+            Two doctors discuss patient care.
+            Example rewritten scenario:
+            Two doctors debate rare autoimmune disorder diagnostics.
+            --------------------------
+            Example scenario:
+            Two programmers discuss bugs.
+            Example rewritten scenario:
+            Two programmers examine obscure concurrency race-condition failures.
+            --------------------------
+            Scenario:
+            {scenario}
+            Rewritten Scenario:
+            """
+        )

{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.1
 Name: deepeval
-Version: 3.7.1
+Version: 3.7.2
 Summary: The LLM Evaluation Framework
 Home-page: https://github.com/confident-ai/deepeval
 License: Apache-2.0
@@ -439,6 +439,7 @@ Using `.env.local` or `.env` is optional. If they are missing, DeepEval uses you
 ```bash
 cp .env.example .env.local
 # then edit .env.local (ignored by git)
+```
 <br />

{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/RECORD RENAMED Viewed

@@ -1,5 +1,5 @@
 deepeval/__init__.py,sha256=tle4lT4FONApg3OeztGPEdrpGMEGLWajyGTu7bEd3s0,2976
-deepeval/_version.py,sha256=YeaRO0UgS2XgzwsbQp4bgbudO4Ac5gGPSx2CsEi9NaU,27
+deepeval/_version.py,sha256=uv4OEocrxlEkjp4YMUEXl0-kwRJuwkdtGlNshton0Mg,27
 deepeval/annotation/__init__.py,sha256=ZFhUVNNuH_YgQSZJ-m5E9iUb9TkAkEV33a6ouMDZ8EI,111
 deepeval/annotation/annotation.py,sha256=3j3-syeJepAcEj3u3e4T_BeRDzNr7yXGDIoNQGMKpwQ,2298
 deepeval/annotation/api.py,sha256=EYN33ACVzVxsFleRYm60KB4Exvff3rPJKt1VBuuX970,2147
@@ -161,7 +161,7 @@ deepeval/dataset/utils.py,sha256=MRiqwt-3E5WNCHtP2kY7P1PeRtFMRpGoy3r75tJ2QFg,791
 deepeval/errors.py,sha256=FfhtULNIQqHpKVqCr-xlvTtLxkNj40qVU89sXYKuDrA,754
 deepeval/evaluate/__init__.py,sha256=315IaMiYEz7oJhZ4kPTBfeCNd1xF-wWVU6KOQnrKQpE,291
 deepeval/evaluate/api.py,sha256=rkblH0ZFAAdyuF0Ymh7JE1pIJPR9yFuPrn9SQaCEQp4,435
-deepeval/evaluate/compare.py,sha256=eGyDlt1eRp-R2hPDqWUpiFOMlI4LU_KKfbaXw_9SI2c,16523
+deepeval/evaluate/compare.py,sha256=AJ3kR4Th44MTuL0juvvNwPdel1Q8tw37IYUgLdy2qrw,16575
 deepeval/evaluate/configs.py,sha256=QfWjaWNxLsgEe8-5j4PIs5WcSyEckiWt0qdpXSpl57M,928
 deepeval/evaluate/evaluate.py,sha256=CLc-5rlHcBkJcakYXf9twaF6G8chp95gCBe8V4B-cVo,10684
 deepeval/evaluate/execute.py,sha256=cXX4W4jX_Uly73WBLEduLv6Dqs32AWHGsgyp9tZmV1Q,134219
@@ -461,13 +461,13 @@ deepeval/synthesizer/base_synthesizer.py,sha256=ua7HDq1lemeFH5FuWdGJxMGFH5QA2CSY
 deepeval/synthesizer/chunking/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 deepeval/synthesizer/chunking/context_generator.py,sha256=ucwa-7BcPSHHf4Tu31dfyJ63Bg9HdNhGLAW5_QsfFX4,38052
 deepeval/synthesizer/chunking/doc_chunker.py,sha256=DvJmbA_NnZBGCZgxKQsxlIC29kca_d7J-Dxq9SyfzX0,10612
-deepeval/synthesizer/config.py,sha256=vcSi6upnmd667dAGANTTdPmY0z5sQ8Ctal7Xr4-tbhA,1934
-deepeval/synthesizer/schema.py,sha256=PIv3012VMg_v-Ylwn08-4tNjf4QShBSg-kaCkgtdA88,879
-deepeval/synthesizer/synthesizer.py,sha256=oa2m9ZqywNcSO1wUijrJ7HO-NC8-oU1g04NIS16dx6U,60306
-deepeval/synthesizer/templates/__init__.py,sha256=C-wSGQeMRxTdSBJbgeyAM5Iu6mkHVSYbNfz0AY9K5Yc,209
-deepeval/synthesizer/templates/template.py,sha256=nTH-k8XbvZQD_lagsaf6kmT6oylFjQ7gEseHYB1Zyso,39807
-deepeval/synthesizer/templates/template_extraction.py,sha256=NkpzP-MkoefokVJBZn9s1ErDvI3o9ocY5_ZY85zj4KE,1972
-deepeval/synthesizer/templates/template_prompt.py,sha256=cqtG3X2DQIs7NaaQeJrNcS4zdwgDn_l8go8ZeVHRdgI,12531
+deepeval/synthesizer/config.py,sha256=rg9HzN5w_82tpzBALgt__NkAcmh0vDEoORJpjsRLWMY,2207
+deepeval/synthesizer/schema.py,sha256=TFCIvXeL0TOKqfjMm2qgR4hFcvvFaPEZdQ1xTnRJqPs,1294
+deepeval/synthesizer/synthesizer.py,sha256=QF02PSedde8t5Q0R9WpkWeD4tVD8fo4m4pJFu0H7jbc,110316
+deepeval/synthesizer/templates/__init__.py,sha256=9UhfJFwPEdLWmxJz3ksNJps-jGYJFJnJP1U-x7j0By4,319
+deepeval/synthesizer/templates/template.py,sha256=ri3dX2gzxNmL8qlkl47HD8kecmqMBF5mE-mraZvf1xU,65008
+deepeval/synthesizer/templates/template_extraction.py,sha256=jmvr8AOOUzDgsHYIOsq-NaxlRQ5GygK16TTRGxBXDyM,3508
+deepeval/synthesizer/templates/template_prompt.py,sha256=bzfC71AXZqBrmoDWmBvuIQKD6hPJZ0ZAWX4hy-lPlnQ,21478
 deepeval/synthesizer/types.py,sha256=wUZntvCAE29sM9K8hk9RPwUpkTip1ObOCExyMEo3sME,493
 deepeval/synthesizer/utils.py,sha256=o-9z5gApQcHqDqusgrD0LagXWAju17LVc27BxtaA7og,1018
 deepeval/telemetry.py,sha256=0k6oVhRBi1Ap6JC6SNe_9-nBnlG-uReUoS3KTrPayhk,21716
@@ -505,8 +505,8 @@ deepeval/tracing/tracing.py,sha256=VWu5z6fxWP6KfDaw5ZmIkN-0yNDqe1CVHa0e9_Wjrgg,4
 deepeval/tracing/types.py,sha256=WhnxefUc5I8jcAOBQ-tsZ8_zVZfGqSvCWHD5XUN6Ggw,6040
 deepeval/tracing/utils.py,sha256=mdvhYAxDNsdnusaEXJd-c-_O2Jn6S3xSuzRvLO1Jz4U,5684
 deepeval/utils.py,sha256=zy9RR0bt3YMzWVlJc5Rl6eU5RyeW2uEjMfwD1sdgPr4,23234
-deepeval-3.7.1.dist-info/LICENSE.md,sha256=0ATkuLv6QgsJTBODUHC5Rak_PArA6gv2t7inJzNTP38,11352
-deepeval-3.7.1.dist-info/METADATA,sha256=9Wa2SRbSrMIRZQKNCttm8miTeo9hqneVQCZBkQAyFSA,18739
-deepeval-3.7.1.dist-info/WHEEL,sha256=d2fvjOD7sXsVzChCqf0Ty0JbHKBaLYwDbGQDwQTnJ50,88
-deepeval-3.7.1.dist-info/entry_points.txt,sha256=fVr8UphXTfJe9I2rObmUtfU3gkSrYeM0pLy-NbJYg10,94
-deepeval-3.7.1.dist-info/RECORD,,
+deepeval-3.7.2.dist-info/LICENSE.md,sha256=0ATkuLv6QgsJTBODUHC5Rak_PArA6gv2t7inJzNTP38,11352
+deepeval-3.7.2.dist-info/METADATA,sha256=-p5kW-oBcfsEi5_uiLnCn_godaoKAeRDCgzRdpOsWUI,18743
+deepeval-3.7.2.dist-info/WHEEL,sha256=d2fvjOD7sXsVzChCqf0Ty0JbHKBaLYwDbGQDwQTnJ50,88
+deepeval-3.7.2.dist-info/entry_points.txt,sha256=fVr8UphXTfJe9I2rObmUtfU3gkSrYeM0pLy-NbJYg10,94
+deepeval-3.7.2.dist-info/RECORD,,

{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/LICENSE.md RENAMED Viewed

File without changes

{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/WHEEL RENAMED Viewed

File without changes

{deepeval-3.7.1.dist-info → deepeval-3.7.2.dist-info}/entry_points.txt RENAMED Viewed

File without changes

deepeval 3.7.1__py3-none-any.whl → 3.7.2__py3-none-any.whl

deepeval 3.7.1py3-none-any.whl → 3.7.2py3-none-any.whl