PyPI - llumo - Versions diffs - 0.2.28__py3-none-any.whl → 0.2.29__py3-none-any.whl - Mend

llumo 0.2.28py3-none-any.whl → 0.2.29py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (7) hide show

llumo/google.py +16 -16
llumo/openai.py +137 -130
{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/METADATA +1 -1
{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/RECORD +7 -7
{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/WHEEL +0 -0
{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/licenses/LICENSE +0 -0
{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/top_level.txt +0 -0

llumo/google.py CHANGED Viewed

@@ -15,9 +15,9 @@ def evaluate_multiple(data, api_key=None, evals=["Response Correctness"]):
 class ChatCompletionWithEval:
-    def __init__(self, response, evaluation):
+    def __init__(self, response, evaluation=None):
         self._response = response
-        self.evaluation = evaluation
+        # self.evaluation = evaluation
     def __getattr__(self, name):
         return getattr(self._response, name)
@@ -46,21 +46,21 @@ class genai:
             response = self._model_instance.generate_content(contents=contents, **kwargs)
             output = response.text
-            eval_input = [{
-                "query": contents,
-                "context": context or contents,
-                "output": output,
-            }]
+            # eval_input = [{
+            #     "query": contents,
+            #     "context": context or contents,
+            #     "output": output,
+            # }]
-            evaluation = None
-            try:
-                evaluation = evaluate_multiple(data=eval_input, evals=evals, api_key=llumo_key)
-            except Exception as e:
-                evaluation = None
+            # evaluation = None
+            # try:
+            #     evaluation = evaluate_multiple(data=eval_input, evals=evals, api_key=llumo_key)
+            # except Exception as e:
+            #     evaluation = None
-            if evaluation is None:
-                    print("Cannot process your request for evaluation, please check your api and try again later.")
-                    return response
+            # if evaluation is None:
+            #         print("Cannot process your request for evaluation, please check your api and try again later.")
+            #         return response
-            return ChatCompletionWithEval(response, evaluation)
+            return ChatCompletionWithEval(response, evaluation=None)

llumo/openai.py CHANGED Viewed

@@ -25,9 +25,13 @@ def performEvaluation(data, api_key=None, evals=["Response Correctness"], **kwar
 # Wrapper around ChatCompletion to allow custom fields like `.evaluation`
 class ChatCompletionWithEval:
-    def __init__(self, response, evaluation):
+    def __init__(
+        self,
+        response,
+        #  , evaluation
+    ):
         self._response = response
-        self.evaluation = evaluation
+        # self.evaluation = evaluation
     def __getattr__(self, name):
         return getattr(self._response, name)
@@ -70,65 +74,65 @@ class OpenAI(OpenAIClient):
             workspace_id = self.session.logger.getWorkspaceID()
             # Input Bias Evaluation
-            eval_input_bias = [
-                {
-                    "query": user_message,
-                    "context": context,
-                    "output": "",  # No output yet
-                }
-            ]
-            try:
-                start_time = time.time()
-                bias_evaluation_result = performEvaluation(
-                    eval_input_bias,
-                    api_key=self.llumo_key,
-                    evals=["Input Bias"],
-                    playgroundID=playground_id,
-                    workspaceID=workspace_id,
-                    createExperiment=create_experiment,
-                )
-                latency = int((time.time() - start_time) * 1000)
-                # Access the first result object
-                bias_evaluation = bias_evaluation_result[0]
-                message = "-".join(
-                    getattr(bias_evaluation, "edgeCases", {}).get("value", [])
-                )
-                self.session.logEvalStep(
-                    stepName=f"EVAL-Input Bias",
-                    output="",
-                    context=context,
-                    query=user_message,
-                    messageHistory="",
-                    tools="",
-                    intermediateSteps="",
-                    groundTruth="",
-                    analyticsScore=getattr(bias_evaluation, "analyticsScore", {}),
-                    reasoning=getattr(bias_evaluation, "reasoning", {}),
-                    classification=getattr(bias_evaluation, "classification", {}),
-                    evalLabel=getattr(bias_evaluation, "evalLabel", {}),
-                    latencyMs=latency,
-                    status="SUCCESS",
-                    message=message,
-                )
-            except Exception as e:
-                print(f"Input Bias evaluation failed: {e}")
-                self.session.logEvalStep(
-                    stepName=f"EVAL-FAILURE",
-                    output="",
-                    context=context,
-                    query=user_message,
-                    messageHistory="",
-                    tools="",
-                    intermediateSteps="",
-                    groundTruth="",
-                    analyticsScore={},
-                    reasoning={},
-                    classification={},
-                    evalLabel={},
-                    latencyMs=0,
-                    status="FAILURE",
-                    message="EVAL_ERROR",
-                )
+            # eval_input_bias = [
+            #     {
+            #         "query": user_message,
+            #         "context": context,
+            #         "output": "",  # No output yet
+            #     }
+            # ]
+            # try:
+            #     start_time = time.time()
+            #     bias_evaluation_result = performEvaluation(
+            #         eval_input_bias,
+            #         api_key=self.llumo_key,
+            #         evals=["Input Bias"],
+            #         playgroundID=playground_id,
+            #         workspaceID=workspace_id,
+            #         createExperiment=create_experiment,
+            #     )
+            #     latency = int((time.time() - start_time) * 1000)
+            #     # Access the first result object
+            #     bias_evaluation = bias_evaluation_result[0]
+            #     message = "-".join(
+            #         getattr(bias_evaluation, "edgeCases", {}).get("value", [])
+            #     )
+            #     self.session.logEvalStep(
+            #         stepName=f"EVAL-Input Bias",
+            #         output="",
+            #         context=context,
+            #         query=user_message,
+            #         messageHistory="",
+            #         tools="",
+            #         intermediateSteps="",
+            #         groundTruth="",
+            #         analyticsScore=getattr(bias_evaluation, "analyticsScore", {}),
+            #         reasoning=getattr(bias_evaluation, "reasoning", {}),
+            #         classification=getattr(bias_evaluation, "classification", {}),
+            #         evalLabel=getattr(bias_evaluation, "evalLabel", {}),
+            #         latencyMs=latency,
+            #         status="SUCCESS",
+            #         message=message,
+            #     )
+            # except Exception as e:
+            #     print(f"Input Bias evaluation failed: {e}")
+            #     self.session.logEvalStep(
+            #         stepName=f"EVAL-FAILURE",
+            #         output="",
+            #         context=context,
+            #         query=user_message,
+            #         messageHistory="",
+            #         tools="",
+            #         intermediateSteps="",
+            #         groundTruth="",
+            #         analyticsScore={},
+            #         reasoning={},
+            #         classification={},
+            #         evalLabel={},
+            #         latencyMs=0,
+            #         status="FAILURE",
+            #         message="EVAL_ERROR",
+            #     )
             start_time = time.time()
             response = original_create(*args, **kwargs)
@@ -151,74 +155,77 @@ class OpenAI(OpenAIClient):
             )
             # Response Correctness Evaluation
-            eval_input_correctness = [
-                {
-                    "query": user_message,
-                    "context": context,
-                    "output": output_text,
-                }
-            ]
-            try:
-                start_time = time.time()
-                correctness_evaluation_result = performEvaluation(
-                    eval_input_correctness,
-                    api_key=self.llumo_key,
-                    evals=["Response Correctness"],
-                    playgroundID=playground_id,
-                    workspaceID=workspace_id,
-                    createExperiment=create_experiment,
-                )
-                latency = int((time.time() - start_time) * 1000)
-                # Access the first result object
-                correctness_evaluation = correctness_evaluation_result[0]
-                message = "-".join(
-                    getattr(correctness_evaluation, "edgeCases", {}).get("value", [])
-                )
-                self.session.logEvalStep(
-                    stepName=f"EVAL-Response Correctness",
-                    output=output_text,
-                    context=context,
-                    query=user_message,
-                    messageHistory="",
-                    tools="",
-                    intermediateSteps="",
-                    groundTruth="",
-                    analyticsScore=getattr(
-                        correctness_evaluation, "analyticsScore", {}
-                    ),
-                    reasoning=getattr(correctness_evaluation, "reasoning", {}),
-                    classification=getattr(
-                        correctness_evaluation, "classification", {}
-                    ),
-                    evalLabel=getattr(correctness_evaluation, "evalLabel", {}),
-                    latencyMs=latency,
-                    status="SUCCESS",
-                    message=message,
-                )
-            except Exception as e:
-                print(f"Response Correctness evaluation failed: {e}")
-                correctness_evaluation = None
-                self.session.logEvalStep(
-                    stepName=f"EVAL-FAILURE",
-                    output=output_text,
-                    context=context,
-                    query=user_message,
-                    messageHistory="",
-                    tools="",
-                    intermediateSteps="",
-                    groundTruth="",
-                    analyticsScore={},
-                    reasoning={},
-                    classification={},
-                    evalLabel={},
-                    latencyMs=0,
-                    status="FAILURE",
-                    message="EVAL_ERROR",
-                )
-            if correctness_evaluation is None:
-                return response
-            return ChatCompletionWithEval(response, correctness_evaluation)
+            # eval_input_correctness = [
+            #     {
+            #         "query": user_message,
+            #         "context": context,
+            #         "output": output_text,
+            #     }
+            # ]
+            # try:
+            #     start_time = time.time()
+            #     correctness_evaluation_result = performEvaluation(
+            #         eval_input_correctness,
+            #         api_key=self.llumo_key,
+            #         evals=["Response Correctness"],
+            #         playgroundID=playground_id,
+            #         workspaceID=workspace_id,
+            #         createExperiment=create_experiment,
+            #     )
+            #     latency = int((time.time() - start_time) * 1000)
+            #     # Access the first result object
+            #     correctness_evaluation = correctness_evaluation_result[0]
+            #     message = "-".join(
+            #         getattr(correctness_evaluation, "edgeCases", {}).get("value", [])
+            #     )
+            #     self.session.logEvalStep(
+            #         stepName=f"EVAL-Response Correctness",
+            #         output=output_text,
+            #         context=context,
+            #         query=user_message,
+            #         messageHistory="",
+            #         tools="",
+            #         intermediateSteps="",
+            #         groundTruth="",
+            #         analyticsScore=getattr(
+            #             correctness_evaluation, "analyticsScore", {}
+            #         ),
+            #         reasoning=getattr(correctness_evaluation, "reasoning", {}),
+            #         classification=getattr(
+            #             correctness_evaluation, "classification", {}
+            #         ),
+            #         evalLabel=getattr(correctness_evaluation, "evalLabel", {}),
+            #         latencyMs=latency,
+            #         status="SUCCESS",
+            #         message=message,
+            #     )
+            # except Exception as e:
+            #     print(f"Response Correctness evaluation failed: {e}")
+            #     correctness_evaluation = None
+            #     self.session.logEvalStep(
+            #         stepName=f"EVAL-FAILURE",
+            #         output=output_text,
+            #         context=context,
+            #         query=user_message,
+            #         messageHistory="",
+            #         tools="",
+            #         intermediateSteps="",
+            #         groundTruth="",
+            #         analyticsScore={},
+            #         reasoning={},
+            #         classification={},
+            #         evalLabel={},
+            #         latencyMs=0,
+            #         status="FAILURE",
+            #         message="EVAL_ERROR",
+            #     )
+            # if correctness_evaluation is None:
+            #     return response
+            return ChatCompletionWithEval(
+                response
+                # , correctness_evaluation
+            )
         self.chat.completions.create = create_wrapper

{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: llumo
-Version: 0.2.28
+Version: 0.2.29
 Summary: Python SDK for interacting with the Llumo ai API.
 Home-page: https://www.llumo.ai/
 Author: Llumo

{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/RECORD RENAMED Viewed

@@ -6,15 +6,15 @@ llumo/client.py,sha256=keYx0GToNB-FXmGncXd0MOwwCGjxsIoDbOhTx2rCcMQ,71582
 llumo/exceptions.py,sha256=1OyhN9YL9LcyUPUsqYHq6Rret0udATZAwMVJaio2_Ec,2123
 llumo/execution.py,sha256=nWbJ7AvWuUPcOb6i-JzKRna_PvF-ewZTiK8skS-5n3w,1380
 llumo/functionCalling.py,sha256=D5jYapu1rIvdIJNUYPYMTyhQ1H-6nkwoOLMi6eekfUE,7241
-llumo/google.py,sha256=3S_aRtbtlctCXPGR0u4baLlkyFrsjd02vlUCkoRPA5U,2147
+llumo/google.py,sha256=6y9YnDFDRHv6-sQNT5LIsV9p31BCN0B9eow5KTRBWfM,2185
 llumo/helpingFuntions.py,sha256=B6FwUQ5f1v4FKrWCbYoGWMFdscOV_liuuhTgNQ3cdrk,27275
 llumo/llumoLogger.py,sha256=grdjhu6Ngxg7nhnrMOP5Pd5ALR7U2ROws48yhf_N7y0,1912
 llumo/llumoSessionContext.py,sha256=iJDeC3FG6dID9jdaDK5d6hIlXWuhWx4KQy-Nnty4wYg,10485
 llumo/models.py,sha256=aVEZsOOoQx5LeNtwSyBxqvrINq0izH3QWu_YjsMPE6o,2910
-llumo/openai.py,sha256=c0pZ-yzm6LfUAbfVmOiVpY9pS5sAWZRb8_jAj0ir910,8450
+llumo/openai.py,sha256=PtcQhEEE5q5J7im9hd16FRP7h51VkNhFNX0txS2t7JY,8786
 llumo/sockets.py,sha256=pBDo-U65hMIMwKMwZQl3iBkEjISEt-9BkXxZTWfSHF4,6116
-llumo-0.2.28.dist-info/licenses/LICENSE,sha256=tF9yAcfPV9xGT3ViWmC8hPvOo8BEk4ZICbUfcEo8Dlk,182
-llumo-0.2.28.dist-info/METADATA,sha256=WYFBghjzGVN4xRdMjqsg3QSKTw5np1qzBoy5tIbcTvk,1558
-llumo-0.2.28.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-llumo-0.2.28.dist-info/top_level.txt,sha256=d5zUTMI99llPtLRB8rtSrqELm_bOqX-bNC5IcwlDk88,6
-llumo-0.2.28.dist-info/RECORD,,
+llumo-0.2.29.dist-info/licenses/LICENSE,sha256=tF9yAcfPV9xGT3ViWmC8hPvOo8BEk4ZICbUfcEo8Dlk,182
+llumo-0.2.29.dist-info/METADATA,sha256=4h3zWbgU4QfCGBGtAlHvKom8hKOJrZwWnq44H8pic0I,1558
+llumo-0.2.29.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+llumo-0.2.29.dist-info/top_level.txt,sha256=d5zUTMI99llPtLRB8rtSrqELm_bOqX-bNC5IcwlDk88,6
+llumo-0.2.29.dist-info/RECORD,,

{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/WHEEL RENAMED Viewed

File without changes

{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{llumo-0.2.28.dist-info → llumo-0.2.29.dist-info}/top_level.txt RENAMED Viewed

File without changes

llumo 0.2.28__py3-none-any.whl → 0.2.29__py3-none-any.whl

llumo 0.2.28py3-none-any.whl → 0.2.29py3-none-any.whl