PyPI - intellif-aihub - Versions diffs - 0.1.20__tar.gz → 0.1.21__tar.gz - Mend

intellif-aihub 0.1.20tar.gz → 0.1.21tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of intellif-aihub might be problematic. Click here for more details.

Files changed (65) hide show

{intellif_aihub-0.1.20 → intellif_aihub-0.1.21}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: intellif-aihub
-Version: 0.1.20
+Version: 0.1.21
 Summary: Intellif AI-hub SDK.
 Author-email: Platform Team <aihub@example.com>
 License-Expression: Apache-2.0

{intellif_aihub-0.1.20 → intellif_aihub-0.1.21}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name            = "intellif-aihub"
-version = "0.1.20"
+version = "0.1.21"
 description     = "Intellif AI-hub SDK."
 readme          = {file = "README.md", content-type = "text/markdown"}
 requires-python = ">=3.9"

intellif_aihub-0.1.21/src/aihub/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ __version__ = "0.1.21"

{intellif_aihub-0.1.20 → intellif_aihub-0.1.21}/src/aihub/models/eval.py RENAMED Viewed

@@ -5,15 +5,28 @@ from typing import Dict, List, Optional
 from pydantic import BaseModel, Field
-class CreateEvalReq(BaseModel):
-    """创建评测任务"""
+class BaseEvalReq(BaseModel):
+    """评测任务基础请求模型"""
+    run_id: str = Field(description="运行ID")
+    type: str = Field(description="评测类型，支持 'llm' 和 'cv'")
+    prediction_artifact_path: str = Field(description="推理产物的路径")
+    user_id: int = Field(0, description="用户ID，默认0")
+class CreateLLMEvalReq(BaseEvalReq):
+    """创建LLM类型评测任务请求"""
+    type: str = Field(default="llm", description="评测类型，固定为 'llm'")
     dataset_id: int = Field(description="数据集ID")
     dataset_version_id: int = Field(description="数据集版本ID")
-    prediction_artifact_path: str = Field(description="推理产物的路径")
     evaled_artifact_path: str = Field(description="评测结果产物的路径")
-    run_id: str = Field(description="运行ID")
-    user_id: int = Field(0, description="用户ID")
-    report: Dict = Field(default_factory=dict, description="评测报告")
+    report: Dict = Field(description="评测报告")
+class CreateCVEvalReq(BaseEvalReq):
+    """创建CV类型评测任务请求"""
+    type: str = Field(default="cv", description="评测类型，固定为 'cv'")
+    metrics_artifact_path: str = Field(description="指标产物的路径")
+    ground_truth_artifact_path: str = Field(description="真实标签产物的路径")
 class EvalRun(BaseModel):

{intellif_aihub-0.1.20 → intellif_aihub-0.1.21}/src/aihub/services/eval.py RENAMED Viewed

@@ -12,7 +12,7 @@ import httpx
 from ..exceptions import APIError
 from ..models.common import APIWrapper
-from ..models.eval import CreateEvalReq, CreateEvalResp, ListEvalReq, ListEvalResp
+from ..models.eval import CreateLLMEvalReq, CreateCVEvalReq, CreateEvalResp, ListEvalReq, ListEvalResp
 _BASE = "/eval-platform/api/v1"
@@ -31,6 +31,7 @@ class EvalService:
         evaled_artifact_path: str,
         report_json: dict,
         run_id,
+        user_id: int = 0,
     ) -> int:
         """创建评测报告
@@ -40,7 +41,7 @@ class EvalService:
             evaled_artifact_path:   评测结果制品路径
             prediction_artifact_path: 推理结果制品路径
             dataset_version_name (str): 数据集名称
+            user_id (int, optional): 用户ID，默认为0
         Returns:
             id (int): 评测报告id
@@ -52,17 +53,48 @@ class EvalService:
         dataset_version = dataset_service.get_dataset_version_by_name(
             dataset_version_name
         )
-        payload = CreateEvalReq(
+        payload = CreateLLMEvalReq(
             dataset_id=dataset_version.dataset_id,
             dataset_version_id=dataset_version.id,
             evaled_artifact_path=evaled_artifact_path,
             prediction_artifact_path=prediction_artifact_path,
             report=report_json,
             run_id=run_id,
+            user_id=user_id,
         )
         return self._eval.create(payload)
+    def create_cv_run(
+        self,
+        run_id: str,
+        prediction_artifact_path: str,
+        metrics_artifact_path: str,
+        ground_truth_artifact_path: str,
+        user_id: int = 0,
+    ) -> int:
+        """创建 CV 类型评测运行
+        Args:
+            run_id (str): 运行ID
+            prediction_artifact_path (str): 推理产物的路径
+            metrics_artifact_path (str): 指标产物的路径
+            ground_truth_artifact_path (str): 真实标签产物的路径
+            user_id (int, optional): 用户ID，默认为0
+        Returns:
+            id (int): 评测运行id
+        """
+        payload = CreateCVEvalReq(
+            run_id=run_id,
+            prediction_artifact_path=prediction_artifact_path,
+            metrics_artifact_path=metrics_artifact_path,
+            ground_truth_artifact_path=ground_truth_artifact_path,
+            user_id=user_id,
+        )
+        return self._eval.create(payload)
     def list(
         self,
         page_size: int = 20,
@@ -119,7 +151,7 @@ class _Eval:
     def __init__(self, http: httpx.Client):
         self._http = http
-    def create(self, payload: CreateEvalReq) -> int:
+    def create(self, payload) -> int:
         resp = self._http.post(f"{_BASE}/run/", json=payload.model_dump())
         wrapper = APIWrapper[CreateEvalResp].model_validate(resp.json())
         if wrapper.code != 0:

{intellif_aihub-0.1.20 → intellif_aihub-0.1.21}/src/intellif_aihub.egg-info/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: intellif-aihub
-Version: 0.1.20
+Version: 0.1.21
 Summary: Intellif AI-hub SDK.
 Author-email: Platform Team <aihub@example.com>
 License-Expression: Apache-2.0

intellif_aihub-0.1.21/tests/test_eval.py ADDED Viewed

@@ -0,0 +1,520 @@
+# !/usr/bin/env python
+# -*-coding:utf-8 -*-
+import sys
+import os
+import unittest
+import uuid
+from unittest.mock import Mock, patch
+import httpx
+from aihub.services.eval import EvalService
+from aihub.models.eval import ListEvalResp, EvalRun, CreateEvalResp
+from aihub.models.common import APIWrapper
+BASE_URL = "http://192.168.13.160:30052"
+TOKEN = "eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJleHAiOjE3NTI1NDQwNDksImlhdCI6MTc1MVkzOTI0OSwidWlkIjoyfQ.MfB_7LK5oR3RAhga3jtgcvJqYESeUPLbz8Bc_y3fouc"
+class TestEvalService(unittest.TestCase):
+    def setUp(self):
+        self.http_client = Mock(spec=httpx.Client)
+        self.eval_service = EvalService(self.http_client)
+    def test_list_eval_runs_default(self):
+        mock_eval_run = {
+            "id": 1,
+            "name": "test_eval",
+            "description": "Test evaluation",
+            "user_id": 1,
+            "model_id": 1,
+            "model_name": "test_model",
+            "dataset_id": 1,
+            "dataset_version_id": 1,
+            "dataset_name": "test_dataset",
+            "status": "completed",
+            "prediction_artifact_path": "/path/to/prediction",
+            "evaled_artifact_path": "/path/to/eval",
+            "run_id": "test_run_123",
+            "dataset_summary": {},
+            "metrics_summary": {"accuracy": 0.95},
+            "viz_summary": {},
+            "eval_config": {"metric": "accuracy"},
+            "created_at": 1640995200,
+            "updated_at": 1640995200
+        }
+        mock_response = {
+            "code": 0,
+            "msg": None,
+            "data": {
+                "total": 1,
+                "page_size": 20,
+                "page_num": 1,
+                "data": [mock_eval_run]
+            }
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.get.return_value = mock_resp
+        result = self.eval_service.list()
+        self.assertIsInstance(result, ListEvalResp)
+        self.assertEqual(result.total, 1)
+        self.assertEqual(result.page_size, 20)
+        self.assertEqual(result.page_num, 1)
+        self.assertEqual(len(result.data), 1)
+        self.assertEqual(result.data[0].id, 1)
+        self.assertEqual(result.data[0].name, "test_eval")
+        self.http_client.get.assert_called_once_with(
+            "/eval-platform/api/v1/run/",
+            params={"page_size": 20, "page_num": 1}
+        )
+    def test_list_eval_runs_with_filters(self):
+        mock_response = {
+            "code": 0,
+            "msg": None,
+            "data": {
+                "total": 0,
+                "page_size": 10,
+                "page_num": 1,
+                "data": []
+            }
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.get.return_value = mock_resp
+        # 带过滤参数
+        result = self.eval_service.list(
+            page_size=10,
+            page_num=1,
+            status="completed",
+            name="test",
+            model_id=1,
+            dataset_id=2,
+            dataset_version_id=3,
+            run_id="test_run",
+            user_id=1,
+            model_ids="1,2,3",
+            dataset_ids="2,3,4",
+            dataset_version_ids="3,4,5"
+        )
+        self.assertIsInstance(result, ListEvalResp)
+        self.assertEqual(result.total, 0)
+        self.assertEqual(len(result.data), 0)
+        expected_params = {
+            "page_size": 10,
+            "page_num": 1,
+            "status": "completed",
+            "name": "test",
+            "model_id": 1,
+            "dataset_id": 2,
+            "dataset_version_id": 3,
+            "run_id": "test_run",
+            "user_id": 1,
+            "model_ids": "1,2,3",
+            "dataset_ids": "2,3,4",
+            "dataset_version_ids": "3,4,5"
+        }
+        self.http_client.get.assert_called_once_with(
+            "/eval-platform/api/v1/run/",
+            params=expected_params
+        )
+    def test_list_eval_runs_api_error(self):
+        """测试列出评测运行 - API错误"""
+        # 模拟 API 错误
+        mock_response = {
+            "code": 1001,
+            "msg": "Database connection failed",
+            "data": None
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.get.return_value = mock_resp
+        with self.assertRaises(Exception) as context:
+            self.eval_service.list()
+        self.assertIn("backend code 1001", str(context.exception))
+        self.assertIn("Database connection failed", str(context.exception))
+    def test_list_eval_runs_only_specified_filters(self):
+        mock_response = {
+            "code": 0,
+            "msg": None,
+            "data": {
+                "total": 0,
+                "page_size": 20,
+                "page_num": 1,
+                "data": []
+            }
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.get.return_value = mock_resp
+        result = self.eval_service.list(
+            status="completed",
+            model_id=1
+        )
+        expected_params = {
+            "page_size": 20,
+            "page_num": 1,
+            "status": "completed",
+            "model_id": 1
+        }
+        self.http_client.get.assert_called_once_with(
+            "/eval-platform/api/v1/run/",
+            params=expected_params
+        )
+    @patch('aihub.services.dataset_management.DatasetManagementService')
+    def test_create_eval_llm_default_user_id(self, mock_dataset_service_class):
+        """测试创建 LLM 类型评测 - 使用默认 user_id"""
+        # 模拟数据集版本
+        mock_dataset_version = Mock()
+        mock_dataset_version.dataset_id = 1
+        mock_dataset_version.id = 1
+        mock_dataset_service = Mock()
+        mock_dataset_service.get_dataset_version_by_name.return_value = mock_dataset_version
+        mock_dataset_service_class.return_value = mock_dataset_service
+        # 模拟成功的创建响应
+        mock_eval_run = {
+            "id": 123,
+            "name": "test_eval",
+            "description": "Test evaluation",
+            "user_id": 0,
+            "model_id": 1,
+            "model_name": "test_model",
+            "dataset_id": 1,
+            "dataset_version_id": 1,
+            "dataset_name": "test_dataset",
+            "status": "created",
+            "prediction_artifact_path": "/path/to/prediction.json",
+            "evaled_artifact_path": "/path/to/evaled.json",
+            "run_id": "test_run_123",
+            "dataset_summary": {},
+            "metrics_summary": {},
+            "viz_summary": {},
+            "eval_config": None,
+            "created_at": 1640995200,
+            "updated_at": 1640995200
+        }
+        mock_response = {
+            "code": 0,
+            "msg": None,
+            "data": {"eval_run": mock_eval_run}
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.post.return_value = mock_resp
+        # 调用方法（不提供 user_id，使用默认值）
+        result = self.eval_service.create(
+            dataset_version_name="test_dataset_v1",
+            prediction_artifact_path="/path/to/prediction.json",
+            evaled_artifact_path="/path/to/evaled.json",
+            report_json={"accuracy": 0.95},
+            run_id="test_run_123"
+        )
+        # 验证结果
+        self.assertEqual(result, 123)
+        # 验证 HTTP 调用
+        self.http_client.post.assert_called_once()
+        call_args = self.http_client.post.call_args
+        # 验证端点
+        self.assertEqual(call_args[0][0], "/eval-platform/api/v1/run/")
+        # 验证 payload 内容
+        actual_payload = call_args[1]["json"]
+        # 验证 LLM 类型必需字段
+        self.assertEqual(actual_payload["run_id"], "test_run_123")
+        self.assertEqual(actual_payload["type"], "llm")
+        self.assertEqual(actual_payload["prediction_artifact_path"], "/path/to/prediction.json")
+        self.assertEqual(actual_payload["user_id"], 0)
+        self.assertEqual(actual_payload["dataset_id"], 1)
+        self.assertEqual(actual_payload["dataset_version_id"], 1)
+        self.assertEqual(actual_payload["evaled_artifact_path"], "/path/to/evaled.json")
+        self.assertEqual(actual_payload["report"], {"accuracy": 0.95})
+        # CV 类型字段不会出现在 LLM 类型评测的 payload 中
+        self.assertNotIn("metrics_artifact_path", actual_payload)
+        self.assertNotIn("ground_truth_artifact_path", actual_payload)
+    @patch('aihub.services.dataset_management.DatasetManagementService')
+    def test_create_eval_llm_custom_user_id(self, mock_dataset_service_class):
+        """测试创建 LLM 类型评测 - 自定义 user_id"""
+        # 模拟数据集版本
+        mock_dataset_version = Mock()
+        mock_dataset_version.dataset_id = 2
+        mock_dataset_version.id = 3
+        mock_dataset_service = Mock()
+        mock_dataset_service.get_dataset_version_by_name.return_value = mock_dataset_version
+        mock_dataset_service_class.return_value = mock_dataset_service
+        # 模拟成功的创建响应
+        mock_eval_run = {
+            "id": 456,
+            "name": "test_eval",
+            "description": "Test evaluation",
+            "user_id": 3750,
+            "model_id": 1,
+            "model_name": "test_model",
+            "dataset_id": 2,
+            "dataset_version_id": 3,
+            "dataset_name": "test_dataset",
+            "status": "created",
+            "prediction_artifact_path": "/path/to/prediction.json",
+            "evaled_artifact_path": "/path/to/evaled.json",
+            "run_id": "test_run_456",
+            "dataset_summary": {},
+            "metrics_summary": {},
+            "viz_summary": {},
+            "eval_config": None,
+            "created_at": 1640995200,
+            "updated_at": 1640995200
+        }
+        mock_response = {
+            "code": 0,
+            "msg": None,
+            "data": {"eval_run": mock_eval_run}
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.post.return_value = mock_resp
+        # 调用方法（提供自定义 user_id）
+        result = self.eval_service.create(
+            dataset_version_name="test_dataset_v2",
+            prediction_artifact_path="/path/to/prediction.json",
+            evaled_artifact_path="/path/to/evaled.json",
+            report_json={"f1_score": 0.88},
+            run_id="test_run_456",
+            user_id=3750
+        )
+        # 验证结果
+        self.assertEqual(result, 456)
+        # 验证 HTTP 调用
+        self.http_client.post.assert_called_once()
+        call_args = self.http_client.post.call_args
+        actual_payload = call_args[1]["json"]
+        # 验证关键字段
+        self.assertEqual(actual_payload["type"], "llm")
+        self.assertEqual(actual_payload["user_id"], 3750)
+        self.assertEqual(actual_payload["dataset_id"], 2)
+        self.assertEqual(actual_payload["dataset_version_id"], 3)
+    def test_create_cv_run_default_user_id(self):
+        """测试创建 CV 类型评测运行 - 使用默认 user_id"""
+        # 模拟成功的创建响应
+        mock_eval_run = {
+            "id": 789,
+            "name": "cv_eval",
+            "description": "CV evaluation",
+            "user_id": 0,
+            "model_id": 2,
+            "model_name": "cv_model",
+            "dataset_id": 0,  # 使用默认值而不是 None
+            "dataset_version_id": 0,  # 使用默认值而不是 None
+            "dataset_name": "",  # 使用空字符串而不是 None
+            "status": "created",
+            "prediction_artifact_path": "coco_dt.json",
+            "evaled_artifact_path": "",  # 使用空字符串而不是 None
+            "run_id": "cv_run_789",
+            "dataset_summary": {},
+            "metrics_summary": {},
+            "viz_summary": {},
+            "eval_config": None,
+            "created_at": 1640995200,
+            "updated_at": 1640995200
+        }
+        mock_response = {
+            "code": 0,
+            "msg": None,
+            "data": {"eval_run": mock_eval_run}
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.post.return_value = mock_resp
+        # 调用方法（不提供 user_id，使用默认值）
+        result = self.eval_service.create_cv_run(
+            run_id="cv_run_789",
+            prediction_artifact_path="coco_dt.json",
+            metrics_artifact_path="metrics.json",
+            ground_truth_artifact_path="coco_gt.json"
+        )
+        # 验证结果
+        self.assertEqual(result, 789)
+        # 验证 HTTP 调用
+        self.http_client.post.assert_called_once()
+        call_args = self.http_client.post.call_args
+        actual_payload = call_args[1]["json"]
+        # 验证 CV 类型必需字段
+        self.assertEqual(actual_payload["type"], "cv")
+        self.assertEqual(actual_payload["user_id"], 0)
+        self.assertEqual(actual_payload["run_id"], "cv_run_789")
+        self.assertEqual(actual_payload["prediction_artifact_path"], "coco_dt.json")
+        self.assertEqual(actual_payload["metrics_artifact_path"], "metrics.json")
+        self.assertEqual(actual_payload["ground_truth_artifact_path"], "coco_gt.json")
+        # LLM 类型字段不会出现在 CV 类型评测的 payload 中（Pydantic v2 自动排除未设置的可选字段）
+        self.assertNotIn("dataset_id", actual_payload)
+        self.assertNotIn("dataset_version_id", actual_payload)
+        self.assertNotIn("evaled_artifact_path", actual_payload)
+        self.assertNotIn("report", actual_payload)
+    def test_create_cv_run_custom_user_id(self):
+        """测试创建 CV 类型评测运行 - 自定义 user_id"""
+        # 模拟成功的创建响应
+        mock_eval_run = {
+            "id": 999,
+            "name": "cv_eval_custom",
+            "description": "CV evaluation custom",
+            "user_id": 3750,
+            "model_id": 3,
+            "model_name": "cv_model_v2",
+            "dataset_id": 0,  # 使用默认值而不是 None
+            "dataset_version_id": 0,  # 使用默认值而不是 None
+            "dataset_name": "",  # 使用空字符串而不是 None
+            "status": "created",
+            "prediction_artifact_path": "coco_dt.json",
+            "evaled_artifact_path": "",  # 使用空字符串而不是 None
+            "run_id": "cv_run_999",
+            "dataset_summary": {},
+            "metrics_summary": {},
+            "viz_summary": {},
+            "eval_config": None,
+            "created_at": 1640995200,
+            "updated_at": 1640995200
+        }
+        mock_response = {
+            "code": 0,
+            "msg": None,
+            "data": {"eval_run": mock_eval_run}
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.post.return_value = mock_resp
+        # 调用方法（提供自定义 user_id）
+        result = self.eval_service.create_cv_run(
+            run_id="cv_run_999",
+            prediction_artifact_path="coco_dt.json",
+            metrics_artifact_path="metrics.json",
+            ground_truth_artifact_path="coco_gt.json",
+            user_id=3750
+        )
+        # 验证结果
+        self.assertEqual(result, 999)
+        # 验证 HTTP 调用
+        self.http_client.post.assert_called_once()
+        call_args = self.http_client.post.call_args
+        actual_payload = call_args[1]["json"]
+        # 验证 CV 类型关键字段
+        self.assertEqual(actual_payload["type"], "cv")
+        self.assertEqual(actual_payload["user_id"], 3750)
+        self.assertEqual(actual_payload["run_id"], "cv_run_999")
+        self.assertEqual(actual_payload["prediction_artifact_path"], "coco_dt.json")
+        self.assertEqual(actual_payload["metrics_artifact_path"], "metrics.json")
+        self.assertEqual(actual_payload["ground_truth_artifact_path"], "coco_gt.json")
+    def test_create_eval_api_error(self):
+        """测试创建评测 - API错误"""
+        with patch('aihub.services.dataset_management.DatasetManagementService') as mock_dataset_service_class:
+            # 模拟数据集版本
+            mock_dataset_version = Mock()
+            mock_dataset_version.dataset_id = 1
+            mock_dataset_version.id = 1
+            mock_dataset_service = Mock()
+            mock_dataset_service.get_dataset_version_by_name.return_value = mock_dataset_version
+            mock_dataset_service_class.return_value = mock_dataset_service
+            # 模拟 API 错误
+            mock_response = {
+                "code": 2001,
+                "msg": "Invalid dataset version",
+                "data": None
+            }
+            mock_resp = Mock()
+            mock_resp.json.return_value = mock_response
+            self.http_client.post.return_value = mock_resp
+            with self.assertRaises(Exception) as context:
+                self.eval_service.create(
+                    dataset_version_name="invalid_dataset",
+                    prediction_artifact_path="/path/to/prediction.json",
+                    evaled_artifact_path="/path/to/evaled.json",
+                    report_json={"accuracy": 0.95},
+                    run_id="test_run_error"
+                )
+            self.assertIn("backend code 2001", str(context.exception))
+            self.assertIn("Invalid dataset version", str(context.exception))
+    def test_create_cv_run_api_error(self):
+        """测试创建 CV 评测运行 - API错误"""
+        # 模拟 API 错误
+        mock_response = {
+            "code": 3001,
+            "msg": "Invalid CV run parameters",
+            "data": None
+        }
+        mock_resp = Mock()
+        mock_resp.json.return_value = mock_response
+        self.http_client.post.return_value = mock_resp
+        with self.assertRaises(Exception) as context:
+            self.eval_service.create_cv_run(
+                run_id="invalid_cv_run",
+                prediction_artifact_path="invalid.json",
+                metrics_artifact_path="invalid_metrics.json",
+                ground_truth_artifact_path="invalid_gt.json"
+            )
+        self.assertIn("backend code 3001", str(context.exception))
+        self.assertIn("Invalid CV run parameters", str(context.exception))
+if __name__ == "__main__":
+    unittest.main()

intellif_aihub-0.1.20/src/aihub/__init__.py DELETED Viewed

	@@ -1 +0,0 @@
1	- __version__ = "0.1.20"

intellif_aihub-0.1.20/tests/test_eval.py DELETED Viewed

@@ -1,184 +0,0 @@
-# !/usr/bin/env python
-# -*-coding:utf-8 -*-
-import unittest
-import uuid
-from unittest.mock import Mock, patch
-import httpx
-from aihub.services.eval import EvalService
-from aihub.models.eval import ListEvalResp, EvalRun
-from aihub.models.common import APIWrapper
-BASE_URL = "http://192.168.13.160:30052"
-TOKEN = "eyJhbGciOiJIUzI1NiIsInR5cCI6IkpXVCJ9.eyJleHAiOjE3NTI1NDQwNDksImlhdCI6MTc1MVkzOTI0OSwidWlkIjoyfQ.MfB_7LK5oR3RAhga3jtgcvJqYESeUPLbz8Bc_y3fouc"
-class TestEvalService(unittest.TestCase):
-    def setUp(self):
-        self.http_client = Mock(spec=httpx.Client)
-        self.eval_service = EvalService(self.http_client)
-    def test_list_eval_runs_default(self):
-        mock_eval_run = {
-            "id": 1,
-            "name": "test_eval",
-            "description": "Test evaluation",
-            "user_id": 1,
-            "model_id": 1,
-            "model_name": "test_model",
-            "dataset_id": 1,
-            "dataset_version_id": 1,
-            "dataset_name": "test_dataset",
-            "status": "completed",
-            "prediction_artifact_path": "/path/to/prediction",
-            "evaled_artifact_path": "/path/to/eval",
-            "run_id": "test_run_123",
-            "dataset_summary": {},
-            "metrics_summary": {"accuracy": 0.95},
-            "viz_summary": {},
-            "eval_config": {"metric": "accuracy"},
-            "created_at": 1640995200,
-            "updated_at": 1640995200
-        }
-        mock_response = {
-            "code": 0,
-            "msg": None,
-            "data": {
-                "total": 1,
-                "page_size": 20,
-                "page_num": 1,
-                "data": [mock_eval_run]
-            }
-        }
-        mock_resp = Mock()
-        mock_resp.json.return_value = mock_response
-        self.http_client.get.return_value = mock_resp
-        result = self.eval_service.list()
-        self.assertIsInstance(result, ListEvalResp)
-        self.assertEqual(result.total, 1)
-        self.assertEqual(result.page_size, 20)
-        self.assertEqual(result.page_num, 1)
-        self.assertEqual(len(result.data), 1)
-        self.assertEqual(result.data[0].id, 1)
-        self.assertEqual(result.data[0].name, "test_eval")
-        self.http_client.get.assert_called_once_with(
-            "/eval-platform/api/v1/run/",
-            params={"page_size": 20, "page_num": 1}
-        )
-    def test_list_eval_runs_with_filters(self):
-        mock_response = {
-            "code": 0,
-            "msg": None,
-            "data": {
-                "total": 0,
-                "page_size": 10,
-                "page_num": 1,
-                "data": []
-            }
-        }
-        mock_resp = Mock()
-        mock_resp.json.return_value = mock_response
-        self.http_client.get.return_value = mock_resp
-        # 带过滤参数
-        result = self.eval_service.list(
-            page_size=10,
-            page_num=1,
-            status="completed",
-            name="test",
-            model_id=1,
-            dataset_id=2,
-            dataset_version_id=3,
-            run_id="test_run",
-            user_id=1,
-            model_ids="1,2,3",
-            dataset_ids="2,3,4",
-            dataset_version_ids="3,4,5"
-        )
-        self.assertIsInstance(result, ListEvalResp)
-        self.assertEqual(result.total, 0)
-        self.assertEqual(len(result.data), 0)
-        expected_params = {
-            "page_size": 10,
-            "page_num": 1,
-            "status": "completed",
-            "name": "test",
-            "model_id": 1,
-            "dataset_id": 2,
-            "dataset_version_id": 3,
-            "run_id": "test_run",
-            "user_id": 1,
-            "model_ids": "1,2,3",
-            "dataset_ids": "2,3,4",
-            "dataset_version_ids": "3,4,5"
-        }
-        self.http_client.get.assert_called_once_with(
-            "/eval-platform/api/v1/run/",
-            params=expected_params
-        )
-    def test_list_eval_runs_api_error(self):
-        """测试列出评测运行 - API错误"""
-        # 模拟 API 错误
-        mock_response = {
-            "code": 1001,
-            "msg": "Database connection failed",
-            "data": None
-        }
-        mock_resp = Mock()
-        mock_resp.json.return_value = mock_response
-        self.http_client.get.return_value = mock_resp
-        with self.assertRaises(Exception) as context:
-            self.eval_service.list()
-        self.assertIn("backend code 1001", str(context.exception))
-        self.assertIn("Database connection failed", str(context.exception))
-    def test_list_eval_runs_only_specified_filters(self):
-        mock_response = {
-            "code": 0,
-            "msg": None,
-            "data": {
-                "total": 0,
-                "page_size": 20,
-                "page_num": 1,
-                "data": []
-            }
-        }
-        mock_resp = Mock()
-        mock_resp.json.return_value = mock_response
-        self.http_client.get.return_value = mock_resp
-        result = self.eval_service.list(
-            status="completed",
-            model_id=1
-        )
-        expected_params = {
-            "page_size": 20,
-            "page_num": 1,
-            "status": "completed",
-            "model_id": 1
-        }
-        self.http_client.get.assert_called_once_with(
-            "/eval-platform/api/v1/run/",
-            params=expected_params
-        )
-if __name__ == "__main__":
-    unittest.main()