PyPI - maxframe - Versions diffs - 2.2.0__cp310-cp310-macosx_10_9_universal2.whl → 2.3.0rc1__cp310-cp310-macosx_10_9_universal2.whl - Mend

maxframe 2.2.0__cp310-cp310-macosx_10_9_universal2.whl → 2.3.0rc1__cp310-cp310-macosx_10_9_universal2.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of maxframe might be problematic. Click here for more details.

Files changed (114) hide show

maxframe/_utils.cpython-310-darwin.so +0 -0
maxframe/codegen/core.py +3 -2
maxframe/codegen/spe/dataframe/merge.py +4 -0
maxframe/codegen/spe/dataframe/misc.py +2 -0
maxframe/codegen/spe/dataframe/reduction.py +18 -0
maxframe/codegen/spe/dataframe/sort.py +9 -1
maxframe/codegen/spe/dataframe/tests/test_reduction.py +13 -0
maxframe/codegen/spe/dataframe/tseries.py +9 -0
maxframe/codegen/spe/learn/contrib/lightgbm.py +4 -3
maxframe/codegen/spe/tensor/datasource.py +1 -0
maxframe/config/config.py +3 -0
maxframe/conftest.py +10 -0
maxframe/core/base.py +2 -1
maxframe/core/entity/tileables.py +2 -0
maxframe/core/graph/core.cpython-310-darwin.so +0 -0
maxframe/core/graph/entity.py +7 -1
maxframe/core/mode.py +6 -1
maxframe/dataframe/__init__.py +2 -2
maxframe/dataframe/arithmetic/__init__.py +4 -0
maxframe/dataframe/arithmetic/maximum.py +33 -0
maxframe/dataframe/arithmetic/minimum.py +33 -0
maxframe/dataframe/core.py +98 -106
maxframe/dataframe/datasource/core.py +6 -0
maxframe/dataframe/datasource/direct.py +57 -0
maxframe/dataframe/datasource/read_csv.py +19 -11
maxframe/dataframe/datasource/read_odps_query.py +29 -6
maxframe/dataframe/datasource/read_odps_table.py +32 -10
maxframe/dataframe/datasource/read_parquet.py +38 -39
maxframe/dataframe/datastore/__init__.py +6 -0
maxframe/dataframe/datastore/direct.py +268 -0
maxframe/dataframe/datastore/to_odps.py +6 -0
maxframe/dataframe/extensions/flatjson.py +2 -1
maxframe/dataframe/groupby/__init__.py +5 -1
maxframe/dataframe/groupby/aggregation.py +10 -6
maxframe/dataframe/groupby/apply_chunk.py +1 -3
maxframe/dataframe/groupby/core.py +20 -4
maxframe/dataframe/indexing/__init__.py +2 -1
maxframe/dataframe/indexing/insert.py +45 -17
maxframe/dataframe/merge/__init__.py +3 -0
maxframe/dataframe/merge/combine.py +244 -0
maxframe/dataframe/misc/__init__.py +14 -3
maxframe/dataframe/misc/check_unique.py +41 -10
maxframe/dataframe/misc/drop.py +31 -0
maxframe/dataframe/misc/infer_dtypes.py +251 -0
maxframe/dataframe/misc/map.py +31 -18
maxframe/dataframe/misc/repeat.py +159 -0
maxframe/dataframe/misc/tests/test_misc.py +35 -1
maxframe/dataframe/missing/checkna.py +3 -2
maxframe/dataframe/reduction/__init__.py +10 -5
maxframe/dataframe/reduction/aggregation.py +6 -6
maxframe/dataframe/reduction/argmax.py +7 -4
maxframe/dataframe/reduction/argmin.py +7 -4
maxframe/dataframe/reduction/core.py +18 -9
maxframe/dataframe/reduction/mode.py +144 -0
maxframe/dataframe/reduction/nunique.py +10 -3
maxframe/dataframe/reduction/tests/test_reduction.py +12 -0
maxframe/dataframe/sort/__init__.py +9 -2
maxframe/dataframe/sort/argsort.py +7 -1
maxframe/dataframe/sort/core.py +1 -1
maxframe/dataframe/sort/rank.py +147 -0
maxframe/dataframe/tseries/__init__.py +19 -0
maxframe/dataframe/tseries/at_time.py +61 -0
maxframe/dataframe/tseries/between_time.py +122 -0
maxframe/dataframe/utils.py +30 -26
maxframe/learn/contrib/llm/core.py +16 -7
maxframe/learn/contrib/llm/deploy/__init__.py +13 -0
maxframe/learn/contrib/llm/deploy/config.py +221 -0
maxframe/learn/contrib/llm/deploy/core.py +247 -0
maxframe/learn/contrib/llm/deploy/framework.py +35 -0
maxframe/learn/contrib/llm/deploy/loader.py +360 -0
maxframe/learn/contrib/llm/deploy/tests/__init__.py +13 -0
maxframe/learn/contrib/llm/deploy/tests/test_register_models.py +359 -0
maxframe/learn/contrib/llm/models/__init__.py +1 -0
maxframe/learn/contrib/llm/models/dashscope.py +12 -6
maxframe/learn/contrib/llm/models/managed.py +76 -11
maxframe/learn/contrib/llm/models/openai.py +72 -0
maxframe/learn/contrib/llm/tests/__init__.py +13 -0
maxframe/learn/contrib/llm/tests/test_core.py +34 -0
maxframe/learn/contrib/llm/tests/test_openai.py +187 -0
maxframe/learn/contrib/llm/tests/test_text_gen.py +155 -0
maxframe/learn/contrib/llm/text.py +348 -42
maxframe/learn/contrib/models.py +4 -1
maxframe/learn/contrib/xgboost/classifier.py +2 -0
maxframe/learn/contrib/xgboost/core.py +31 -7
maxframe/learn/contrib/xgboost/predict.py +4 -2
maxframe/learn/contrib/xgboost/regressor.py +5 -0
maxframe/learn/contrib/xgboost/train.py +2 -0
maxframe/learn/preprocessing/_data/min_max_scaler.py +34 -23
maxframe/learn/preprocessing/_data/standard_scaler.py +34 -25
maxframe/learn/utils/__init__.py +1 -0
maxframe/learn/utils/extmath.py +42 -9
maxframe/learn/utils/odpsio.py +80 -11
maxframe/lib/filesystem/_oss_lib/common.py +2 -0
maxframe/lib/mmh3.cpython-310-darwin.so +0 -0
maxframe/opcodes.py +9 -1
maxframe/remote/core.py +4 -0
maxframe/serialization/core.cpython-310-darwin.so +0 -0
maxframe/serialization/tests/test_serial.py +2 -2
maxframe/tensor/arithmetic/__init__.py +1 -1
maxframe/tensor/arithmetic/core.py +2 -2
maxframe/tensor/arithmetic/tests/test_arithmetic.py +0 -9
maxframe/tensor/core.py +3 -0
maxframe/tensor/misc/copyto.py +1 -1
maxframe/tests/test_udf.py +61 -0
maxframe/tests/test_utils.py +8 -5
maxframe/udf.py +103 -7
maxframe/utils.py +61 -8
{maxframe-2.2.0.dist-info → maxframe-2.3.0rc1.dist-info}/METADATA +1 -2
{maxframe-2.2.0.dist-info → maxframe-2.3.0rc1.dist-info}/RECORD +113 -90
maxframe_client/session/task.py +8 -1
maxframe_client/tests/test_session.py +24 -0
maxframe/dataframe/arrays.py +0 -864
{maxframe-2.2.0.dist-info → maxframe-2.3.0rc1.dist-info}/WHEEL +0 -0
{maxframe-2.2.0.dist-info → maxframe-2.3.0rc1.dist-info}/top_level.txt +0 -0

maxframe/learn/contrib/llm/deploy/tests/test_register_models.py ADDED Viewed

@@ -0,0 +1,359 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import json
+import os.path
+from typing import List
+import pytest
+from ..core import (
+    ResourceNameTemplate,
+    _registered_llm_models,
+    clean_registered_model,
+    get_registered_model_config,
+    register_model_deployments,
+)
+from ..framework import InferenceFrameworkEnum
+from ..loader import (
+    DeploymentConfigBase,
+    DeploymentConfigResourceRequirement,
+    FrameworkDeploymentConfig,
+    ModelDeploymentConfig,
+    _model_config_to_json,
+    register_models_from_json_file,
+)
+current_dir = os.path.dirname(os.path.abspath(__file__))
+@pytest.fixture
+def qwen2_5_0_5b_model():
+    model_name = "Qwen2.5-0.5B-instruct"
+    model_file_resource = ResourceNameTemplate(
+        project="bigdata_public_dataset",
+        schema="data_plus_ai_{region_id}",
+        name="Qwen2.5-0.5B-Instruct.Q8_0.gguf",
+    )
+    common_load_params = {
+        "chat_format": "qwen",
+        "flash_attn": True,
+        "cache-type-k": "q8_0",
+        "cache-type-v": "q8_0",
+        "defrag-thold": "1",
+    }
+    common_config = DeploymentConfigBase.from_json(
+        {
+            "properties": {"family": "Qwen2.5", "type": "instruct"},
+            "load_params": common_load_params,
+        }
+    )
+    load_params = {"n_threads": 2, "n_batch": 1024, "n_ctx": 32768, "verbose": False}
+    calc_resources = DeploymentConfigResourceRequirement(cpu=2, memory=8)
+    deployment_llama_cpp_python = FrameworkDeploymentConfig(
+        model_file="Qwen2.5-0.5B-Instruct.Q8_0.gguf",
+        framework=InferenceFrameworkEnum.LLAMA_CPP_PYTHON_TEXT.value,
+        device="cpu",
+        model_file_resources=[model_file_resource],
+        load_params=load_params,
+        resource_requirements=calc_resources,
+    )
+    deployment_llama_server = FrameworkDeploymentConfig(
+        model_file="Qwen2.5-0.5B-Instruct.Q8_0.gguf",
+        framework=InferenceFrameworkEnum.LLAMA_CPP_SERVE_TEXT.value,
+        device="cpu",
+        model_file_resources=[model_file_resource],
+        load_params=load_params,
+        resource_requirements=calc_resources,
+    )
+    deployments = [deployment_llama_cpp_python, deployment_llama_server]
+    return ModelDeploymentConfig(
+        model_name=model_name,
+        tags=["tag"],
+        common_config=common_config,
+        deployments=deployments,
+    )
+@pytest.fixture
+def qwen3_8b_model():
+    json_config = """
+        {
+        "model_name": "Qwen3-0.6B",
+        "model_identifier": "qwen3-0.6b",
+        "common_config": {
+        "properties": {
+            "family": "Qwen3",
+            "reasoning_model": true
+        },
+        "load_params": {
+            "flash_attn": true,
+            "cache-type-k": "q8_0",
+            "cache-type-v": "q8_0",
+            "defrag-thold": "1",
+            "n_threads": 2,
+            "n_batch": 1024,
+            "n_ctx": 32768,
+            "verbose": false
+        },
+        "model_file": "Qwen3-0.6B-Q8_0.gguf",
+        "model_file_resources": [
+            {
+                "project": "bigdata_public_dataset",
+                "schema": "data_plus_ai_{region_id}",
+                "name": "Qwen3-0.6B-Q8_0.gguf"
+            }
+        ],
+        "resource_requirements": {
+            "cpu": 2,
+            "memory": 8
+            }
+        },
+        "deployments": [
+        {
+            "framework": "LLAMA_CPP_SERVE:TEXT",
+            "device": "cpu",
+            "load_params": {},
+            "resource_requirements": {},
+            "properties": {}
+        },
+        {
+            "framework": "LLAMA_CPP_PYTHON:TEXT",
+            "device": "cpu",
+            "load_params": {},
+            "resource_requirements": {
+            "cpu": 2,
+            "memory": 8
+            },
+            "properties": {}
+        }
+        ],
+        "tags": []
+    }
+    """
+    model = ModelDeploymentConfig.from_json(json.loads(json_config))
+    return model
+@pytest.fixture
+def models(qwen2_5_0_5b_model, qwen3_8b_model):
+    model_list = [qwen2_5_0_5b_model, qwen3_8b_model]
+    import uuid
+    test_json_path = os.path.join(current_dir, f"./test_models_{uuid.uuid4()}.json")
+    try:
+        with open(test_json_path, "w") as f:
+            f.write(_model_config_to_json(model_list))
+        yield test_json_path, model_list
+    finally:
+        clean_registered_model()
+        if os.path.exists(test_json_path):
+            os.remove(test_json_path)
+def test_serialize_and_deserialize(qwen2_5_0_5b_model):
+    serialized = qwen2_5_0_5b_model.to_json()
+    deserialized = ModelDeploymentConfig.from_json(serialized)
+    assert serialized == deserialized.to_json()
+def test_register_models():
+    clean_registered_model()
+    register_model_deployments(
+        model_name="mock_model",
+        model_file="DeepSeek-R1-Distill-Qwen-1.5B-Q8_0.gguf",
+        inference_frameworks=InferenceFrameworkEnum.LLAMA_CPP_PYTHON_TEXT,
+        required_resources=[
+            ResourceNameTemplate(
+                project="test",
+                schema=None,
+                name="DeepSeek-R1-Distill-Qwen-1.5B-Q8_0.gguf",
+            ),
+        ],
+        default_load_params={
+            "n_threads": 3,
+            "n_threads_batch": 512,
+            "n_batch": 512,
+            "flash_attn": True,
+            "verbose": True,
+            "n_ctx": 32 * 1024,
+        },
+        required_cpu=2,
+        required_memory=8,
+        device="cpu",
+        properties={"reasoning_model": True},
+    )
+    cpu_model_config = get_registered_model_config(
+        "mock_model",
+        expected_device="cpu",
+        expected_inference_framework=InferenceFrameworkEnum.LLAMA_CPP_PYTHON_TEXT,
+    )
+    assert cpu_model_config is not None
+    assert cpu_model_config is get_registered_model_config(
+        "mock_model", expected_device="cpu"
+    )
+    general_config = get_registered_model_config("mock_model")
+    assert cpu_model_config.model_name == general_config.model_name
+    assert cpu_model_config.device == general_config.device
+    assert cpu_model_config.device == "cpu"
+    assert cpu_model_config.required_memory == 8
+    assert cpu_model_config.required_cpu == 2
+    assert cpu_model_config.required_resource_files == [
+        ResourceNameTemplate(
+            project="test", schema=None, name="DeepSeek-R1-Distill-Qwen-1.5B-Q8_0.gguf"
+        )
+    ]
+    assert cpu_model_config.load_params.get("flash_attn") is True
+    register_model_deployments(
+        model_name="mock_model",
+        model_file="DeepSeek-R1-Distill-Qwen-1.5B-Q8_0.gguf",
+        inference_frameworks=InferenceFrameworkEnum.LLAMA_CPP_PYTHON_TEXT,
+        required_resources=[],
+        default_load_params={},
+        required_cpu=2,
+        required_memory=8,
+        device="gpu",
+        properties={"reasoning_model": True},
+    )
+    gpu_model_config = get_registered_model_config("mock_model", expected_device="gpu")
+    cpu_model_config_again = get_registered_model_config(
+        "mock_model", expected_device="cpu"
+    )
+    assert cpu_model_config.model_name == cpu_model_config_again.model_name
+    assert cpu_model_config.device == cpu_model_config_again.device
+    assert cpu_model_config.device != gpu_model_config.device
+    with pytest.raises(ValueError):
+        register_model_deployments(
+            model_name="mock_model",
+            model_file="DeepSeek-R1-Distill-Qwen-1.5B-Q8_0.gguf",
+            inference_frameworks=InferenceFrameworkEnum.LLAMA_CPP_PYTHON_TEXT,
+            required_resources=[],
+            default_load_params={},
+            required_cpu=2,
+            required_memory=8,
+            device="gpu",
+            properties={"reasoning_model": True},
+        )
+def test_model_config_register(models):
+    clean_registered_model()
+    import os
+    test_json_path, model_list = models
+    model_list: List[ModelDeploymentConfig]
+    with pytest.raises(FileNotFoundError):
+        register_models_from_json_file(
+            os.path.join(current_dir, "test_models_not_exist.json")
+        )
+    test_config_path = os.path.join(current_dir, test_json_path)
+    register_models_from_json_file(test_config_path)
+    deployments = []
+    for model in model_list:
+        deployments.extend(model.deployments)
+    assert len(_registered_llm_models) == len(model_list)
+    for model in model_list:
+        model_name = model.model_name.lower()
+        assert model_name in _registered_llm_models.keys()
+        for deployments in model.deployments:
+            assert deployments.device in _registered_llm_models[model_name]
+            assert (
+                InferenceFrameworkEnum.from_string(deployments.framework)
+                in _registered_llm_models[model_name][deployments.device]
+            )
+def test_resource_name_template():
+    """Test ResourceNameTemplate functionality."""
+    # Test with single variable
+    template = ResourceNameTemplate(
+        project="test_project", schema="schema_{region_id}", name="resource_{region_id}"
+    )
+    result = template.build_full_resource_name({"region_id": "cn-hangzhou"})
+    assert "cn_hangzhou" in result
+    # Test with multiple variables and hyphen replacement
+    template2 = ResourceNameTemplate(
+        project="my_project",
+        schema="schema_{region_id}_{env}",
+        name="resource_{region_id}_{version}",
+    )
+    result2 = template2.build_full_resource_name(
+        {"region_id": "us-west-1", "env": "prod-test", "version": "v1-2-3"}
+    )
+    assert "us_west_1" in result2
+    assert "prod_test" in result2
+    assert "v1_2_3" in result2
+    # Test equality and hash
+    template3 = ResourceNameTemplate("proj", "schema", "name")
+    template4 = ResourceNameTemplate("proj", "schema", "name")
+    template5 = ResourceNameTemplate("proj2", "schema", "name")
+    assert template3 == template4
+    assert template3 != template5
+    assert hash(template3) == hash(template4)
+    assert hash(template3) != hash(template5)
+@pytest.mark.parametrize(
+    "input_string,expected_enum",
+    [
+        ("LLAMA_CPP_PYTHON:TEXT", InferenceFrameworkEnum.LLAMA_CPP_PYTHON_TEXT),
+        ("LLAMA_CPP_SERVE:TEXT", InferenceFrameworkEnum.LLAMA_CPP_SERVE_TEXT),
+        ("DASH_SCOPE:TEXT", InferenceFrameworkEnum.DASH_SCOPE_TEXT),
+        ("DASH_SCOPE:MULTIMODAL", InferenceFrameworkEnum.DASH_SCOPE_MULTIMODAL),
+        ("VLLM_SERVE:TEXT", InferenceFrameworkEnum.VLLM_SERVE_TEXT),
+        ("OPENAI_REMOTE:TEXT", InferenceFrameworkEnum.OPENAI_REMOTE_TEXT),
+        ("OTHER", InferenceFrameworkEnum.OTHER),
+        (
+            InferenceFrameworkEnum.DASH_SCOPE_TEXT,
+            InferenceFrameworkEnum.DASH_SCOPE_TEXT,
+        ),
+    ],
+)
+def test_inference_framework_enum_success(input_string, expected_enum):
+    result = InferenceFrameworkEnum.from_string(input_string)
+    assert result == expected_enum
+@pytest.mark.parametrize(
+    "input_string",
+    [
+        "INVALID_FRAMEWORK",
+        "",
+        "llama_cpp_python:text",
+        "LLAMA_CPP_PYTHON:Text",
+        "UNKNOWN:FRAMEWORK",
+    ],
+)
+def test_inference_framework_enum_failure(input_string):
+    """Test that invalid inputs raise appropriate exceptions."""
+    with pytest.raises(ValueError):
+        InferenceFrameworkEnum.from_string(input_string)

maxframe/learn/contrib/llm/models/__init__.py CHANGED Viewed

@@ -13,3 +13,4 @@
 # limitations under the License.
 from .dashscope import DashScopeMultiModalLLM, DashScopeTextLLM
+from .openai import OpenAICompatibleTextLLM

maxframe/learn/contrib/llm/models/dashscope.py CHANGED Viewed

@@ -19,7 +19,7 @@ from .....serialization.serializables.core import Serializable
 from .....serialization.serializables.field import StringField
 from ..core import LLMTextGenOperator
 from ..multi_modal import MultiModalLLM
-from ..text import TextLLM
+from ..text import TextGenLLM
 class DashScopeLLMMixin(Serializable):
@@ -33,7 +33,7 @@ class DashScopeLLMMixin(Serializable):
                 raise ValueError(f"{k} is not supported")
-class DashScopeTextLLM(TextLLM, DashScopeLLMMixin):
+class DashScopeTextLLM(TextGenLLM, DashScopeLLMMixin):
     """
     DashScope text LLM.
     """
@@ -59,7 +59,7 @@ class DashScopeTextLLM(TextLLM, DashScopeLLMMixin):
         prompt_template: Dict[str, Any],
         params: Dict[str, Any] = None,
     ):
-        return DashScopeTextGenerationOperator(
+        return DashScopeTextGenerationOp(
             model=self,
             prompt_template=prompt_template,
             params=params,
@@ -93,16 +93,22 @@ class DashScopeMultiModalLLM(MultiModalLLM, DashScopeLLMMixin):
         params: Dict[str, Any] = None,
     ):
         # TODO add precheck here
-        return DashScopeMultiModalGenerationOperator(
+        return DashScopeMultiModalGenerationOp(
             model=self,
             prompt_template=prompt_template,
             params=params,
         )(data)
-class DashScopeTextGenerationOperator(LLMTextGenOperator):
+class DashScopeTextGenerationOp(LLMTextGenOperator):
     _op_type_ = opcodes.DASHSCOPE_TEXT_GENERATION
+    _legacy_name = "DashScopeTextGenerationOperator"
-class DashScopeMultiModalGenerationOperator(LLMTextGenOperator):
+class DashScopeMultiModalGenerationOp(LLMTextGenOperator):
     _op_type_ = opcodes.DASHSCOPE_MULTI_MODAL_GENERATION
+    _legacy_name = "DashScopeMultiModalGenerationOperator"
+DashScopeTextGenerationOperator = DashScopeTextGenerationOp
+DashScopeMultiModalGenerationOperator = DashScopeMultiModalGenerationOp

maxframe/learn/contrib/llm/models/managed.py CHANGED Viewed

@@ -12,26 +12,34 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
-from typing import Any, Dict, List
+from typing import Any, Dict, List, Union
 from ..... import opcodes
-from .....serialization.serializables import StringField
-from ..core import LLMTextGenOperator
-from ..text import TextLLM
+from .....serialization.serializables import BoolField, ReferenceField, StringField
+from ..core import LLMTextEmbeddingOp, LLMTextGenOperator
+from ..deploy.config import ModelDeploymentConfig
+from ..text import TextEmbeddingModel, TextGenLLM
-class ManagedLLMTextGenOperator(LLMTextGenOperator):
+class ManagedLLMTextGenOp(LLMTextGenOperator):
     _op_type_ = opcodes.MANAGED_TEXT_MODAL_GENERATION
+    _legacy_name = "ManagedLLMTextGenOperator"
     inference_framework: str = StringField("inference_framework", default=None)
+    simple_output: bool = BoolField("simple_output", default=False)
-class ManagedTextLLM(TextLLM):
+class ManagedTextGenLLM(TextGenLLM):
     """
     Managed text LLM by MaxFrame.
     """
-    def __init__(self, name: str):
+    _legacy_name = "ManagedTextLLM"  # since v2.3.0
+    deploy_config: ModelDeploymentConfig = ReferenceField(
+        "deploy_config", reference_type=ModelDeploymentConfig, default=None
+    )
+    def __init__(self, name: str, deploy_config: ModelDeploymentConfig = None):
         """
         Initialize a managed text LLM.
@@ -39,16 +47,73 @@ class ManagedTextLLM(TextLLM):
         ----------
         name : str
             The managed text LLM name to use.
+        deploy_config : ModelDeploymentConfig
+            The model deployment config to use.
         """
-        super().__init__(name=name)
+        if deploy_config:
+            deploy_config.model_name = name
+            deploy_config.check_validity()
+        super().__init__(name=name, deploy_config=deploy_config)
     def generate(
         self,
         data,
-        prompt_template: List[Dict[str, Any]],
+        prompt_template: Union[str, List[Dict[str, Any]]],
+        simple_output: bool = False,
         params: Dict[str, Any] = None,
         **kw
     ):
-        return ManagedLLMTextGenOperator(
-            model=self, prompt_template=prompt_template, params=params, **kw
+        return ManagedLLMTextGenOp(
+            model=self,
+            prompt_template=prompt_template,
+            simple_output=simple_output,
+            params=params,
+            **kw,
         )(data)
+# since v2.3.0, text llm has more types
+ManagedTextLLM = ManagedTextGenLLM  # for old client compatibility
+class ManagedLLMTextEmbeddingOp(LLMTextEmbeddingOp):
+    _op_type_ = opcodes.LLM_TEXT_EMBEDDING_TASK
+    inference_framework: str = StringField("inference_framework", default=None)
+class ManagedTextEmbeddingModel(TextEmbeddingModel):
+    """
+    Managed text embedder by MaxFrame.
+    """
+    def __init__(self, name: str):
+        """
+        Initialize a managed text embedder.
+        Parameters
+        ----------
+        name : str
+            The managed text embedder name to use.
+        """
+        super().__init__(name=name)
+    def embed(
+        self,
+        series,
+        dimensions: int = None,
+        encoding_format: str = None,
+        simple_output: bool = False,
+        params: Dict[str, Any] = None,
+        **kw
+    ):
+        return ManagedLLMTextEmbeddingOp(
+            model=self,
+            dimensions=dimensions,
+            encoding_format=encoding_format,
+            simple_output=simple_output,
+            params=params,
+            task="text-embedding",
+            **kw,
+        )(series)
+ManagedLLMTextGenOperator = ManagedLLMTextGenOp

maxframe/learn/contrib/llm/models/openai.py ADDED Viewed

@@ -0,0 +1,72 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from typing import Any, Dict, List
+from ..... import opcodes
+from .....serialization.serializables.field import BoolField, Int32Field, StringField
+from ..core import LLM, LLMTextGenOperator
+from ..text import TextGenLLM
+class OpenAICompatibleLLM(LLM):
+    """
+    Remote OpenAI-compatible text LLM.
+    """
+    base_url: str = StringField("base_url")
+    api_key: str = StringField("api_key")
+    batch_size: int = Int32Field("batch_size", default=None)
+    batch_timeout: int = Int32Field("batch_timeout", default=None)
+class OpenAICompatibleTextLLM(TextGenLLM, OpenAICompatibleLLM):
+    def __init__(self, name: str, base_url: str, api_key: str):
+        """
+        Initialize a remote OpenAI-compatible text LLM.
+        Parameters
+        ----------
+        name : str
+            The remote model name to use.
+        base_url : str
+            The base URL of the OpenAI-compatible API service.
+        api_key : str
+            The API key for authentication.
+        """
+        super().__init__(name=name)
+        self.base_url = base_url
+        self.api_key = api_key
+    def generate(
+        self,
+        data,
+        prompt_template: List[Dict[str, Any]],
+        simple_output: bool = False,
+        params: Dict[str, Any] = None,
+        **kw
+    ):
+        return OpenAICompatibleTextGenOp(
+            model=self,
+            prompt_template=prompt_template,
+            simple_output=simple_output,
+            params=params,
+            **kw,
+        )(data)
+class OpenAICompatibleTextGenOp(LLMTextGenOperator):
+    _op_type_ = opcodes.OPENAI_COMPATIBLE_TEXT_GENERATION
+    simple_output = BoolField("simple_output", default=False)

maxframe/learn/contrib/llm/tests/__init__.py ADDED Viewed

@@ -0,0 +1,13 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.

maxframe/learn/contrib/llm/tests/test_core.py ADDED Viewed

@@ -0,0 +1,34 @@
+# Copyright 1999-2025 Alibaba Group Holding Ltd.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#      http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import numpy as np
+from .. import core as llm_core
+def test_text_gen_operator_output_dtypes():
+    op = llm_core.LLMTextGenOperator()
+    dtypes = op.get_output_dtypes()
+    assert dtypes["response"] == np.dtype("O")
+    assert dtypes["success"] == np.dtype("bool")
+def test_text_embedding_operator_output_dtypes_and_defaults():
+    op = llm_core.LLMTextEmbeddingOp()
+    dtypes = op.get_output_dtypes()
+    assert dtypes["response"] == np.dtype("O")
+    assert dtypes["success"] == np.dtype("bool")
+    assert op.simple_output is False
+    assert op.dimensions is None
+    assert op.encoding_format is None