PyPI - bisheng-langchain - Versions diffs - 0.0.1__py3-none-any.whl - Mend

bisheng-langchain 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

bisheng_langchain/__init__.py +0 -0
bisheng_langchain/chains/__init__.py +5 -0
bisheng_langchain/chains/combine_documents/__init__.py +0 -0
bisheng_langchain/chains/combine_documents/stuff.py +56 -0
bisheng_langchain/chains/question_answering/__init__.py +240 -0
bisheng_langchain/chains/retrieval_qa/__init__.py +0 -0
bisheng_langchain/chains/retrieval_qa/base.py +89 -0
bisheng_langchain/chat_models/__init__.py +11 -0
bisheng_langchain/chat_models/host_llm.py +409 -0
bisheng_langchain/chat_models/interface/__init__.py +10 -0
bisheng_langchain/chat_models/interface/minimax.py +123 -0
bisheng_langchain/chat_models/interface/openai.py +68 -0
bisheng_langchain/chat_models/interface/types.py +61 -0
bisheng_langchain/chat_models/interface/utils.py +5 -0
bisheng_langchain/chat_models/interface/wenxin.py +114 -0
bisheng_langchain/chat_models/interface/xunfei.py +233 -0
bisheng_langchain/chat_models/interface/zhipuai.py +81 -0
bisheng_langchain/chat_models/minimax.py +354 -0
bisheng_langchain/chat_models/proxy_llm.py +354 -0
bisheng_langchain/chat_models/wenxin.py +349 -0
bisheng_langchain/chat_models/xunfeiai.py +355 -0
bisheng_langchain/chat_models/zhipuai.py +379 -0
bisheng_langchain/document_loaders/__init__.py +3 -0
bisheng_langchain/document_loaders/elem_html.py +0 -0
bisheng_langchain/document_loaders/elem_image.py +0 -0
bisheng_langchain/document_loaders/elem_pdf.py +655 -0
bisheng_langchain/document_loaders/parsers/__init__.py +5 -0
bisheng_langchain/document_loaders/parsers/image.py +28 -0
bisheng_langchain/document_loaders/parsers/test_image.py +286 -0
bisheng_langchain/embeddings/__init__.py +7 -0
bisheng_langchain/embeddings/host_embedding.py +133 -0
bisheng_langchain/embeddings/interface/__init__.py +3 -0
bisheng_langchain/embeddings/interface/types.py +23 -0
bisheng_langchain/embeddings/interface/wenxin.py +86 -0
bisheng_langchain/embeddings/wenxin.py +139 -0
bisheng_langchain/vectorstores/__init__.py +3 -0
bisheng_langchain/vectorstores/elastic_keywords_search.py +284 -0
bisheng_langchain-0.0.1.dist-info/METADATA +64 -0
bisheng_langchain-0.0.1.dist-info/RECORD +41 -0
bisheng_langchain-0.0.1.dist-info/WHEEL +5 -0
bisheng_langchain-0.0.1.dist-info/top_level.txt +1 -0

bisheng_langchain/chat_models/host_llm.py ADDED Viewed

@@ -0,0 +1,409 @@
+"""proxy llm chat wrapper."""
+from __future__ import annotations
+import logging
+import sys
+from typing import TYPE_CHECKING, Any, Callable, Dict, List, Mapping, Optional, Tuple, Union
+import requests
+from langchain.callbacks.manager import AsyncCallbackManagerForLLMRun, CallbackManagerForLLMRun
+from langchain.chat_models.base import BaseChatModel
+from langchain.schema import ChatGeneration, ChatResult
+from langchain.schema.messages import (AIMessage, BaseMessage, ChatMessage, FunctionMessage,
+                                       HumanMessage, SystemMessage)
+from langchain.utils import get_from_dict_or_env
+from pydantic import Field, root_validator
+# from requests.exceptions import HTTPError
+from tenacity import (before_sleep_log, retry, retry_if_exception_type, stop_after_attempt,
+                      wait_exponential)
+# from .interface import MinimaxChatCompletion
+# from .interface.types import ChatInput
+if TYPE_CHECKING:
+    import tiktoken
+logger = logging.getLogger(__name__)
+def _import_tiktoken() -> Any:
+    try:
+        import tiktoken
+    except ImportError:
+        raise ValueError('Could not import tiktoken python package. '
+                         'This is needed in order to calculate get_token_ids. '
+                         'Please install it with `pip install tiktoken`.')
+    return tiktoken
+def _create_retry_decorator(llm: BaseHostChatLLM) -> Callable[[Any], Any]:
+    min_seconds = 1
+    max_seconds = 20
+    # Wait 2^x * 1 second between each retry starting with
+    # 4 seconds, then up to 10 seconds, then 10 seconds afterwards
+    return retry(
+        reraise=True,
+        stop=stop_after_attempt(llm.max_retries),
+        wait=wait_exponential(multiplier=1, min=min_seconds, max=max_seconds),
+        retry=(retry_if_exception_type(Exception)),
+        before_sleep=before_sleep_log(logger, logging.WARNING),
+    )
+def _convert_dict_to_message(_dict: Mapping[str, Any]) -> BaseMessage:
+    role = _dict['role']
+    if role == 'user':
+        return HumanMessage(content=_dict['content'])
+    elif role == 'assistant':
+        content = _dict[
+            'content'] or ''  # OpenAI returns None for tool invocations
+        if _dict.get('function_call'):
+            additional_kwargs = {'function_call': dict(_dict['function_call'])}
+        else:
+            additional_kwargs = {}
+        return AIMessage(content=content, additional_kwargs=additional_kwargs)
+    elif role == 'system':
+        return SystemMessage(content=_dict['content'])
+    elif role == 'function':
+        return FunctionMessage(content=_dict['content'], name=_dict['name'])
+    else:
+        return ChatMessage(content=_dict['content'], role=role)
+def _convert_message_to_dict(message: BaseMessage) -> dict:
+    if isinstance(message, ChatMessage):
+        message_dict = {'role': message.role, 'content': message.content}
+    elif isinstance(message, HumanMessage):
+        message_dict = {'role': 'user', 'content': message.content}
+    elif isinstance(message, AIMessage):
+        message_dict = {'role': 'assistant', 'content': message.content}
+        if 'function_call' in message.additional_kwargs:
+            message_dict['function_call'] = message.additional_kwargs[
+                'function_call']
+    elif isinstance(message, SystemMessage):
+        message_dict = {'role': 'system', 'content': message.content}
+    elif isinstance(message, FunctionMessage):
+        message_dict = {
+            'role': 'function',
+            'content': message.content,
+            'name': message.name,
+        }
+    else:
+        raise ValueError(f'Got unknown type {message}')
+    if 'name' in message.additional_kwargs:
+        message_dict['name'] = message.additional_kwargs['name']
+    return message_dict
+class BaseHostChatLLM(BaseChatModel):
+    """Wrapper around base host Chat large language models.
+    """
+    client: Optional[Any]  #: :meta private:
+    """Model name to use."""
+    model_name: str = Field('', alias='model')
+    temperature: float = 0.9
+    top_p: float = 0.95
+    do_sample: bool = False
+    """Number of chat completions to generate for each prompt."""
+    max_tokens: int = 4096
+    """What sampling temperature to use."""
+    model_kwargs: Optional[Dict[str, Any]] = Field(default_factory=dict)
+    """Holds any model parameters valid for `create` call not explicitly specified."""
+    host_base_url: Optional[str] = None
+    headers: Optional[Dict[str, str]] = Field(default_factory=dict)
+    request_timeout: Optional[Union[float, Tuple[float, float]]] = None
+    """Timeout for requests to OpenAI completion API. Default is 600 seconds."""
+    max_retries: Optional[int] = 6
+    """Maximum number of retries to make when generating."""
+    streaming: Optional[bool] = False
+    """Whether to stream the results or not."""
+    n: Optional[int] = 1
+    """Maximum number of tokens to generate."""
+    tiktoken_model_name: Optional[str] = None
+    """The model name to pass to tiktoken when using this class.
+    Tiktoken is used to count the number of tokens in documents to constrain
+    them to be under a certain limit. By default, when set to None, this will
+    be the same as the embedding model name. However, there are some cases
+    where you may want to use this Embedding class with a model name not
+    supported by tiktoken. This can include when using Azure embeddings or
+    when using one of the many model providers that expose an OpenAI-like
+    API but with different models. In those cases, in order to avoid erroring
+    when tiktoken is called, you can specify a model name to use here."""
+    verbose: Optional[bool] = False
+    class Config:
+        """Configuration for this pydantic object."""
+        allow_population_by_field_name = True
+    @root_validator()
+    def validate_environment(cls, values: Dict) -> Dict:
+        """Validate that api key and python package exists in environment."""
+        values['host_base_url'] = get_from_dict_or_env(values, 'host_base_url',
+                                                       'HostBaseUrl')
+        try:
+            values['client'] = requests.post
+        except AttributeError:
+            raise ValueError(
+                'Try upgrading it with `pip install --upgrade requests`.')
+        return values
+    @property
+    def _default_params(self) -> Dict[str, Any]:
+        """Get the default parameters for calling ChatMinimaxAI API."""
+        return {
+            'model': self.model_name,
+            'temperature': self.temperature,
+            'top_p': self.top_p,
+            'max_tokens': self.max_tokens,
+            'do_sample': self.do_sample,
+            **self.model_kwargs,
+        }
+    def completion_with_retry(self, **kwargs: Any) -> Any:
+        retry_decorator = _create_retry_decorator(self)
+        @retry_decorator
+        def _completion_with_retry(**kwargs: Any) -> Any:
+            messages = kwargs.get('messages')
+            temperature = kwargs.get('temperature')
+            top_p = kwargs.get('top_p')
+            max_tokens = kwargs.get('max_tokens')
+            do_sample = kwargs.get('do_sample')
+            params = {
+                'messages': messages,
+                'model': self.model_name,
+                'top_p': top_p,
+                'temperature': temperature,
+                'max_tokens': max_tokens,
+                'do_sample': do_sample
+            }
+            if self.verbose:
+                print('payload', params)
+            url = f'{self.host_base_url}/{self.model_name}/infer'
+            resp = self.client(url=url, json=params).json()
+            if resp['status_code'] != 200:
+                raise ValueError(
+                    f"API returned an error: {resp['status_message']}")
+            resp['usage'] = {}
+            return resp
+        return _completion_with_retry(**kwargs)
+    def _combine_llm_outputs(self, llm_outputs: List[Optional[dict]]) -> dict:
+        overall_token_usage: dict = {}
+        for output in llm_outputs:
+            if output is None:
+                # Happens in streaming
+                continue
+            token_usage = output['token_usage']
+            if token_usage is None:
+                continue
+            for k, v in token_usage.items():
+                if k in overall_token_usage:
+                    overall_token_usage[k] += v
+                else:
+                    overall_token_usage[k] = v
+        return {
+            'token_usage': overall_token_usage,
+            'model_name': self.model_name
+        }
+    def _generate(
+        self,
+        messages: List[BaseMessage],
+        stop: Optional[List[str]] = None,
+        run_manager: Optional[CallbackManagerForLLMRun] = None,
+        **kwargs: Any,
+    ) -> ChatResult:
+        message_dicts, params = self._create_message_dicts(messages, stop)
+        params = {**params, **kwargs}
+        response = self.completion_with_retry(messages=message_dicts, **params)
+        return self._create_chat_result(response)
+    async def _agenerate(
+        self,
+        messages: List[BaseMessage],
+        stop: Optional[List[str]] = None,
+        run_manager: Optional[AsyncCallbackManagerForLLMRun] = None,
+        **kwargs: Any,
+    ) -> ChatResult:
+        return self._generate(messages, stop, run_manager, kwargs)
+    def _create_message_dicts(
+        self, messages: List[BaseMessage], stop: Optional[List[str]]
+    ) -> Tuple[List[Dict[str, Any]], Dict[str, Any]]:
+        params = dict(self._client_params)
+        if stop is not None:
+            if 'stop' in params:
+                raise ValueError(
+                    '`stop` found in both the input and default params.')
+            params['stop'] = stop
+        message_dicts = [_convert_message_to_dict(m) for m in messages]
+        return message_dicts, params
+    def _create_chat_result(self, response: Mapping[str, Any]) -> ChatResult:
+        generations = []
+        for res in response['choices']:
+            message = _convert_dict_to_message(res['message'])
+            gen = ChatGeneration(message=message)
+            generations.append(gen)
+        llm_output = {
+            'token_usage': response['usage'],
+            'model_name': self.model_name
+        }
+        return ChatResult(generations=generations, llm_output=llm_output)
+    @property
+    def _identifying_params(self) -> Mapping[str, Any]:
+        """Get the identifying parameters."""
+        return {**{'model_name': self.model_name}, **self._default_params}
+    @property
+    def _client_params(self) -> Mapping[str, Any]:
+        """Get the parameters used for the client."""
+        minimaxai_creds: Dict[str, Any] = {
+            'model': self.model_name,
+        }
+        return {**minimaxai_creds, **self._default_params}
+    def _get_invocation_params(self,
+                               stop: Optional[List[str]] = None,
+                               **kwargs: Any) -> Dict[str, Any]:
+        """Get the parameters used to invoke the model FOR THE CALLBACKS."""
+        return {
+            **super()._get_invocation_params(stop=stop, **kwargs),
+            **self._default_params,
+            'model': self.model_name,
+            'function': kwargs.get('functions'),
+        }
+    @property
+    def _llm_type(self) -> str:
+        """Return type of chat model."""
+        return 'host_chat_llm'
+    def _get_encoding_model(self) -> Tuple[str, tiktoken.Encoding]:
+        tiktoken_ = _import_tiktoken()
+        if self.tiktoken_model_name is not None:
+            model = self.tiktoken_model_name
+        else:
+            model = self.model_name
+            # model chatglm-std, chatglm-lite
+        # Returns the number of tokens used by a list of messages.
+        try:
+            encoding = tiktoken_.encoding_for_model(model)
+        except KeyError:
+            logger.warning(
+                'Warning: model not found. Using cl100k_base encoding.')
+            model = 'cl100k_base'
+            encoding = tiktoken_.get_encoding(model)
+        return model, encoding
+    def get_token_ids(self, text: str) -> List[int]:
+        """Get the tokens present in the text with tiktoken package."""
+        # tiktoken NOT supported for Python 3.7 or below
+        if sys.version_info[1] <= 7:
+            return super().get_token_ids(text)
+        _, encoding_model = self._get_encoding_model()
+        return encoding_model.encode(text)
+    def get_num_tokens_from_messages(self, messages: List[BaseMessage]) -> int:
+        """Calculate num tokens for chatglm with tiktoken package.
+        todo: read chatglm document
+        Official documentation: https://github.com/openai/openai-cookbook/blob/
+        main/examples/How_to_format_inputs_to_ChatGPT_models.ipynb"""
+        if sys.version_info[1] <= 7:
+            return super().get_num_tokens_from_messages(messages)
+        model, encoding = self._get_encoding_model()
+        if model.startswith('chatglm'):
+            # every message follows <im_start>{role/name}\n{content}<im_end>\n
+            tokens_per_message = 4
+            # if there's a name, the role is omitted
+            tokens_per_name = -1
+        else:
+            raise NotImplementedError(
+                f'get_num_tokens_from_messages() is not presently implemented '
+                f'for model {model}.'
+                'See https://github.com/openai/openai-python/blob/main/chatml.md for '
+                'information on how messages are converted to tokens.')
+        num_tokens = 0
+        messages_dict = [_convert_message_to_dict(m) for m in messages]
+        for message in messages_dict:
+            num_tokens += tokens_per_message
+            for key, value in message.items():
+                num_tokens += len(encoding.encode(value))
+                if key == 'name':
+                    num_tokens += tokens_per_name
+        # every reply is primed with <im_start>assistant
+        num_tokens += 3
+        return num_tokens
+class ChatGLM2Host(BaseHostChatLLM):
+    # chatglm2-12b, chatglm2-6b
+    model_name: str = Field('chatglm2-6b', alias='model')
+    temperature: float = 0.95
+    top_p: float = 0.7
+    max_tokens: int = 4096
+    @property
+    def _llm_type(self) -> str:
+        """Return type of chat model."""
+        return 'chatglm2'
+class BaichuanChat(BaseHostChatLLM):
+    # Baichuan-7B-Chat, Baichuan-13B-Chat
+    model_name: str = Field('Baichuan-13B-Chat', alias='model')
+    temperature: float = 0.3
+    top_p: float = 0.85
+    max_tokens: int = 8192
+    @property
+    def _llm_type(self) -> str:
+        """Return type of chat model."""
+        return 'baichang_chat'
+class QwenChat(BaseHostChatLLM):
+    # Qwen-7B-Chat
+    model_name: str = Field('Qwen-7B-Chat', alias='model')
+    temperature: float = 0
+    top_p: float = 0.5
+    max_tokens: int = 8192
+    @property
+    def _llm_type(self) -> str:
+        """Return type of chat model."""
+        return 'qwen_chat'
+class Llama2Chat(BaseHostChatLLM):
+    # Llama-2-7b-chat-hf, Llama-2-13b-chat-hf, Llama-2-70b-chat-hf
+    model_name: str = Field('Llama-2-7b-chat-hf', alias='model')
+    temperature: float = 0.9
+    top_p: float = 0.6
+    max_tokens: int = 8192
+    @property
+    def _llm_type(self) -> str:
+        """Return type of chat model."""
+        return 'llama2_chat'

bisheng_langchain/chat_models/interface/__init__.py ADDED Viewed

@@ -0,0 +1,10 @@
+from .minimax import ChatCompletion as MinimaxChatCompletion
+from .openai import ChatCompletion as OpenaiChatCompletion
+from .wenxin import ChatCompletion as WenxinChatCompletion
+from .xunfei import ChatCompletion as XunfeiChatCompletion
+from .zhipuai import ChatCompletion as ZhipuaiChatCompletion
+__all__ = [
+    'MinimaxChatCompletion', 'OpenaiChatCompletion', 'WenxinChatCompletion',
+    'XunfeiChatCompletion', 'ZhipuaiChatCompletion'
+]

bisheng_langchain/chat_models/interface/minimax.py ADDED Viewed

@@ -0,0 +1,123 @@
+import json
+import requests
+from .types import ChatInput, ChatOutput, Choice, Message, Usage
+from .utils import get_ts
+class ChatCompletion(object):
+    def __init__(self, group_id, api_key, **kwargs):
+        ep_url = 'https://api.minimax.chat/v1/text/chatcompletion'
+        self.endpoint = f'{ep_url}?GroupId={group_id}'
+        self.headers = {
+            'Authorization': f'Bearer {api_key}',
+            'Content-Type': 'application/json'
+        }
+    def parseChunkDelta(self, chunk):
+        decoded_data = chunk.decode('utf-8')
+        parsed_data = json.loads(decoded_data[6:])
+        delta_content = parsed_data['choices'][0]['delta']
+        return delta_content
+    def __call__(self, inp: ChatInput, verbose=False):
+        messages = inp.messages
+        model = inp.model
+        top_p = 0.95 if inp.top_p is None else inp.top_p
+        temperature = 0.9 if inp.temperature is None else inp.temperature
+        stream = False if inp.stream is None else inp.stream
+        max_tokens = 1024 if inp.max_tokens is None else inp.max_tokens
+        if abs(temperature) <= 1e-6:
+            temperature = 1e-6
+        chat_messages = messages
+        system_prompt = ('MM智能助理是一款由MinMax自研的，没有调用其他产品接口的大型语言'
+                         '模型。MiniMax是一家中国科技公司，一直致力于进行大模型相关的研究。\n----\n')
+        if messages[0].role == 'system':
+            system_prompt = messages[0].content
+            chat_messages = messages[1:]
+        new_messages = []
+        for m in chat_messages:
+            role = 'USER'
+            if m.role == 'system' or m.role == 'assistant':
+                role = 'BOT'
+            new_messages.append({'sender_type': role, 'text': m.content})
+        #  role_meta is given, prompt must is not empty
+        system_info = {}
+        if system_prompt:
+            system_info = {
+                'prompt': system_prompt,
+                'role_meta': {
+                    'user_name': '用户',
+                    'bot_name': 'MM智能助理'
+                }
+            }
+        payload = {
+            'model': model,
+            'stream': stream,
+            'use_standard_sse': True,
+            'messages': new_messages,
+            'temperature': temperature,
+            'top_p': top_p,
+            'tokens_to_generate': max_tokens
+        }
+        payload.update(system_info)
+        if verbose:
+            print('payload', payload)
+        response = requests.post(self.endpoint,
+                                 headers=self.headers,
+                                 json=payload)
+        req_type = 'chat.completion'
+        status_message = 'success'
+        status_code = response.status_code
+        created = get_ts()
+        choices = []
+        usage = None
+        if status_code == 200:
+            try:
+                info = json.loads(response.text)
+                if info['base_resp']['status_code'] == 0:
+                    created = info['created']
+                    # reply = info['reply']
+                    choices = []
+                    for s in info['choices']:
+                        index = s['index']
+                        finish_reason = s['finish_reason']
+                        msg = Message(role='assistant', content=s['text'])
+                        cho = Choice(index=index,
+                                     message=msg,
+                                     finish_reason=finish_reason)
+                        choices.append(cho)
+                    total_tokens = info['usage']['total_tokens']
+                    usage = Usage(total_tokens=total_tokens)
+                else:
+                    status_code = info['base_resp']['status_code']
+                    status_message = info['base_resp']['status_msg']
+            except Exception as e:
+                status_code = 401
+                status_message = str(e)
+        else:
+            status_code = 400
+            status_message = 'requests error'
+        if status_code != 200:
+            raise Exception(status_message)
+        return ChatOutput(status_code=status_code,
+                          status_message=status_message,
+                          model=model,
+                          object=req_type,
+                          created=created,
+                          choices=choices,
+                          usage=usage)

bisheng_langchain/chat_models/interface/openai.py ADDED Viewed

@@ -0,0 +1,68 @@
+# import json
+import openai
+from .types import ChatInput, ChatOutput, Choice, Usage
+from .utils import get_ts
+class ChatCompletion(object):
+    def __init__(self, api_key, proxy=None, **kwargs):
+        openai.api_key = api_key
+        openai.proxy = proxy
+    def __call__(self, inp: ChatInput, verbose=False):
+        messages = inp.messages
+        model = inp.model
+        top_p = 0.7 if inp.top_p is None else inp.top_p
+        temperature = 0.97 if inp.temperature is None else inp.temperature
+        # stream = False if inp.stream is None else inp.stream
+        max_tokens = 1024 if inp.max_tokens is None else inp.max_tokens
+        stop = None
+        if inp.stop is not None:
+            stop = inp.stop.split('||')
+        new_messages = [m.dict() for m in messages]
+        created = get_ts()
+        payload = {
+            'model': model,
+            'messages': new_messages,
+            'temperature': temperature,
+            'top_p': top_p,
+            'stop': stop,
+            'max_tokens': max_tokens,
+        }
+        if inp.functions:
+            payload.update({'functions': inp.functions})
+        if verbose:
+            print('payload', payload)
+        req_type = 'chat.completion'
+        status_message = 'success'
+        choices = []
+        usage = None
+        try:
+            resp = openai.ChatCompletion.create(**payload)
+            status_code = 200
+            choices = []
+            for choice in resp['choices']:
+                cho = Choice(**choice)
+                choices.append(cho)
+            usage = Usage(**resp['usage'])
+        except Exception as e:
+            status_code = 400
+            status_message = str(e)
+        if status_code != 200:
+            raise Exception(status_message)
+        return ChatOutput(status_code=status_code,
+                          status_message=status_message,
+                          model=model,
+                          object=req_type,
+                          created=created,
+                          choices=choices,
+                          usage=usage)

bisheng_langchain/chat_models/interface/types.py ADDED Viewed

@@ -0,0 +1,61 @@
+# from typing import Union
+from pydantic import BaseModel
+class Message(BaseModel):
+    role: str
+    content: str
+class Function(BaseModel):
+    name: str
+    description: str
+    parameters: dict
+class ChatInput(BaseModel):
+    model: str
+    messages: list[Message] = []
+    top_p: float = None
+    temperature: float = None
+    n: int = 1
+    stream: bool = False
+    stop: str = None
+    max_tokens: int = 256
+    functions: list[Function] = []
+    function_call: str = None
+class Choice(BaseModel):
+    index: int
+    message: Message = None
+    finish_reason: str = 'stop'
+class Usage(BaseModel):
+    prompt_tokens: int = 0
+    completion_tokens: int = 0
+    total_tokens: int
+class ChatOutput(BaseModel):
+    status_code: int
+    status_message: str = 'success'
+    id: str = None
+    object: str = None
+    model: str = None
+    created: int = None
+    choices: list[Choice] = []
+    usage: Usage = None
+class CompletionsInput(BaseModel):
+    model: str
+    prompt: str
+    top_p: float = None
+    temperature: float = None
+    n: int = 1
+    stream: bool = True
+    stop: str = None
+    max_tokens: int = 256

bisheng_langchain/chat_models/interface/utils.py ADDED Viewed

@@ -0,0 +1,5 @@
+import time
+def get_ts():
+    return round(time.time() * 1000)