2024-01-27 00:06:38 +08:00
|
|
|
from __future__ import annotations
|
|
|
|
|
|
|
|
|
|
import abc
|
|
|
|
|
import typing
|
|
|
|
|
|
|
|
|
|
from ...core import app
|
|
|
|
|
from ...core import entities as core_entities
|
|
|
|
|
from .. import entities as llm_entities
|
2024-05-14 22:20:31 +08:00
|
|
|
from ..tools import entities as tools_entities
|
2025-03-29 17:50:45 +08:00
|
|
|
from ...entity.persistence import model as persistence_model
|
|
|
|
|
from . import token
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
class RuntimeLLMModel:
|
|
|
|
|
"""运行时模型"""
|
|
|
|
|
|
|
|
|
|
model_entity: persistence_model.LLMModel
|
|
|
|
|
"""模型数据"""
|
|
|
|
|
|
|
|
|
|
token_mgr: token.TokenManager
|
|
|
|
|
"""api key管理器"""
|
|
|
|
|
|
|
|
|
|
requester: LLMAPIRequester
|
|
|
|
|
"""请求器实例"""
|
2025-04-29 17:24:07 +08:00
|
|
|
|
|
|
|
|
def __init__(
|
|
|
|
|
self,
|
|
|
|
|
model_entity: persistence_model.LLMModel,
|
|
|
|
|
token_mgr: token.TokenManager,
|
|
|
|
|
requester: LLMAPIRequester,
|
|
|
|
|
):
|
2025-03-29 17:50:45 +08:00
|
|
|
self.model_entity = model_entity
|
|
|
|
|
self.token_mgr = token_mgr
|
|
|
|
|
self.requester = requester
|
2024-01-27 00:06:38 +08:00
|
|
|
|
2024-03-12 16:04:11 +08:00
|
|
|
|
2024-01-27 00:06:38 +08:00
|
|
|
class LLMAPIRequester(metaclass=abc.ABCMeta):
|
2025-04-29 17:24:07 +08:00
|
|
|
"""LLM API请求器"""
|
|
|
|
|
|
2024-03-12 16:04:11 +08:00
|
|
|
name: str = None
|
2024-01-27 00:06:38 +08:00
|
|
|
|
|
|
|
|
ap: app.Application
|
|
|
|
|
|
2025-03-17 22:03:09 +08:00
|
|
|
default_config: dict[str, typing.Any] = {}
|
|
|
|
|
|
|
|
|
|
requester_cfg: dict[str, typing.Any] = {}
|
|
|
|
|
|
|
|
|
|
def __init__(self, ap: app.Application, config: dict[str, typing.Any]):
|
2024-01-27 00:06:38 +08:00
|
|
|
self.ap = ap
|
2025-04-29 17:24:07 +08:00
|
|
|
self.requester_cfg = {**self.default_config}
|
2025-03-17 22:03:09 +08:00
|
|
|
self.requester_cfg.update(config)
|
2024-01-27 00:06:38 +08:00
|
|
|
|
|
|
|
|
async def initialize(self):
|
|
|
|
|
pass
|
|
|
|
|
|
2024-05-14 22:20:31 +08:00
|
|
|
@abc.abstractmethod
|
2025-03-29 17:50:45 +08:00
|
|
|
async def invoke_llm(
|
2024-05-14 22:20:31 +08:00
|
|
|
self,
|
2024-12-24 10:57:17 +08:00
|
|
|
query: core_entities.Query,
|
2025-03-29 17:50:45 +08:00
|
|
|
model: RuntimeLLMModel,
|
2024-05-14 22:20:31 +08:00
|
|
|
messages: typing.List[llm_entities.Message],
|
|
|
|
|
funcs: typing.List[tools_entities.LLMFunction] = None,
|
2025-03-17 22:03:09 +08:00
|
|
|
extra_args: dict[str, typing.Any] = {},
|
2024-05-14 22:20:31 +08:00
|
|
|
) -> llm_entities.Message:
|
|
|
|
|
"""调用API
|
2024-03-22 16:41:46 +08:00
|
|
|
|
|
|
|
|
Args:
|
2025-03-29 17:50:45 +08:00
|
|
|
model (RuntimeLLMModel): 使用的模型信息
|
2024-05-14 22:20:31 +08:00
|
|
|
messages (typing.List[llm_entities.Message]): 消息对象列表
|
|
|
|
|
funcs (typing.List[tools_entities.LLMFunction], optional): 使用的工具函数列表. Defaults to None.
|
2025-03-17 22:03:09 +08:00
|
|
|
extra_args (dict[str, typing.Any], optional): 额外的参数. Defaults to {}.
|
2024-03-22 16:41:46 +08:00
|
|
|
|
2024-05-14 22:20:31 +08:00
|
|
|
Returns:
|
|
|
|
|
llm_entities.Message: 返回消息对象
|
2024-01-27 00:06:38 +08:00
|
|
|
"""
|
2024-05-14 22:20:31 +08:00
|
|
|
pass
|