model interfaces

(cherry picked from commit 4c556c39f6fdefd8755d9afcec247086f5d47380)
2025-11-16 02:17:42 +00:00 · 2023-12-05 21:51:26 +08:00 · 2023-12-05 21:51:26 +08:00 · de35b970b7
commit de35b970b7
parent 425285ad79
13 changed files with 259 additions and 104 deletions
--- a/python/NN4K/executor/base.py
+++ b/python/NN4K/executor/base.py
@ -1,54 +0,0 @@
 from abc import ABC, abstractmethod
 class ModelExecutor(ABC):
    """
    对应xflow AntLLM
    """
    @classmethod
    def from_config(cls,
                    args='sys',
                    **kwargs):
        pass
    def __init__(self,
             backend_model,
             backend_tokenizer,
             init_args,
             **kwargs):
        self.backend_model = backend_model
        self.backend_tokenizer = backend_tokenizer
        self.init_args = init_args
        self.kwargs = kwargs
 class LLMExecutor(ModelExecutor):
    @abstractmethod
    def sft_train(self, args=None, callbacks=None, **kwargs):
        raise NotImplementedError("")
    @abstractmethod
    def rl_tuning(self, args=None, callbacks=None, **kwargs):
        raise NotImplementedError("")
    @abstractmethod
    def batch_inference(self, args, **kwargs):
        pass
    @abstractmethod
    def inference(self, input, inference_args, **kwargs):
        raise NotImplementedError()
 class HfLLMExecutor(ModelExecutor):
    pass
 class DeepKEExecutor(ModelExecutor):
    pass
--- a/python/NN4K/executor/hugging_face/init.py
+++ b/python/NN4K/executor/hugging_face/init.py
--- a/python/NN4K/invoker/init.py
+++ b/python/NN4K/invoker/init.py
--- a/python/NN4K/invoker/base.py
+++ b/python/NN4K/invoker/base.py
@ -1,50 +0,0 @@
 # coding: utf-8
 # Copyright (c) Antfin, Inc. All rights reserved.
 import sys
 from abc import ABC
 class ModelInvoker(ABC):
    """
    对应 xflow ModelHubEntry
    """
    def submit_sft(self, submit_mode='k8s'):
        pass
    def submit_rl_tuning(self, submit_mode='k8s'):
        pass
    def deploy(cls, args, deploy_mode='k8s'):
        pass
    def inference(self, input, **kwargs):
        """
        这个是从已有的服务中获取inference
        Args:
            args:
            **kwargs:
        Returns:
        """
        pass
    @classmethod
    def from_config(cls, args='sys'):
        return cls()
 class OpenAI(ModelInvoker):
    def __init__(self, token):
        self.token = token
        pass
    def inference(self, input, **kwargs):
        import requests
        requests.post(url="https://api.openai.com", params={"input": input, "token": self.token})
--- a/python/nn4k/init.py
+++ b/python/nn4k/init.py
--- a/python/nn4k/executor/init.py
+++ b/python/nn4k/executor/init.py
@ -0,0 +1 @@
 from .base import NNExecutor, LLMExecutor
--- a/python/nn4k/executor/base.py
+++ b/python/nn4k/executor/base.py
@ -0,0 +1,70 @@
 from abc import ABC, abstractmethod
 class NNExecutor(ABC):
    """
    Entry point of model execution in a certain pod.
    """
    @classmethod
    def from_config(cls, nn_config, **kwargs):
        pass
    def __init__(self,
             backend_model,
             backend_tokenizer,
             init_args,
             **kwargs):
        self.backend_model = backend_model
        self.backend_tokenizer = backend_tokenizer
        self.init_args = init_args
        self.kwargs = kwargs
 class LLMExecutor(NNExecutor):
    @classmethod
    def from_config(cls, nn_config: dict, **kwargs):
        """
        Args:
            nn_config
        """
        # TODO
        pass
    @abstractmethod
    def sft(self, args=None, callbacks=None, **kwargs):
        """
        The entry point of SFT execution in a certain pod.
        """
        raise NotImplementedError(f"{self.__class__.__name__} does not support SFT.")
    @abstractmethod
    def rl_tuning(self, args=None, callbacks=None, **kwargs):
        """
        The entry point of SFT execution in a certain pod.
        """
        raise NotImplementedError(f"{self.__class__.__name__} does not support RL-Tuning.")
    def batch_inference(self, args, **kwargs):
        pass
    @abstractmethod
    def inference(self, data, **kwargs):
        """
        The entry point of inference. Usually for local invokers or model services.
        """
        raise NotImplementedError()
 class HfLLMExecutor(NNExecutor):
    pass
 class DeepKeExecutor(NNExecutor):
    pass
--- a/python/nn4k/executor/deepke.py
+++ b/python/nn4k/executor/deepke.py
--- a/python/nn4k/executor/hugging_face.py
+++ b/python/nn4k/executor/hugging_face.py
--- a/python/nn4k/invoker/init.py
+++ b/python/nn4k/invoker/init.py
@ -0,0 +1 @@
 from .base import NNInvoker, LLMInvoker
--- a/python/nn4k/invoker/base.py
+++ b/python/nn4k/invoker/base.py
@ -0,0 +1,83 @@
 # coding: utf-8
 # Copyright (c) Antfin, Inc. All rights reserved.
 import json
 import os
 from abc import ABC
 from typing import Union
 from nn4k.executor import LLMExecutor
 from nn4k.executor import NNExecutor
 from nn4k.nnhub import SimpleNNHub
 class NNInvoker(ABC):
    """
    Invoking Entry Interfaces for NN Models.
    One NNInvoker object is for one NN Model.
    - Interfaces starting with "submit_" means submitting a batch task to a remote execution engine.
    - Interfaces starting with "remote_" means querying a remote service for some results.
    - Interfaces starting with "local_"  means running something locally.
    """
    hub = SimpleNNHub()
    def __init__(self, nn_executor: NNExecutor) -> None:
        if os.getenv("NN4K_DEBUG") is None:
            raise EnvironmentError("In prod env, only NNInvoker.from_config is allowed for creating an nn_invoker.")
        super().__init__()
        self._nn_executor: NNExecutor = nn_executor
 class LLMInvoker(NNInvoker):
    def __init__(self, nn_executor: LLMExecutor) -> None:
        super().__init__(nn_executor)
    def submit_inference(self, submit_mode='k8s'):
        pass
    def submit_sft(self, submit_mode='k8s'):
        pass
    def submit_rl_tuning(self, submit_mode='k8s'):
        pass
    # def deploy(cls, args, deploy_mode='k8s'):
    #     pass
    def remote_inference(self, input, **kwargs):
        """
        这个是从已有的服务中获取inference
        Args:
            args:
            **kwargs:
        Returns:
        """
        pass
    def local_inference(self, data, **kwargs):
        self._nn_executor.inference(data, **kwargs)
    def init_local_model(self):
        name = self._nn_config.get("nn_name")
        version = self._nn_config.get("nn_version")
        self._nn_executor: LLMExecutor = self.hub.get_model_executor(name, version)
    @classmethod
    def from_config(cls, nn_config: Union[str, dict]):
        try:
            if isinstance(nn_config, str):
                with open(nn_config, "r") as f:
                    nn_config = json.load(f)
        except:
            raise ValueError("cannot decode config file")
        if nn_config.get("invoker_type", "LLM") == "LLM":
            o = cls.__new__(cls)
            o._nn_config = nn_config
            return o
        elif nn_config.get("invoker_type", "LLM") == "OpenAI":
            from nn4k.invoker.openai_invoker import OpenAIInvoker
            return OpenAIInvoker.from_config(nn_config)
--- a/python/nn4k/invoker/openai_invoker.py
+++ b/python/nn4k/invoker/openai_invoker.py
@ -0,0 +1,21 @@
 from typing import Union
 from nn4k.invoker import NNInvoker
 class OpenAIInvoker(NNInvoker):
    @classmethod
    def from_config(cls, nn_config: Union[str, dict]):
        import openai
        o = cls.__new__(cls)
        o._openai_client = openai.OpenAI()
        o._open_ai_model = nn_config.get("open_ai_model")
        # TODO config key
        # TODO complete
        return o
    def remote_inference(self, input, **kwargs):
        # TODO
        pass
--- a/python/nn4k/nnhub/init.py
+++ b/python/nn4k/nnhub/init.py
@ -0,0 +1,83 @@
 from abc import ABC, abstractmethod
 from typing import Optional, Union, Tuple, Type
 from nn4k.executor import NNExecutor
 class NNHub(ABC):
    @abstractmethod
    def publish(self,
                model_executor: Union[NNExecutor, Tuple[Type[NNExecutor], tuple, dict, tuple]],
                name: str,
                version: str = None) -> str:
        """
        Publish a model(executor) to hub.
        Args:
            model_executor: An NNExecutor object, which is pickleable.
                Or a tuple of (class, args, kwargs, weight_ids) for creating an NNExecutor
                , while all these 4 augments are pickleable.
            name: The name of a model, like `llama2`.
                We do not have a `namespace`. Use a joined name like `alibaba/qwen` to support such features.
            version: Optional. Auto generate a version if this param is not given.
        Returns:
            The published model version.
        """
        pass
    @abstractmethod
    def get_model_executor(self, name: str, version: str = None) -> Optional[NNExecutor]:
        """
        Get a ModelExecutor instance from Hub.
        Args:
            name: The name of a model.
            version: The version of a model. Get default version of a model if this param is not given.
        Returns:
            The ModelExecutor Instance. None for NotFound.
        """
        pass
    def start_service(self, name: str, version: str, service_id: str = None, **kwargs):
        raise NotImplementedError("This Hub does not support starting model service.")
    def stop_service(self, name: str, version: str, service_id: str = None, **kwargs):
        raise NotImplementedError("This Hub does not support stopping model service.")
    def get_service(self, name: str, version: str, service_id: str = None):
        raise NotImplementedError("This Hub does not support model services.")
 class SimpleNNHub(NNHub):
    def __init__(self) -> None:
        super().__init__()
        self._model_executors = {}
        # init executor info.
        # TODO
        self._add_executor(())
    def _add_executor(self,
                      executor: Union[NNExecutor, Tuple[Type[NNExecutor], tuple, dict, tuple]],
                      name: str,
                      version: str = None):
        if version is None:
            version = 'default'
        if self._model_executors.get(name) is None:
            self._model_executors[name] = {
                version: executor
            }
        else:
            self._model_executors[name][version] = executor
    def publish(self, model_executor: NNExecutor, name: str, version: str = None) -> str:
        print("WARNING: You are using SimpleNNHub which can only maintain models in memory without data persistence!")
        if version is None:
            version = 'default'
        self._add_executor(model_executor, name, version)
        return version
    def get_model_executor(self, name: str, version: str = None) -> Optional[NNExecutor]:
        if self._model_executors.get(name) is None:
            return None
        return self._model_executors.get(name).get(version)