mirror of
https://github.com/bentoml/OpenLLM.git
synced 2026-02-07 22:33:28 -05:00
Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com> Signed-off-by: Aaron Pham <29749331+aarnphm@users.noreply.github.com> Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
26 lines
582 B
Python
26 lines
582 B
Python
import bentoml
|
|
from bentoml._internal.models.model import ModelInfo
|
|
from openllm_core._typing_compat import TypedDict, NotRequired
|
|
from ._llm import LLM as LLM
|
|
|
|
class _Metadata(TypedDict):
|
|
model_id: str
|
|
dtype: str
|
|
_revision: str
|
|
_local: bool
|
|
serialisation: str
|
|
architectures: str
|
|
trust_remote_code: bool
|
|
api_version: str
|
|
llm_type: str
|
|
openllm_version: str
|
|
openllm_core_version: str
|
|
openllm_client_version: str
|
|
quantize: NotRequired[str]
|
|
|
|
class _Info(ModelInfo):
|
|
metadata: _Metadata # type: ignore[assignment]
|
|
|
|
class _Model(bentoml.Model):
|
|
info: _Info
|