Files
OpenLLM/openllm-python/src/_service_vars.pyi
Aaron Pham 072b3e97ec feat: 1.2 APIs (#821)
Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com>
Signed-off-by: Aaron Pham <29749331+aarnphm@users.noreply.github.com>
Co-authored-by: pre-commit-ci[bot] <66853113+pre-commit-ci[bot]@users.noreply.github.com>
2024-03-15 03:49:19 -04:00

16 lines
518 B
Python

from typing import Dict, Optional, Any
from openllm_core._typing_compat import LiteralSerialisation, LiteralQuantise, LiteralString
from _openllm_tiny._llm import Dtype
model_id: str = ...
model_name: LiteralString = ...
model_tag: Optional[str] = ...
model_version: Optional[str] = ...
quantise: LiteralQuantise = ...
serialisation: LiteralSerialisation = ...
dtype: Dtype = ...
trust_remote_code: bool = ...
max_model_len: Optional[int] = ...
gpu_memory_utilization: int = ...
services_config: Dict[str, Any] = ...