mirror of
https://github.com/bentoml/OpenLLM.git
synced 2026-01-06 06:29:21 -05:00
24 lines
1.6 KiB
Python
24 lines
1.6 KiB
Python
from __future__ import annotations
|
|
import itertools, os, typing as t, pytest, openllm
|
|
if t.TYPE_CHECKING: from openllm._configuration import LiteralRuntime
|
|
|
|
_FRAMEWORK_MAPPING = {"flan_t5": "google/flan-t5-small", "opt": "facebook/opt-125m", "baichuan": "baichuan-inc/Baichuan-7B",}
|
|
_PROMPT_MAPPING = {"qa": "Answer the following yes/no question by reasoning step-by-step. Can you write a whole Haiku in a single tweet?",}
|
|
def parametrise_local_llm(model: str,) -> t.Generator[tuple[str, openllm.LLMRunner[t.Any, t.Any] | openllm.LLM[t.Any, t.Any]], None, None]:
|
|
if model not in _FRAMEWORK_MAPPING: pytest.skip(f"'{model}' is not yet supported in framework testing.")
|
|
runtime_impl: tuple[LiteralRuntime, ...] = tuple()
|
|
if model in openllm.MODEL_MAPPING_NAMES: runtime_impl += ("pt",)
|
|
if model in openllm.MODEL_FLAX_MAPPING_NAMES: runtime_impl += ("flax",)
|
|
if model in openllm.MODEL_TF_MAPPING_NAMES: runtime_impl += ("tf",)
|
|
for framework, prompt in itertools.product(runtime_impl, _PROMPT_MAPPING.keys()):
|
|
llm = openllm.Runner(model, model_id=_FRAMEWORK_MAPPING[model], ensure_available=True, implementation=framework, init_local=True,)
|
|
yield prompt, llm
|
|
|
|
def pytest_generate_tests(metafunc: pytest.Metafunc) -> None:
|
|
if os.getenv("GITHUB_ACTIONS") is None:
|
|
if "prompt" in metafunc.fixturenames and "llm" in metafunc.fixturenames:
|
|
metafunc.parametrize("prompt,llm", [(p, llm) for p, llm in parametrise_local_llm(metafunc.function.__name__[5:-15])])
|
|
def pytest_sessionfinish(session: pytest.Session, exitstatus: int):
|
|
# If no tests are collected, pytest exists with code 5, which makes the CI fail.
|
|
if exitstatus == 5: session.exitstatus = 0
|