mirror of
https://github.com/bentoml/OpenLLM.git
synced 2026-01-03 04:59:01 -05:00
23 lines
1.6 KiB
Python
23 lines
1.6 KiB
Python
from __future__ import annotations
|
|
import itertools, os, typing as t, pytest, openllm
|
|
if t.TYPE_CHECKING: from openllm_core._typing_compat import LiteralRuntime
|
|
|
|
_FRAMEWORK_MAPPING = {'flan_t5': 'google/flan-t5-small', 'opt': 'facebook/opt-125m', 'baichuan': 'baichuan-inc/Baichuan-7B',}
|
|
_PROMPT_MAPPING = {'qa': 'Answer the following yes/no question by reasoning step-by-step. Can you write a whole Haiku in a single tweet?',}
|
|
def parametrise_local_llm(model: str,) -> t.Generator[tuple[str, openllm.LLMRunner[t.Any, t.Any] | openllm.LLM[t.Any, t.Any]], None, None]:
|
|
if model not in _FRAMEWORK_MAPPING: pytest.skip(f"'{model}' is not yet supported in framework testing.")
|
|
runtime_impl: tuple[LiteralRuntime, ...] = tuple()
|
|
if model in openllm.MODEL_MAPPING_NAMES: runtime_impl += ('pt',)
|
|
if model in openllm.MODEL_FLAX_MAPPING_NAMES: runtime_impl += ('flax',)
|
|
if model in openllm.MODEL_TF_MAPPING_NAMES: runtime_impl += ('tf',)
|
|
for framework, prompt in itertools.product(runtime_impl, _PROMPT_MAPPING.keys()):
|
|
llm = openllm.Runner(model, model_id=_FRAMEWORK_MAPPING[model], ensure_available=True, implementation=framework, init_local=True,)
|
|
yield prompt, llm
|
|
def pytest_generate_tests(metafunc: pytest.Metafunc) -> None:
|
|
if os.getenv('GITHUB_ACTIONS') is None:
|
|
if 'prompt' in metafunc.fixturenames and 'llm' in metafunc.fixturenames:
|
|
metafunc.parametrize('prompt,llm', [(p, llm) for p, llm in parametrise_local_llm(metafunc.function.__name__[5:-15])])
|
|
def pytest_sessionfinish(session: pytest.Session, exitstatus: int):
|
|
# If no tests are collected, pytest exists with code 5, which makes the CI fail.
|
|
if exitstatus == 5: session.exitstatus = 0
|