types: update stubs for remaining entrypoints (#667)

* perf(type): static OpenAI types definition Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com> * feat: add hf types Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com> * types: update remaining missing stubs Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com> --------- Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com>
2026-06-11 18:09:52 -04:00 · 2023-11-16 04:26:13 -05:00
parent 6102a67a83
commit 9e3f0fea15
13 changed files with 231 additions and 260 deletions
--- a/openllm-python/src/openllm_cli/_factory.py
+++ b/openllm-python/src/openllm_cli/_factory.py
@@ -8,7 +8,7 @@ import click
 import click_option_group as cog
 import inflection
 from bentoml_cli.utils import BentoMLCommandGroup
-from click import ClickException, shell_completion as sc
+from click import shell_completion as sc

 import bentoml
 import openllm
@@ -22,7 +22,7 @@ from openllm_core._typing_compat import (
  ParamSpec,
  get_literal_args,
 )
-from openllm_core.utils import DEBUG
+from openllm_core.utils import DEBUG, resolve_user_filepath


 class _OpenLLM_GenericInternalConfig(LLMConfig):
@@ -125,12 +125,11 @@ def _id_callback(ctx: click.Context, _: click.Parameter, value: t.Tuple[str, ...
    # try to resolve the full path if users pass in relative,
    # currently only support one level of resolve path with current directory
    try:
-      adapter_id = openllm.utils.resolve_user_filepath(adapter_id, os.getcwd())
+      adapter_id = resolve_user_filepath(adapter_id, os.getcwd())
    except FileNotFoundError:
      pass
-    if len(adapter_name) == 0:
-      raise ClickException(f'Adapter name is required for {adapter_id}')
-    ctx.params[_adapter_mapping_key][adapter_id] = adapter_name[0]
+    name = adapter_name[0] if len(adapter_name) > 0 else 'default'
+    ctx.params[_adapter_mapping_key][adapter_id] = name
  return None


@@ -171,32 +170,7 @@ def start_decorator(serve_grpc: bool = False) -> t.Callable[[FC], t.Callable[[FC
        help='Assign GPU devices (if available)',
        show_envvar=True,
      ),
-      cog.optgroup.group(
-        'Fine-tuning related options',
-        help="""\
-    Note that the argument `--adapter-id` can accept the following format:
-
-    - `--adapter-id /path/to/adapter` (local adapter)
-
-    - `--adapter-id remote/adapter` (remote adapter from HuggingFace Hub)
-
-    - `--adapter-id remote/adapter:eng_lora` (two previous adapter options with the given adapter_name)
-
-    ```bash
-
-    $ openllm start opt --adapter-id /path/to/adapter_dir --adapter-id remote/adapter:eng_lora
-
-    ```
-    """,
-      ),
-      cog.optgroup.option(
-        '--adapter-id',
-        default=None,
-        help='Optional name or path for given LoRA adapter',
-        multiple=True,
-        callback=_id_callback,
-        metavar='[PATH | [remote/][adapter_name:]adapter_id][, ...]',
-      ),
+      adapter_id_option(factory=cog.optgroup),
      click.option('--return-process', is_flag=True, default=False, help='Internal use only.', hidden=True),
    )
    return composed(fn)
@@ -285,6 +259,17 @@ cli_option = functools.partial(_click_factory_type, attr='option')
 cli_argument = functools.partial(_click_factory_type, attr='argument')


+def adapter_id_option(f: _AnyCallable | None = None, **attrs: t.Any) -> t.Callable[[FC], FC]:
+  return cli_option(
+    '--adapter-id',
+    default=None,
+    help='Optional name or path for given LoRA adapter',
+    multiple=True,
+    callback=_id_callback,
+    metavar='[PATH | [remote/][adapter_name:]adapter_id][, ...]',
+  )
+
+
 def cors_option(f: _AnyCallable | None = None, **attrs: t.Any) -> t.Callable[[FC], FC]:
  return cli_option(
    '--cors/--no-cors',
--- a/openllm-python/src/openllm_cli/entrypoint.py
+++ b/openllm-python/src/openllm_cli/entrypoint.py
@@ -691,7 +691,7 @@ def pretty_print(line: str):
  elif 'ERROR' in line:
    caller = termui.error
  else:
-    caller = caller = functools.partial(termui.echo, fg=None)
+    caller = functools.partial(termui.echo, fg=None)
  caller(line.strip())


@@ -1026,6 +1026,7 @@ def build_command(
      'OPENLLM_BACKEND': llm.__llm_backend__,
      'OPENLLM_SERIALIZATION': llm._serialisation,
      'OPENLLM_MODEL_ID': llm.model_id,
+      'OPENLLM_ADAPTER_MAP': orjson.dumps(None).decode(),
    }
  )
  if llm.quantise:
@@ -1035,13 +1036,8 @@ def build_command(
  if prompt_template:
    os.environ['OPENLLM_PROMPT_TEMPLATE'] = prompt_template

-  # NOTE: We set this environment variable so that our service.py logic won't raise RuntimeError
-  # during build. This is a current limitation of bentoml build where we actually import the service.py into sys.path
  try:
    assert llm.bentomodel  # HACK: call it here to patch correct tag with revision and everything
-    # FIX: This is a patch for _service_vars injection
-    if 'OPENLLM_ADAPTER_MAP' not in os.environ:
-      os.environ['OPENLLM_ADAPTER_MAP'] = orjson.dumps(None).decode()

    labels = dict(llm.identifying_params)
    labels.update({'_type': llm.llm_type, '_framework': llm.__llm_backend__})
@@ -1190,14 +1186,8 @@ class ModelItem(t.TypedDict):


@cli.command()
-@click.option(
-  '--show-available',
-  is_flag=True,
-  default=True,
-  hidden=True,
-  help="Show available models in local store (mutually exclusive with '-o porcelain').",
-)
-def models_command(show_available: bool) -> dict[t.LiteralString, ModelItem]:
+@click.option('--show-available', is_flag=True, default=True, hidden=True)
+def models_command(**_: t.Any) -> dict[t.LiteralString, ModelItem]:
  """List all supported models.

  \b