mirror of
https://github.com/bentoml/OpenLLM.git
synced 2026-01-17 03:47:54 -05:00
fix(cli): set default dtype to auto infer (#642)
Signed-off-by: Aaron Pham <29749331+aarnphm@users.noreply.github.com>
This commit is contained in:
@@ -304,9 +304,9 @@ def machine_option(f: _AnyCallable | None = None, **attrs: t.Any) -> t.Callable[
|
||||
def dtype_option(f: _AnyCallable | None = None, **attrs: t.Any) -> t.Callable[[FC], FC]:
|
||||
return cli_option(
|
||||
'--dtype',
|
||||
type=click.Choice(['float16', 'float32', 'bfloat16']),
|
||||
type=click.Choice(['float16', 'float32', 'bfloat16', 'auto']),
|
||||
envvar='TORCH_DTYPE',
|
||||
default='float16',
|
||||
default='auto',
|
||||
help='Optional dtype for casting tensors for running inference.',
|
||||
**attrs,
|
||||
)(f)
|
||||
|
||||
Reference in New Issue
Block a user