feat: set options for 'gpu' for building recommendation

Signed-off-by: paperspace <29749331+aarnphm@users.noreply.github.com>
2026-01-22 06:19:35 -05:00 · 2024-05-09 01:37:08 +00:00
parent 5e444381bb
commit c9f8dbc767
1 changed files with 3 additions and 3 deletions
--- a/openllm-python/src/_openllm_tiny/_entrypoint.py
+++ b/openllm-python/src/_openllm_tiny/_entrypoint.py
@@ -69,6 +69,8 @@ def parse_device_callback(
  # NOTE: --device all is a special case
  if len(el) == 1 and el[0] == 'all':
    return tuple(map(str, openllm.utils.available_devices()))
+  if len(el) == 1 and el[0] == 'gpu':
+    return ('0',)
  return el


@@ -266,9 +268,7 @@ def start_command(
    'TRUST_REMOTE_CODE': str(trust_remote_code),
    'GPU_MEMORY_UTILIZATION': orjson.dumps(gpu_memory_utilization).decode(),
    'SERVICES_CONFIG': orjson.dumps(
-      dict(
-        resources={'gpu' if device else 'cpu': len(device) if device else 'cpu_count'}, traffic=dict(timeout=timeout)
-      )
+      dict(resources={'gpu' if device else 'cpu': len(device) if device else '1'}, traffic=dict(timeout=timeout))
    ).decode(),
  })
  if max_model_len is not None: