fix: device imports using strategies (#584)

* fix: device imports using strategies Signed-off-by: Aaron Pham <29749331+aarnphm@users.noreply.github.com> * chore: support trust_remote_code for vLLM runners Signed-off-by: Aaron Pham <29749331+aarnphm@users.noreply.github.com> --------- Signed-off-by: Aaron Pham <29749331+aarnphm@users.noreply.github.com>
2026-04-24 00:47:44 -04:00 · 2023-11-08 05:10:50 -05:00
parent 6d81fbbccd
commit 85a7243ac3
6 changed files with 16 additions and 19 deletions
--- a/openllm-python/src/openllm/utils/init.py
+++ b/openllm-python/src/openllm/utils/init.py
@@ -6,6 +6,7 @@ we won't ensure backward compatibility for these functions. So use with caution.
 from __future__ import annotations
 import typing as t

+import functools
 import openllm_core

 if t.TYPE_CHECKING:
@@ -14,7 +15,16 @@ if t.TYPE_CHECKING:
 def generate_labels(llm: openllm.LLM[t.Any, t.Any]) -> dict[str, t.Any]:
  return {'backend': llm.__llm_backend__, 'framework': 'openllm', 'model_name': llm.config['model_name'], 'architecture': llm.config['architecture'], 'serialisation': llm._serialisation}

-__all__ = ['generate_labels']
+def available_devices() -> tuple[str, ...]:
+  """Return available GPU under system. Currently only supports NVIDIA GPUs."""
+  from .._strategies import NvidiaGpuResource
+  return tuple(NvidiaGpuResource.from_system())
+
+@functools.lru_cache(maxsize=1)
+def device_count() -> int:
+  return len(available_devices())
+
+__all__ = ['generate_labels', 'available_devices', 'device_count']

 def __dir__() -> t.Sequence[str]:
  return sorted(__all__)