add warning for nvidia compute_capability

2026-08-02 19:22:27 -04:00 · 2024-07-02 14:49:55 +08:00
parent 7baac978fe
commit d3d08f20d6
1 changed files with 9 additions and 0 deletions
--- a/openllm_next/accelerator_spec.py
+++ b/openllm_next/accelerator_spec.py
@@ -78,6 +78,7 @@ def get_local_machine_spec():

    from pynvml import (
        nvmlDeviceGetCount,
+        nvmlDeviceGetCudaComputeCapability,
        nvmlDeviceGetHandleByIndex,
        nvmlDeviceGetMemoryInfo,
        nvmlDeviceGetName,
@@ -98,6 +99,14 @@ def get_local_machine_spec():
                    model=name, memory_size=math.ceil(int(memory_info.total) / 1024**3)
                )
            )
+            compute_capability = nvmlDeviceGetCudaComputeCapability(handle)
+            if compute_capability < (7, 5):
+                output(
+                    f"GPU {name.decode()} with compute capability {compute_capability} "
+                    "may not be supported, 7.5 or higher is recommended. check "
+                    "https://developer.nvidia.com/cuda-gpus for more information",
+                    style="yellow",
+                )
        nvmlShutdown()
        return DeploymentTarget(
            accelerators=accelerators,