refactor: use DEBUG env-var instead of OPENLLMDEVDEBUG (#647)

Signed-off-by: Aaron Pham <29749331+aarnphm@users.noreply.github.com>
2026-05-24 08:34:37 -04:00 · 2023-11-14 01:39:58 -05:00
parent d63da6a5cb
commit 31a799ff61
7 changed files with 6 additions and 9 deletions
--- a/openllm-python/src/openllm/bundle/oci/init.py
+++ b/openllm-python/src/openllm/bundle/oci/init.py
@@ -213,7 +213,7 @@ def build_container(
      tags['image_sha'] = outputs.decode('utf-8').strip()
  except Exception as err:
    raise openllm.exceptions.OpenLLMException(
-      f'Failed to containerize base container images (Scroll up to see error above, or set OPENLLMDEVDEBUG=True for more traceback):\n{err}'
+      f'Failed to containerize base container images (Scroll up to see error above, or set DEBUG=5 for more traceback):\n{err}'
    ) from err
  return tags

--- a/openllm-python/src/openllm/entrypoints/cohere.py
+++ b/openllm-python/src/openllm/entrypoints/cohere.py
@@ -147,8 +147,8 @@ async def cohere_generate(req: Request, llm: openllm.LLM[M, T]) -> Response:
      return StreamingResponse(generate_stream_generator(), media_type='text/event-stream')
    # None-streaming case
    final_result: GenerationOutput | None = None
-    texts: list[list[str]] = [[]] * config['num_generations']
-    token_ids: list[list[int]] = [[]] * config['num_generations']
+    texts: list[list[str]] = [[]] * config['n']
+    token_ids: list[list[int]] = [[]] * config['n']
    async for res in result_generator:
      if await req.is_disconnected():
        return error_response(HTTPStatus.BAD_REQUEST, 'Client disconnected.')
--- a/openllm-python/src/openllm/playground/falcon_tuned.py
+++ b/openllm-python/src/openllm/playground/falcon_tuned.py
@@ -8,7 +8,6 @@ import typing as t
 import torch
 import transformers

-# import openllm here for OPENLLMDEVDEBUG
 import openllm

 # Make sure to have at least one GPU to run this script
--- a/openllm-python/src/openllm/playground/llama2_qlora.py
+++ b/openllm-python/src/openllm/playground/llama2_qlora.py
@@ -8,7 +8,6 @@ import typing as t
 import torch
 import transformers

-# import openllm here for OPENLLMDEVDEBUG
 import openllm

 if t.TYPE_CHECKING:
--- a/openllm-python/src/openllm/playground/opt_tuned.py
+++ b/openllm-python/src/openllm/playground/opt_tuned.py
@@ -7,7 +7,6 @@ import typing as t

 import transformers

-# import openllm here for OPENLLMDEVDEBUG
 import openllm

 # Make sure to have at least one GPU to run this script