perf: improve build logics and cleanup speed (#657)

Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com>
2026-02-20 07:33:55 -05:00 · 2023-11-15 00:18:31 -05:00
parent 103156cd71
commit a58d947bc8
11 changed files with 141 additions and 237 deletions
--- a/openllm-python/src/openllm/serialisation/init.py
+++ b/openllm-python/src/openllm/serialisation/init.py
@@ -4,8 +4,8 @@ import importlib
 import cloudpickle
 import fs

-import openllm
 from openllm_core._typing_compat import ParamSpec
+from openllm_core.exceptions import OpenLLMException

 P = ParamSpec('P')

@@ -31,7 +31,7 @@ def load_tokenizer(llm, **tokenizer_attrs):
      try:
        tokenizer = cloudpickle.load(cofile)['tokenizer']
      except KeyError:
-        raise openllm.exceptions.OpenLLMException(
+        raise OpenLLMException(
          "Bento model does not have tokenizer. Make sure to save the tokenizer within the model via 'custom_objects'. "
          'For example: "bentoml.transformers.save_model(..., custom_objects={\'tokenizer\': tokenizer})"'
        ) from None