fix(serialisation): vLLM safetensors support (#324)

* fix(serilisation): vllm support for safetensors Signed-off-by: aarnphm-ec2-dev <29749331+aarnphm@users.noreply.github.com> * chore: running tools Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com> * chore: generalize one shot generation Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com> * chore: add changelog [skip ci] Signed-off-by: paperspace <29749331+aarnphm@users.noreply.github.com> --------- Signed-off-by: aarnphm-ec2-dev <29749331+aarnphm@users.noreply.github.com> Signed-off-by: Aaron <29749331+aarnphm@users.noreply.github.com> Signed-off-by: paperspace <29749331+aarnphm@users.noreply.github.com>
2026-04-24 00:47:44 -04:00 · 2023-09-12 17:44:01 -04:00
parent c70d4edcb1
commit 35e6945e86
11 changed files with 29 additions and 46 deletions
--- a/openllm-python/src/openllm/utils/dummy_pt_objects.py
+++ b/openllm-python/src/openllm/utils/dummy_pt_objects.py
@@ -19,8 +19,8 @@ class GPTNeoX(metaclass=_DummyMetaclass):
  _backends=["torch"]
  def __init__(self,*param_decls:_t.Any,**attrs: _t.Any):_require_backends(self,["torch"])
 class Llama(metaclass=_DummyMetaclass):
-  _backends=["torch","fairscale","sentencepiece"]
-  def __init__(self,*param_decls:_t.Any,**attrs: _t.Any):_require_backends(self,["torch","fairscale","sentencepiece"])
+  _backends=["torch","fairscale","sentencepiece","scipy"]
+  def __init__(self,*param_decls:_t.Any,**attrs: _t.Any):_require_backends(self,["torch","fairscale","sentencepiece","scipy"])
 class MPT(metaclass=_DummyMetaclass):
  _backends=["torch","triton","einops"]
  def __init__(self,*param_decls:_t.Any,**attrs: _t.Any):_require_backends(self,["torch","triton","einops"])
--- a/openllm-python/src/openllm/utils/dummy_vllm_objects.py
+++ b/openllm-python/src/openllm/utils/dummy_vllm_objects.py
@@ -28,8 +28,8 @@ class VLLMStarCoder(metaclass=_DummyMetaclass):
  _backends=["vllm","bitsandbytes"]
  def __init__(self,*param_decls:_t.Any,**attrs: _t.Any):_require_backends(self,["vllm","bitsandbytes"])
 class VLLMLlama(metaclass=_DummyMetaclass):
-  _backends=["vllm","fairscale","sentencepiece"]
-  def __init__(self,*param_decls:_t.Any,**attrs: _t.Any):_require_backends(self,["vllm","fairscale","sentencepiece"])
+  _backends=["vllm","fairscale","sentencepiece","scipy"]
+  def __init__(self,*param_decls:_t.Any,**attrs: _t.Any):_require_backends(self,["vllm","fairscale","sentencepiece","scipy"])
 class AutoVLLM(metaclass=_DummyMetaclass):
  _backends=["vllm"]
  def __init__(self,*param_decls:_t.Any,**attrs: _t.Any):_require_backends(self,["vllm"])