From 65c76cace350c51a3005b3b3ef53e0d49d2dea24 Mon Sep 17 00:00:00 2001 From: aarnphm-ec2-dev <29749331+aarnphm@users.noreply.github.com> Date: Wed, 11 Oct 2023 04:28:46 +0000 Subject: [PATCH] chore: update deps for transformers and vllm Signed-off-by: aarnphm-ec2-dev <29749331+aarnphm@users.noreply.github.com> --- openllm-python/pyproject.toml | 4 ++-- tools/dependencies.py | 8 ++++---- 2 files changed, 6 insertions(+), 6 deletions(-) diff --git a/openllm-python/pyproject.toml b/openllm-python/pyproject.toml index cfce5cdc..dacfb04d 100644 --- a/openllm-python/pyproject.toml +++ b/openllm-python/pyproject.toml @@ -39,7 +39,7 @@ classifiers = [ ] dependencies = [ "bentoml[io]>=1.1.2", - "transformers[torch,tokenizers,accelerate]>=4.32.1", + "transformers[torch,tokenizers]>=4.34.0", "openllm-client", "openllm-core", "safetensors", @@ -115,7 +115,7 @@ openai = ["openai[embeddings]", "tiktoken"] opt = ["flax>=0.7", "jax", "jaxlib", "tensorflow", "keras"] playground = ["jupyter", "notebook", "ipython", "jupytext", "nbformat"] starcoder = ["bitsandbytes"] -vllm = ["vllm>=0.1.7", "ray"] +vllm = ["vllm>=0.2.0", "ray"] [tool.hatch.version] fallback-version = "0.0.0" diff --git a/tools/dependencies.py b/tools/dependencies.py index c7b25751..84fed2f2 100755 --- a/tools/dependencies.py +++ b/tools/dependencies.py @@ -106,11 +106,11 @@ class Dependencies: lower_bentoml_constraint = '1.1.2' _BENTOML_EXT = ['io'] -_TRANSFORMERS_EXT = ['torch', 'tokenizers', 'accelerate'] +_TRANSFORMERS_EXT = ['torch', 'tokenizers'] _BASE_DEPENDENCIES = [ Dependencies(name='bentoml', extensions=_BENTOML_EXT, lower_constraint=lower_bentoml_constraint), - Dependencies(name='transformers', extensions=_TRANSFORMERS_EXT, lower_constraint='4.32.1'), + Dependencies(name='transformers', extensions=_TRANSFORMERS_EXT, lower_constraint='4.34.0'), Dependencies(name='openllm-client'), Dependencies(name='openllm-core'), Dependencies(name='safetensors'), @@ -120,7 +120,7 @@ _BASE_DEPENDENCIES = [ Dependencies(name='tabulate', extensions=['widechars'], lower_constraint='0.9.0'), Dependencies(name='click', lower_constraint='8.1.3'), Dependencies(name='cuda-python', platform=('Darwin', 'ne')), - Dependencies(name='bitsandbytes', upper_constraint='0.42'), # 0.41 works with CUDA 11.8 + Dependencies(name='bitsandbytes', upper_constraint='0.42'), # 0.41 works with CUDA 11.8 ] _ALL_RUNTIME_DEPS = ['flax>=0.7', 'jax', 'jaxlib', 'tensorflow', 'keras'] @@ -133,7 +133,7 @@ AGENTS_DEPS = ['transformers[agents]>=4.30', 'diffusers', 'soundfile'] PLAYGROUND_DEPS = ['jupyter', 'notebook', 'ipython', 'jupytext', 'nbformat'] GGML_DEPS = ['ctransformers'] GPTQ_DEPS = ['auto-gptq[triton]>=0.4.2', 'optimum>=1.12.0'] -VLLM_DEPS = ['vllm>=0.1.7', 'ray'] +VLLM_DEPS = ['vllm>=0.2.0', 'ray'] _base_requirements: dict[str, t.Any] = { inflection.dasherize(name): config_cls.__openllm_requirements__ for name, config_cls in openllm.CONFIG_MAPPING.items() if config_cls.__openllm_requirements__