diff --git a/backend/python/rerankers/requirements-cpu.txt b/backend/python/rerankers/requirements-cpu.txt index e27a47263..1225fa4db 100644 --- a/backend/python/rerankers/requirements-cpu.txt +++ b/backend/python/rerankers/requirements-cpu.txt @@ -1,4 +1,4 @@ transformers accelerate -torch==2.4.1 +torch==2.7.1 rerankers[transformers] \ No newline at end of file diff --git a/backend/python/rerankers/requirements-cublas12.txt b/backend/python/rerankers/requirements-cublas12.txt index e27a47263..1225fa4db 100644 --- a/backend/python/rerankers/requirements-cublas12.txt +++ b/backend/python/rerankers/requirements-cublas12.txt @@ -1,4 +1,4 @@ transformers accelerate -torch==2.4.1 +torch==2.7.1 rerankers[transformers] \ No newline at end of file diff --git a/backend/python/vllm-omni/install.sh b/backend/python/vllm-omni/install.sh index 9a42b4727..8823948ec 100755 --- a/backend/python/vllm-omni/install.sh +++ b/backend/python/vllm-omni/install.sh @@ -79,6 +79,14 @@ fi cd vllm-omni/ +# fa3-fwd ships no aarch64 wheels and there is no source distribution, so on +# aarch64 (e.g. l4t13 / SBSA cu130) the upstream requirements/cuda.txt is +# unsatisfiable. Drop it before resolving — vllm-omni does not hard-require +# the fused FA3 kernel at import time on Jetson/SBSA targets. +if [ "$(uname -m)" = "aarch64" ] && [ -f requirements/cuda.txt ]; then + sed -i '/^fa3-fwd[[:space:]]*==/d' requirements/cuda.txt +fi + if [ "x${USE_PIP}" == "xtrue" ]; then pip install ${EXTRA_PIP_INSTALL_FLAGS:-} -e . else