From a01d867bc76cf57bbfb906bedd0d2fa24ade7921 Mon Sep 17 00:00:00 2001 From: aarnphm-ec2-dev <29749331+aarnphm@users.noreply.github.com> Date: Thu, 3 Aug 2023 02:40:06 +0000 Subject: [PATCH] chore(base): add auto-gptq CUDA kernel Signed-off-by: aarnphm-ec2-dev <29749331+aarnphm@users.noreply.github.com> --- src/openllm/bundle/oci/Dockerfile | 20 +++++++++++++++++++- 1 file changed, 19 insertions(+), 1 deletion(-) diff --git a/src/openllm/bundle/oci/Dockerfile b/src/openllm/bundle/oci/Dockerfile index 03c7f32f..a367c530 100644 --- a/src/openllm/bundle/oci/Dockerfile +++ b/src/openllm/bundle/oci/Dockerfile @@ -103,6 +103,21 @@ git fetch && git checkout ${COMMIT_HASH} python setup.py build EOT +# NOTE: Build auto-gptq CUDA kernels +FROM kernel-builder as auto-gptq-builder + +ENV COMMIT_HASH a7167b108c438f570938f0ced46a52fe515f4a59 +ARG COMMIT_HASH=${COMMIT_HASH} + +WORKDIR /usr/src + +RUN <