From e08a1fdae65edc76ee31bdc790a1df5e359468cf Mon Sep 17 00:00:00 2001 From: MekkCyber Date: Thu, 28 Nov 2024 12:16:48 +0000 Subject: [PATCH] add arch list --- docker/transformers-quantization-latest-gpu/Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/docker/transformers-quantization-latest-gpu/Dockerfile b/docker/transformers-quantization-latest-gpu/Dockerfile index ed08f19d5..f7bfae24f 100755 --- a/docker/transformers-quantization-latest-gpu/Dockerfile +++ b/docker/transformers-quantization-latest-gpu/Dockerfile @@ -38,7 +38,7 @@ RUN python3 -m pip install --no-cache-dir bitsandbytes # Add auto-gptq for gtpq quantization testing, installed from source RUN pip install gekko -RUN git clone https://github.com/PanQiWei/AutoGPTQ.git && cd AutoGPTQ && python3 setup.py install +RUN git clone https://github.com/PanQiWei/AutoGPTQ.git && cd AutoGPTQ && TORCH_CUDA_ARCH_LIST="7.5+PTX" python3 setup.py install # Add optimum for gptq quantization testing RUN python3 -m pip install --no-cache-dir git+https://github.com/huggingface/optimum@main#egg=optimum