forked from jasonacox/TinyLLM
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvllm.patch
23 lines (19 loc) · 969 Bytes
/
vllm.patch
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
--- Dockerfile 2024-06-07 22:09:30.069782339 -0700
+++ Dockerfile 2024-06-07 22:10:02.357875428 -0700
@@ -35,7 +35,7 @@
# can be useful for both `dev` and `test`
# explicitly set the list to avoid issues with torch 2.2
# see https://github.com/pytorch/pytorch/pull/123243
-ARG torch_cuda_arch_list='7.0 7.5 8.0 8.6 8.9 9.0+PTX'
+ARG torch_cuda_arch_list='6.0 6.1 7.0 7.5 8.0 8.6 8.9 9.0+PTX'
ENV TORCH_CUDA_ARCH_LIST=${torch_cuda_arch_list}
#################### BASE BUILD IMAGE ####################
--- CMakeLists.txt 2024-06-07 22:08:27.657601121 -0700
+++ CMakeLists.txt 2024-06-07 22:09:01.541699767 -0700
@@ -16,7 +16,7 @@
set(PYTHON_SUPPORTED_VERSIONS "3.8" "3.9" "3.10" "3.11")
# Supported NVIDIA architectures.
-set(CUDA_SUPPORTED_ARCHS "7.0;7.5;8.0;8.6;8.9;9.0")
+set(CUDA_SUPPORTED_ARCHS "6.0;6.1;7.0;7.5;8.0;8.6;8.9;9.0")
# Supported AMD GPU architectures.
set(HIP_SUPPORTED_ARCHS "gfx906;gfx908;gfx90a;gfx940;gfx941;gfx942;gfx1030;gfx1100")