Spaces:
Running
Running
Commit
·
6641178
1
Parent(s):
ab96dac
CUDA: correct the lowest Maxwell supported by CUDA 12 (llama/11984)
Browse files* CUDA: correct the lowest Maxwell supported by CUDA 12
---------
Co-authored-by: Johannes Gäßler <[email protected]>
ggml/src/ggml-cuda/CMakeLists.txt
CHANGED
|
@@ -7,7 +7,7 @@ if (CUDAToolkit_FOUND)
|
|
| 7 |
|
| 8 |
if (NOT DEFINED CMAKE_CUDA_ARCHITECTURES)
|
| 9 |
# native == GPUs available at build time
|
| 10 |
-
#
|
| 11 |
# 60 == P100, FP16 CUDA intrinsics
|
| 12 |
# 61 == Pascal, __dp4a instruction (per-byte integer dot product)
|
| 13 |
# 70 == V100, FP16 tensor cores
|
|
@@ -17,7 +17,7 @@ if (CUDAToolkit_FOUND)
|
|
| 17 |
elseif(GGML_CUDA_F16 OR GGML_CUDA_DMMV_F16)
|
| 18 |
set(CMAKE_CUDA_ARCHITECTURES "60;61;70;75;80")
|
| 19 |
else()
|
| 20 |
-
set(CMAKE_CUDA_ARCHITECTURES "
|
| 21 |
endif()
|
| 22 |
endif()
|
| 23 |
message(STATUS "Using CUDA architectures: ${CMAKE_CUDA_ARCHITECTURES}")
|
|
|
|
| 7 |
|
| 8 |
if (NOT DEFINED CMAKE_CUDA_ARCHITECTURES)
|
| 9 |
# native == GPUs available at build time
|
| 10 |
+
# 50 == Maxwell, lowest CUDA 12 standard
|
| 11 |
# 60 == P100, FP16 CUDA intrinsics
|
| 12 |
# 61 == Pascal, __dp4a instruction (per-byte integer dot product)
|
| 13 |
# 70 == V100, FP16 tensor cores
|
|
|
|
| 17 |
elseif(GGML_CUDA_F16 OR GGML_CUDA_DMMV_F16)
|
| 18 |
set(CMAKE_CUDA_ARCHITECTURES "60;61;70;75;80")
|
| 19 |
else()
|
| 20 |
+
set(CMAKE_CUDA_ARCHITECTURES "50;61;70;75;80")
|
| 21 |
endif()
|
| 22 |
endif()
|
| 23 |
message(STATUS "Using CUDA architectures: ${CMAKE_CUDA_ARCHITECTURES}")
|