File tree Expand file tree Collapse file tree 1 file changed +9
-16
lines changed Expand file tree Collapse file tree 1 file changed +9
-16
lines changed Original file line number Diff line number Diff line change @@ -250,6 +250,15 @@ if (LLAMA_CUBLAS)
250
250
set (LLAMA_EXTRA_LIBS ${LLAMA_EXTRA_LIBS} CUDA::cudart CUDA::cublas CUDA::cublasLt )
251
251
endif ()
252
252
253
+ if (NOT DEFINED CMAKE_CUDA_ARCHITECTURES )
254
+ if (LLAMA_CUDA_DMMV_F16 )
255
+ set (CMAKE_CUDA_ARCHITECTURES "61" ) # needed for f16 CUDA intrinsics
256
+ else ()
257
+ set (CMAKE_CUDA_ARCHITECTURES "52" ) # lowest CUDA 12 standard
258
+ endif ()
259
+ endif ()
260
+ message (STATUS "Using CUDA architectures: ${CMAKE_CUDA_ARCHITECTURES} " )
261
+
253
262
else ()
254
263
message (WARNING "cuBLAS not found" )
255
264
endif ()
@@ -493,22 +502,6 @@ if (BUILD_SHARED_LIBS)
493
502
endif ()
494
503
endif ()
495
504
496
- if (GGML_SOURCES_CUDA )
497
- message (STATUS "GGML CUDA sources found, configuring CUDA architecture" )
498
- set_property (TARGET ggml PROPERTY CUDA_ARCHITECTURES "native" )
499
- set_property (TARGET ggml PROPERTY CUDA_SELECT_NVCC_ARCH_FLAGS "Auto" )
500
-
501
- set_property (TARGET ggml_static PROPERTY CUDA_ARCHITECTURES "native" )
502
- set_property (TARGET ggml_static PROPERTY CUDA_SELECT_NVCC_ARCH_FLAGS "Auto" )
503
-
504
- if (BUILD_SHARED_LIBS )
505
- set_property (TARGET ggml_shared PROPERTY CUDA_ARCHITECTURES "native" )
506
- set_property (TARGET ggml_shared PROPERTY CUDA_SELECT_NVCC_ARCH_FLAGS "Auto" )
507
- endif ()
508
-
509
- set_property (TARGET llama PROPERTY CUDA_ARCHITECTURES "native" )
510
- endif ()
511
-
512
505
513
506
#
514
507
# programs, examples and tests
You can’t perform that action at this time.
0 commit comments