Skip to content

Commit 0a5eebb

Browse files
CUDA: mul_mat_q RDNA2 tunings (#2910)
* CUDA: mul_mat_q RDNA2 tunings * Update ggml-cuda.cu Co-authored-by: Henri Vasserman <[email protected]> --------- Co-authored-by: Henri Vasserman <[email protected]>
1 parent 84e7236 commit 0a5eebb

File tree

3 files changed

+426
-45
lines changed

3 files changed

+426
-45
lines changed

CMakeLists.txt

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -388,7 +388,6 @@ if (LLAMA_HIPBLAS)
388388
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_DMMV_X=${LLAMA_CUDA_DMMV_X})
389389
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_MMV_Y=${LLAMA_CUDA_MMV_Y})
390390
target_compile_definitions(ggml-rocm PRIVATE K_QUANTS_PER_ITERATION=${LLAMA_CUDA_KQUANTS_ITER})
391-
target_compile_definitions(ggml-rocm PRIVATE CC_TURING=1000000000)
392391
set_source_files_properties(ggml-cuda.cu PROPERTIES LANGUAGE CXX)
393392
target_link_libraries(ggml-rocm PRIVATE hip::device PUBLIC hip::host roc::rocblas roc::hipblas)
394393

Makefile

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -408,7 +408,6 @@ ifdef LLAMA_HIPBLAS
408408
HIPFLAGS += -DGGML_CUDA_DMMV_X=$(LLAMA_CUDA_DMMV_X)
409409
HIPFLAGS += -DGGML_CUDA_MMV_Y=$(LLAMA_CUDA_MMV_Y)
410410
HIPFLAGS += -DK_QUANTS_PER_ITERATION=$(LLAMA_CUDA_KQUANTS_ITER)
411-
HIPFLAGS += -DCC_TURING=1000000000
412411
ifdef LLAMA_CUDA_FORCE_DMMV
413412
HIPFLAGS += -DGGML_CUDA_FORCE_DMMV
414413
endif # LLAMA_CUDA_FORCE_DMMV

0 commit comments

Comments
 (0)