Skip to content

Commit 7fbd26a

Browse files
CUDA: mul_mat_q RDNA2 tunings
1 parent 00d62ad commit 7fbd26a

File tree

3 files changed

+365
-40
lines changed

3 files changed

+365
-40
lines changed

CMakeLists.txt

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -388,7 +388,6 @@ if (LLAMA_HIPBLAS)
388388
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_DMMV_X=${LLAMA_CUDA_DMMV_X})
389389
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_MMV_Y=${LLAMA_CUDA_MMV_Y})
390390
target_compile_definitions(ggml-rocm PRIVATE K_QUANTS_PER_ITERATION=${LLAMA_CUDA_KQUANTS_ITER})
391-
target_compile_definitions(ggml-rocm PRIVATE CC_TURING=1000000000)
392391
set_source_files_properties(ggml-cuda.cu PROPERTIES LANGUAGE CXX)
393392
target_link_libraries(ggml-rocm PRIVATE hip::device PUBLIC hip::host roc::rocblas roc::hipblas)
394393

Makefile

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -358,7 +358,6 @@ ifdef LLAMA_HIPBLAS
358358
HIPFLAGS += -DGGML_CUDA_DMMV_X=$(LLAMA_CUDA_DMMV_X)
359359
HIPFLAGS += -DGGML_CUDA_MMV_Y=$(LLAMA_CUDA_MMV_Y)
360360
HIPFLAGS += -DK_QUANTS_PER_ITERATION=$(LLAMA_CUDA_KQUANTS_ITER)
361-
HIPFLAGS += -DCC_TURING=1000000000
362361
ifdef LLAMA_CUDA_FORCE_DMMV
363362
HIPFLAGS += -DGGML_CUDA_FORCE_DMMV
364363
endif # LLAMA_CUDA_FORCE_DMMV

0 commit comments

Comments
 (0)