Skip to content

Commit d0ef910

Browse files
CUDA: mul_mat_q RDNA2 tunings
1 parent 00d62ad commit d0ef910

File tree

3 files changed

+426
-45
lines changed

3 files changed

+426
-45
lines changed

CMakeLists.txt

-1
Original file line numberDiff line numberDiff line change
@@ -388,7 +388,6 @@ if (LLAMA_HIPBLAS)
388388
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_DMMV_X=${LLAMA_CUDA_DMMV_X})
389389
target_compile_definitions(ggml-rocm PRIVATE GGML_CUDA_MMV_Y=${LLAMA_CUDA_MMV_Y})
390390
target_compile_definitions(ggml-rocm PRIVATE K_QUANTS_PER_ITERATION=${LLAMA_CUDA_KQUANTS_ITER})
391-
target_compile_definitions(ggml-rocm PRIVATE CC_TURING=1000000000)
392391
set_source_files_properties(ggml-cuda.cu PROPERTIES LANGUAGE CXX)
393392
target_link_libraries(ggml-rocm PRIVATE hip::device PUBLIC hip::host roc::rocblas roc::hipblas)
394393

Makefile

-1
Original file line numberDiff line numberDiff line change
@@ -358,7 +358,6 @@ ifdef LLAMA_HIPBLAS
358358
HIPFLAGS += -DGGML_CUDA_DMMV_X=$(LLAMA_CUDA_DMMV_X)
359359
HIPFLAGS += -DGGML_CUDA_MMV_Y=$(LLAMA_CUDA_MMV_Y)
360360
HIPFLAGS += -DK_QUANTS_PER_ITERATION=$(LLAMA_CUDA_KQUANTS_ITER)
361-
HIPFLAGS += -DCC_TURING=1000000000
362361
ifdef LLAMA_CUDA_FORCE_DMMV
363362
HIPFLAGS += -DGGML_CUDA_FORCE_DMMV
364363
endif # LLAMA_CUDA_FORCE_DMMV

0 commit comments

Comments
 (0)