Skip to content

Commit 4c8b3fb

Browse files
committed
add configurable vars
1 parent 30d921a commit 4c8b3fb

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

Makefile

+4-2
Original file line numberDiff line numberDiff line change
@@ -164,13 +164,15 @@ ifdef LLAMA_HIPBLAS
164164
CC := $(ROCM_PATH)/llvm/bin/clang
165165
CXX := $(ROCM_PATH)/llvm/bin/clang++
166166
GPU_TARGETS = gfx900 gfx906 gfx908 gfx90a gfx1030
167+
LLAMA_CUDA_DMMV_X ?= 64
168+
LLAMA_CUDA_DMMV_Y ?= 1
167169
CFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
168170
CXXFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
169171
LDFLAGS += -L/opt/rocm/lib -Wl,-rpath=$(ROCM_PATH)/lib -lhipblas -lamdhip64
170172
OBJS += ggml-cuda.o
171173
ggml-cuda.o: CXXFLAGS += $(addprefix --offload-arch=,$(GPU_TARGETS))
172-
ggml-cuda.o: CXXFLAGS += -DGGML_CUDA_DMMV_X=64
173-
ggml-cuda.o: CXXFLAGS += -DGGML_CUDA_DMMV_Y=1
174+
ggml-cuda.o: CXXFLAGS += -DGGML_CUDA_DMMV_X=$(LLAMA_CUDA_DMMV_X)
175+
ggml-cuda.o: CXXFLAGS += -DGGML_CUDA_DMMV_Y=$(LLAMA_CUDA_DMMV_Y)
174176
ggml-cuda.o: ggml-cuda.cu ggml-cuda.h
175177
$(CXX) $(CXXFLAGS) -x hip -c -o $@ $<
176178
endif

0 commit comments

Comments
 (0)