Skip to content

Commit 2780ea2

Browse files
authored
Update Makefile
1 parent 04a3e64 commit 2780ea2

File tree

1 file changed

+5
-3
lines changed

1 file changed

+5
-3
lines changed

Makefile

+5-3
Original file line numberDiff line numberDiff line change
@@ -160,17 +160,19 @@ ifdef LLAMA_HIPBLAS
160160
CC := $(ROCM_PATH)/llvm/bin/clang
161161
CXX := $(ROCM_PATH)/llvm/bin/clang++
162162
GPU_TARGETS = gfx900 gfx906 gfx908 gfx90a gfx1030
163-
LLAMA_CUDA_DMMV_X ?= 32
164-
LLAMA_CUDA_DMMV_Y ?= 1
163+
LLAMA_CUDA_DMMV_X ?= 128
164+
LLAMA_CUDA_DMMV_Y ?= 4
165165
CFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
166166
CXXFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
167167
LDFLAGS += -L/opt/rocm/lib -Wl,-rpath=$(ROCM_PATH)/lib -lhipblas -lamdhip64
168-
OBJS += ggml-cuda.o
168+
OBJS += ggml-cuda.o ggml_v2-cuda.o
169169
ggml-cuda.o: CXXFLAGS += $(addprefix --offload-arch=,$(GPU_TARGETS))
170170
ggml-cuda.o: CXXFLAGS += -DGGML_CUDA_DMMV_X=$(LLAMA_CUDA_DMMV_X)
171171
ggml-cuda.o: CXXFLAGS += -DGGML_CUDA_DMMV_Y=$(LLAMA_CUDA_DMMV_Y)
172172
ggml-cuda.o: ggml-cuda.cu ggml-cuda.h
173173
$(CXX) $(CXXFLAGS) -x hip -c -o $@ $<
174+
ggml_v2-cuda.o: otherarch/ggml_v2-cuda.cu otherarch/ggml_v2-cuda.h
175+
$(CXX) $(CXXFLAGS) -x hip -c -o $@ $<
174176
endif # LLAMA_HIPBLAS
175177

176178
ifdef LLAMA_METAL

0 commit comments

Comments
 (0)