File tree 1 file changed +5
-3
lines changed
1 file changed +5
-3
lines changed Original file line number Diff line number Diff line change @@ -160,17 +160,19 @@ ifdef LLAMA_HIPBLAS
160
160
CC := $(ROCM_PATH)/llvm/bin/clang
161
161
CXX := $(ROCM_PATH)/llvm/bin/clang++
162
162
GPU_TARGETS = gfx900 gfx906 gfx908 gfx90a gfx1030
163
- LLAMA_CUDA_DMMV_X ?= 32
164
- LLAMA_CUDA_DMMV_Y ?= 1
163
+ LLAMA_CUDA_DMMV_X ?= 128
164
+ LLAMA_CUDA_DMMV_Y ?= 4
165
165
CFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
166
166
CXXFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
167
167
LDFLAGS += -L/opt/rocm/lib -Wl,-rpath=$(ROCM_PATH)/lib -lhipblas -lamdhip64
168
- OBJS += ggml-cuda.o
168
+ OBJS += ggml-cuda.o ggml_v2-cuda.o
169
169
ggml-cuda.o : CXXFLAGS += $(addprefix --offload-arch=,$(GPU_TARGETS ) )
170
170
ggml-cuda.o : CXXFLAGS += -DGGML_CUDA_DMMV_X=$(LLAMA_CUDA_DMMV_X )
171
171
ggml-cuda.o : CXXFLAGS += -DGGML_CUDA_DMMV_Y=$(LLAMA_CUDA_DMMV_Y )
172
172
ggml-cuda.o : ggml-cuda.cu ggml-cuda.h
173
173
$(CXX ) $(CXXFLAGS ) -x hip -c -o $@ $<
174
+ ggml_v2-cuda.o : otherarch/ggml_v2-cuda.cu otherarch/ggml_v2-cuda.h
175
+ $(CXX ) $(CXXFLAGS ) -x hip -c -o $@ $<
174
176
endif # LLAMA_HIPBLAS
175
177
176
178
ifdef LLAMA_METAL
You can’t perform that action at this time.
0 commit comments