Skip to content

Commit 7f85cc5

Browse files
committed
update makefile and ggml.c
1 parent 6ca3499 commit 7f85cc5

File tree

2 files changed

+7
-6
lines changed

2 files changed

+7
-6
lines changed

Makefile

+3-2
Original file line numberDiff line numberDiff line change
@@ -186,8 +186,9 @@ ifdef LLAMA_HIPBLAS
186186
CC := $(ROCM_PATH)/llvm/bin/clang
187187
CXX := $(ROCM_PATH)/llvm/bin/clang++
188188
GPU_TARGETS = gfx803 gfx900 gfx906 gfx908 gfx90a gfx1030 gfx1100
189-
LLAMA_CUDA_DMMV_X ?= 64
190-
LLAMA_CUDA_MMV_Y ?= 2
189+
LLAMA_CUDA_DMMV_X ?= 128
190+
LLAMA_CUDA_MMV_Y ?= 1
191+
LLAMA_CUDA_KQUANTS_ITER ?= 1
191192
LLAMA_CUDA_FORCE_DMMV = true
192193
CFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
193194
CXXFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)

ggml.c

+4-4
Original file line numberDiff line numberDiff line change
@@ -246,12 +246,12 @@ inline static void* ggml_aligned_malloc(size_t size) {
246246
#if defined(GGML_USE_CLBLAST) // allow usage of CLBlast alongside Accelerate functions
247247
#include "ggml-opencl.h"
248248
#endif
249-
#elif defined(GGML_USE_OPENBLAS)
250-
#if defined(GGML_BLAS_USE_MKL)
251-
#include <mkl.h>
252-
#else
249+
#endif
250+
#if defined(GGML_USE_OPENBLAS)
253251
#include <cblas.h>
254252
#endif
253+
#if defined(GGML_BLAS_USE_MKL)
254+
#include <mkl.h>
255255
#endif
256256
#if defined(GGML_USE_CUBLAS)
257257
#include "ggml-cuda.h"

0 commit comments

Comments
 (0)