File tree 2 files changed +7
-6
lines changed
2 files changed +7
-6
lines changed Original file line number Diff line number Diff line change @@ -186,8 +186,9 @@ ifdef LLAMA_HIPBLAS
186
186
CC := $(ROCM_PATH)/llvm/bin/clang
187
187
CXX := $(ROCM_PATH)/llvm/bin/clang++
188
188
GPU_TARGETS = gfx803 gfx900 gfx906 gfx908 gfx90a gfx1030 gfx1100
189
- LLAMA_CUDA_DMMV_X ?= 64
190
- LLAMA_CUDA_MMV_Y ?= 2
189
+ LLAMA_CUDA_DMMV_X ?= 128
190
+ LLAMA_CUDA_MMV_Y ?= 1
191
+ LLAMA_CUDA_KQUANTS_ITER ?= 1
191
192
LLAMA_CUDA_FORCE_DMMV = true
192
193
CFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
193
194
CXXFLAGS += -DGGML_USE_HIPBLAS -DGGML_USE_CUBLAS $(shell $(ROCM_PATH)/bin/hipconfig -C)
Original file line number Diff line number Diff line change @@ -246,12 +246,12 @@ inline static void* ggml_aligned_malloc(size_t size) {
246
246
#if defined(GGML_USE_CLBLAST) // allow usage of CLBlast alongside Accelerate functions
247
247
#include "ggml-opencl.h"
248
248
#endif
249
- #elif defined(GGML_USE_OPENBLAS)
250
- #if defined(GGML_BLAS_USE_MKL)
251
- #include <mkl.h>
252
- #else
249
+ #endif
250
+ #if defined(GGML_USE_OPENBLAS)
253
251
#include <cblas.h>
254
252
#endif
253
+ #if defined(GGML_BLAS_USE_MKL)
254
+ #include <mkl.h>
255
255
#endif
256
256
#if defined(GGML_USE_CUBLAS)
257
257
#include "ggml-cuda.h"
You can’t perform that action at this time.
0 commit comments