Skip to content

Commit 5fa1064

Browse files
mmq implementation for non k-quants
1 parent 5488fb7 commit 5fa1064

File tree

2 files changed

+765
-246
lines changed

2 files changed

+765
-246
lines changed

Makefile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -193,7 +193,7 @@ ifdef LLAMA_CUBLAS
193193
CXXFLAGS += -DGGML_USE_CUBLAS -I/usr/local/cuda/include -I/opt/cuda/include -I$(CUDA_PATH)/targets/x86_64-linux/include
194194
LDFLAGS += -lcublas -lculibos -lcudart -lcublasLt -lpthread -ldl -lrt -L/usr/local/cuda/lib64 -L/opt/cuda/lib64 -L$(CUDA_PATH)/targets/x86_64-linux/lib
195195
OBJS += ggml-cuda.o
196-
NVCCFLAGS = --forward-unknown-to-host-compiler
196+
NVCCFLAGS = --forward-unknown-to-host-compiler -use_fast_math
197197
ifdef LLAMA_CUDA_NVCC
198198
NVCC = $(LLAMA_CUDA_NVCC)
199199
else

0 commit comments

Comments
 (0)