fix output

This commit is contained in:
jmorganca 2024-06-09 23:53:40 -04:00
parent 110f37ffb0
commit a632a04426
3 changed files with 25 additions and 15 deletions

4
llama/.gitignore vendored
View File

@ -3,5 +3,7 @@
*.lib
*.exp
*.dll
*.so
*.o
ollama_runner_*
*.obj
ollama_runner*

View File

@ -3,21 +3,17 @@ ARCH := $(or $(ARCH), $(shell uname -m))
NVCC := nvcc
HIPCC := "$(HIP_PATH)/bin/hipcc"
ifeq ($(UNAME_ARCH),x86_64)
ifeq ($(ARCH),x86_64)
ARCH := amd64
endif
# Determine object file extension based on OS
ifeq ($(OS),Windows_NT)
ifneq (,$(findstring MINGW,$(OS)))
OBJ_EXT := obj
SHARED_EXT := dll
else
OBJ_EXT := o
endif
ifeq ($(OS),Windows_NT)
SHARED_EXT := dll
else
SHARED_EXT := so
SHARED_EXT := so
endif
CUDA_SRCS := \
@ -105,15 +101,27 @@ else
all: ollama_runner ollama_runner_avx ollama_runner_avx2 ollama_runner_cuda ollama_runner_rocm
endif
%.cuda.$(OBJ_EXT): %.cu %.c %.cpp
nvcc -c $(CUDA_FLAGS) -o $@ $<
%.cuda.$(OBJ_EXT): %.cu
$(NVCC) -c $(CUDA_FLAGS) -o $@ $<
%.hip.$(OBJ_EXT): %.cu %.c %.cpp
$(HIPCC) -c $(HIP_FLAGS) -o $@ $<
%.cuda.$(OBJ_EXT): %.c
$(NVCC) -c $(CFLAGS) -o $@ $<
%.cuda.$(OBJ_EXT): %.cpp
$(NVCC) -c $(CXXFLAGS) -o $@ $<
ggml_cuda.$(SHARED_EXT): $(CUDA_OBJS)
nvcc --shared -lcuda -lcublas -lcudart -lcublasLt $(CUDA_FLAGS) $(CUDA_OBJS) -o $@
%.hip.$(OBJ_EXT): %.cu
$(HIPCC) -c $(HIP_FLAGS) -o $@ $<
%.hip.$(OBJ_EXT): %.c
$(HIPCC) -c $(CFLAGS) -o $@ $<
%.hip.$(OBJ_EXT): %.cpp
$(HIPCC) -c $(CXXFLAGS) -o $@ $<
ggml_hipblas.$(SHARED_EXT): $(HIP_OBJS)
$(HIPCC) --shared -lhipblas -lamdhip64 -lrocblas $(HIP_OBJS) -o $@
@ -135,4 +143,4 @@ ollama_runner_rocm: ggml_hipblas.dll
clean:
rm -f $(CUDA_OBJS) $(HIP_OBJS) ggml_cuda.$(SHARED_EXT) ggml_cuda.* ggml_hipblas.* ollama_runner*
.PHONY: all clean ollama_runner_cpu ollama_runner_cpu_avx ollama_runner_cpu_avx2 ollama_runner_cuda ollama_runner_rocm
.PHONY: all clean ollama_runner ollama_runner_avx ollama_runner_avx2 ollama_runner_cuda ollama_runner_rocm

View File

@ -1,6 +1,6 @@
package llama
// #cgo CFLAGS: -std=c11 -DNDEBUG -DLOG_DISABLE_LOGS
// #cgo CFLAGS: -std=c11 -DNDEBUG -DLOG_DISABLE_LOGS -Wno-discarded-qualifiers
// #cgo CXXFLAGS: -std=c++11 -DNDEBUG -DLOG_DISABLE_LOGS
// #cgo darwin,arm64 CFLAGS: -DGGML_USE_METAL -DGGML_USE_ACCELERATE -DACCELERATE_NEW_LAPACK -DACCELERATE_LAPACK_ILP64
// #cgo darwin,arm64 CXXFLAGS: -DGGML_USE_METAL -DGGML_USE_ACCELERATE -DACCELERATE_NEW_LAPACK -DACCELERATE_LAPACK_ILP64