ollama/llama/hipblas.sh
2024-09-03 21:15:12 -04:00

92 lines
2.5 KiB
Bash

hipcc \
-parallel-jobs=12 \
-O3 \
--offload-arch=gfx1100 \
-DGGML_USE_CUDA \
-DGGML_BUILD=1 \
-DGGML_SHARED=1 \
-DGGML_CUDA_DMMV_X=32 \
-DGGML_CUDA_MMV_Y=1 \
-DGGML_SCHED_MAX_COPIES=4 \
-DGGML_USE_HIPBLAS \
-DGGML_USE_LLAMAFILE \
-DK_QUANTS_PER_ITERATION=2 \
-D_CRT_SECURE_NO_WARNINGS \
-Xclang --dependent-lib=msvcrt -Wl,/subsystem:console \
-Wno-expansion-to-defined \
-Wno-invalid-noreturn \
-Wno-ignored-attributes \
-Wno-pass-failed \
-Wno-deprecated-declarations \
-I. \
-lhipblas -lamdhip64 -lrocblas \
-shared \
-o ggml-hipblas.dll \
ggml-cuda.cu ggml-cuda/*.cu ggml.c ggml-backend.c ggml-alloc.c ggml-quants.c
# --offload-arch=gfx900 \
# --offload-arch=gfx906:xnack- \
# --offload-arch=gfx908:xnack- \
# --offload-arch=gfx90a:xnack+ \
# --offload-arch=gfx90a:xnack- \
# --offload-arch=gfx940 \
# --offload-arch=gfx941 \
# --offload-arch=gfx942 \
# --offload-arch=gfx1010 \
# --offload-arch=gfx1012 \
# --offload-arch=gfx1030 \
# --offload-arch=gfx1100 \
# --offload-arch=gfx1101 \
# --offload-arch=gfx1102 \
# hipcc \
# -v \
# -parallel-jobs=12 \
# --offload-arch=gfx900 \
# --offload-arch=gfx940 \
# --offload-arch=gfx941 \
# --offload-arch=gfx942 \
# --offload-arch=gfx1010 \
# --offload-arch=gfx1012 \
# --offload-arch=gfx1030 \
# --offload-arch=gfx1100 \
# --offload-arch=gfx1101 \
# --offload-arch=gfx1102 \
# -DLLAMA_BUILD \
# -DLLAMA_SHARED \
# -DK_QUANTS_PER_ITERATION=2 \
# -DGGML_USE_CUDA=1 \
# -DGGML_USE_HIPBLAS \
# -DGGML_CUDA_DMMV_X=32 \
# -DGGML_CUDA_MMV_Y=1 \
# -DGGML_CUDA_FORCE_DMMV \
# -DNDEBUG \
# -D_DLL \
# -D_MT \
# -D_XOPEN_SOURCE=600 \
# -D_CRT_SECURE_NO_WARNINGS \
# -Xclang \
# --dependent-lib=msvcrt \
# -std=gnu++14 \
# -Wmissing-declarations \
# -Wmissing-noreturn \
# -Wall \
# -Wextra \
# -Wpedantic \
# -Wcast-qual \
# -Wno-unused-function \
# -Wunreachable-code-break \
# -Wunreachable-code-return \
# -Wmissing-prototypes \
# -Wextra-semi \
# -Wno-cast-qual \
# -I. \
# -lhipblas -lamdhip64 -lrocblas \
# -Wno-expansion-to-defined \
# -Wno-invalid-noreturn \
# -Wno-deprecated-declarations \
# -mllvm \
# -x hip \
# -shared -o ggml-cuda.dll \
# ggml-cuda.cu ggml-cuda/*.cu ggml.c ggml-backend.c ggml-alloc.c ggml-quants.c