karrelin's picture
Upload folder using huggingface_hub
6b67641 verified
# CMAKE generated file: DO NOT EDIT!
# Generated by "Unix Makefiles" Generator, CMake Version 3.31
# compile C with /usr/bin/cc
# compile CUDA with /usr/local/cuda/bin/nvcc
# compile CXX with /usr/bin/c++
C_DEFINES = -DGGML_CUDA_DMMV_X=32 -DGGML_CUDA_MIN_BATCH_OFFLOAD=32 -DGGML_CUDA_MMV_Y=1 -DGGML_CUDA_PEER_MAX_BATCH_SIZE=128 -DGGML_CUDA_USE_GRAPHS -DGGML_IQK_FLASH_ATTENTION -DGGML_SCHED_MAX_COPIES=4 -DGGML_USE_CUDA -DGGML_USE_IQK_MULMAT -DGGML_USE_LLAMAFILE -DGGML_USE_OPENMP -DK_QUANTS_PER_ITERATION=2 -DNDEBUG -D_GNU_SOURCE -D_XOPEN_SOURCE=600
C_INCLUDES = -I/content/tmp/ggml/src/../include -I/content/tmp/ggml/src/. -isystem /usr/local/cuda/targets/x86_64-linux/include
C_FLAGS = -O3 -DNDEBUG -std=gnu11 -Wshadow -Wstrict-prototypes -Wpointer-arith -Wmissing-prototypes -Werror=implicit-int -Werror=implicit-function-declaration -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wdouble-promotion -march=native -fopenmp
CUDA_DEFINES = -DGGML_CUDA_DMMV_X=32 -DGGML_CUDA_MIN_BATCH_OFFLOAD=32 -DGGML_CUDA_MMV_Y=1 -DGGML_CUDA_PEER_MAX_BATCH_SIZE=128 -DGGML_CUDA_USE_GRAPHS -DGGML_IQK_FLASH_ATTENTION -DGGML_SCHED_MAX_COPIES=4 -DGGML_USE_CUDA -DGGML_USE_IQK_MULMAT -DGGML_USE_LLAMAFILE -DGGML_USE_OPENMP -DK_QUANTS_PER_ITERATION=2 -DNDEBUG -D_GNU_SOURCE -D_XOPEN_SOURCE=600
CUDA_INCLUDES = -I/content/tmp/ggml/src/../include -I/content/tmp/ggml/src/. -isystem /usr/local/cuda/targets/x86_64-linux/include
CUDA_FLAGS = -O3 -DNDEBUG -std=c++17 "--generate-code=arch=compute_75,code=[compute_75,sm_75]" -use_fast_math -extended-lambda -Xcompiler "-Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wno-array-bounds -Wno-format-truncation -Wextra-semi -Wno-pedantic -march=native"
CXX_DEFINES = -DGGML_CUDA_DMMV_X=32 -DGGML_CUDA_MIN_BATCH_OFFLOAD=32 -DGGML_CUDA_MMV_Y=1 -DGGML_CUDA_PEER_MAX_BATCH_SIZE=128 -DGGML_CUDA_USE_GRAPHS -DGGML_IQK_FLASH_ATTENTION -DGGML_SCHED_MAX_COPIES=4 -DGGML_USE_CUDA -DGGML_USE_IQK_MULMAT -DGGML_USE_LLAMAFILE -DGGML_USE_OPENMP -DK_QUANTS_PER_ITERATION=2 -DNDEBUG -D_GNU_SOURCE -D_XOPEN_SOURCE=600
CXX_INCLUDES = -I/content/tmp/ggml/src/../include -I/content/tmp/ggml/src/. -isystem /usr/local/cuda/targets/x86_64-linux/include
CXX_FLAGS = -O3 -DNDEBUG -std=gnu++17 -Wmissing-declarations -Wmissing-noreturn -Wall -Wextra -Wpedantic -Wcast-qual -Wno-unused-function -Wno-array-bounds -Wno-format-truncation -Wextra-semi -march=native -fopenmp