1
1
default : koboldcpp_default koboldcpp_failsafe koboldcpp_openblas koboldcpp_noavx2 koboldcpp_clblast koboldcpp_clblast_noavx2 koboldcpp_cublas koboldcpp_hipblas koboldcpp_vulkan koboldcpp_vulkan_noavx2
2
- tools : quantize_gpt2 quantize_gptj quantize_llama quantize_neox quantize_mpt
2
+ tools : quantize_gpt2 quantize_gptj quantize_gguf quantize_neox quantize_mpt quantize_clip
3
3
dev : koboldcpp_openblas
4
4
dev2 : koboldcpp_clblast
5
5
@@ -507,7 +507,7 @@ gpttype_adapter_vulkan_noavx2.o: $(GPTTYPE_ADAPTER)
507
507
$(CXX ) $(CXXFLAGS ) $(FAILSAFE_FLAGS ) $(VULKAN_FLAGS ) -c $< -o $@
508
508
509
509
clean :
510
- rm -vf * .o main sdmain quantize_llama quantize_gpt2 quantize_gptj quantize_neox quantize_mpt quantize-stats perplexity embedding benchmark-matmult save-load-state gguf imatrix imatrix.exe gguf.exe main.exe quantize_llama .exe quantize_gptj.exe quantize_gpt2.exe quantize_neox.exe quantize_mpt.exe koboldcpp_default.dll koboldcpp_openblas.dll koboldcpp_failsafe.dll koboldcpp_noavx2.dll koboldcpp_clblast.dll koboldcpp_clblast_noavx2.dll koboldcpp_cublas.dll koboldcpp_hipblas.dll koboldcpp_vulkan.dll koboldcpp_vulkan_noavx2.dll koboldcpp_default.so koboldcpp_openblas.so koboldcpp_failsafe.so koboldcpp_noavx2.so koboldcpp_clblast.so koboldcpp_clblast_noavx2.so koboldcpp_cublas.so koboldcpp_hipblas.so koboldcpp_vulkan.so koboldcpp_vulkan_noavx2.so
510
+ rm -vf * .o main sdmain quantize_gguf quantize_clip quantize_gpt2 quantize_gptj quantize_neox quantize_mpt quantize-stats perplexity embedding benchmark-matmult save-load-state gguf imatrix imatrix.exe gguf.exe main.exe quantize_clip.exe quantize_gguf .exe quantize_gptj.exe quantize_gpt2.exe quantize_neox.exe quantize_mpt.exe koboldcpp_default.dll koboldcpp_openblas.dll koboldcpp_failsafe.dll koboldcpp_noavx2.dll koboldcpp_clblast.dll koboldcpp_clblast_noavx2.dll koboldcpp_cublas.dll koboldcpp_hipblas.dll koboldcpp_vulkan.dll koboldcpp_vulkan_noavx2.dll koboldcpp_default.so koboldcpp_openblas.so koboldcpp_failsafe.so koboldcpp_noavx2.so koboldcpp_clblast.so koboldcpp_clblast_noavx2.so koboldcpp_cublas.so koboldcpp_hipblas.so koboldcpp_vulkan.so koboldcpp_vulkan_noavx2.so
511
511
512
512
# useful tools
513
513
main : examples/main/main.cpp common/sampling.cpp build-info.h ggml.o ggml-quants.o ggml-alloc.o ggml-backend.o llama.o common.o console.o grammar-parser.o $(OBJS )
@@ -600,7 +600,7 @@ koboldcpp_vulkan_noavx2:
600
600
endif
601
601
602
602
# tools
603
- quantize_llama : examples/quantize/quantize.cpp ggml.o llama.o ggml-quants.o ggml-alloc.o ggml-backend.o
603
+ quantize_gguf : examples/quantize/quantize.cpp ggml.o llama.o ggml-quants.o ggml-alloc.o ggml-backend.o
604
604
$(CXX ) $(CXXFLAGS ) $^ -o $@ $(LDFLAGS )
605
605
quantize_gptj : ggml.o llama.o ggml-quants.o ggml-alloc.o ggml-backend.o otherarch/tools/gptj_quantize.cpp otherarch/tools/common-ggml.cpp
606
606
$(CXX ) $(CXXFLAGS ) $^ -o $@ $(LDFLAGS )
@@ -610,6 +610,8 @@ quantize_neox: ggml.o llama.o ggml-quants.o ggml-alloc.o ggml-backend.o otherarc
610
610
$(CXX ) $(CXXFLAGS ) $^ -o $@ $(LDFLAGS )
611
611
quantize_mpt : ggml.o llama.o ggml-quants.o ggml-alloc.o ggml-backend.o otherarch/tools/mpt_quantize.cpp otherarch/tools/common-ggml.cpp
612
612
$(CXX ) $(CXXFLAGS ) $^ -o $@ $(LDFLAGS )
613
+ quantize_clip : ggml.o llama.o ggml-quants.o ggml-alloc.o ggml-backend.o examples/llava/clip.cpp examples/llava/clip.h examples/llava/quantclip.cpp
614
+ $(CXX ) $(CXXFLAGS ) $^ -o $@ $(LDFLAGS )
613
615
614
616
# window simple clinfo
615
617
simpleclinfo : simpleclinfo.cpp
0 commit comments