llama_cpp 0.12.4 → 0.12.5
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/CHANGELOG.md +4 -0
- data/lib/llama_cpp/version.rb +2 -2
- data/vendor/tmp/llama.cpp/Makefile +138 -53
- data/vendor/tmp/llama.cpp/ggml-cuda.cu +688 -270
- data/vendor/tmp/llama.cpp/ggml-impl.h +2 -0
- data/vendor/tmp/llama.cpp/ggml-quants.c +39 -94
- data/vendor/tmp/llama.cpp/ggml-quants.h +68 -59
- data/vendor/tmp/llama.cpp/ggml-sycl.cpp +131 -90
- data/vendor/tmp/llama.cpp/ggml-vulkan-shaders.hpp +1516 -10656
- data/vendor/tmp/llama.cpp/ggml-vulkan.cpp +1697 -1241
- data/vendor/tmp/llama.cpp/ggml-vulkan.h +14 -9
- data/vendor/tmp/llama.cpp/ggml.c +13 -10
- data/vendor/tmp/llama.cpp/llama.cpp +266 -43
- data/vendor/tmp/llama.cpp/llama.h +1 -1
- metadata +2 -2
checksums.yaml
CHANGED
@@ -1,7 +1,7 @@
|
|
1
1
|
---
|
2
2
|
SHA256:
|
3
|
-
metadata.gz:
|
4
|
-
data.tar.gz:
|
3
|
+
metadata.gz: 143fb1bb108c9cc679ed6eddaaca4cb8a52a5321ee4ffd965440a2c92aeeb99e
|
4
|
+
data.tar.gz: f522cbf943f82143d1a4eae679473468a9920a6ef6fe6cf88147b82bc6a1f279
|
5
5
|
SHA512:
|
6
|
-
metadata.gz:
|
7
|
-
data.tar.gz:
|
6
|
+
metadata.gz: 1646833e8e1ffd6dd22d809ce2c4f2b0f3de78d84504713da4e8d5ab1c2b466c5cbc47a3c787297753f6d56656635e12cf522acffbe37253bdae0c57f8cc51c9
|
7
|
+
data.tar.gz: fbbf0372d52ba8862dcc4ff61f590f634cdcde039dc31f09a93ac6cd8e112c34a1c6d567d54a9ec2d0679e1c4ec8c2e8153071c6952f67af34fa0c4ccf49ac76
|
data/CHANGELOG.md
CHANGED
@@ -1,3 +1,7 @@
|
|
1
|
+
## [[0.12.5](https://github.com/yoshoku/llama_cpp.rb/compare/v0.12.4...v0.12.5)] - 2024-02-09
|
2
|
+
|
3
|
+
- Bump bundled llama.cpp from b2047 to b2106.
|
4
|
+
|
1
5
|
## [[0.12.4](https://github.com/yoshoku/llama_cpp.rb/compare/v0.12.3...v0.12.4)] - 2024-02-03
|
2
6
|
|
3
7
|
- Bump bundled llama.cpp from b1971 to b2047.
|
data/lib/llama_cpp/version.rb
CHANGED
@@ -3,8 +3,8 @@
|
|
3
3
|
# llama_cpp.rb provides Ruby bindings for the llama.cpp.
|
4
4
|
module LLaMACpp
|
5
5
|
# The version of llama_cpp.rb you install.
|
6
|
-
VERSION = '0.12.
|
6
|
+
VERSION = '0.12.5'
|
7
7
|
|
8
8
|
# The version of llama.cpp bundled with llama_cpp.rb.
|
9
|
-
LLAMA_CPP_VERSION = '
|
9
|
+
LLAMA_CPP_VERSION = 'b2106'
|
10
10
|
end
|
@@ -109,8 +109,21 @@ MK_NVCCFLAGS += -O3
|
|
109
109
|
else
|
110
110
|
MK_CFLAGS += -O3
|
111
111
|
MK_CXXFLAGS += -O3
|
112
|
+
MK_NVCCFLAGS += -O3
|
112
113
|
endif
|
113
114
|
|
115
|
+
ifndef LLAMA_NO_CCACHE
|
116
|
+
CCACHE := $(shell which ccache)
|
117
|
+
ifdef CCACHE
|
118
|
+
export CCACHE_SLOPPINESS = time_macros
|
119
|
+
$(info I ccache found, compilation results will be cached. Disable with LLAMA_NO_CCACHE.)
|
120
|
+
CC := $(CCACHE) $(CC)
|
121
|
+
CXX := $(CCACHE) $(CXX)
|
122
|
+
else
|
123
|
+
$(info I ccache not found. Consider installing it for faster compilation.)
|
124
|
+
endif # CCACHE
|
125
|
+
endif # LLAMA_NO_CCACHE
|
126
|
+
|
114
127
|
# clock_gettime came in POSIX.1b (1993)
|
115
128
|
# CLOCK_MONOTONIC came in POSIX.1-2001 / SUSv3 as optional
|
116
129
|
# posix_memalign came in POSIX.1-2001 / SUSv3
|
@@ -367,7 +380,7 @@ ifdef LLAMA_CUBLAS
|
|
367
380
|
MK_CPPFLAGS += -DGGML_USE_CUBLAS -I/usr/local/cuda/include -I/opt/cuda/include -I$(CUDA_PATH)/targets/x86_64-linux/include -I/usr/local/cuda/targets/aarch64-linux/include
|
368
381
|
MK_LDFLAGS += -lcuda -lcublas -lculibos -lcudart -lcublasLt -lpthread -ldl -lrt -L/usr/local/cuda/lib64 -L/opt/cuda/lib64 -L$(CUDA_PATH)/targets/x86_64-linux/lib -L/usr/local/cuda/targets/aarch64-linux/lib -L/usr/lib/wsl/lib
|
369
382
|
OBJS += ggml-cuda.o
|
370
|
-
MK_NVCCFLAGS
|
383
|
+
MK_NVCCFLAGS += -use_fast_math
|
371
384
|
ifndef JETSON_EOL_MODULE_DETECT
|
372
385
|
MK_NVCCFLAGS += --forward-unknown-to-host-compiler
|
373
386
|
endif # JETSON_EOL_MODULE_DETECT
|
@@ -375,9 +388,9 @@ ifdef LLAMA_DEBUG
|
|
375
388
|
MK_NVCCFLAGS += -lineinfo
|
376
389
|
endif # LLAMA_DEBUG
|
377
390
|
ifdef LLAMA_CUDA_NVCC
|
378
|
-
NVCC = $(LLAMA_CUDA_NVCC)
|
391
|
+
NVCC = $(CCACHE) $(LLAMA_CUDA_NVCC)
|
379
392
|
else
|
380
|
-
NVCC = nvcc
|
393
|
+
NVCC = $(CCACHE) nvcc
|
381
394
|
endif #LLAMA_CUDA_NVCC
|
382
395
|
ifdef CUDA_DOCKER_ARCH
|
383
396
|
MK_NVCCFLAGS += -Wno-deprecated-gpu-targets -arch=$(CUDA_DOCKER_ARCH)
|
@@ -459,6 +472,18 @@ ifdef LLAMA_VULKAN_CHECK_RESULTS
|
|
459
472
|
MK_CPPFLAGS += -DGGML_VULKAN_CHECK_RESULTS
|
460
473
|
endif
|
461
474
|
|
475
|
+
ifdef LLAMA_VULKAN_DEBUG
|
476
|
+
MK_CPPFLAGS += -DGGML_VULKAN_DEBUG
|
477
|
+
endif
|
478
|
+
|
479
|
+
ifdef LLAMA_VULKAN_VALIDATE
|
480
|
+
MK_CPPFLAGS += -DGGML_VULKAN_VALIDATE
|
481
|
+
endif
|
482
|
+
|
483
|
+
ifdef LLAMA_VULKAN_RUN_TESTS
|
484
|
+
MK_CPPFLAGS += -DGGML_VULKAN_RUN_TESTS
|
485
|
+
endif
|
486
|
+
|
462
487
|
ggml-vulkan.o: ggml-vulkan.cpp ggml-vulkan.h
|
463
488
|
$(CXX) $(CXXFLAGS) -c $< -o $@
|
464
489
|
endif # LLAMA_VULKAN
|
@@ -472,7 +497,7 @@ ifdef LLAMA_HIPBLAS
|
|
472
497
|
ROCM_PATH ?= /opt/rocm
|
473
498
|
GPU_TARGETS ?= $(shell $(ROCM_PATH)/llvm/bin/amdgpu-arch)
|
474
499
|
endif
|
475
|
-
HIPCC ?= $(ROCM_PATH)/bin/hipcc
|
500
|
+
HIPCC ?= $(CCACHE) $(ROCM_PATH)/bin/hipcc
|
476
501
|
LLAMA_CUDA_DMMV_X ?= 32
|
477
502
|
LLAMA_CUDA_MMV_Y ?= 1
|
478
503
|
LLAMA_CUDA_KQUANTS_ITER ?= 2
|
@@ -542,8 +567,11 @@ $(info I CFLAGS: $(CFLAGS))
|
|
542
567
|
$(info I CXXFLAGS: $(CXXFLAGS))
|
543
568
|
$(info I NVCCFLAGS: $(NVCCFLAGS))
|
544
569
|
$(info I LDFLAGS: $(LDFLAGS))
|
545
|
-
$(info I CC: $(shell $(CC)
|
546
|
-
$(info I CXX: $(shell $(CXX)
|
570
|
+
$(info I CC: $(shell $(CC) --version | head -n 1))
|
571
|
+
$(info I CXX: $(shell $(CXX) --version | head -n 1))
|
572
|
+
ifdef LLAMA_CUBLAS
|
573
|
+
$(info I NVCC: $(shell $(NVCC) --version | tail -n 1))
|
574
|
+
endif # LLAMA_CUBLAS
|
547
575
|
$(info )
|
548
576
|
|
549
577
|
#
|
@@ -597,97 +625,135 @@ lib: llama.o ggml.o $(OBJS)
|
|
597
625
|
|
598
626
|
clean:
|
599
627
|
rm -vrf *.o tests/*.o *.so *.a *.dll *.dylib benchmark-matmult common/build-info.cpp *.dot $(COV_TARGETS) $(BUILD_TARGETS) $(TEST_TARGETS)
|
628
|
+
find examples pocs -type f -name "*.o" -delete
|
600
629
|
|
601
630
|
#
|
602
631
|
# Examples
|
603
632
|
#
|
604
633
|
|
634
|
+
# $< is the first prerequisite, i.e. the source file.
|
635
|
+
# Explicitly compile this to an object file so that it can be cached with ccache.
|
636
|
+
# The source file is then filtered out from $^ (the list of all prerequisites) and the object file is added instead.
|
637
|
+
|
638
|
+
# Helper function that replaces .c, .cpp, and .cu file endings with .o:
|
639
|
+
GET_OBJ_FILE = $(patsubst %.c,%.o,$(patsubst %.cpp,%.o,$(patsubst %.cu,%.o,$(1))))
|
640
|
+
|
605
641
|
main: examples/main/main.cpp ggml.o llama.o $(COMMON_DEPS) console.o grammar-parser.o $(OBJS)
|
606
|
-
$(CXX) $(CXXFLAGS)
|
642
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
643
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
607
644
|
@echo
|
608
645
|
@echo '==== Run ./main -h for help. ===='
|
609
646
|
@echo
|
610
647
|
|
611
648
|
infill: examples/infill/infill.cpp ggml.o llama.o $(COMMON_DEPS) console.o grammar-parser.o $(OBJS)
|
612
|
-
$(CXX) $(CXXFLAGS)
|
649
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
650
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
613
651
|
|
614
652
|
simple: examples/simple/simple.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
615
|
-
$(CXX) $(CXXFLAGS)
|
653
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
654
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
616
655
|
|
617
656
|
tokenize: examples/tokenize/tokenize.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
618
|
-
$(CXX) $(CXXFLAGS)
|
657
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
658
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
619
659
|
|
620
660
|
batched: examples/batched/batched.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
621
|
-
$(CXX) $(CXXFLAGS)
|
661
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
662
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
622
663
|
|
623
664
|
batched-bench: examples/batched-bench/batched-bench.cpp build-info.o ggml.o llama.o common.o $(OBJS)
|
624
|
-
$(CXX) $(CXXFLAGS)
|
665
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
666
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
625
667
|
|
626
668
|
quantize: examples/quantize/quantize.cpp build-info.o ggml.o llama.o $(OBJS)
|
627
|
-
$(CXX) $(CXXFLAGS)
|
669
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
670
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
628
671
|
|
629
672
|
quantize-stats: examples/quantize-stats/quantize-stats.cpp build-info.o ggml.o llama.o $(OBJS)
|
630
|
-
$(CXX) $(CXXFLAGS)
|
673
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
674
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
631
675
|
|
632
676
|
perplexity: examples/perplexity/perplexity.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
633
|
-
$(CXX) $(CXXFLAGS)
|
677
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
678
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
634
679
|
|
635
680
|
imatrix: examples/imatrix/imatrix.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
636
|
-
$(CXX) $(CXXFLAGS)
|
681
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
682
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
637
683
|
|
638
684
|
embedding: examples/embedding/embedding.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
639
|
-
$(CXX) $(CXXFLAGS)
|
685
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
686
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
640
687
|
|
641
688
|
save-load-state: examples/save-load-state/save-load-state.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
642
|
-
$(CXX) $(CXXFLAGS)
|
689
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
690
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
643
691
|
|
644
692
|
server: examples/server/server.cpp examples/server/oai.hpp examples/server/utils.hpp examples/server/httplib.h examples/server/json.hpp examples/server/index.html.hpp examples/server/index.js.hpp examples/server/completion.js.hpp examples/llava/clip.cpp examples/llava/clip.h common/stb_image.h ggml.o llama.o $(COMMON_DEPS) grammar-parser.o $(OBJS)
|
645
|
-
$(CXX) $(CXXFLAGS) -
|
693
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
694
|
+
$(CXX) $(CXXFLAGS) -c examples/llava/clip.cpp -o $(call GET_OBJ_FILE, examples/llava/clip.cpp) -Wno-cast-qual
|
695
|
+
$(CXX) $(CXXFLAGS) -Iexamples/server $(filter-out %.h %.hpp $< examples/llava/clip.cpp,$^) $(call GET_OBJ_FILE, $<) $(call GET_OBJ_FILE, examples/llava/clip.cpp) -o $@ $(LDFLAGS) $(LWINSOCK2)
|
646
696
|
|
647
697
|
gguf: examples/gguf/gguf.cpp ggml.o $(OBJS)
|
648
|
-
$(CXX) $(CXXFLAGS)
|
698
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
699
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
649
700
|
|
650
701
|
train-text-from-scratch: examples/train-text-from-scratch/train-text-from-scratch.cpp ggml.o llama.o $(COMMON_DEPS) train.o $(OBJS)
|
651
|
-
$(CXX) $(CXXFLAGS)
|
702
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
703
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
652
704
|
|
653
705
|
convert-llama2c-to-ggml: examples/convert-llama2c-to-ggml/convert-llama2c-to-ggml.cpp ggml.o llama.o $(OBJS)
|
654
|
-
$(CXX) $(CXXFLAGS)
|
706
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
707
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
655
708
|
|
656
709
|
llama-bench: examples/llama-bench/llama-bench.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
657
|
-
$(CXX) $(CXXFLAGS)
|
710
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
711
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
658
712
|
|
659
713
|
libllava.a: examples/llava/llava.cpp examples/llava/llava.h examples/llava/clip.cpp examples/llava/clip.h common/stb_image.h common/base64.hpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
660
714
|
$(CXX) $(CXXFLAGS) -static -fPIC -c $< -o $@ -Wno-cast-qual
|
661
715
|
|
662
716
|
llava-cli: examples/llava/llava-cli.cpp examples/llava/clip.h examples/llava/clip.cpp examples/llava/llava.h examples/llava/llava.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
663
|
-
$(CXX) $(CXXFLAGS)
|
717
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
718
|
+
$(CXX) $(CXXFLAGS) -c examples/llava/clip.cpp -o $(call GET_OBJ_FILE, examples/llava/clip.cpp) -Wno-cast-qual
|
719
|
+
$(CXX) $(CXXFLAGS) -c examples/llava/llava.cpp -o $(call GET_OBJ_FILE, examples/llava/llava.cpp)
|
720
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $< examples/llava/clip.cpp examples/llava/llava.cpp,$^) $(call GET_OBJ_FILE, $<) $(call GET_OBJ_FILE, examples/llava/clip.cpp) $(call GET_OBJ_FILE, examples/llava/llava.cpp) -o $@ $(LDFLAGS)
|
664
721
|
|
665
722
|
baby-llama: examples/baby-llama/baby-llama.cpp ggml.o llama.o $(COMMON_DEPS) train.o $(OBJS)
|
666
|
-
$(CXX) $(CXXFLAGS)
|
723
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
724
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
667
725
|
|
668
726
|
beam-search: examples/beam-search/beam-search.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
669
|
-
$(CXX) $(CXXFLAGS)
|
727
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
728
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
670
729
|
|
671
730
|
finetune: examples/finetune/finetune.cpp ggml.o llama.o $(COMMON_DEPS) train.o $(OBJS)
|
672
|
-
$(CXX) $(CXXFLAGS)
|
731
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
732
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
673
733
|
|
674
734
|
export-lora: examples/export-lora/export-lora.cpp ggml.o common/common.h $(OBJS)
|
675
|
-
$(CXX) $(CXXFLAGS)
|
735
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
736
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
676
737
|
|
677
738
|
speculative: examples/speculative/speculative.cpp ggml.o llama.o $(COMMON_DEPS) grammar-parser.o $(OBJS)
|
678
|
-
$(CXX) $(CXXFLAGS)
|
739
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
740
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
679
741
|
|
680
742
|
parallel: examples/parallel/parallel.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
681
|
-
$(CXX) $(CXXFLAGS)
|
743
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
744
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
682
745
|
|
683
746
|
lookahead: examples/lookahead/lookahead.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
684
|
-
$(CXX) $(CXXFLAGS)
|
747
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
748
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
685
749
|
|
686
750
|
lookup: examples/lookup/lookup.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
687
|
-
$(CXX) $(CXXFLAGS)
|
751
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
752
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
688
753
|
|
689
754
|
passkey: examples/passkey/passkey.cpp ggml.o llama.o $(COMMON_DEPS) $(OBJS)
|
690
|
-
$(CXX) $(CXXFLAGS)
|
755
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
756
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
691
757
|
|
692
758
|
ifeq ($(UNAME_S),Darwin)
|
693
759
|
swift: examples/batched.swift
|
@@ -695,7 +761,7 @@ swift: examples/batched.swift
|
|
695
761
|
endif
|
696
762
|
|
697
763
|
common/build-info.cpp: $(wildcard .git/index) scripts/build-info.sh
|
698
|
-
@sh scripts/build-info.sh $(CC) > $@.tmp
|
764
|
+
@sh scripts/build-info.sh "$(CC)" > $@.tmp
|
699
765
|
@if ! cmp -s $@.tmp $@; then \
|
700
766
|
mv $@.tmp $@; \
|
701
767
|
else \
|
@@ -712,7 +778,8 @@ build-info.o: common/build-info.cpp
|
|
712
778
|
tests: $(TEST_TARGETS)
|
713
779
|
|
714
780
|
benchmark-matmult: examples/benchmark/benchmark-matmult.cpp build-info.o ggml.o $(OBJS)
|
715
|
-
$(CXX) $(CXXFLAGS)
|
781
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
782
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
716
783
|
|
717
784
|
run-benchmark-matmult: benchmark-matmult
|
718
785
|
./$@
|
@@ -720,58 +787,76 @@ run-benchmark-matmult: benchmark-matmult
|
|
720
787
|
.PHONY: run-benchmark-matmult swift
|
721
788
|
|
722
789
|
vdot: pocs/vdot/vdot.cpp ggml.o $(OBJS)
|
723
|
-
$(CXX) $(CXXFLAGS)
|
790
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
791
|
+
$(CXX) $(CXXFLAGS) $(filter-out $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
724
792
|
|
725
793
|
q8dot: pocs/vdot/q8dot.cpp ggml.o $(OBJS)
|
726
|
-
$(CXX) $(CXXFLAGS)
|
794
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
795
|
+
$(CXX) $(CXXFLAGS) $(filter-out $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
727
796
|
|
728
797
|
tests/test-llama-grammar: tests/test-llama-grammar.cpp ggml.o grammar-parser.o $(OBJS)
|
729
|
-
$(CXX) $(CXXFLAGS)
|
798
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
799
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
730
800
|
|
731
801
|
tests/test-grammar-parser: tests/test-grammar-parser.cpp ggml.o llama.o grammar-parser.o $(OBJS)
|
732
|
-
$(CXX) $(CXXFLAGS)
|
802
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
803
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
733
804
|
|
734
805
|
tests/test-double-float: tests/test-double-float.cpp ggml.o $(OBJS)
|
735
|
-
$(CXX) $(CXXFLAGS)
|
806
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
807
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
736
808
|
|
737
809
|
tests/test-grad0: tests/test-grad0.cpp ggml.o $(OBJS)
|
738
|
-
$(CXX) $(CXXFLAGS)
|
810
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
811
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
739
812
|
|
740
813
|
tests/test-opt: tests/test-opt.cpp ggml.o $(OBJS)
|
741
|
-
$(CXX) $(CXXFLAGS)
|
814
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
815
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
742
816
|
|
743
817
|
tests/test-quantize-fns: tests/test-quantize-fns.cpp ggml.o $(OBJS)
|
744
|
-
$(CXX) $(CXXFLAGS)
|
818
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
819
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
745
820
|
|
746
821
|
tests/test-quantize-perf: tests/test-quantize-perf.cpp ggml.o $(OBJS)
|
747
|
-
$(CXX) $(CXXFLAGS)
|
822
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
823
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
748
824
|
|
749
825
|
tests/test-sampling: tests/test-sampling.cpp ggml.o llama.o $(OBJS)
|
750
|
-
$(CXX) $(CXXFLAGS)
|
826
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
827
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
751
828
|
|
752
829
|
tests/test-tokenizer-0-falcon: tests/test-tokenizer-0-falcon.cpp ggml.o llama.o $(COMMON_DEPS) console.o $(OBJS)
|
753
|
-
$(CXX) $(CXXFLAGS)
|
830
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
831
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
754
832
|
|
755
833
|
tests/test-tokenizer-0-llama: tests/test-tokenizer-0-llama.cpp ggml.o llama.o $(COMMON_DEPS) console.o $(OBJS)
|
756
|
-
$(CXX) $(CXXFLAGS)
|
834
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
835
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
757
836
|
|
758
837
|
tests/test-tokenizer-1-bpe: tests/test-tokenizer-1-bpe.cpp ggml.o llama.o $(COMMON_DEPS) console.o $(OBJS)
|
759
|
-
$(CXX) $(CXXFLAGS)
|
838
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
839
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
760
840
|
|
761
841
|
tests/test-tokenizer-1-llama: tests/test-tokenizer-1-llama.cpp ggml.o llama.o $(COMMON_DEPS) console.o $(OBJS)
|
762
|
-
$(CXX) $(CXXFLAGS)
|
842
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
843
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
763
844
|
|
764
845
|
tests/test-rope: tests/test-rope.cpp ggml.o $(OBJS)
|
765
|
-
$(CXX) $(CXXFLAGS)
|
846
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
847
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
766
848
|
|
767
849
|
tests/test-c.o: tests/test-c.c llama.h
|
768
850
|
$(CC) $(CFLAGS) -c $(filter-out %.h,$^) -o $@
|
769
851
|
|
770
852
|
tests/test-backend-ops: tests/test-backend-ops.cpp ggml.o $(OBJS)
|
771
|
-
$(CXX) $(CXXFLAGS)
|
853
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
854
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
772
855
|
|
773
856
|
tests/test-model-load-cancel: tests/test-model-load-cancel.cpp ggml.o llama.o tests/get-model.cpp $(COMMON_DEPS) $(OBJS)
|
774
|
-
$(CXX) $(CXXFLAGS)
|
857
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
858
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|
775
859
|
|
776
860
|
tests/test-autorelease: tests/test-autorelease.cpp ggml.o llama.o tests/get-model.cpp $(COMMON_DEPS) $(OBJS)
|
777
|
-
$(CXX) $(CXXFLAGS)
|
861
|
+
$(CXX) $(CXXFLAGS) -c $< -o $(call GET_OBJ_FILE, $<)
|
862
|
+
$(CXX) $(CXXFLAGS) $(filter-out %.h $<,$^) $(call GET_OBJ_FILE, $<) -o $@ $(LDFLAGS)
|