tokenize example: Respect normal add BOS token behavior (#4126)

Allow building with Makefile
author: Kerfuffle <44031344+KerfuffleV2@users.noreply.github.com> 2023-11-18 14:48:17 -0700
committer: GitHub <noreply@github.com> 2023-11-18 14:48:17 -0700
commit: 28a2e6e7d476717881be6eb9e2d3331342cec57b (patch)
tree: 19c9ea98490818264fd3c585492002eaca9eadae
parent: 0b5c3b04572a05f80163a365070fb377a837ac27 (diff)
2 files changed, 5 insertions, 2 deletions
diff --git a/Makefile b/Makefile
index 7150dbaf..a6d2c2ec 100644
--- a/Makefile
+++ b/Makefile
@@ -2,7 +2,7 @@
 BUILD_TARGETS = \
 	main quantize quantize-stats perplexity embedding vdot q8dot train-text-from-scratch convert-llama2c-to-ggml \
 	simple batched batched-bench save-load-state server gguf llama-bench libllava.a llava-cli baby-llama beam-search  \
-	speculative infill benchmark-matmult parallel finetune export-lora tests/test-c.o
+	speculative infill tokenize benchmark-matmult parallel finetune export-lora tests/test-c.o
 
 # Binaries only useful for tests
 TEST_TARGETS = \
@@ -594,6 +594,9 @@ infill: examples/infill/infill.cpp                            ggml.o llama.o $(C
 simple: examples/simple/simple.cpp                            ggml.o llama.o $(COMMON_DEPS) $(OBJS)
 	$(CXX) $(CXXFLAGS) $(filter-out %.h,$^) -o $@ $(LDFLAGS)
 
+tokenize: examples/tokenize/tokenize.cpp                      ggml.o llama.o $(COMMON_DEPS) $(OBJS)
+	$(CXX) $(CXXFLAGS) $(filter-out %.h,$^) -o $@ $(LDFLAGS)
+
 batched: examples/batched/batched.cpp                         ggml.o llama.o $(COMMON_DEPS) $(OBJS)
 	$(CXX) $(CXXFLAGS) $(filter-out %.h,$^) -o $@ $(LDFLAGS)
 
diff --git a/examples/tokenize/tokenize.cpp b/examples/tokenize/tokenize.cpp
index 17166836..4ff8e3fa 100644
--- a/examples/tokenize/tokenize.cpp
+++ b/examples/tokenize/tokenize.cpp
@@ -26,7 +26,7 @@ int main(int argc, char ** argv) {
     llama_context_params ctx_params = llama_context_default_params();
     llama_context * ctx = llama_new_context_with_model(model, ctx_params);
 
-    const bool add_bos = true;
+    const bool add_bos = llama_should_add_bos_token(model);
 
     std::vector<llama_token> tokens;
author	Kerfuffle <44031344+KerfuffleV2@users.noreply.github.com>	2023-11-18 14:48:17 -0700
committer	GitHub <noreply@github.com>	2023-11-18 14:48:17 -0700
commit	28a2e6e7d476717881be6eb9e2d3331342cec57b (patch)
tree	19c9ea98490818264fd3c585492002eaca9eadae
parent	0b5c3b04572a05f80163a365070fb377a837ac27 (diff)