llama : remove token functions with `context` args in favor of `model` (#3720)

* added `llama_model_token_*` variants to all the `llama_token_*` functions. * added `LLAMA_API` * formatting Co-authored-by: Georgi Gerganov <ggerganov@gmail.com> * removed old `llama_token` functions * changed 3 more functions to take in model - `llama_token_get_text` - `llama_token_get_score` - `llama_token_get_type` * added back docs * fixed main.cpp * changed token functions to use new model variants * changed token functions to use new model variants --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
author: Marcus Dunn <51931484+MarcusDunn@users.noreply.github.com> 2023-10-23 12:40:03 -0700
committer: GitHub <noreply@github.com> 2023-10-23 22:40:03 +0300
commit: 5be6c803fa5378f62a1590f3ad8c6b64c7c0c2ce (patch)
tree: 190868e0431070686d797c3c2d86da857b8ba55f /examples/llama-bench/llama-bench.cpp
parent: 6336701c9378c23c85d1c0e464b663ca2bbb8e60 (diff)
1 files changed, 2 insertions, 2 deletions
diff --git a/examples/llama-bench/llama-bench.cpp b/examples/llama-bench/llama-bench.cpp
index a04115c9..20767d55 100644
--- a/examples/llama-bench/llama-bench.cpp
+++ b/examples/llama-bench/llama-bench.cpp
@@ -933,7 +933,7 @@ struct sql_printer : public printer {
 };
 
 static void test_prompt(llama_context * ctx, int n_prompt, int n_past, int n_batch, int n_threads) {
-    std::vector<llama_token> tokens(n_batch, llama_token_bos(ctx));
+    std::vector<llama_token> tokens(n_batch, llama_token_bos(llama_get_model(ctx)));
     int n_processed = 0;
 
     llama_set_n_threads(ctx, n_threads, n_threads);
@@ -946,7 +946,7 @@ static void test_prompt(llama_context * ctx, int n_prompt, int n_past, int n_bat
 }
 
 static void test_gen(llama_context * ctx, int n_gen, int n_past, int n_threads) {
-    llama_token token = llama_token_bos(ctx);
+    llama_token token = llama_token_bos(llama_get_model(ctx));
 
     llama_set_n_threads(ctx, n_threads, n_threads);
author	Marcus Dunn <51931484+MarcusDunn@users.noreply.github.com>	2023-10-23 12:40:03 -0700
committer	GitHub <noreply@github.com>	2023-10-23 22:40:03 +0300
commit	5be6c803fa5378f62a1590f3ad8c6b64c7c0c2ce (patch)
tree	190868e0431070686d797c3c2d86da857b8ba55f /examples/llama-bench/llama-bench.cpp
parent	6336701c9378c23c85d1c0e464b663ca2bbb8e60 (diff)