gguf : make token scores and types optional (#3347)

author: Cebtenzzre <cebtenzzre@gmail.com> 2023-09-28 14:30:15 -0400
committer: GitHub <noreply@github.com> 2023-09-28 14:30:15 -0400
commit: ecf90b1a5114034bc0939b3968f549fe4d63cf6d (patch)
tree: edd1cbfc46d4be6484b77e22a27210cfedaf146a /llama.cpp
parent: 2619109ad57d7a75388a9cce51e5da645410d92e (diff)
1 files changed, 8 insertions, 10 deletions
diff --git a/llama.cpp b/llama.cpp
index 14053355..15de7600 100644
--- a/llama.cpp
+++ b/llama.cpp
@@ -1931,20 +1931,18 @@ static void llm_load_vocab(
         throw std::runtime_error("cannot find tokenizer vocab in model file\n");
     }
 
+    const float * scores = nullptr;
     const int score_idx = gguf_find_key(ctx, kv(LLM_KV_TOKENIZER_SCORES).c_str());
-    if (score_idx == -1) {
-        throw std::runtime_error("cannot find tokenizer scores in model file\n");
+    if (score_idx != -1) {
+        scores = (const float * ) gguf_get_arr_data(ctx, score_idx);
     }
 
-    const float * scores = (const float * ) gguf_get_arr_data(ctx, score_idx);
-
+    const int * toktypes = nullptr;
     const int toktype_idx = gguf_find_key(ctx, kv(LLM_KV_TOKENIZER_TOKEN_TYPE).c_str());
-    if (toktype_idx == -1) {
-        throw std::runtime_error("cannot find token type list in GGUF file\n");
+    if (toktype_idx != -1) {
+        toktypes = (const int * ) gguf_get_arr_data(ctx, toktype_idx);
     }
 
-    const int * toktypes = (const int * ) gguf_get_arr_data(ctx, toktype_idx);
-
     // determine vocab type
     {
         std::string tokenizer_name;
@@ -2012,8 +2010,8 @@ static void llm_load_vocab(
 
         auto & token_data = vocab.id_to_token[i];
         token_data.text  = std::move(word);
-        token_data.score = scores[i];
-        token_data.type  = (llama_token_type) toktypes[i];
+        token_data.score = scores ? scores[i] : 0.0f;
+        token_data.type  = toktypes ? (llama_token_type) toktypes[i] : LLAMA_TOKEN_TYPE_NORMAL;
     }
 
     // determine the newline token: LLaMA "<0x0A>" == 10 == '\n', Falcon 193 == '\n'
author	Cebtenzzre <cebtenzzre@gmail.com>	2023-09-28 14:30:15 -0400
committer	GitHub <noreply@github.com>	2023-09-28 14:30:15 -0400
commit	ecf90b1a5114034bc0939b3968f549fe4d63cf6d (patch)
tree	edd1cbfc46d4be6484b77e22a27210cfedaf146a /llama.cpp
parent	2619109ad57d7a75388a9cce51e5da645410d92e (diff)