llama : support Llama 3 HF conversion (#6745)

* Support Llama 3 conversion The tokenizer is BPE. * style * Accept suggestion Co-authored-by: Sourab Mangrulkar <13534540+pacman100@users.noreply.github.com> * llama : add llama_token_is_eog() ggml-ci * llama : auto-detect more EOT tokens when missing in KV data * convert : replacing EOS token is a hack * llama : fix codegemma EOT token + add TODOs * llama : fix model type string for 8B model --------- Co-authored-by: Sourab Mangrulkar <13534540+pacman100@users.noreply.github.com> Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
author: Pedro Cuenca <pedro@huggingface.co> 2024-04-21 13:50:41 +0200
committer: GitHub <noreply@github.com> 2024-04-21 14:50:41 +0300
commit: b97bc3966e852adb626c90be64fd48282800f504 (patch)
tree: 178656d15821205889fa03ec603c7327facbb265 /llama.h
parent: b8109bc0139f15a5b321909f47510b89dca47ffc (diff)
1 files changed, 4 insertions, 1 deletions
diff --git a/llama.h b/llama.h
index b5da686f..5bed97ad 100644
--- a/llama.h
+++ b/llama.h
@@ -783,6 +783,9 @@ extern "C" {
 
     LLAMA_API enum llama_token_type llama_token_get_type(const struct llama_model * model, llama_token token);
 
+    // Check if the token is supposed to end generation (end-of-generation, eg. EOS, EOT, etc.)
+    LLAMA_API bool llama_token_is_eog(const struct llama_model * model, llama_token token);
+
     // Special tokens
     LLAMA_API llama_token llama_token_bos(const struct llama_model * model); // beginning-of-sentence
     LLAMA_API llama_token llama_token_eos(const struct llama_model * model); // end-of-sentence
@@ -796,7 +799,7 @@ extern "C" {
     // Returns -1 if unknown, 1 for true or 0 for false.
     LLAMA_API int32_t         llama_add_eos_token(const struct llama_model * model);
 
-    // codellama infill tokens
+    // Codellama infill tokens
     LLAMA_API llama_token llama_token_prefix(const struct llama_model * model); // Beginning of infill prefix
     LLAMA_API llama_token llama_token_middle(const struct llama_model * model); // Beginning of infill middle
     LLAMA_API llama_token llama_token_suffix(const struct llama_model * model); // Beginning of infill suffix
author	Pedro Cuenca <pedro@huggingface.co>	2024-04-21 13:50:41 +0200
committer	GitHub <noreply@github.com>	2024-04-21 14:50:41 +0300
commit	b97bc3966e852adb626c90be64fd48282800f504 (patch)
tree	178656d15821205889fa03ec603c7327facbb265 /llama.h
parent	b8109bc0139f15a5b321909f47510b89dca47ffc (diff)