ci : integrate with ggml-org/ci (#2250)

* ci : run ctest ggml-ci * ci : add open llama 3B-v2 tests ggml-ci * ci : disable wget progress output ggml-ci * ci : add open llama 3B-v2 tg tests for q4 and q5 quantizations ggml-ci * tests : try to fix tail free sampling test ggml-ci * ci : add K-quants ggml-ci * ci : add short perplexity tests ggml-ci * ci : add README.md * ppl : add --chunks argument to limit max number of chunks ggml-ci * ci : update README
author: Georgi Gerganov <ggerganov@gmail.com> 2023-07-18 14:24:43 +0300
committer: GitHub <noreply@github.com> 2023-07-18 14:24:43 +0300
commit: d01bccde9f759b24449fdaa16306b406a50eb367 (patch)
tree: a1c351c6732f399f540a1e91f957eb61db535bbc /examples/perplexity/perplexity.cpp
parent: 6cbf9dfb32f0e23ed3afd02d30ab066ed53e2c4d (diff)
1 files changed, 4 insertions, 2 deletions
diff --git a/examples/perplexity/perplexity.cpp b/examples/perplexity/perplexity.cpp
index 7e120ff1..bfad9993 100644
--- a/examples/perplexity/perplexity.cpp
+++ b/examples/perplexity/perplexity.cpp
@@ -32,13 +32,15 @@ void perplexity(llama_context * ctx, const gpt_params & params) {
     // BOS tokens will be added for each chunk before eval
     auto tokens = ::llama_tokenize(ctx, params.prompt, true);
 
-    int count   = 0;
+    const int n_chunk_max = tokens.size() / params.n_ctx;
 
-    const int n_chunk = tokens.size() / params.n_ctx;
+    const int n_chunk = params.n_chunks < 0 ? n_chunk_max : std::min(params.n_chunks, n_chunk_max);
     const int n_vocab = llama_n_vocab(ctx);
     const int n_batch = params.n_batch;
 
+    int count = 0;
     double nll = 0.0;
+
     fprintf(stderr, "%s: calculating perplexity over %d chunks, batch_size=%d\n", __func__, n_chunk, n_batch);
 
     for (int i = 0; i < n_chunk; ++i) {
author	Georgi Gerganov <ggerganov@gmail.com>	2023-07-18 14:24:43 +0300
committer	GitHub <noreply@github.com>	2023-07-18 14:24:43 +0300
commit	d01bccde9f759b24449fdaa16306b406a50eb367 (patch)
tree	a1c351c6732f399f540a1e91f957eb61db535bbc /examples/perplexity/perplexity.cpp
parent	6cbf9dfb32f0e23ed3afd02d30ab066ed53e2c4d (diff)