summaryrefslogtreecommitdiff
path: root/utils.h
diff options
context:
space:
mode:
authoranzz1 <anzz1@live.com>2023-03-21 17:42:43 +0200
committerGitHub <noreply@github.com>2023-03-21 17:42:43 +0200
commit975d2cebf97ce888fa0aeee6f5ac774d7135891f (patch)
treee578d57ca7ccef7851e1f02dfe15887ff829aec4 /utils.h
parente0ffc861fae5ac8b40ce973f822d03db02929d36 (diff)
cmdline option for custom amount of model parts (--n_parts N) (#348)
* cmdline option for custom amount of model parts (--n_parts N) * Update main.cpp --------- Co-authored-by: Georgi Gerganov <ggerganov@gmail.com>
Diffstat (limited to 'utils.h')
-rw-r--r--utils.h3
1 files changed, 2 insertions, 1 deletions
diff --git a/utils.h b/utils.h
index 4aa7c63b..c7fce964 100644
--- a/utils.h
+++ b/utils.h
@@ -13,10 +13,11 @@
//
struct gpt_params {
- int32_t seed = -1; // RNG seed
+ int32_t seed = -1; // RNG seed
int32_t n_threads = std::min(4, (int32_t) std::thread::hardware_concurrency());
int32_t n_predict = 128; // new tokens to predict
int32_t repeat_last_n = 64; // last n tokens to penalize
+ int32_t n_parts = -1; // amount of model parts (-1 = determine from model dimensions)
int32_t n_ctx = 512; //context size
// sampling parameters