diff options
author | Georgi Gerganov <ggerganov@gmail.com> | 2023-07-22 21:17:57 +0300 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-07-22 21:17:57 +0300 |
commit | b47b8a9cfeb439d271bf997fb985fd6d82b3af5e (patch) | |
tree | e5e2c0b5fc8839d2497e14b4c073964bc541707e /examples/common.cpp | |
parent | b5fe67f8c69113bd9354bc1adcfe2df6be323740 (diff) |
llama : optimize memory buffers (#2325)
Diffstat (limited to 'examples/common.cpp')
-rw-r--r-- | examples/common.cpp | 24 |
1 files changed, 12 insertions, 12 deletions
diff --git a/examples/common.cpp b/examples/common.cpp index 730b28bd..2dc6654d 100644 --- a/examples/common.cpp +++ b/examples/common.cpp @@ -578,18 +578,18 @@ std::vector<llama_token> llama_tokenize(struct llama_context * ctx, const std::s struct llama_context_params llama_context_params_from_gpt_params(const gpt_params & params) { auto lparams = llama_context_default_params(); - lparams.n_ctx = params.n_ctx; - lparams.n_batch = params.n_batch; - lparams.n_gpu_layers = params.n_gpu_layers; - lparams.main_gpu = params.main_gpu; - lparams.tensor_split = params.tensor_split; - lparams.low_vram = params.low_vram; - lparams.seed = params.seed; - lparams.f16_kv = params.memory_f16; - lparams.use_mmap = params.use_mmap; - lparams.use_mlock = params.use_mlock; - lparams.logits_all = params.perplexity; - lparams.embedding = params.embedding; + lparams.n_ctx = params.n_ctx; + lparams.n_batch = params.n_batch; + lparams.n_gpu_layers = params.n_gpu_layers; + lparams.main_gpu = params.main_gpu; + lparams.tensor_split = params.tensor_split; + lparams.low_vram = params.low_vram; + lparams.seed = params.seed; + lparams.f16_kv = params.memory_f16; + lparams.use_mmap = params.use_mmap; + lparams.use_mlock = params.use_mlock; + lparams.logits_all = params.perplexity; + lparams.embedding = params.embedding; lparams.rope_freq_base = params.rope_freq_base; lparams.rope_freq_scale = params.rope_freq_scale; |