summaryrefslogtreecommitdiff
path: root/common/common.cpp
diff options
context:
space:
mode:
authorIwan Kawrakow <iwan.kawrakow@gmail.com>2024-06-26 17:38:18 +0300
committerIwan Kawrakow <iwan.kawrakow@gmail.com>2024-06-26 17:38:18 +0300
commit0a3a2c4cd47943dc4c3c43be75728402584a3732 (patch)
tree9e3b58646f002f023de8991dc8b30f2d0251796a /common/common.cpp
parent71725a918f9edee559a978397779486dce7c703a (diff)
imatrix: be able to specify the name of the output tensor
For some models the same tensor is used for token embeddings and output. This tensor tends to be named token_embedding.weight rather than output.weight, which prevernts us from collecting imatrix data for this tensor. With this commit we can tell the name of the output tensor to the imatrix tool.
Diffstat (limited to 'common/common.cpp')
-rw-r--r--common/common.cpp8
1 files changed, 8 insertions, 0 deletions
diff --git a/common/common.cpp b/common/common.cpp
index 64f160af..8eb23ade 100644
--- a/common/common.cpp
+++ b/common/common.cpp
@@ -1599,6 +1599,14 @@ bool gpt_params_find_arg(int argc, char ** argv, const std::string & arg, gpt_pa
params.process_output = true;
return true;
}
+ if (arg == "--output-tensor-name") {
+ if (++i >= argc) {
+ invalid_param = true;
+ return true;
+ }
+ params.output_tensor_name = argv[i];
+ return true;
+ }
if (arg == "--no-ppl") {
params.compute_ppl = false;
return true;