diff options
author | Daniel Bevenius <daniel.bevenius@gmail.com> | 2024-01-16 18:54:24 +0100 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-01-16 19:54:24 +0200 |
commit | cec8a4847062fbd76253e3b085683f39d91e80d3 (patch) | |
tree | 9effcb2bbe2dbe449cdaa38dff8647a705035b4f | |
parent | 334a835a1ccc8106a5fa355683a965efb1bfa24b (diff) |
finetune : add training data file to log message (#4979)
This commit adds the name of the training data file to the log message
printed when the training data is tokenized.
The motivation for this change is that it can be useful to show which
file is being tokenized when running the finetune example.
Signed-off-by: Daniel Bevenius <daniel.bevenius@gmail.com>
-rw-r--r-- | examples/finetune/finetune.cpp | 2 |
1 files changed, 1 insertions, 1 deletions
diff --git a/examples/finetune/finetune.cpp b/examples/finetune/finetune.cpp index a6620fd7..11fcbf44 100644 --- a/examples/finetune/finetune.cpp +++ b/examples/finetune/finetune.cpp @@ -1799,7 +1799,7 @@ int main(int argc, char ** argv) { std::vector<llama_token> train_tokens; std::vector<size_t> train_samples_begin; std::vector<size_t> train_samples_size; - printf("%s: tokenize training data\n", __func__); + printf("%s: tokenize training data from %s\n", __func__, params.common.fn_train_data); tokenize_file(lctx, params.common.fn_train_data, params.common.sample_start, |