diff options
author | Xuan Son Nguyen <thichthat@gmail.com> | 2024-05-04 18:56:22 +0200 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-05-04 18:56:22 +0200 |
commit | 842500144ee02c8b0a46d2cc43880f8d80998fa5 (patch) | |
tree | 2f80ab4903dc5b618e51fb92af968f601a4369d3 /examples/gguf-split/tests.sh | |
parent | cf768b7e71cbcc9886c753ae963c2b68893d02e4 (diff) |
gguf-split: add --no-tensor-first-split (#7072)
Diffstat (limited to 'examples/gguf-split/tests.sh')
-rwxr-xr-x | examples/gguf-split/tests.sh | 14 |
1 files changed, 7 insertions, 7 deletions
diff --git a/examples/gguf-split/tests.sh b/examples/gguf-split/tests.sh index 57588204..7ca6fa7f 100755 --- a/examples/gguf-split/tests.sh +++ b/examples/gguf-split/tests.sh @@ -55,15 +55,15 @@ $MAIN --model $WORK_PATH/ggml-model-merge.gguf --random-prompt --n-predict 32 echo PASS echo -# 4. Split with no tensor in metadata -#$SPLIT --split-max-tensors 32 --no-tensor-in-metadata $WORK_PATH/ggml-model-merge.gguf $WORK_PATH/ggml-model-split-32-tensors -#echo PASS -#echo +# 4. Split with no tensors in the first split +$SPLIT --split-max-tensors 32 --no-tensor-first-split $WORK_PATH/ggml-model-merge.gguf $WORK_PATH/ggml-model-split-32-tensors +echo PASS +echo # 4b. Test the sharded model is loading properly -#$MAIN --model $WORK_PATH/ggml-model-split-32-tensors-00001-of-00006.gguf --random-prompt --n-predict 32 -#echo PASS -#echo +$MAIN --model $WORK_PATH/ggml-model-split-32-tensors-00001-of-00007.gguf --random-prompt --n-predict 32 +echo PASS +echo # 5. Merge #$SPLIT --merge $WORK_PATH/ggml-model-split-32-tensors-00001-of-00006.gguf $WORK_PATH/ggml-model-merge-2.gguf |