diff options
author | manikbhandari <mbbhandarimanik2@gmail.com> | 2023-12-28 09:03:57 -0500 |
---|---|---|
committer | GitHub <noreply@github.com> | 2023-12-28 15:03:57 +0100 |
commit | ea5497df5d138c83b2b0ca70aefdc4b1175c1001 (patch) | |
tree | c66c6a7c29c8a60c5758ef534aec46bd792175a9 /gguf-py/gguf/constants.py | |
parent | f6793491b5af6da75edad34d6f503ef86d31b09f (diff) |
gpt2 : Add gpt2 architecture integration (#4555)
Diffstat (limited to 'gguf-py/gguf/constants.py')
-rw-r--r-- | gguf-py/gguf/constants.py | 11 |
1 files changed, 10 insertions, 1 deletions
diff --git a/gguf-py/gguf/constants.py b/gguf-py/gguf/constants.py index c9be2111..ae62cc57 100644 --- a/gguf-py/gguf/constants.py +++ b/gguf-py/gguf/constants.py @@ -370,7 +370,16 @@ MODEL_TENSORS: dict[MODEL_ARCH, list[MODEL_TENSOR]] = { MODEL_TENSOR.FFN_UP, ], MODEL_ARCH.GPT2: [ - # TODO + MODEL_TENSOR.TOKEN_EMBD, + MODEL_TENSOR.POS_EMBD, + MODEL_TENSOR.OUTPUT_NORM, + MODEL_TENSOR.OUTPUT, + MODEL_TENSOR.ATTN_NORM, + MODEL_TENSOR.ATTN_QKV, + MODEL_TENSOR.ATTN_OUT, + MODEL_TENSOR.FFN_NORM, + MODEL_TENSOR.FFN_DOWN, + MODEL_TENSOR.FFN_UP, ], MODEL_ARCH.PHI2: [ MODEL_TENSOR.TOKEN_EMBD, |