From e53d44c0bbd1bc993ee5929653ad765f2347ce0f Mon Sep 17 00:00:00 2001 From: teleprint-me <77757836+teleprint-me@users.noreply.github.com> Date: Wed, 20 Dec 2023 15:15:35 -0500 Subject: [PATCH] Consolidate PHI and PHI2 architectures in gguf constants Signed-off-by: teleprint-me <77757836+teleprint-me@users.noreply.github.com> --- gguf-py/gguf/constants.py | 8 ++------ 1 file changed, 2 insertions(+), 6 deletions(-) diff --git a/gguf-py/gguf/constants.py b/gguf-py/gguf/constants.py index 46cc6a143..d99616d30 100644 --- a/gguf-py/gguf/constants.py +++ b/gguf-py/gguf/constants.py @@ -95,7 +95,6 @@ class MODEL_ARCH(IntEnum): BLOOM = auto() STABLELM = auto() QWEN = auto() - PHI2 = auto() PHI = auto() @@ -142,7 +141,7 @@ MODEL_ARCH_NAMES: dict[MODEL_ARCH, str] = { MODEL_ARCH.BLOOM: "bloom", MODEL_ARCH.STABLELM: "stablelm", MODEL_ARCH.QWEN: "qwen", - MODEL_ARCH.PHI2: "phi2", + MODEL_ARCH.PHI: "phi", } TENSOR_NAMES: dict[MODEL_TENSOR, str] = { @@ -353,7 +352,7 @@ MODEL_TENSORS: dict[MODEL_ARCH, list[MODEL_TENSOR]] = { MODEL_ARCH.GPT2: [ # TODO ], - MODEL_ARCH.PHI2: [ + MODEL_ARCH.PHI: [ MODEL_TENSOR.TOKEN_EMBD, MODEL_TENSOR.OUTPUT_NORM, MODEL_TENSOR.OUTPUT, @@ -364,9 +363,6 @@ MODEL_TENSORS: dict[MODEL_ARCH, list[MODEL_TENSOR]] = { MODEL_TENSOR.FFN_DOWN, MODEL_TENSOR.FFN_UP, ] - MODEL_ARCH.PHI: [ - # TODO - ], # TODO }