Skip to content

Commit 30e85cb

Browse files
ngxsondanbev
authored andcommitted
use id for mmproj tensors
1 parent 84d22b1 commit 30e85cb

File tree

3 files changed

+10
-16
lines changed

3 files changed

+10
-16
lines changed

gguf-py/gguf/constants.py

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -438,8 +438,7 @@ class MODEL_TENSOR(IntEnum):
438438
POSNET_ATTN_V = auto()
439439
POSNET_ATTN_OUT = auto()
440440
# vision
441-
V_MMPROJ_A = auto()
442-
V_MMPROJ_B = auto()
441+
V_MMPROJ = auto()
443442
V_ENC_EMBD_CLS = auto()
444443
V_ENC_EMBD_PATCH = auto()
445444
V_ENC_EMBD_POS = auto()
@@ -643,8 +642,7 @@ class MODEL_TENSOR(IntEnum):
643642
MODEL_TENSOR.POSNET_ATTN_V: "posnet.{bid}.attn_v",
644643
MODEL_TENSOR.POSNET_ATTN_OUT: "posnet.{bid}.attn_output",
645644
# vision
646-
MODEL_TENSOR.V_MMPROJ_A: "v.mmproj_a",
647-
MODEL_TENSOR.V_MMPROJ_B: "v.mmproj_b",
645+
MODEL_TENSOR.V_MMPROJ: "v.mmproj_{bid}",
648646
MODEL_TENSOR.V_ENC_EMBD_CLS: "v.enc.embd.cls",
649647
MODEL_TENSOR.V_ENC_EMBD_PATCH: "v.enc.embd.patch",
650648
MODEL_TENSOR.V_ENC_EMBD_POS: "v.enc.embd.pos",
@@ -1600,8 +1598,7 @@ class MODEL_TENSOR(IntEnum):
16001598
MODEL_TENSOR.POSNET_ATTN_OUT,
16011599
],
16021600
MODEL_ARCH.LLAVA_VISION: [
1603-
MODEL_TENSOR.V_MMPROJ_A,
1604-
MODEL_TENSOR.V_MMPROJ_B,
1601+
MODEL_TENSOR.V_MMPROJ,
16051602
MODEL_TENSOR.V_ENC_EMBD_CLS,
16061603
MODEL_TENSOR.V_ENC_EMBD_PATCH,
16071604
MODEL_TENSOR.V_ENC_EMBD_POS,

gguf-py/gguf/tensor_mapping.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -726,12 +726,12 @@ class TensorNameMap:
726726
MODEL_TENSOR.CLS_OUT: (
727727
"classifier.out_proj", # roberta
728728

729-
MODEL_TENSOR.V_MMPROJ_A: (
730-
"multi_modal_projector.linear_1",
729+
MODEL_TENSOR.V_MMPROJ: (
730+
"multi_modal_projector.linear_{bid}",
731731
),
732732

733-
MODEL_TENSOR.V_MMPROJ_B: (
734-
"multi_modal_projector.linear_2",
733+
MODEL_TENSOR.V_MMPROJ: (
734+
"multi_modal_projector.linear_{bid}",
735735
),
736736

737737
MODEL_TENSOR.V_ENC_EMBD_CLS: (

src/llama-arch.h

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -1420,8 +1420,7 @@ static const std::map<llm_arch, std::map<llm_tensor, std::string>> LLM_TENSOR_NA
14201420

14211421

14221422
enum vision_tensor {
1423-
VISION_TENSOR_MMPROJ_A,
1424-
VISION_TENSOR_MMPROJ_B,
1423+
VISION_TENSOR_MMPROJ,
14251424
VISION_TENSOR_ENC_EMBD_CLS,
14261425
VISION_TENSOR_ENC_EMBD_PATCH,
14271426
VISION_TENSOR_ENC_EMBD_POS,
@@ -1441,8 +1440,7 @@ static const std::map<vision_arch, std::map<vision_tensor, std::string>> VISION_
14411440
{
14421441
VISION_ARCH_LLAVA,
14431442
{
1444-
{ VISION_TENSOR_MMPROJ_A, "v.mmproj_a" },
1445-
{ VISION_TENSOR_MMPROJ_B, "v.mmproj_b" },
1443+
{ VISION_TENSOR_MMPROJ, "v.mmproj" },
14461444
{ VISION_TENSOR_ENC_EMBD_CLS, "v.enc.embd.cls" },
14471445
{ VISION_TENSOR_ENC_EMBD_PATCH, "v.enc.embd.patch" },
14481446
{ VISION_TENSOR_ENC_EMBD_POS, "v.enc.embd.pos" },
@@ -1472,8 +1470,7 @@ struct llm_tensor_info {
14721470
};
14731471

14741472
static const std::map<vision_tensor, llm_tensor_info> vision_tensor_info_mapping = {
1475-
{VISION_TENSOR_MMPROJ_A, {LLM_TENSOR_LAYER_INPUT, GGML_OP_GET_ROWS}},
1476-
{VISION_TENSOR_MMPROJ_B, {LLM_TENSOR_LAYER_INPUT, GGML_OP_GET_ROWS}},
1473+
{VISION_TENSOR_MMPROJ, {LLM_TENSOR_LAYER_INPUT, GGML_OP_GET_ROWS}},
14771474
{VISION_TENSOR_ENC_EMBD_CLS, {LLM_TENSOR_LAYER_INPUT, GGML_OP_GET_ROWS}},
14781475
{VISION_TENSOR_ENC_EMBD_PATCH, {LLM_TENSOR_LAYER_INPUT, GGML_OP_GET_ROWS}},
14791476
{VISION_TENSOR_ENC_EMBD_POS, {LLM_TENSOR_LAYER_INPUT, GGML_OP_GET_ROWS}},

0 commit comments

Comments
 (0)