Skip to content

Commit 0d4c4a7

Browse files
authored
Support BailingMoE
1 parent b1b9222 commit 0d4c4a7

File tree

2 files changed

+28
-0
lines changed

2 files changed

+28
-0
lines changed

gguf-py/gguf/constants.py

Lines changed: 27 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -287,6 +287,7 @@ class MODEL_ARCH(IntEnum):
287287
CHAMELEON = auto()
288288
WAVTOKENIZER_DEC = auto()
289289
PLM = auto()
290+
BAILINGMOE = auto()
290291

291292

292293
class MODEL_TENSOR(IntEnum):
@@ -490,6 +491,7 @@ class MODEL_TENSOR(IntEnum):
490491
MODEL_ARCH.CHAMELEON: "chameleon",
491492
MODEL_ARCH.WAVTOKENIZER_DEC: "wavtokenizer-dec",
492493
MODEL_ARCH.PLM: "plm",
494+
MODEL_ARCH.BAILINGMOE: "bailingmoe",
493495
}
494496

495497
TENSOR_NAMES: dict[MODEL_TENSOR, str] = {
@@ -1667,6 +1669,28 @@ class MODEL_TENSOR(IntEnum):
16671669
MODEL_TENSOR.POSNET_ATTN_V,
16681670
MODEL_TENSOR.POSNET_ATTN_OUT,
16691671
],
1672+
MODEL_ARCH.BAILINGMOE: [
1673+
MODEL_TENSOR.TOKEN_EMBD,
1674+
MODEL_TENSOR.OUTPUT_NORM,
1675+
MODEL_TENSOR.OUTPUT,
1676+
MODEL_TENSOR.ROPE_FREQS,
1677+
MODEL_TENSOR.ATTN_NORM,
1678+
MODEL_TENSOR.ATTN_Q,
1679+
MODEL_TENSOR.ATTN_K,
1680+
MODEL_TENSOR.ATTN_V,
1681+
MODEL_TENSOR.ATTN_OUT,
1682+
MODEL_TENSOR.FFN_GATE_INP,
1683+
MODEL_TENSOR.FFN_NORM,
1684+
MODEL_TENSOR.FFN_GATE,
1685+
MODEL_TENSOR.FFN_DOWN,
1686+
MODEL_TENSOR.FFN_UP,
1687+
MODEL_TENSOR.FFN_GATE_EXP,
1688+
MODEL_TENSOR.FFN_DOWN_EXP,
1689+
MODEL_TENSOR.FFN_UP_EXP,
1690+
MODEL_TENSOR.FFN_GATE_SHEXP,
1691+
MODEL_TENSOR.FFN_DOWN_SHEXP,
1692+
MODEL_TENSOR.FFN_UP_SHEXP,
1693+
],
16701694
# TODO
16711695
}
16721696

@@ -1719,6 +1743,9 @@ class MODEL_TENSOR(IntEnum):
17191743
MODEL_TENSOR.ROPE_FREQS,
17201744
MODEL_TENSOR.ATTN_ROT_EMBD,
17211745
],
1746+
MODEL_ARCH.BAILINGMOE: [
1747+
MODEL_TENSOR.ROPE_FREQS,
1748+
],
17221749
}
17231750

17241751
#

gguf-py/gguf/tensor_mapping.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -29,6 +29,7 @@ class TensorNameMap:
2929
"shared", # t5
3030
"rwkv.embeddings", # rwkv6
3131
"model.embeddings", # rwkv7
32+
"model.word_embeddings", # bailingmoe
3233
),
3334

3435
# Token type embeddings

0 commit comments

Comments
 (0)