We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ee9f077 commit 3b0e720Copy full SHA for 3b0e720
mergekit/architecture/__init__.py
@@ -41,12 +41,14 @@ def arch_info_for_config(config: PretrainedConfig) -> Optional[ModelArchitecture
41
return ModelArchitecture(
42
modules={"default": ModuleDefinition(architecture=module)},
43
architectures=[arch_name],
44
+ model_type="mixtral",
45
)
46
elif arch_name == Qwen3MoeModuleArchitecture.ARCHITECTURE_NAME:
47
module = Qwen3MoeModuleArchitecture.from_config(config)
48
49
50
51
+ model_type="qwen3_moe",
52
53
elif arch_name in NAME_TO_ARCH:
54
candidates = list(NAME_TO_ARCH[arch_name])
0 commit comments