mirror of
https://github.com/hiyouga/LlamaFactory.git
synced 2026-03-24 19:17:45 +08:00
[model] support Qwen3.5 liger kernel (#10313)
This commit is contained in:
@@ -79,6 +79,8 @@ def apply_liger_kernel(
|
|||||||
from liger_kernel.transformers import apply_liger_kernel_to_qwen3_moe as apply_liger_kernel
|
from liger_kernel.transformers import apply_liger_kernel_to_qwen3_moe as apply_liger_kernel
|
||||||
elif model_type == "qwen3_next":
|
elif model_type == "qwen3_next":
|
||||||
from liger_kernel.transformers import apply_liger_kernel_to_qwen3_next as apply_liger_kernel
|
from liger_kernel.transformers import apply_liger_kernel_to_qwen3_next as apply_liger_kernel
|
||||||
|
elif model_type == "qwen3_5":
|
||||||
|
from liger_kernel.transformers import apply_liger_kernel_to_qwen3_5 as apply_liger_kernel
|
||||||
elif model_type == "gpt_oss":
|
elif model_type == "gpt_oss":
|
||||||
try:
|
try:
|
||||||
from liger_kernel.transformers import apply_liger_kernel_to_gpt_oss as apply_liger_kernel
|
from liger_kernel.transformers import apply_liger_kernel_to_gpt_oss as apply_liger_kernel
|
||||||
|
|||||||
Reference in New Issue
Block a user