From 2e118e9d3d2ed37281f1bdc36563dc3eff63b3a3 Mon Sep 17 00:00:00 2001 From: jingyaogong Date: Sun, 27 Apr 2025 15:44:40 +0800 Subject: [PATCH] update convert script --- scripts/convert_model.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/scripts/convert_model.py b/scripts/convert_model.py index 685cf9e..a6e22f8 100644 --- a/scripts/convert_model.py +++ b/scripts/convert_model.py @@ -62,11 +62,11 @@ def convert_transformers2torch(transformers_path, torch_path): if __name__ == '__main__': - lm_config = MiniMindConfig(hidden_size=768, num_hidden_layers=16, max_seq_len=8192, use_moe=True) + lm_config = MiniMindConfig(hidden_size=768, num_hidden_layers=16, max_seq_len=8192, use_moe=False) torch_path = f"../out/full_sft_{lm_config.hidden_size}{'_moe' if lm_config.use_moe else ''}.pth" - transformers_path = '../MiniMind2-MoE' + transformers_path = '../MiniMind2' convert_torch2transformers_minimind(torch_path, transformers_path)