[update] default model

2026-04-23 15:58:15 +08:00 · 2026-03-31 13:40:16 +08:00 · 2026-03-31 13:40:16 +08:00 · b7e0ae21d6
commit b7e0ae21d6
parent b1865f75c2
1 changed files with 2 additions and 2 deletions
--- a/scripts/convert_model.py
+++ b/scripts/convert_model.py
@ -126,10 +126,10 @@ def convert_json_to_jinja(json_file_path, output_path):


 if __name__ == '__main__':
-    lm_config = MiniMindConfig(hidden_size=768, num_hidden_layers=8, max_seq_len=8192, use_moe=True)
+    lm_config = MiniMindConfig(hidden_size=768, num_hidden_layers=8, max_seq_len=8192, use_moe=False)
    # convert torch to transformers
    torch_path = f"../out/full_sft_{lm_config.hidden_size}{'_moe' if lm_config.use_moe else ''}.pth"
-    transformers_path = '../minimind-3-moe'
+    transformers_path = '../minimind-3'
    convert_torch2transformers(torch_path, transformers_path)

    # # merge lora