minimind/trainer
2026-04-09 16:36:48 +08:00
..
rollout_engine.py [update] minimind-3 2026-03-25 23:57:45 +08:00
train_agent.py [update] minimind-3 2026-03-25 23:57:45 +08:00
train_distillation.py [update] minimind-3 2026-03-25 23:57:45 +08:00
train_dpo.py [update] minimind-3 2026-03-25 23:57:45 +08:00
train_full_sft.py [update] change default seq_len 2026-03-26 10:09:06 +08:00
train_grpo.py [update] minimind-3 2026-03-25 23:57:45 +08:00
train_lora.py [fix] lora moe 2026-04-09 16:36:48 +08:00
train_ppo.py [update] minimind-3 2026-03-25 23:57:45 +08:00
train_pretrain.py [update] minimind-3 2026-03-25 23:57:45 +08:00
train_tokenizer.py [update] minimind-3 2026-03-25 23:57:45 +08:00
trainer_utils.py [update] minimind-3 2026-03-25 23:57:45 +08:00