minimind/trainer
2025-11-15 18:25:37 +08:00
..
train_distill_reason.py [feat] clear cache 2025-11-06 13:12:28 +08:00
train_distillation.py [feat] clear cache 2025-11-06 13:12:28 +08:00
train_dpo.py [feat] clear cache 2025-11-06 13:12:28 +08:00
train_full_sft.py [feat] clear cache 2025-11-06 13:12:28 +08:00
train_grpo.py [feat] clear cache 2025-11-06 13:12:28 +08:00
train_lora.py [feat] clear cache 2025-11-06 13:12:28 +08:00
train_ppo.py [fix] prompt length calculate 2025-11-15 18:25:37 +08:00
train_pretrain.py [feat] clear cache 2025-11-06 13:12:28 +08:00
train_spo.py [feat] clear cache 2025-11-06 13:12:28 +08:00
trainer_utils.py [feat] update import 2025-10-31 23:45:55 +08:00