|
1-wiki.png
|
update images
|
2024-09-13 10:23:36 +08:00 |
|
2-wiki.png
|
update images
|
2024-09-13 10:23:36 +08:00 |
|
3-wiki.png
|
update images
|
2024-09-13 10:23:36 +08:00 |
|
4-wiki.png
|
update images
|
2024-09-13 10:23:36 +08:00 |
|
5-wiki.png
|
update images
|
2024-09-13 10:23:36 +08:00 |
|
and_huggingface.png
|
update readme
|
2025-02-10 13:30:55 +08:00 |
|
and_modelscope.png
|
update readme
|
2025-02-10 13:30:55 +08:00 |
|
compare_radar.png
|
[fix] model-name
|
2025-11-07 19:38:20 +08:00 |
|
dataset.jpg
|
add minimind2
|
2025-02-09 23:49:47 +08:00 |
|
gpt3_config.png
|
MiniMind first open source
|
2024-08-28 16:41:44 +08:00 |
|
LLM-structure-moe.png
|
update structure figure
|
2025-02-18 23:24:51 +08:00 |
|
LLM-structure.png
|
update structure image
|
2025-04-01 16:15:26 +08:00 |
|
logo2.png
|
update readme
|
2025-02-10 11:14:52 +08:00 |
|
logo.png
|
update readme
|
2025-02-10 22:22:35 +08:00 |
|
minimind2.gif
|
update images
|
2025-02-19 22:54:57 +08:00 |
|
pre_512_loss.png
|
add minimind2
|
2025-02-09 23:49:47 +08:00 |
|
pre_768_loss.png
|
add minimind2
|
2025-02-09 23:49:47 +08:00 |
|
rope_ppl.png
|
[feat] update yarn
|
2025-12-01 16:15:05 +08:00 |
|
sft_512_loss.png
|
add minimind2
|
2025-02-09 23:49:47 +08:00 |
|
sft_768_loss.png
|
add minimind2
|
2025-02-09 23:49:47 +08:00 |
|
train_grpo_512.png
|
[feat] minimind-2510
|
2025-10-21 21:19:47 +08:00 |
|
train_grpo_768.png
|
[feat] minimind-2510
|
2025-10-21 21:19:47 +08:00 |
|
train_ppo_512.png
|
[feat] minimind-2510
|
2025-10-21 21:19:47 +08:00 |
|
train_ppo_768.png
|
[feat] minimind-2510
|
2025-10-21 21:19:47 +08:00 |
|
train_spo_768.png
|
[feat] minimind-2510
|
2025-10-21 21:19:47 +08:00 |