jingyaogong
|
cc81925ecc
|
[feat] update readme
|
2025-10-26 18:52:50 +08:00 |
|
jingyaogong
|
35bed8936d
|
[feat] update eval-llm
|
2025-10-26 18:52:01 +08:00 |
|
jingyaogong
|
e8484874f5
|
[feat] pause-training
|
2025-10-26 18:49:52 +08:00 |
|
jingyaogong
|
6efba3249a
|
[feat] update readme
|
2025-10-24 01:18:33 +08:00 |
|
jingyaogong
|
ea2abb5fb3
|
[feat] update readme
|
2025-10-24 00:45:11 +08:00 |
|
jingyaogong
|
c4e9789d7e
|
[feat] update requirements
|
2025-10-23 23:54:55 +08:00 |
|
jingyaogong
|
4276f8a72f
|
[feat] update requirements
|
2025-10-23 23:50:21 +08:00 |
|
jingyaogong
|
d762926f48
|
[feat] update readme
|
2025-10-23 23:23:52 +08:00 |
|
jingyaogong
|
09be7dba11
|
[feat] update readme
|
2025-10-23 20:23:46 +08:00 |
|
jingyaogong
|
fa6df82ff8
|
[feat] repetition-penalty
|
2025-10-23 20:23:25 +08:00 |
|
jingyaogong
|
28cc44579a
|
[feat] convert2llama
|
2025-10-23 20:22:42 +08:00 |
|
jingyaogong
|
a82526da11
|
[feat] shuffle data
|
2025-10-23 20:13:28 +08:00 |
|
jingyaogong
|
805744e60a
|
[fix] loss-issues-430
|
2025-10-23 19:08:42 +08:00 |
|
jingyaogong
|
4014e62cdf
|
[fix] restore
|
2025-10-23 19:00:06 +08:00 |
|
jingyaogong
|
557bcc018d
|
[fix] issue-431
|
2025-10-23 18:56:30 +08:00 |
|
jingyaogong
|
463044e92a
|
[fix] sampler-ddp
|
2025-10-23 15:03:19 +08:00 |
|
jingyaogong
|
fa7dff8291
|
[fix] graph-oom & ddp-pos_cis
|
2025-10-23 14:22:13 +08:00 |
|
jingyaogong
|
ce693f8e7f
|
[fix] git track
|
2025-10-21 23:09:00 +08:00 |
|
jingyaogong
|
d8bf813eac
|
[feat] update readme
|
2025-10-21 23:02:16 +08:00 |
|
jingyaogong
|
7d877db79b
|
[feat] minimind-2510
|
2025-10-21 21:19:47 +08:00 |
|
jingyaogong
|
3812a16d20
|
[feat] update eval
|
2025-10-18 00:24:36 +08:00 |
|
jingyaogong
|
0682134e21
|
[feat] update requirements
|
2025-10-17 00:14:37 +08:00 |
|
jingyaogong
|
b8adffbe89
|
[fix] update model
|
2025-10-17 00:11:08 +08:00 |
|
jingyaogong
|
4e35fb9da8
|
[fix] update model
|
2025-10-17 00:09:32 +08:00 |
|
jingyaogong
|
36159fb2ab
|
update app
|
2025-10-16 23:33:35 +08:00 |
|
jingyaogong
|
561979c7e3
|
update torch version
|
2025-04-30 16:47:26 +08:00 |
|
jingyaogong
|
caae54a89e
|
fix bugs
|
2025-04-29 20:45:39 +08:00 |
|
jingyaogong
|
5ffde04b7c
|
update lora
|
2025-04-27 15:45:06 +08:00 |
|
jingyaogong
|
2e118e9d3d
|
update convert script
|
2025-04-27 15:44:40 +08:00 |
|
jingyaogong
|
29454c31af
|
fix bugs
|
2025-04-27 09:56:49 +08:00 |
|
jingyaogong
|
765c79c7a2
|
update readme
|
2025-04-26 10:37:46 +08:00 |
|
jingyaogong
|
00d145c481
|
update readme
|
2025-04-26 10:21:34 +08:00 |
|
jingyaogong
|
274483cb1b
|
250426
|
2025-04-26 10:07:55 +08:00 |
|
jingyaogong
|
a62faf34bd
|
250426
|
2025-04-26 10:05:47 +08:00 |
|
jingyaogong
|
7da201a944
|
update chat-openai-api
|
2025-04-18 12:43:57 +08:00 |
|
jingyaogong
|
d9453ed9a3
|
update moe note
|
2025-04-09 17:38:31 +08:00 |
|
jingyaogong
|
d503093ec4
|
update eval
|
2025-04-09 16:56:57 +08:00 |
|
jingyaogong
|
4a758564e4
|
fix top_p float bug
|
2025-04-09 16:52:20 +08:00 |
|
jingyaogong
|
4a7c1c49e8
|
update rlaif
|
2025-04-05 16:06:08 +08:00 |
|
jingyaogong
|
9e67798397
|
update generate
|
2025-04-05 15:53:55 +08:00 |
|
jingyaogong
|
399d526fbd
|
add hidden state
|
2025-04-05 14:39:56 +08:00 |
|
jingyaogong
|
885661f47d
|
update inference
|
2025-04-05 12:04:38 +08:00 |
|
jingyaogong
|
ed01c5d84a
|
update inference
|
2025-04-05 12:03:04 +08:00 |
|
jingyaogong
|
7fcc46b39a
|
update seed set
|
2025-04-04 11:39:41 +08:00 |
|
jingyaogong
|
08e9a22a25
|
update web_demo
|
2025-04-04 11:25:40 +08:00 |
|
jingyaogong
|
278ec760a1
|
update dpo_loss
|
2025-04-01 17:32:50 +08:00 |
|
jingyaogong
|
4f95e23a98
|
update structure image
|
2025-04-01 16:15:26 +08:00 |
|
jingyaogong
|
edc8d26189
|
update structure image
|
2025-04-01 16:11:54 +08:00 |
|
jingyaogong
|
bf81fd5f5e
|
rmsnorm float convert
|
2025-04-01 16:03:44 +08:00 |
|
jingyaogong
|
e369b33265
|
fix chat mask bug
|
2025-04-01 13:44:55 +08:00 |
|