jingyaogong
|
d8ac558ce2
|
[feat] update readme
|
2025-10-30 23:30:12 +08:00 |
|
jingyaogong
|
e4807a5214
|
[feat] update readme
|
2025-10-30 23:27:15 +08:00 |
|
jingyaogong
|
de23e1ea39
|
[feat] update datasets
|
2025-10-30 11:08:13 +08:00 |
|
jingyaogong
|
08ce3da228
|
[feat] update args
|
2025-10-30 10:48:31 +08:00 |
|
jingyaogong
|
bf123b585d
|
[feat] add args
|
2025-10-30 10:05:12 +08:00 |
|
jingyaogong
|
800fed4639
|
[feat] update readme
|
2025-10-29 12:13:25 +08:00 |
|
jingyaogong
|
1713c24114
|
[fix] model device
|
2025-10-29 10:36:28 +08:00 |
|
jingyaogong
|
acd5925193
|
[feat] update trainer
|
2025-10-29 00:52:37 +08:00 |
|
jingyaogong
|
8f7e07b8ef
|
[feat] update trainer
|
2025-10-28 23:30:10 +08:00 |
|
jingyaogong
|
eb96113cd4
|
[feat] update readme
|
2025-10-27 16:31:40 +08:00 |
|
jingyaogong
|
cc81925ecc
|
[feat] update readme
|
2025-10-26 18:52:50 +08:00 |
|
jingyaogong
|
35bed8936d
|
[feat] update eval-llm
|
2025-10-26 18:52:01 +08:00 |
|
jingyaogong
|
e8484874f5
|
[feat] pause-training
|
2025-10-26 18:49:52 +08:00 |
|
jingyaogong
|
6efba3249a
|
[feat] update readme
|
2025-10-24 01:18:33 +08:00 |
|
jingyaogong
|
ea2abb5fb3
|
[feat] update readme
|
2025-10-24 00:45:11 +08:00 |
|
jingyaogong
|
c4e9789d7e
|
[feat] update requirements
|
2025-10-23 23:54:55 +08:00 |
|
jingyaogong
|
4276f8a72f
|
[feat] update requirements
|
2025-10-23 23:50:21 +08:00 |
|
jingyaogong
|
d762926f48
|
[feat] update readme
|
2025-10-23 23:23:52 +08:00 |
|
jingyaogong
|
09be7dba11
|
[feat] update readme
|
2025-10-23 20:23:46 +08:00 |
|
jingyaogong
|
fa6df82ff8
|
[feat] repetition-penalty
|
2025-10-23 20:23:25 +08:00 |
|
jingyaogong
|
28cc44579a
|
[feat] convert2llama
|
2025-10-23 20:22:42 +08:00 |
|
jingyaogong
|
a82526da11
|
[feat] shuffle data
|
2025-10-23 20:13:28 +08:00 |
|
jingyaogong
|
805744e60a
|
[fix] loss-issues-430
|
2025-10-23 19:08:42 +08:00 |
|
jingyaogong
|
4014e62cdf
|
[fix] restore
|
2025-10-23 19:00:06 +08:00 |
|
jingyaogong
|
557bcc018d
|
[fix] issue-431
|
2025-10-23 18:56:30 +08:00 |
|
jingyaogong
|
463044e92a
|
[fix] sampler-ddp
|
2025-10-23 15:03:19 +08:00 |
|
jingyaogong
|
fa7dff8291
|
[fix] graph-oom & ddp-pos_cis
|
2025-10-23 14:22:13 +08:00 |
|
jingyaogong
|
ce693f8e7f
|
[fix] git track
|
2025-10-21 23:09:00 +08:00 |
|
jingyaogong
|
d8bf813eac
|
[feat] update readme
|
2025-10-21 23:02:16 +08:00 |
|
jingyaogong
|
7d877db79b
|
[feat] minimind-2510
|
2025-10-21 21:19:47 +08:00 |
|
jingyaogong
|
3812a16d20
|
[feat] update eval
|
2025-10-18 00:24:36 +08:00 |
|
jingyaogong
|
0682134e21
|
[feat] update requirements
|
2025-10-17 00:14:37 +08:00 |
|
jingyaogong
|
b8adffbe89
|
[fix] update model
|
2025-10-17 00:11:08 +08:00 |
|
jingyaogong
|
4e35fb9da8
|
[fix] update model
|
2025-10-17 00:09:32 +08:00 |
|
jingyaogong
|
36159fb2ab
|
update app
|
2025-10-16 23:33:35 +08:00 |
|
jingyaogong
|
561979c7e3
|
update torch version
|
2025-04-30 16:47:26 +08:00 |
|
jingyaogong
|
caae54a89e
|
fix bugs
|
2025-04-29 20:45:39 +08:00 |
|
jingyaogong
|
5ffde04b7c
|
update lora
|
2025-04-27 15:45:06 +08:00 |
|
jingyaogong
|
2e118e9d3d
|
update convert script
|
2025-04-27 15:44:40 +08:00 |
|
jingyaogong
|
29454c31af
|
fix bugs
|
2025-04-27 09:56:49 +08:00 |
|
jingyaogong
|
765c79c7a2
|
update readme
|
2025-04-26 10:37:46 +08:00 |
|
jingyaogong
|
00d145c481
|
update readme
|
2025-04-26 10:21:34 +08:00 |
|
jingyaogong
|
274483cb1b
|
250426
|
2025-04-26 10:07:55 +08:00 |
|
jingyaogong
|
a62faf34bd
|
250426
|
2025-04-26 10:05:47 +08:00 |
|
jingyaogong
|
7da201a944
|
update chat-openai-api
|
2025-04-18 12:43:57 +08:00 |
|
jingyaogong
|
d9453ed9a3
|
update moe note
|
2025-04-09 17:38:31 +08:00 |
|
jingyaogong
|
d503093ec4
|
update eval
|
2025-04-09 16:56:57 +08:00 |
|
jingyaogong
|
4a758564e4
|
fix top_p float bug
|
2025-04-09 16:52:20 +08:00 |
|
jingyaogong
|
4a7c1c49e8
|
update rlaif
|
2025-04-05 16:06:08 +08:00 |
|
jingyaogong
|
9e67798397
|
update generate
|
2025-04-05 15:53:55 +08:00 |
|