hiyouga
|
c0658711ca
|
fix tokenizer padding side in evaluate.py
Former-commit-id: bcb43ff8ba1946c1f7e7865c9d0fb47ba276935d
|
2023-10-21 00:30:04 +08:00 |
|
hiyouga
|
d602f06882
|
fix #1232
Former-commit-id: 49975755d47344e362145c52548fdda8783f2c0c
|
2023-10-20 23:28:52 +08:00 |
|
hiyouga
|
1cb9a38ac2
|
fix #1215
Former-commit-id: d91b43a8afbea4859357f2224e3d9b9d71160e6d
|
2023-10-19 16:19:21 +08:00 |
|
hiyouga
|
47a1f73d0f
|
fix #1218
Former-commit-id: b301f35bd4a3bf368159c8f5fb4e2736f922115b
|
2023-10-19 16:17:41 +08:00 |
|
hiyouga
|
142dd63b47
|
fix #1228
Former-commit-id: e4e0cae3f55da2f1b566c97dbfdd7fc5b7b728a4
|
2023-10-19 15:54:10 +08:00 |
|
hiyouga
|
b1bd8370c2
|
fix #1217
Former-commit-id: 065fc0a6f3f005bb87e1c5c126c8b6bb470ce700
|
2023-10-19 15:52:24 +08:00 |
|
hiyouga
|
215660c8da
|
rename webui
Former-commit-id: 26feaf80fff6177d9eb4e28ad18feb6d34d3ea27
|
2023-10-16 15:16:24 +08:00 |
|
hiyouga
|
0cafe67efe
|
fix #1197
Former-commit-id: 00100e23fcfef9587fda4cf01c62599d996e1176
|
2023-10-16 15:13:46 +08:00 |
|
hiyouga
|
d627ab4855
|
release v0.2.0
Former-commit-id: 7f941c1ab6c52915aa2675fa77cae5efc530fdd9
|
2023-10-15 20:49:43 +08:00 |
|
hiyouga
|
a6f800b741
|
fix config, #1191
Former-commit-id: 5dbc9b355e85b203cb43ff72589374f0e04be391
|
2023-10-15 18:28:45 +08:00 |
|
hiyouga
|
a003d1fa1e
|
disable tqdm in webui mode
Former-commit-id: 832be571bec2eefb79ea88f110b7827f5c1249e6
|
2023-10-15 16:18:25 +08:00 |
|
hiyouga
|
c2e84d4558
|
refactor export, fix #1190
Former-commit-id: 30e60e37023a7c4a2db033ffec0542efa3d5cdfb
|
2023-10-15 16:01:48 +08:00 |
|
hiyouga
|
68330eab2a
|
fix eval resuming in webui
Former-commit-id: b28b53cd06777f213ef7b925a914ff5fd357ade1
|
2023-10-15 15:45:38 +08:00 |
|
hiyouga
|
7070f3969d
|
tiny fix
Former-commit-id: 47b7b34357708a5354d542ddc239146c6417d718
|
2023-10-15 05:02:48 +08:00 |
|
hiyouga
|
e4727ab155
|
fix callback
Former-commit-id: 51208655a8c1d66551b7b644247321a3583debdc
|
2023-10-15 04:59:44 +08:00 |
|
hiyouga
|
31e3805fb8
|
implement webui resuming training
Former-commit-id: 2d41672ef52414c56c50c8b4fdc442797ba682e9
|
2023-10-15 04:52:19 +08:00 |
|
hiyouga
|
ef248dbe15
|
fix bugs in webui
Former-commit-id: 4befa74ea630d90e4d7a1f7d7c34d39257717ec1
|
2023-10-15 03:41:58 +08:00 |
|
hiyouga
|
6a61b4b638
|
refactor webui
Former-commit-id: 813ecd8e51949c21ab6fbaa51cc2b1a84ee07952
|
2023-10-15 03:06:21 +08:00 |
|
hiyouga
|
4b1473502f
|
fix loading dtype
Former-commit-id: d54a356128f7e335c12089702cf3de7f5b4baf16
|
2023-10-14 20:15:24 +08:00 |
|
hiyouga
|
bf211d818d
|
fix #1176 #1177
Former-commit-id: 5627a2b57c270a78095a32083e2dc7aa02162875
|
2023-10-14 20:00:17 +08:00 |
|
hiyouga
|
27dd87c890
|
fix #1184
Former-commit-id: 5b069a967823e659dbc70b0d50361b3ad248087e
|
2023-10-14 19:20:11 +08:00 |
|
hiyouga
|
8659084ab0
|
fix webui
Former-commit-id: a0fe43aac968d9f6ca4724b8d718b45c03063b91
|
2023-10-13 16:27:59 +08:00 |
|
hiyouga
|
97b74d328b
|
fix ppo args
Former-commit-id: 0f12899951808f53a482082eb116bda309775930
|
2023-10-11 23:40:50 +08:00 |
|
hiyouga
|
3198a7e5f4
|
refactor model_dtype, fix PPO trainer
Former-commit-id: 3e17ee5afbcb823a7c9a2f91864b3750cd79edb4
|
2023-10-11 23:16:01 +08:00 |
|
hiyouga
|
a2d08ce961
|
add averaging in evaluation
Former-commit-id: b39d6e0b8658e1c69bbaf6bcb6cfaa8f7af30110
|
2023-10-10 23:16:31 +08:00 |
|
hiyouga
|
bd8ea09479
|
fix aquila template, repair sft packing mechanism
Former-commit-id: 8c82cfa5dd4bec957426b5bf176d242c77552ab0
|
2023-10-10 18:49:55 +08:00 |
|
hiyouga
|
6d0d46c7fb
|
tiny fix
Former-commit-id: 31ccd3329ac634b239c43d60bd955cd95670df16
|
2023-10-10 17:41:13 +08:00 |
|
hiyouga
|
f74d600497
|
fix flash shift short attention
Former-commit-id: e44ad23eafa39b3ac0400b6f97cd440106a87f44
|
2023-10-09 17:54:48 +08:00 |
|
hiyouga
|
94fec9f50e
|
fix webui args
Former-commit-id: 64aa75c8cd7c84ab4a0f1dbaf4763765ba973f54
|
2023-10-09 17:13:57 +08:00 |
|
hiyouga
|
e387a50475
|
fix shift short attention
Former-commit-id: 9a49cce8e6f6b222f74a07bdab40efee6a77b0f1
|
2023-10-09 17:07:46 +08:00 |
|
hiyouga
|
5c4248a29c
|
update webui #1086
Former-commit-id: 65a48bc398f18f71f5f2659b2070e3b9593af243
|
2023-10-09 14:50:14 +08:00 |
|
hiyouga
|
f22886e2b6
|
fix #1097
Former-commit-id: c5b8796322d9d48e815038f9fecf0ce39036a4ee
|
2023-10-08 22:29:26 +08:00 |
|
hiyouga
|
33af3cbf37
|
add llamafy_qwen.py
Former-commit-id: 6cdc91543c022edcc98076488f06e809fde9bad7
|
2023-10-08 22:05:36 +08:00 |
|
hiyouga
|
728dfb1be7
|
fix #1068 #1074
Former-commit-id: 26c6bfd21de06cc56be9a58e2ef69045ea70cc14
|
2023-09-28 14:39:16 +08:00 |
|
hiyouga
|
e49f7f1afe
|
fix bug in packed sft dataset
Former-commit-id: 51d26b2af6612e65a91c576da5270028da27b322
|
2023-09-28 01:16:46 +08:00 |
|
hiyouga
|
21a454fa6c
|
tiny fix
Former-commit-id: 35b355b76d2a8f8adf3750a905224e52d03d218f
|
2023-09-28 01:03:04 +08:00 |
|
hiyouga
|
22c6c27f78
|
tiny fix
Former-commit-id: 7451b2ae7e58d0f1857f01a037672a8c53b1bd0d
|
2023-09-28 01:02:11 +08:00 |
|
hiyouga
|
aecbb43096
|
fix #1064
Former-commit-id: fd4660aa72d981d7efdad465f24a59358626c975
|
2023-09-28 00:53:29 +08:00 |
|
hiyouga
|
fa53fd2db2
|
fix bug in pretraining
Former-commit-id: 18a2d90bd6e7c3e1e3513e6f9d895e4048b35b04
|
2023-09-28 00:45:20 +08:00 |
|
hiyouga
|
1c150995ae
|
fix layer norm dtype
Former-commit-id: 67af21961b68d9b54d07b09e444c7140869f26da
|
2023-09-28 00:25:55 +08:00 |
|
hiyouga
|
6c5d8f089e
|
fix #1026
Former-commit-id: d0940d0dbd03d4bbcc955304566b0d5507edf9e6
|
2023-09-27 22:57:09 +08:00 |
|
hiyouga
|
dd623325e8
|
fix #424
Former-commit-id: daaf89f1126112a73b9f115b0f5617a8cd974a3e
|
2023-09-27 22:49:43 +08:00 |
|
hiyouga
|
e8a375c8f2
|
fix #1032
Former-commit-id: 1235b2da5a79ffefd1342054ea8e7dabf47398c1
|
2023-09-27 22:42:16 +08:00 |
|
hiyouga
|
386d85ae72
|
refactor finetuning Args
Former-commit-id: be425a70a4c8f051717cf1e4464dbd79dae4c0b5
|
2023-09-27 22:28:06 +08:00 |
|
hiyouga
|
20130b486c
|
support LongLoRA
Former-commit-id: 0832ed37e7947d699f17375648a52f80752c2b6b
|
2023-09-27 21:55:50 +08:00 |
|
hiyouga
|
73c48d0463
|
add CMMLU, update eval script
Former-commit-id: 47f31f06a946eefa5a972e4a566cf3ce05e1e111
|
2023-09-23 21:10:17 +08:00 |
|
hiyouga
|
f7cecd20e3
|
update evaluate
Former-commit-id: 288137a76ed1528faa39b467da22f6468ba368ee
|
2023-09-23 11:55:31 +08:00 |
|
hiyouga
|
2bc64a7636
|
move file
Former-commit-id: 8711ca9b5421f971ee4cb2fada23832f1021577c
|
2023-09-23 11:52:12 +08:00 |
|
hiyouga
|
35d1921081
|
add MMLU and C-Eval script
Former-commit-id: 3403f876127b4b99c5e3edb2834cc3b9a3a0063f
|
2023-09-23 00:34:17 +08:00 |
|
hiyouga
|
4fbdf18c70
|
fix #1000
Former-commit-id: 85de2d0a99e4a81fae890a963ccbb5c6142d52d4
|
2023-09-22 15:00:48 +08:00 |
|