mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-10-14 15:52:49 +08:00
Commit Graph
Select branches
Hide Pull Requests
main
#1
#1059
#11
#1186
#119
#1252
#1326
#1348
#1353
#1375
#1436
#145
#1454
#1486
#1525
#1544
#1553
#156
#158
#1624
#1689
#1690
#1695
#1699
#1700
#171
#179
#1796
#1800
#1802
#1861
#1864
#1868
#1918
#1932
#1946
#1947
#1953
#1954
#200
#2007
#2019
#2100
#2117
#213
#2163
#2194
#22
#2201
#221
#2226
#2262
#2264
#2266
#2283
#2285
#2319
#2350
#2411
#2423
#2426
#2435
#2445
#2462
#2469
#2474
#2514
#2519
#2525
#2531
#2568
#2570
#2572
#2575
#258
#26
#2608
#2683
#2689
#2730
#2739
#2743
#2746
#2764
#2766
#2830
#2845
#2849
#2872
#2903
#2905
#2919
#2944
#2945
#2963
#2967
#2993
#3004
#3046
#3053
#3057
#306
#3066
#307
#3083
#3103
#3103
#3158
#3159
#3160
#3161
#3201
#3226
#3254
#3256
#3261
#3263
#3267
#3275
#3276
#3287
#3288
#3291
#33
#3332
#3338
#3357
#3371
#3383
#3394
#3412
#3423
#3435
#3449
#3450
#3454
#3471
#3484
#3487
#3490
#3498
#3511
#3513
#3527
#3532
#356
#3578
#3584
#3588
#3596
#3601
#3604
#3651
#3654
#3655
#3661
#3683
#3692
#3702
#3741
#3746
#3748
#3755
#3756
#3785
#3792
#3794
#3799
#3804
#3812
#382
#3829
#3835
#387
#3876
#3921
#3923
#3925
#3930
#3941
#395
#3958
#3976
#3987
#4003
#4006
#4007
#4009
#4011
#4015
#4029
#4043
#4045
#4053
#4066
#4080
#4082
#4083
#4098
#4099
#4119
#4136
#4166
#4167
#4173
#4191
#4204
#4224
#4227
#4234
#4237
#4245
#4246
#4307
#4309
#4314
#4321
#4329
#4334
#434
#4342
#4347
#4348
#4352
#4355
#4377
#4382
#4409
#4417
#4445
#4446
#4461
#451
#4544
#4561
#4580
#4589
#4590
#4636
#4651
#4662
#4663
#4673
#4680
#4680
#4686
#4687
#4691
#4692
#4700
#4706
#4724
#4733
#4746
#4781
#479
#4793
#4804
#4821
#4822
#4877
#4878
#4892
#4939
#4950
#4957
#4961
#4970
#4995
#4996
#5010
#5019
#5032
#5037
#5068
#5072
#5095
#51
#5109
#511
#5111
#5112
#5115
#5118
#5156
#516
#5163
#5170
#5185
#5188
#5193
#5208
#5226
#5230
#5233
#5237
#5242
#5278
#5290
#5317
#5323
#5326
#5339
#5343
#5346
#5365
#5372
#5388
#5405
#5424
#5427
#5438
#5445
#5451
#5458
#5473
#5475
#5480
#5483
#5486
#5507
#5522
#5532
#5533
#5536
#5546
#5547
#5555
#5563
#5574
#5580
#5581
#5585
#5606
#5615
#5639
#5642
#5653
#5665
#5673
#5746
#5752
#5752
#5758
#5781
#5799
#5801
#5816
#5819
#5839
#5852
#5856
#5857
#5871
#5873
#5880
#5889
#5895
#5897
#5901
#5906
#5907
#5909
#5910
#5912
#5913
#5914
#5920
#5922
#5924
#5926
#5927
#5929
#5933
#596
#5970
#5971
#5973
#598
#5982
#5984
#599
#5990
#5993
#6010
#6022
#6046
#6052
#6065
#6078
#6083
#6098
#6103
#6120
#6121
#6123
#6124
#6125
#6126
#6127
#6128
#6129
#6137
#6138
#6140
#6141
#6151
#6152
#6156
#6157
#6160
#6170
#6175
#619
#6190
#6192
#6204
#6224
#6226
#6233
#6238
#6242
#6246
#6251
#6253
#6265
#6275
#629
#6310
#6313
#6317
#6334
#6359
#6362
#6363
#6364
#6365
#6367
#6368
#6369
#6379
#6384
#6388
#6395
#6396
#6401
#6416
#6418
#6420
#6426
#6430
#644
#6441
#6443
#6444
#6457
#6462
#6465
#6471
#6478
#6483
#6492
#6493
#6498
#6503
#6506
#651
#6512
#6513
#6514
#6515
#6524
#6527
#6528
#6542
#6547
#6564
#6565
#657
#6585
#6588
#6597
#6598
#6600
#6601
#6617
#6620
#6624
#6625
#6626
#6628
#6629
#6631
#6632
#6637
#6640
#6641
#6642
#6645
#6648
#6653
#6657
#6684
#6688
#6689
#6690
#6691
#6692
#6693
#6698
#6701
#6710
#6722
#6753
#6767
#6771
#6778
#6779
#678
#6786
#6787
#6788
#6796
#6797
#68
#6801
#6810
#6814
#6830
#6831
#6834
#6843
#6854
#6855
#6857
#6865
#6866
#6868
#6874
#6879
#6890
#6892
#6895
#6896
#6899
#6901
#6902
#6903
#6904
#6905
#6906
#6907
#6913
#6916
#6917
#6918
#6920
#6930
#6931
#6944
#6946
#6954
#6963
#6972
#6975
#6976
#6977
#6982
#6983
#6985
#6998
#7019
#7051
#7053
#7054
#7058
#7060
#7061
#7067
#7074
#7077
#7089
#7106
#7108
#7117
#7120
#7126
#7142
#7143
#7161
#7166
#7174
#7176
#7179
#7181
#7183
#7190
#7193
#7201
#7204
#7205
#7206
#7207
#7209
#7211
#7219
#7229
#7230
#7231
#7235
#7241
#7242
#7244
#7247
#7253
#7254
#7255
#7256
#7257
#7258
#7259
#7264
#7272
#7273
#7275
#7277
#7278
#7287
#7288
#7294
#7295
#7304
#7308
#7312
#7317
#7318
#7330
#7332
#7338
#7340
#7343
#7345
#7347
#7349
#7351
#7361
#7378
#7381
#7395
#7404
#741
#7413
#7419
#7420
#7432
#7436
#7437
#7440
#7441
#7442
#7445
#7448
#7449
#7453
#7455
#7456
#7462
#7466
#7469
#7471
#7481
#7500
#7505
#7509
#7519
#7523
#7530
#7537
#7546
#7553
#7564
#7566
#7567
#7570
#7573
#7576
#7578
#7594
#7609
#7611
#7612
#7623
#7625
#7635
#7638
#7639
#7644
#7645
#7646
#7647
#7654
#7655
#7657
#766
#7660
#7674
#7686
#7694
#7695
#7700
#7704
#7714
#7715
#7719
#7724
#7725
#7728
#7732
#7739
#7740
#7744
#7745
#7746
#7747
#7748
#7749
#7754
#7765
#7786
#7792
#7793
#7794
#7795
#7797
#7801
#7803
#7804
#7808
#7810
#7817
#7826
#7830
#7840
#7854
#786
#7867
#7870
#7872
#7875
#7879
#7883
#7885
#7887
#7910
#7911
#7912
#7913
#7923
#7924
#7928
#7945
#7946
#7958
#7962
#7964
#7966
#7974
#7988
#7992
#8000
#8015
#8039
#8042
#8050
#8051
#8057
#8067
#8077
#8078
#8095
#8099
#8101
#8103
#8108
#8109
#8110
#8124
#8125
#8128
#8129
#8130
#8156
#8159
#8161
#8162
#8167
#8176
#8178
#8179
#8180
#8181
#8183
#8195
#8196
#8197
#8201
#8202
#8203
#8215
#8220
#8227
#8235
#8245
#8248
#8249
#8258
#8264
#8270
#8276
#8286
#8288
#8291
#8293
#8298
#83
#8303
#8311
#8312
#8314
#8325
#8327
#8328
#8333
#8335
#8348
#8362
#8367
#8385
#8386
#8387
#8388
#8389
#8390
#8396
#84
#8403
#8414
#8421
#8422
#8423
#8432
#8433
#8438
#844
#8441
#8448
#8449
#8457
#8458
#8460
#8461
#8462
#8480
#8481
#8505
#8509
#8517
#8519
#8529
#8530
#8532
#8535
#8538
#8539
#8542
#8543
#8546
#8547
#8548
#8554
#8556
#8557
#8559
#8564
#8565
#8567
#8569
#8571
#8587
#86
#8614
#8623
#8627
#8637
#8651
#8680
#8685
#8689
#8721
#8722
#8731
#8736
#8739
#8750
#8752
#8762
#8770
#8773
#8774
#8776
#8783
#8784
#8787
#8788
#8795
#8812
#8813
#8818
#8823
#8826
#8827
#8829
#8839
#8842
#8845
#8851
#8861
#8863
#8866
#8869
#8875
#8876
#8887
#8899
#8906
#8917
#8930
#8960
#8961
#8962
#8970
#8972
#8975
#8976
#8978
#8985
#8992
#900
#9000
#9008
#9018
#9022
#9024
#9028
#9029
#9046
#9071
#9077
#9078
#9086
#9086
#9112
#9117
#9124
#9128
#9129
#9130
#9137
#9143
#9165
#9176
#9177
#9183
#9188
#9196
#9198
#9204
#9215
#9217
#9219
#9221
#9223
#9224
#9225
#9226
#9227
#9229
#9230
#9231
#9232
#9236
#9237
#9243
#9248
#9249
#9259
#9262
#9263
#9265
#975
v0.0.9
v0.1.0
v0.1.1
v0.1.2
v0.1.3
v0.1.4
v0.1.5
v0.1.6
v0.1.7
v0.1.8
v0.2.0
v0.2.1
v0.2.2
v0.3.0
v0.3.2
v0.3.3
v0.4.0
v0.5.0
v0.5.2
v0.5.3
v0.6.0
v0.6.1
v0.6.2
v0.6.3
v0.7.0
v0.7.1
v0.8.0
v0.8.1
v0.8.2
v0.8.3
v0.9.0
v0.9.1
v0.9.2
v0.9.3
Select branches
Hide Pull Requests
main
#1
#1059
#11
#1186
#119
#1252
#1326
#1348
#1353
#1375
#1436
#145
#1454
#1486
#1525
#1544
#1553
#156
#158
#1624
#1689
#1690
#1695
#1699
#1700
#171
#179
#1796
#1800
#1802
#1861
#1864
#1868
#1918
#1932
#1946
#1947
#1953
#1954
#200
#2007
#2019
#2100
#2117
#213
#2163
#2194
#22
#2201
#221
#2226
#2262
#2264
#2266
#2283
#2285
#2319
#2350
#2411
#2423
#2426
#2435
#2445
#2462
#2469
#2474
#2514
#2519
#2525
#2531
#2568
#2570
#2572
#2575
#258
#26
#2608
#2683
#2689
#2730
#2739
#2743
#2746
#2764
#2766
#2830
#2845
#2849
#2872
#2903
#2905
#2919
#2944
#2945
#2963
#2967
#2993
#3004
#3046
#3053
#3057
#306
#3066
#307
#3083
#3103
#3103
#3158
#3159
#3160
#3161
#3201
#3226
#3254
#3256
#3261
#3263
#3267
#3275
#3276
#3287
#3288
#3291
#33
#3332
#3338
#3357
#3371
#3383
#3394
#3412
#3423
#3435
#3449
#3450
#3454
#3471
#3484
#3487
#3490
#3498
#3511
#3513
#3527
#3532
#356
#3578
#3584
#3588
#3596
#3601
#3604
#3651
#3654
#3655
#3661
#3683
#3692
#3702
#3741
#3746
#3748
#3755
#3756
#3785
#3792
#3794
#3799
#3804
#3812
#382
#3829
#3835
#387
#3876
#3921
#3923
#3925
#3930
#3941
#395
#3958
#3976
#3987
#4003
#4006
#4007
#4009
#4011
#4015
#4029
#4043
#4045
#4053
#4066
#4080
#4082
#4083
#4098
#4099
#4119
#4136
#4166
#4167
#4173
#4191
#4204
#4224
#4227
#4234
#4237
#4245
#4246
#4307
#4309
#4314
#4321
#4329
#4334
#434
#4342
#4347
#4348
#4352
#4355
#4377
#4382
#4409
#4417
#4445
#4446
#4461
#451
#4544
#4561
#4580
#4589
#4590
#4636
#4651
#4662
#4663
#4673
#4680
#4680
#4686
#4687
#4691
#4692
#4700
#4706
#4724
#4733
#4746
#4781
#479
#4793
#4804
#4821
#4822
#4877
#4878
#4892
#4939
#4950
#4957
#4961
#4970
#4995
#4996
#5010
#5019
#5032
#5037
#5068
#5072
#5095
#51
#5109
#511
#5111
#5112
#5115
#5118
#5156
#516
#5163
#5170
#5185
#5188
#5193
#5208
#5226
#5230
#5233
#5237
#5242
#5278
#5290
#5317
#5323
#5326
#5339
#5343
#5346
#5365
#5372
#5388
#5405
#5424
#5427
#5438
#5445
#5451
#5458
#5473
#5475
#5480
#5483
#5486
#5507
#5522
#5532
#5533
#5536
#5546
#5547
#5555
#5563
#5574
#5580
#5581
#5585
#5606
#5615
#5639
#5642
#5653
#5665
#5673
#5746
#5752
#5752
#5758
#5781
#5799
#5801
#5816
#5819
#5839
#5852
#5856
#5857
#5871
#5873
#5880
#5889
#5895
#5897
#5901
#5906
#5907
#5909
#5910
#5912
#5913
#5914
#5920
#5922
#5924
#5926
#5927
#5929
#5933
#596
#5970
#5971
#5973
#598
#5982
#5984
#599
#5990
#5993
#6010
#6022
#6046
#6052
#6065
#6078
#6083
#6098
#6103
#6120
#6121
#6123
#6124
#6125
#6126
#6127
#6128
#6129
#6137
#6138
#6140
#6141
#6151
#6152
#6156
#6157
#6160
#6170
#6175
#619
#6190
#6192
#6204
#6224
#6226
#6233
#6238
#6242
#6246
#6251
#6253
#6265
#6275
#629
#6310
#6313
#6317
#6334
#6359
#6362
#6363
#6364
#6365
#6367
#6368
#6369
#6379
#6384
#6388
#6395
#6396
#6401
#6416
#6418
#6420
#6426
#6430
#644
#6441
#6443
#6444
#6457
#6462
#6465
#6471
#6478
#6483
#6492
#6493
#6498
#6503
#6506
#651
#6512
#6513
#6514
#6515
#6524
#6527
#6528
#6542
#6547
#6564
#6565
#657
#6585
#6588
#6597
#6598
#6600
#6601
#6617
#6620
#6624
#6625
#6626
#6628
#6629
#6631
#6632
#6637
#6640
#6641
#6642
#6645
#6648
#6653
#6657
#6684
#6688
#6689
#6690
#6691
#6692
#6693
#6698
#6701
#6710
#6722
#6753
#6767
#6771
#6778
#6779
#678
#6786
#6787
#6788
#6796
#6797
#68
#6801
#6810
#6814
#6830
#6831
#6834
#6843
#6854
#6855
#6857
#6865
#6866
#6868
#6874
#6879
#6890
#6892
#6895
#6896
#6899
#6901
#6902
#6903
#6904
#6905
#6906
#6907
#6913
#6916
#6917
#6918
#6920
#6930
#6931
#6944
#6946
#6954
#6963
#6972
#6975
#6976
#6977
#6982
#6983
#6985
#6998
#7019
#7051
#7053
#7054
#7058
#7060
#7061
#7067
#7074
#7077
#7089
#7106
#7108
#7117
#7120
#7126
#7142
#7143
#7161
#7166
#7174
#7176
#7179
#7181
#7183
#7190
#7193
#7201
#7204
#7205
#7206
#7207
#7209
#7211
#7219
#7229
#7230
#7231
#7235
#7241
#7242
#7244
#7247
#7253
#7254
#7255
#7256
#7257
#7258
#7259
#7264
#7272
#7273
#7275
#7277
#7278
#7287
#7288
#7294
#7295
#7304
#7308
#7312
#7317
#7318
#7330
#7332
#7338
#7340
#7343
#7345
#7347
#7349
#7351
#7361
#7378
#7381
#7395
#7404
#741
#7413
#7419
#7420
#7432
#7436
#7437
#7440
#7441
#7442
#7445
#7448
#7449
#7453
#7455
#7456
#7462
#7466
#7469
#7471
#7481
#7500
#7505
#7509
#7519
#7523
#7530
#7537
#7546
#7553
#7564
#7566
#7567
#7570
#7573
#7576
#7578
#7594
#7609
#7611
#7612
#7623
#7625
#7635
#7638
#7639
#7644
#7645
#7646
#7647
#7654
#7655
#7657
#766
#7660
#7674
#7686
#7694
#7695
#7700
#7704
#7714
#7715
#7719
#7724
#7725
#7728
#7732
#7739
#7740
#7744
#7745
#7746
#7747
#7748
#7749
#7754
#7765
#7786
#7792
#7793
#7794
#7795
#7797
#7801
#7803
#7804
#7808
#7810
#7817
#7826
#7830
#7840
#7854
#786
#7867
#7870
#7872
#7875
#7879
#7883
#7885
#7887
#7910
#7911
#7912
#7913
#7923
#7924
#7928
#7945
#7946
#7958
#7962
#7964
#7966
#7974
#7988
#7992
#8000
#8015
#8039
#8042
#8050
#8051
#8057
#8067
#8077
#8078
#8095
#8099
#8101
#8103
#8108
#8109
#8110
#8124
#8125
#8128
#8129
#8130
#8156
#8159
#8161
#8162
#8167
#8176
#8178
#8179
#8180
#8181
#8183
#8195
#8196
#8197
#8201
#8202
#8203
#8215
#8220
#8227
#8235
#8245
#8248
#8249
#8258
#8264
#8270
#8276
#8286
#8288
#8291
#8293
#8298
#83
#8303
#8311
#8312
#8314
#8325
#8327
#8328
#8333
#8335
#8348
#8362
#8367
#8385
#8386
#8387
#8388
#8389
#8390
#8396
#84
#8403
#8414
#8421
#8422
#8423
#8432
#8433
#8438
#844
#8441
#8448
#8449
#8457
#8458
#8460
#8461
#8462
#8480
#8481
#8505
#8509
#8517
#8519
#8529
#8530
#8532
#8535
#8538
#8539
#8542
#8543
#8546
#8547
#8548
#8554
#8556
#8557
#8559
#8564
#8565
#8567
#8569
#8571
#8587
#86
#8614
#8623
#8627
#8637
#8651
#8680
#8685
#8689
#8721
#8722
#8731
#8736
#8739
#8750
#8752
#8762
#8770
#8773
#8774
#8776
#8783
#8784
#8787
#8788
#8795
#8812
#8813
#8818
#8823
#8826
#8827
#8829
#8839
#8842
#8845
#8851
#8861
#8863
#8866
#8869
#8875
#8876
#8887
#8899
#8906
#8917
#8930
#8960
#8961
#8962
#8970
#8972
#8975
#8976
#8978
#8985
#8992
#900
#9000
#9008
#9018
#9022
#9024
#9028
#9029
#9046
#9071
#9077
#9078
#9086
#9086
#9112
#9117
#9124
#9128
#9129
#9130
#9137
#9143
#9165
#9176
#9177
#9183
#9188
#9196
#9198
#9204
#9215
#9217
#9219
#9221
#9223
#9224
#9225
#9226
#9227
#9229
#9230
#9231
#9232
#9236
#9237
#9243
#9248
#9249
#9259
#9262
#9263
#9265
#975
v0.0.9
v0.1.0
v0.1.1
v0.1.2
v0.1.3
v0.1.4
v0.1.5
v0.1.6
v0.1.7
v0.1.8
v0.2.0
v0.2.1
v0.2.2
v0.3.0
v0.3.2
v0.3.3
v0.4.0
v0.5.0
v0.5.2
v0.5.3
v0.6.0
v0.6.1
v0.6.2
v0.6.3
v0.7.0
v0.7.1
v0.8.0
v0.8.1
v0.8.2
v0.8.3
v0.9.0
v0.9.1
v0.9.2
v0.9.3
-
7500e761d3
[misc] update internvl constants (#7801)
Kingsley
2025-04-22 15:53:08 +08:00 -
fddcd43c88
[trainer] support early stop (#7797)
hoshi-hiyouga
2025-04-22 01:59:33 +08:00 -
0e4ce039ee
[data] improve mmplugin (#7795)
hoshi-hiyouga
2025-04-22 01:25:33 +08:00 -
b07628dea5
[example] add bash usage (#7794)
hoshi-hiyouga
2025-04-22 00:25:51 +08:00 -
12ada72ed4
[trainer] Add Muon Optimizer (#7749)
Juanxi Tian
2025-04-21 23:38:37 +08:00 -
416853dd25
[parser] support omegaconf (#7793)
hoshi-hiyouga
2025-04-21 23:30:30 +08:00 -
bd7bc31c79
[data] Fix wrong position ids with packed attention masks (#7754)
Changrui Chen
2025-04-21 16:19:36 +01:00 -
0ac641326b
[misc] fix new tokens adding (#7253)
flashJd
2025-04-21 23:19:02 +08:00 -
c5ba9106ec
[model] fix gemma3 export (#7786)
ddddng
2025-04-21 23:07:11 +08:00 -
3b2d3794a5
[misc] fix bug in constant (#7765)
Sachin Beldona
2025-04-21 10:06:31 -05:00 -
b605c20768
[assets] update wechat (#7792)
hoshi-hiyouga
2025-04-21 21:29:42 +08:00 -
39169986ef
[trainer] fix pt loss (#7748)
hoshi-hiyouga
2025-04-17 03:15:35 +08:00 -
86ebb219d6
[breaking] bump transformers to 4.45.0 & improve ci (#7746)
hoshi-hiyouga
2025-04-17 02:36:48 +08:00 -
d222f63cb7
[infer] set env for vllm ascend (#7745)
hoshi-hiyouga
2025-04-17 01:08:55 +08:00 -
2e518f255f
[model] support intern-VL 2.5-3 series (#7258)
Kingsley
2025-04-17 00:31:30 +08:00 -
8f88a4e6a4
[misc] improve entrypoint (#7345)
ENg-122
2025-04-16 21:48:23 +08:00 -
b9263ff5ac
[infer] support vllm-ascend (#7739)
leo-pony
2025-04-16 20:06:47 +08:00 -
ee2ab093a7
[api] fix chat messages (#7732)
hoshi-hiyouga
2025-04-15 16:39:08 +08:00 -
3df021d4d7
[deps] upgrade vllm (#7728)
hoshi-hiyouga
2025-04-15 14:57:40 +08:00 -
e252abf051
[docker] patch docker-rocm (#7725)
Joe Schoonover
2025-04-15 01:36:39 -04:00 -
1134baeedd
[assets] update model readme (#7724)
hoshi-hiyouga
2025-04-15 00:41:09 +08:00 -
2101399c94
[model] Support Kimi_VL thinking/instruct (#7719)
Kingsley
2025-04-15 00:21:58 +08:00 -
3f91a95250
[misc] fix env vars (#7715)
hoshi-hiyouga
2025-04-14 16:04:04 +08:00 -
7c61b35106
[misc] upgrade cli (#7714)
hoshi-hiyouga
2025-04-14 15:41:22 +08:00 -
f518bfba5b
[deps] upgrade transformers (#7704)
hoshi-hiyouga
2025-04-13 18:11:34 +08:00 -
8162f94db5
[model] add GLM-4-0414 (#7695)
Yuxuan Zhang
2025-04-13 17:10:45 +08:00 -
1f0c52b73c
[deps] fix uv conflicts (#7686)
hoshi-hiyouga
2025-04-11 18:02:24 +08:00 -
a8caf09c7f
[data] support for specifying a dataset in cloud storage (#7567)
Eric Tang
2025-04-09 20:31:35 -07:00 -
bb8d79bae2
[ray] allow for specifying ray.init kwargs (i.e. runtime_env) (#7647)
Eric Tang
2025-04-09 20:31:05 -07:00 -
1c436c9f25
[bugfix] enable_gemma_liger_kernel (#7660)
Dain Kim
2025-04-10 12:27:30 +09:00 -
1b0934bccb
[misc] fix cuda warn on intel GPU (#7655)
jilongW
2025-04-09 21:37:54 +08:00 -
4eec541857
[data] add coig-p dataset (#7657)
hoshi-hiyouga
2025-04-09 21:18:25 +08:00 -
89a4f9ec7f
[assets] update readme (#7654)
hoshi-hiyouga
2025-04-09 18:27:38 +08:00 -
1abd71b551
[assets] update readme (#7644)
hoshi-hiyouga
2025-04-09 01:06:06 +08:00 -
349c56c51c
[data] Fix bugs of
use_audio_in_video
in Qwen2.5 Omni (#7638)Kingsley
2025-04-08 18:40:10 +08:00 -
acb09fa3a3
[trainer] fix key error (#7635)
Shawn Tao
2025-04-08 18:39:50 +08:00 -
f75b91077b
[sglang] support transformers 4.51.0 (#7639)
Adarsh Shirawalmath
2025-04-08 16:09:23 +05:30 -
c3c0efbaa0
[misc] fix packing and eval plot (#7623)
hoshi-hiyouga
2025-04-07 18:20:57 +08:00 -
5115dc8c7f
[assets] update readme (#7612)
hoshi-hiyouga
2025-04-06 13:58:49 +08:00 -
831e7f1cfd
[model] add llama4 (#7611)
hoshi-hiyouga
2025-04-06 13:42:31 +08:00 -
d4cfa9507e
[data] fix qwen2.5 omni plugin (#7578)
Kingsley
2025-04-02 23:58:39 +08:00 -
d32c6c014d
[data] fix qwen2.5 omni plugin (#7573)
Kingsley
2025-04-02 21:28:52 +08:00 -
7b9deb9410
[trainer] fix batch processing in PPO trainer (#7576)
gechengze
2025-04-02 21:17:48 +08:00 -
5e22597ff1
[infer] vllm video/audio inference (#7566)
hoshi-hiyouga
2025-04-02 02:27:04 +08:00 -
2bfcad2394
[model] fix kv cache (#7564)
hoshi-hiyouga
2025-04-01 23:07:46 +08:00 -
a13b1bb49a
[model] fix use_cache patching for gemma3 multimodal (#7500)
Yu Shi Jie
2025-04-01 04:06:48 -04:00 -
d10467d178
[data] specify position_ids in PackedSupervisedDatasetProcessor for neat_packing (#7318)
Ritesh Goru
2025-04-01 13:33:13 +05:30 -
aac70663fd
[webui] fix launch with proxy (#7332)
taoharry
2025-04-01 15:52:56 +08:00 -
00409ff28a
[data] shard the dataset to allow multiprocessing when streaming is enabled (#7530)
Billy Cao
2025-04-01 15:36:23 +08:00 -
d70b3b4bc5
[trainer] new kto mismatch pair creation strategy (#7509)
Hao
2025-04-01 15:21:53 +08:00 -
e76eba051d
[data] fix qwen2.5 omni collator (#7553)
hoshi-hiyouga
2025-04-01 00:15:12 +08:00 -
7eed496336
[model] add Qwen2.5-Omni model (#7537)
Kingsley
2025-03-31 20:39:35 +08:00 -
0f8296626a
[deps] pin pydantic to 2.10.6 (#7546)
hoshi-hiyouga
2025-03-31 14:42:28 +08:00 -
8da1d2fa71
[data] fix pixtral plugin (#7505)
Kingsley
2025-03-27 17:06:40 +08:00 -
b578a7d5b6
[3rdparty] support swanlab lark notification (#7481)
Xu-pixel
2025-03-27 01:52:01 +08:00 -
24afceddb7
[trainer] fix wsd scheduler (#7304)
Kdump
2025-03-26 15:25:02 +08:00 -
0583d06676
[model] add qwen2vl 32b & upgrade peft (#7469)
hoshi-hiyouga
2025-03-25 12:15:58 +08:00 -
ec6a261568
[model] fix lora on quant models (#7456)
GuoCoder
2025-03-25 11:59:46 +08:00 -
6b3b97c738
[misc] update liger-kernel's monkey patch (#7453)
Xiaosu Zhu
2025-03-25 11:58:52 +08:00 -
6d3748f727
[misc] enable liger kernel for gemma3 text and paligemma (#7466)
AbdelKarim ELJANDOUBI
2025-03-25 02:27:43 +01:00 -
7c890170e3
[misc] enable liger kernel for gemma3 (#7462)
Kenny Lam
2025-03-24 11:09:59 +00:00 -
ca42c0c406
[assets] fix gemma3 readme (#7449)
hoshi-hiyouga
2025-03-24 10:31:25 +08:00 -
7203365b80
[trainer] fix vlm loss for transformers 4.49 (#7448)
hoshi-hiyouga
2025-03-24 10:24:05 +08:00 -
3612946dd9
[docker] upgrade to torch 2.6 (#7442)
rumichi
2025-03-23 22:18:08 +09:00 -
3aa4f32e9c
[misc] fix ci (#7441)
hoshi-hiyouga
2025-03-23 21:09:35 +08:00 -
304796b803
[misc] fix license (#7440)
hoshi-hiyouga
2025-03-23 19:31:56 +08:00 -
7cfd6e4bb0
[scripts] support compute score on vllm's predictions (#7419)
SnowFox4004
2025-03-23 19:21:01 +08:00 -
05b19d6952
[deps] upgrade transformers to 4.50.0 (#7437)
hoshi-hiyouga
2025-03-23 17:44:27 +08:00 -
919415dba9
[deps] upgrade vllm to 0.8 (#7436)
hoshi-hiyouga
2025-03-23 14:32:22 +08:00 -
a959c2a509
[misc] fix sglang deps (#7432)
Guo, Quan
2025-03-23 14:07:10 +08:00 -
db0a08db6f
[3rdparty] fix redundant process group destroy for ray (#7395)
Eric Tang
2025-03-20 19:56:47 -07:00 -
a306f0f5a2
[version] fix minicpmo (#7378)
hoshi-hiyouga
2025-03-20 16:59:31 +08:00 -
63752fccf7
[assets] update wechat (#7361)
hoshi-hiyouga
2025-03-18 21:31:09 +08:00 -
1f9773395b
[misc] set dev version (#7351)
hoshi-hiyouga
2025-03-18 00:10:53 +08:00 -
128b5b12b3
[data] fix template (#7349)
hoshi-hiyouga
2025-03-17 23:45:20 +08:00 -
d5915a7dd7
[assets] update videos (#7340)
hoshi-hiyouga
2025-03-17 15:48:02 +08:00 -
ec1154662b
[model] support hunyuan 7b (#7317)
Hertz
2025-03-15 20:55:24 +08:00 -
a44a53ebec
[inference] support sglang backend (#7278)
Qiaolin Yu
2025-03-14 16:37:58 -04:00 -
93e6184cbe
[data] gemma3 plugin pan and scan (#7294)
hoshi-hiyouga
2025-03-13 23:29:23 +08:00 -
0be0d7796a
[assets] update video (#7287)
hoshi-hiyouga
2025-03-13 18:45:47 +08:00 -
480369a9f2
[data] efficient 4d_attention_mask creation in neat_packing (#7272)
Ritesh Goru
2025-03-13 01:01:12 +05:30 -
650a9a9057
[misc] update format (#7277)
hoshi-hiyouga
2025-03-13 02:53:08 +08:00 -
4b9d8da5a4
[model] support gemma3 (#7273)
hoshi-hiyouga
2025-03-13 01:35:23 +08:00 -
e6159ad730
[misc] upgrade deps (#7257)
hoshi-hiyouga
2025-03-12 00:33:47 +08:00 -
264538cb26
[misc] upgrade format to py39 (#7256)
hoshi-hiyouga
2025-03-12 00:08:41 +08:00 -
5995800bce
[ci] update workflow (#7255)
hoshi-hiyouga
2025-03-11 22:57:49 +08:00 -
bf8b483186
[core] release v0.9.2 (#7254)
hoshi-hiyouga
2025-03-11 22:42:23 +08:00 -
e2299e261b
Merge pull request #7242 from hiyouga/hiyouga/release
v0.9.2
hoshi-hiyouga
2025-03-11 15:28:45 +08:00 -
8a44dce326
Merge pull request #7247 from hiyouga/hiyouga/commit
hoshi-hiyouga
2025-03-11 15:28:04 +08:00 -
6d9233833b
Merge pull request #7244 from hiyouga/hiyouga/token
hoshi-hiyouga
2025-03-11 15:17:15 +08:00 -
d019603835
support commit info
hiyouga
2025-03-11 15:13:59 +08:00 -
478e8194d9
remove exit in preprocess
hiyouga
2025-03-11 15:06:17 +08:00 -
1890d3dafe
release v0.9.2
hiyouga
2025-03-11 14:48:22 +08:00 -
522a3e8493
[infer] fix vllm args (#7235)
hoshi-hiyouga
2025-03-11 01:15:35 +08:00 -
18968405d0
[tracking] add swanlab_logdir param (#7219)
Ze-Yi LIN
2025-03-11 00:53:07 +08:00 -
71a1c1321a
[config] update args (#7231)
hoshi-hiyouga
2025-03-10 23:04:43 +08:00 -
cf58a6d860
[config] fix export max len (#7230)
hoshi-hiyouga
2025-03-10 16:46:08 +08:00 -
9adc0a2c3f
[assets] update readme (#7209)
hoshi-hiyouga
2025-03-07 17:27:49 +08:00 -
16419b2834
[data] fix loader (#7207)
hoshi-hiyouga
2025-03-07 17:20:46 +08:00 -
82a2bac866
[misc] fix ds config (#7205)
hoshi-hiyouga
2025-03-07 15:21:28 +08:00