mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-10-14 15:52:49 +08:00
Commit Graph
Select branches
Hide Pull Requests
main
#1
#1059
#11
#1186
#119
#1252
#1326
#1348
#1353
#1375
#1436
#145
#1454
#1486
#1525
#1544
#1553
#156
#158
#1624
#1689
#1690
#1695
#1699
#1700
#171
#179
#1796
#1800
#1802
#1861
#1864
#1868
#1918
#1932
#1946
#1947
#1953
#1954
#200
#2007
#2019
#2100
#2117
#213
#2163
#2194
#22
#2201
#221
#2226
#2262
#2264
#2266
#2283
#2285
#2319
#2350
#2411
#2423
#2426
#2435
#2445
#2462
#2469
#2474
#2514
#2519
#2525
#2531
#2568
#2570
#2572
#2575
#258
#26
#2608
#2683
#2689
#2730
#2739
#2743
#2746
#2764
#2766
#2830
#2845
#2849
#2872
#2903
#2905
#2919
#2944
#2945
#2963
#2967
#2993
#3004
#3046
#3053
#3057
#306
#3066
#307
#3083
#3103
#3103
#3158
#3159
#3160
#3161
#3201
#3226
#3254
#3256
#3261
#3263
#3267
#3275
#3276
#3287
#3288
#3291
#33
#3332
#3338
#3357
#3371
#3383
#3394
#3412
#3423
#3435
#3449
#3450
#3454
#3471
#3484
#3487
#3490
#3498
#3511
#3513
#3527
#3532
#356
#3578
#3584
#3588
#3596
#3601
#3604
#3651
#3654
#3655
#3661
#3683
#3692
#3702
#3741
#3746
#3748
#3755
#3756
#3785
#3792
#3794
#3799
#3804
#3812
#382
#3829
#3835
#387
#3876
#3921
#3923
#3925
#3930
#3941
#395
#3958
#3976
#3987
#4003
#4006
#4007
#4009
#4011
#4015
#4029
#4043
#4045
#4053
#4066
#4080
#4082
#4083
#4098
#4099
#4119
#4136
#4166
#4167
#4173
#4191
#4204
#4224
#4227
#4234
#4237
#4245
#4246
#4307
#4309
#4314
#4321
#4329
#4334
#434
#4342
#4347
#4348
#4352
#4355
#4377
#4382
#4409
#4417
#4445
#4446
#4461
#451
#4544
#4561
#4580
#4589
#4590
#4636
#4651
#4662
#4663
#4673
#4680
#4680
#4686
#4687
#4691
#4692
#4700
#4706
#4724
#4733
#4746
#4781
#479
#4793
#4804
#4821
#4822
#4877
#4878
#4892
#4939
#4950
#4957
#4961
#4970
#4995
#4996
#5010
#5019
#5032
#5037
#5068
#5072
#5095
#51
#5109
#511
#5111
#5112
#5115
#5118
#5156
#516
#5163
#5170
#5185
#5188
#5193
#5208
#5226
#5230
#5233
#5237
#5242
#5278
#5290
#5317
#5323
#5326
#5339
#5343
#5346
#5365
#5372
#5388
#5405
#5424
#5427
#5438
#5445
#5451
#5458
#5473
#5475
#5480
#5483
#5486
#5507
#5522
#5532
#5533
#5536
#5546
#5547
#5555
#5563
#5574
#5580
#5581
#5585
#5606
#5615
#5639
#5642
#5653
#5665
#5673
#5746
#5752
#5752
#5758
#5781
#5799
#5801
#5816
#5819
#5839
#5852
#5856
#5857
#5871
#5873
#5880
#5889
#5895
#5897
#5901
#5906
#5907
#5909
#5910
#5912
#5913
#5914
#5920
#5922
#5924
#5926
#5927
#5929
#5933
#596
#5970
#5971
#5973
#598
#5982
#5984
#599
#5990
#5993
#6010
#6022
#6046
#6052
#6065
#6078
#6083
#6098
#6103
#6120
#6121
#6123
#6124
#6125
#6126
#6127
#6128
#6129
#6137
#6138
#6140
#6141
#6151
#6152
#6156
#6157
#6160
#6170
#6175
#619
#6190
#6192
#6204
#6224
#6226
#6233
#6238
#6242
#6246
#6251
#6253
#6265
#6275
#629
#6310
#6313
#6317
#6334
#6359
#6362
#6363
#6364
#6365
#6367
#6368
#6369
#6379
#6384
#6388
#6395
#6396
#6401
#6416
#6418
#6420
#6426
#6430
#644
#6441
#6443
#6444
#6457
#6462
#6465
#6471
#6478
#6483
#6492
#6493
#6498
#6503
#6506
#651
#6512
#6513
#6514
#6515
#6524
#6527
#6528
#6542
#6547
#6564
#6565
#657
#6585
#6588
#6597
#6598
#6600
#6601
#6617
#6620
#6624
#6625
#6626
#6628
#6629
#6631
#6632
#6637
#6640
#6641
#6642
#6645
#6648
#6653
#6657
#6684
#6688
#6689
#6690
#6691
#6692
#6693
#6698
#6701
#6710
#6722
#6753
#6767
#6771
#6778
#6779
#678
#6786
#6787
#6788
#6796
#6797
#68
#6801
#6810
#6814
#6830
#6831
#6834
#6843
#6854
#6855
#6857
#6865
#6866
#6868
#6874
#6879
#6890
#6892
#6895
#6896
#6899
#6901
#6902
#6903
#6904
#6905
#6906
#6907
#6913
#6916
#6917
#6918
#6920
#6930
#6931
#6944
#6946
#6954
#6963
#6972
#6975
#6976
#6977
#6982
#6983
#6985
#6998
#7019
#7051
#7053
#7054
#7058
#7060
#7061
#7067
#7074
#7077
#7089
#7106
#7108
#7117
#7120
#7126
#7142
#7143
#7161
#7166
#7174
#7176
#7179
#7181
#7183
#7190
#7193
#7201
#7204
#7205
#7206
#7207
#7209
#7211
#7219
#7229
#7230
#7231
#7235
#7241
#7242
#7244
#7247
#7253
#7254
#7255
#7256
#7257
#7258
#7259
#7264
#7272
#7273
#7275
#7277
#7278
#7287
#7288
#7294
#7295
#7304
#7308
#7312
#7317
#7318
#7330
#7332
#7338
#7340
#7343
#7345
#7347
#7349
#7351
#7361
#7378
#7381
#7395
#7404
#741
#7413
#7419
#7420
#7432
#7436
#7437
#7440
#7441
#7442
#7445
#7448
#7449
#7453
#7455
#7456
#7462
#7466
#7469
#7471
#7481
#7500
#7505
#7509
#7519
#7523
#7530
#7537
#7546
#7553
#7564
#7566
#7567
#7570
#7573
#7576
#7578
#7594
#7609
#7611
#7612
#7623
#7625
#7635
#7638
#7639
#7644
#7645
#7646
#7647
#7654
#7655
#7657
#766
#7660
#7674
#7686
#7694
#7695
#7700
#7704
#7714
#7715
#7719
#7724
#7725
#7728
#7732
#7739
#7740
#7744
#7745
#7746
#7747
#7748
#7749
#7754
#7765
#7786
#7792
#7793
#7794
#7795
#7797
#7801
#7803
#7804
#7808
#7810
#7817
#7826
#7830
#7840
#7854
#786
#7867
#7870
#7872
#7875
#7879
#7883
#7885
#7887
#7910
#7911
#7912
#7913
#7923
#7924
#7928
#7945
#7946
#7958
#7962
#7964
#7966
#7974
#7988
#7992
#8000
#8015
#8039
#8042
#8050
#8051
#8057
#8067
#8077
#8078
#8095
#8099
#8101
#8103
#8108
#8109
#8110
#8124
#8125
#8128
#8129
#8130
#8156
#8159
#8161
#8162
#8167
#8176
#8178
#8179
#8180
#8181
#8183
#8195
#8196
#8197
#8201
#8202
#8203
#8215
#8220
#8227
#8235
#8245
#8248
#8249
#8258
#8264
#8270
#8276
#8286
#8288
#8291
#8293
#8298
#83
#8303
#8311
#8312
#8314
#8325
#8327
#8328
#8333
#8335
#8348
#8362
#8367
#8385
#8386
#8387
#8388
#8389
#8390
#8396
#84
#8403
#8414
#8421
#8422
#8423
#8432
#8433
#8438
#844
#8441
#8448
#8449
#8457
#8458
#8460
#8461
#8462
#8480
#8481
#8505
#8509
#8517
#8519
#8529
#8530
#8532
#8535
#8538
#8539
#8542
#8543
#8546
#8547
#8548
#8554
#8556
#8557
#8559
#8564
#8565
#8567
#8569
#8571
#8587
#86
#8614
#8623
#8627
#8637
#8651
#8680
#8685
#8689
#8721
#8722
#8731
#8736
#8739
#8750
#8752
#8762
#8770
#8773
#8774
#8776
#8783
#8784
#8787
#8788
#8795
#8812
#8813
#8818
#8823
#8826
#8827
#8829
#8839
#8842
#8845
#8851
#8861
#8863
#8866
#8869
#8875
#8876
#8887
#8899
#8906
#8917
#8930
#8960
#8961
#8962
#8970
#8972
#8975
#8976
#8978
#8985
#8992
#900
#9000
#9008
#9018
#9022
#9024
#9028
#9029
#9046
#9071
#9077
#9078
#9086
#9086
#9112
#9117
#9124
#9128
#9129
#9130
#9137
#9143
#9165
#9176
#9177
#9183
#9188
#9196
#9198
#9204
#9215
#9217
#9219
#9221
#9223
#9224
#9225
#9226
#9227
#9229
#9230
#9231
#9232
#9236
#9237
#9243
#9248
#9249
#9259
#9262
#9263
#9265
#975
v0.0.9
v0.1.0
v0.1.1
v0.1.2
v0.1.3
v0.1.4
v0.1.5
v0.1.6
v0.1.7
v0.1.8
v0.2.0
v0.2.1
v0.2.2
v0.3.0
v0.3.2
v0.3.3
v0.4.0
v0.5.0
v0.5.2
v0.5.3
v0.6.0
v0.6.1
v0.6.2
v0.6.3
v0.7.0
v0.7.1
v0.8.0
v0.8.1
v0.8.2
v0.8.3
v0.9.0
v0.9.1
v0.9.2
v0.9.3
Select branches
Hide Pull Requests
main
#1
#1059
#11
#1186
#119
#1252
#1326
#1348
#1353
#1375
#1436
#145
#1454
#1486
#1525
#1544
#1553
#156
#158
#1624
#1689
#1690
#1695
#1699
#1700
#171
#179
#1796
#1800
#1802
#1861
#1864
#1868
#1918
#1932
#1946
#1947
#1953
#1954
#200
#2007
#2019
#2100
#2117
#213
#2163
#2194
#22
#2201
#221
#2226
#2262
#2264
#2266
#2283
#2285
#2319
#2350
#2411
#2423
#2426
#2435
#2445
#2462
#2469
#2474
#2514
#2519
#2525
#2531
#2568
#2570
#2572
#2575
#258
#26
#2608
#2683
#2689
#2730
#2739
#2743
#2746
#2764
#2766
#2830
#2845
#2849
#2872
#2903
#2905
#2919
#2944
#2945
#2963
#2967
#2993
#3004
#3046
#3053
#3057
#306
#3066
#307
#3083
#3103
#3103
#3158
#3159
#3160
#3161
#3201
#3226
#3254
#3256
#3261
#3263
#3267
#3275
#3276
#3287
#3288
#3291
#33
#3332
#3338
#3357
#3371
#3383
#3394
#3412
#3423
#3435
#3449
#3450
#3454
#3471
#3484
#3487
#3490
#3498
#3511
#3513
#3527
#3532
#356
#3578
#3584
#3588
#3596
#3601
#3604
#3651
#3654
#3655
#3661
#3683
#3692
#3702
#3741
#3746
#3748
#3755
#3756
#3785
#3792
#3794
#3799
#3804
#3812
#382
#3829
#3835
#387
#3876
#3921
#3923
#3925
#3930
#3941
#395
#3958
#3976
#3987
#4003
#4006
#4007
#4009
#4011
#4015
#4029
#4043
#4045
#4053
#4066
#4080
#4082
#4083
#4098
#4099
#4119
#4136
#4166
#4167
#4173
#4191
#4204
#4224
#4227
#4234
#4237
#4245
#4246
#4307
#4309
#4314
#4321
#4329
#4334
#434
#4342
#4347
#4348
#4352
#4355
#4377
#4382
#4409
#4417
#4445
#4446
#4461
#451
#4544
#4561
#4580
#4589
#4590
#4636
#4651
#4662
#4663
#4673
#4680
#4680
#4686
#4687
#4691
#4692
#4700
#4706
#4724
#4733
#4746
#4781
#479
#4793
#4804
#4821
#4822
#4877
#4878
#4892
#4939
#4950
#4957
#4961
#4970
#4995
#4996
#5010
#5019
#5032
#5037
#5068
#5072
#5095
#51
#5109
#511
#5111
#5112
#5115
#5118
#5156
#516
#5163
#5170
#5185
#5188
#5193
#5208
#5226
#5230
#5233
#5237
#5242
#5278
#5290
#5317
#5323
#5326
#5339
#5343
#5346
#5365
#5372
#5388
#5405
#5424
#5427
#5438
#5445
#5451
#5458
#5473
#5475
#5480
#5483
#5486
#5507
#5522
#5532
#5533
#5536
#5546
#5547
#5555
#5563
#5574
#5580
#5581
#5585
#5606
#5615
#5639
#5642
#5653
#5665
#5673
#5746
#5752
#5752
#5758
#5781
#5799
#5801
#5816
#5819
#5839
#5852
#5856
#5857
#5871
#5873
#5880
#5889
#5895
#5897
#5901
#5906
#5907
#5909
#5910
#5912
#5913
#5914
#5920
#5922
#5924
#5926
#5927
#5929
#5933
#596
#5970
#5971
#5973
#598
#5982
#5984
#599
#5990
#5993
#6010
#6022
#6046
#6052
#6065
#6078
#6083
#6098
#6103
#6120
#6121
#6123
#6124
#6125
#6126
#6127
#6128
#6129
#6137
#6138
#6140
#6141
#6151
#6152
#6156
#6157
#6160
#6170
#6175
#619
#6190
#6192
#6204
#6224
#6226
#6233
#6238
#6242
#6246
#6251
#6253
#6265
#6275
#629
#6310
#6313
#6317
#6334
#6359
#6362
#6363
#6364
#6365
#6367
#6368
#6369
#6379
#6384
#6388
#6395
#6396
#6401
#6416
#6418
#6420
#6426
#6430
#644
#6441
#6443
#6444
#6457
#6462
#6465
#6471
#6478
#6483
#6492
#6493
#6498
#6503
#6506
#651
#6512
#6513
#6514
#6515
#6524
#6527
#6528
#6542
#6547
#6564
#6565
#657
#6585
#6588
#6597
#6598
#6600
#6601
#6617
#6620
#6624
#6625
#6626
#6628
#6629
#6631
#6632
#6637
#6640
#6641
#6642
#6645
#6648
#6653
#6657
#6684
#6688
#6689
#6690
#6691
#6692
#6693
#6698
#6701
#6710
#6722
#6753
#6767
#6771
#6778
#6779
#678
#6786
#6787
#6788
#6796
#6797
#68
#6801
#6810
#6814
#6830
#6831
#6834
#6843
#6854
#6855
#6857
#6865
#6866
#6868
#6874
#6879
#6890
#6892
#6895
#6896
#6899
#6901
#6902
#6903
#6904
#6905
#6906
#6907
#6913
#6916
#6917
#6918
#6920
#6930
#6931
#6944
#6946
#6954
#6963
#6972
#6975
#6976
#6977
#6982
#6983
#6985
#6998
#7019
#7051
#7053
#7054
#7058
#7060
#7061
#7067
#7074
#7077
#7089
#7106
#7108
#7117
#7120
#7126
#7142
#7143
#7161
#7166
#7174
#7176
#7179
#7181
#7183
#7190
#7193
#7201
#7204
#7205
#7206
#7207
#7209
#7211
#7219
#7229
#7230
#7231
#7235
#7241
#7242
#7244
#7247
#7253
#7254
#7255
#7256
#7257
#7258
#7259
#7264
#7272
#7273
#7275
#7277
#7278
#7287
#7288
#7294
#7295
#7304
#7308
#7312
#7317
#7318
#7330
#7332
#7338
#7340
#7343
#7345
#7347
#7349
#7351
#7361
#7378
#7381
#7395
#7404
#741
#7413
#7419
#7420
#7432
#7436
#7437
#7440
#7441
#7442
#7445
#7448
#7449
#7453
#7455
#7456
#7462
#7466
#7469
#7471
#7481
#7500
#7505
#7509
#7519
#7523
#7530
#7537
#7546
#7553
#7564
#7566
#7567
#7570
#7573
#7576
#7578
#7594
#7609
#7611
#7612
#7623
#7625
#7635
#7638
#7639
#7644
#7645
#7646
#7647
#7654
#7655
#7657
#766
#7660
#7674
#7686
#7694
#7695
#7700
#7704
#7714
#7715
#7719
#7724
#7725
#7728
#7732
#7739
#7740
#7744
#7745
#7746
#7747
#7748
#7749
#7754
#7765
#7786
#7792
#7793
#7794
#7795
#7797
#7801
#7803
#7804
#7808
#7810
#7817
#7826
#7830
#7840
#7854
#786
#7867
#7870
#7872
#7875
#7879
#7883
#7885
#7887
#7910
#7911
#7912
#7913
#7923
#7924
#7928
#7945
#7946
#7958
#7962
#7964
#7966
#7974
#7988
#7992
#8000
#8015
#8039
#8042
#8050
#8051
#8057
#8067
#8077
#8078
#8095
#8099
#8101
#8103
#8108
#8109
#8110
#8124
#8125
#8128
#8129
#8130
#8156
#8159
#8161
#8162
#8167
#8176
#8178
#8179
#8180
#8181
#8183
#8195
#8196
#8197
#8201
#8202
#8203
#8215
#8220
#8227
#8235
#8245
#8248
#8249
#8258
#8264
#8270
#8276
#8286
#8288
#8291
#8293
#8298
#83
#8303
#8311
#8312
#8314
#8325
#8327
#8328
#8333
#8335
#8348
#8362
#8367
#8385
#8386
#8387
#8388
#8389
#8390
#8396
#84
#8403
#8414
#8421
#8422
#8423
#8432
#8433
#8438
#844
#8441
#8448
#8449
#8457
#8458
#8460
#8461
#8462
#8480
#8481
#8505
#8509
#8517
#8519
#8529
#8530
#8532
#8535
#8538
#8539
#8542
#8543
#8546
#8547
#8548
#8554
#8556
#8557
#8559
#8564
#8565
#8567
#8569
#8571
#8587
#86
#8614
#8623
#8627
#8637
#8651
#8680
#8685
#8689
#8721
#8722
#8731
#8736
#8739
#8750
#8752
#8762
#8770
#8773
#8774
#8776
#8783
#8784
#8787
#8788
#8795
#8812
#8813
#8818
#8823
#8826
#8827
#8829
#8839
#8842
#8845
#8851
#8861
#8863
#8866
#8869
#8875
#8876
#8887
#8899
#8906
#8917
#8930
#8960
#8961
#8962
#8970
#8972
#8975
#8976
#8978
#8985
#8992
#900
#9000
#9008
#9018
#9022
#9024
#9028
#9029
#9046
#9071
#9077
#9078
#9086
#9086
#9112
#9117
#9124
#9128
#9129
#9130
#9137
#9143
#9165
#9176
#9177
#9183
#9188
#9196
#9198
#9204
#9215
#9217
#9219
#9221
#9223
#9224
#9225
#9226
#9227
#9229
#9230
#9231
#9232
#9236
#9237
#9243
#9248
#9249
#9259
#9262
#9263
#9265
#975
v0.0.9
v0.1.0
v0.1.1
v0.1.2
v0.1.3
v0.1.4
v0.1.5
v0.1.6
v0.1.7
v0.1.8
v0.2.0
v0.2.1
v0.2.2
v0.3.0
v0.3.2
v0.3.3
v0.4.0
v0.5.0
v0.5.2
v0.5.3
v0.6.0
v0.6.1
v0.6.2
v0.6.3
v0.7.0
v0.7.1
v0.8.0
v0.8.1
v0.8.2
v0.8.3
v0.9.0
v0.9.1
v0.9.2
v0.9.3
-
9cd81aa424
[misc] fix ci (#8441)
Yaowei Zheng
2025-06-24 16:37:32 +08:00 -
ecbccb4c5d
[model] Add mistral-small 3.2 & kimi-dev (#8433)
Kingsley
2025-06-24 14:59:47 +08:00 -
9af7915f7b
[model] add kimi vl 2506 (#8432)
Yaowei Zheng
2025-06-23 17:56:48 +08:00 -
7b252b2368
[model] unsloth resume from checkpoint bug (#8423)
Vivek Iyer
2025-06-23 04:43:54 -04:00 -
88a92be808
[model] add support for Falcon H1 (#8403)
Dhia Eddine Rhaiem
2025-06-18 12:51:23 +04:00 -
c6c764388c
[assets] update readme (#8396)
Yaowei Zheng
2025-06-17 16:15:20 +08:00 -
3e392473d1
[misc] set dev version (#8389)
Yaowei Zheng
2025-06-17 01:39:25 +08:00 -
ad345ec054
[ci] add docker version (#8390)
Yaowei Zheng
2025-06-17 01:37:47 +08:00 -
ca75f1edf3
[model] fix vlm utils (#8388)
v0.9.3
Yaowei Zheng
2025-06-17 01:08:49 +08:00 -
3a3bae1cfe
[data] fix qwen2vl pos ids (#8387)
Yaowei Zheng
2025-06-17 00:48:54 +08:00 -
31874e4f62
[version] release v0.9.3 (#8386)
Yaowei Zheng
2025-06-16 19:21:32 +08:00 -
9a2d1dec62
[assets] update wechat (#8385)
Yaowei Zheng
2025-06-16 18:23:22 +08:00 -
8e4ac78607
[trainer] Add LD-DPO objective (#8362)
Aman Gupta
2025-06-12 01:10:38 -07:00 -
44f1b9b5ad
[misc] tiny fixes (#8348)
Yaowei Zheng
2025-06-10 15:30:58 +08:00 -
b41697c9b6
[model] support MiniCPM4 (#8314)
阿丹(adan)
2025-06-10 14:38:39 +08:00 -
31bca4d172
[model] support Mistral3.1 small 2503 (#8335)
Kingsley
2025-06-09 10:37:42 +08:00 -
fa4360dca7
[assets] Add awesome works used LLaMA-Factory (#8333)
Chenhao Zhang
2025-06-09 10:21:17 +08:00 -
9acab4949d
[model] fix model generate (#8327)
Yaowei Zheng
2025-06-07 08:47:50 +08:00 -
32b4574094
[model] pushing FFT with unsloth (#8325)
Vivek Iyer
2025-06-06 20:20:58 -04:00 -
03a93ec513
[data] fix empty template (#8312)
Yaowei Zheng
2025-06-06 13:50:50 +08:00 -
bcb6b94658
[setup] fix uv (#8311)
Yaowei Zheng
2025-06-06 11:54:15 +08:00 -
c0710be6d7
[assets] update readme (#8303)
Yaowei Zheng
2025-06-05 23:23:15 +08:00 -
212a8006dc
[tests] add visual model save test (#8248)
Kingsley
2025-06-05 20:38:01 +08:00 -
ed70f8d5a2
[assets] fix npu docker (#8298)
Yaowei Zheng
2025-06-05 19:09:20 +08:00 -
1a33d65a56
[launcher] Add elastic and fault-tolerant training support (#8286)
Butui Hu
2025-06-05 16:40:03 +08:00 -
69c9e379d5
[script] add Script description for qwen_omni_merge (#8293)
Kingsley
2025-06-05 13:22:01 +08:00 -
e9fe9cee29
[assets] update docker files (#8291)
Yaowei Zheng
2025-06-04 23:30:46 +08:00 -
cb7ab69783
[assets] update readme (#8288)
Yaowei Zheng
2025-06-04 17:46:12 +08:00 -
c1ed76e109
[assets] add icon (#8276)
Yaowei Zheng
2025-06-03 20:36:21 +08:00 -
c224d17cb2
[data] support nested images input for videos (#8264)
Kingsley
2025-06-03 20:26:29 +08:00 -
c4e51d40e0
[tracking] swanlab add llamafactory tag (#8258)
Ze-Yi LIN
2025-06-03 18:42:29 +08:00 -
554e89ff02
[model] add MIMO_VL (#8249)
Kingsley
2025-06-01 03:54:54 +08:00 -
fee2122f09
[deps] upgrade transformers to 4.52.4 (#8245)
Yaowei Zheng
2025-05-31 16:51:40 +08:00 -
c7e63bead7
[model] add smollm2 support (#8220)
Akshat Sehgal
2025-05-31 01:29:01 -07:00 -
3e1a7fcb9c
[assets] update readme (#8235)
hoshi-hiyouga
2025-05-30 16:52:12 +08:00 -
2aaede8ef4
[scripts] specify model class for qwen_omni merge (#8227)
Kingsley
2025-05-30 14:20:12 +08:00 -
42bebc341d
[model] add deepseek 0528 models (#8215)
hoshi-hiyouga
2025-05-29 21:37:07 +08:00 -
83a9ff5853
[assets] fix docker images (#8203)
hoshi-hiyouga
2025-05-28 22:26:05 +08:00 -
519bab86e6
[workflow] auto push docker images (#8181)
yzoaim
2025-05-28 20:21:15 +08:00 -
dbc9f5a5d9
[assets] update Dockerfile (#8201)
hoshi-hiyouga
2025-05-28 20:20:59 +08:00 -
9b152d9cb5
[webui] fix skip args (#8195)
hoshi-hiyouga
2025-05-28 18:11:07 +08:00 -
6c3cd400b5
[data] Reading files from cloud is broken (#8182) (#8183)
Youngwoo Kim
2025-05-28 16:50:44 +09:00 -
4d3ffa2ec4
[assets] fix docker image (#8180)
hoshi-hiyouga
2025-05-27 19:01:31 +08:00 -
2bf8e993ab
[data] fix shared file system (#8179)
hoshi-hiyouga
2025-05-27 18:36:03 +08:00 -
d4a413eb37
[webui] add extra args to export (#8178)
hoshi-hiyouga
2025-05-27 18:25:31 +08:00 -
00974a3169
[assets] update docker files (#8176)
hoshi-hiyouga
2025-05-27 18:15:23 +08:00 -
46ccf84aaa
[webui] add infer extra args (#8167)
hoshi-hiyouga
2025-05-27 12:04:00 +08:00 -
07343ca83d
[webui] fix input args (#8162)
hoshi-hiyouga
2025-05-27 02:05:54 +08:00 -
3c7dc66a92
[model] add smollm2 and medgemma (#8161)
hoshi-hiyouga
2025-05-26 23:19:58 +08:00 -
ba032828e2
[deps] upgrade transformers (#8159)
hoshi-hiyouga
2025-05-26 22:03:58 +08:00 -
501e7d8a8f
feat: add smollm support (#8050)
Akshat Sehgal
2025-05-26 04:47:54 -07:00 -
12292e4283
[api] support repetition_penalty and align presence_penalty with OpenAI Client (#7958)
wangzhan
2025-05-26 18:45:11 +08:00 -
f08b748199
[data] fix internvl plugin when using PIL images (#8129)
Kingsley
2025-05-22 01:32:59 +08:00 -
d2a3036a23
[misc] update data readme (#8128)
hoshi-hiyouga
2025-05-21 22:41:18 +08:00 -
9ae17cd173
[deps] update to transformers 4.52 (#8125)
hoshi-hiyouga
2025-05-21 05:16:18 +08:00 -
56926d76f9
[data] llama3 multi tool support (#8124)
hoshi-hiyouga
2025-05-21 02:01:12 +08:00 -
c2f6f2fa77
[assets] update readme (#8110)
hoshi-hiyouga
2025-05-20 02:44:18 +08:00 -
9b5baa97f0
[data] qwen3 fixes (#8109)
hoshi-hiyouga
2025-05-20 02:00:30 +08:00 -
45030ff803
[model] switch to gptqmodel (#8108)
hoshi-hiyouga
2025-05-19 22:25:40 +08:00 -
bc7f00f2c7
[model] update rope kwargs for yarn (#8101)
piamo
2025-05-19 20:07:54 +08:00 -
beae231af6
[doc] add no build isolation (#8103)
hoshi-hiyouga
2025-05-19 19:25:13 +08:00 -
a0b4b91577
[trainer] fix KeyError at end of pretrain (#8099)
Ma, Xiaochen
2025-05-19 18:01:26 +08:00 -
90492f3582
[misc] fix cli (#8095)
Biao Wang
2025-05-19 17:59:39 +08:00 -
ab41f7956c
[infer] support lora adapter for SGLang backend (#8067)
Saiya
2025-05-16 23:33:47 +08:00 -
52b23f9e56
[data] add forward compatibility for video_utils in Transformers 4.52.0 (#8077)
Kingsley
2025-05-16 17:41:04 +08:00 -
a9aa392ba4
[data] support loading folder from remote (#8078)
Eric Tang
2025-05-16 00:35:38 -07:00 -
0b773234e5
[infer] Modify vllm_infer.py to batch preprocess to avoid too much files opened error (#8051)
Shawn Tao
2025-05-15 10:54:35 +08:00 -
712c57f3b4
[assets] update windows installation (#8042)
hoshi-hiyouga
2025-05-13 17:01:56 +08:00 -
dc080399c6
[model] add seed coder and qwen3 quant models (#8039)
hoshi-hiyouga
2025-05-13 15:59:55 +08:00 -
68fc068cab
[data] fix kimi vl template (#8015)
hoshi-hiyouga
2025-05-11 20:45:19 +08:00 -
9620825892
[scripts] add video params for vllm infer (#7992)
Kingsley
2025-05-09 21:16:52 +08:00 -
26cbb03a5f
[data] Avoid repetitive tool description warp (#8000)
yunhao-tech
2025-05-09 21:16:37 +08:00 -
5f4b793e04
[docs] add GraphGen (#7974)
tpoisonooo
2025-05-07 18:23:11 +08:00 -
994ab6424a
[misc] update liger kernel patch (#7966)
hoshi-hiyouga
2025-05-06 20:32:16 +02:00 -
aa9ed4db59
[example] update examples (#7964)
hoshi-hiyouga
2025-05-06 17:24:25 +02:00 -
ef86a53063
[model] add mimo7b (#7946)
Kingsley
2025-05-06 23:10:30 +08:00 -
bf0286e1e3
[misc] fix qwen2 omni (#7962)
hoshi-hiyouga
2025-05-06 15:39:13 +02:00 -
ce7032e1b3
[model] add qwen2 omni 3b (#7945)
hoshi-hiyouga
2025-05-03 16:36:51 +08:00 -
5763017cea
[assets] Warp Support README Update (#7887)
Eric Chen
2025-05-01 12:08:48 -04:00 -
13b05e74f1
[hparam] add enable think argument (#7928)
hoshi-hiyouga
2025-04-30 17:21:30 +08:00 -
c566e39b7d
[data] fix base plugin (#7924)
hoshi-hiyouga
2025-04-30 16:28:05 +08:00 -
052ca871bd
[data] optimize qwen3 loss computation (#7923)
hoshi-hiyouga
2025-04-30 16:18:00 +08:00 -
73198a6645
[misc] fix uv (#7913)
hoshi-hiyouga
2025-04-30 07:45:03 +08:00 -
d4ee44bdef
[data] add eval_on_each_dataset arg (#7912)
hoshi-hiyouga
2025-04-30 06:56:43 +08:00 -
6d2cde43e7
[data] replace eos token for base models (#7911)
hoshi-hiyouga
2025-04-30 06:52:28 +08:00 -
11295cdea0
[data] improve mm plugin (#7910)
hoshi-hiyouga
2025-04-30 06:34:28 +08:00 -
98f23c6584
[model] add qwen3 (#7885)
hoshi-hiyouga
2025-04-29 09:34:05 +08:00 -
db9559456c
[data] fix qwen2.5 omni template (#7883)
Kingsley
2025-04-29 00:58:23 +08:00 -
3ae5da2a04
[model] fix dsv3 leaf node (#7879)
hoshi-hiyouga
2025-04-28 18:11:09 +08:00 -
d173cb50f5
[data] fix qwen2 omni plugin (#7875)
hoshi-hiyouga
2025-04-28 14:22:41 +08:00 -
df27d7e48a
[trainer] make projector trainable in freeze training (#7872)
zhaop-l
2025-04-28 13:19:37 +08:00 -
bb5b83352b
[data] fix minicpmo vllm infer (#7870)
hoshi-hiyouga
2025-04-28 01:59:53 +08:00 -
1157f4e246
fix attn patch for kimivl (#7867)
Kingsley
2025-04-27 23:12:28 +08:00 -
ef03832cd4
[ray] add storage filesystem to ray config (#7854)
Eric Tang
2025-04-27 07:12:40 -07:00 -
2233b739fa
[model] fix vit gradient checkpointing (#7830)
hoshi-hiyouga
2025-04-23 22:48:48 +08:00 -
091d2539e8
Merge commit from fork
hoshi-hiyouga
2025-04-23 16:38:27 +08:00 -
c1a7f2ebb2
[model] fix moe zero3 (#7826)
hoshi-hiyouga
2025-04-23 15:30:49 +08:00 -
fa0eb91f1f
[data] fix internvl plugin (#7817)
Kingsley
2025-04-23 00:58:22 +08:00 -
49f9ed0232
[assets] update model readme (#7804)
hoshi-hiyouga
2025-04-22 16:43:56 +08:00 -
2a564c25d1
[model] add arch check for InternVL (#7803)
Kingsley
2025-04-22 16:38:05 +08:00