mirror of
https://github.com/hiyouga/LLaMA-Factory.git
synced 2025-12-27 01:00:34 +08:00
Commit Graph
Select branches
Hide Pull Requests
hiyouga/misc
main
#1
#1059
#11
#1186
#119
#1252
#1326
#1348
#1353
#1375
#1436
#145
#1454
#1486
#1525
#1544
#1553
#156
#158
#1624
#1689
#1690
#1695
#1699
#1700
#171
#179
#1796
#1800
#1802
#1861
#1864
#1868
#1918
#1932
#1946
#1947
#1953
#1954
#200
#2007
#2019
#2100
#2117
#213
#2163
#2194
#22
#2201
#221
#2226
#2262
#2264
#2266
#2283
#2285
#2319
#2350
#2411
#2423
#2426
#2435
#2445
#2462
#2469
#2474
#2514
#2519
#2525
#2531
#2568
#2570
#2572
#2575
#258
#26
#2608
#2683
#2689
#2730
#2739
#2743
#2746
#2764
#2766
#2830
#2845
#2849
#2872
#2903
#2905
#2919
#2944
#2945
#2963
#2967
#2993
#3004
#3046
#3053
#3057
#306
#3066
#307
#3083
#3103
#3103
#3158
#3159
#3160
#3161
#3201
#3226
#3254
#3256
#3261
#3263
#3267
#3275
#3276
#3287
#3288
#3291
#33
#3332
#3338
#3357
#3371
#3383
#3394
#3412
#3423
#3435
#3449
#3450
#3454
#3471
#3484
#3487
#3490
#3498
#3511
#3513
#3527
#3532
#356
#3578
#3584
#3588
#3596
#3601
#3604
#3651
#3654
#3655
#3661
#3683
#3692
#3702
#3741
#3746
#3748
#3755
#3756
#3785
#3792
#3794
#3799
#3804
#3812
#382
#3829
#3835
#387
#3876
#3921
#3923
#3925
#3930
#3941
#395
#3958
#3976
#3987
#4003
#4006
#4007
#4009
#4011
#4015
#4029
#4043
#4045
#4053
#4066
#4080
#4082
#4083
#4098
#4099
#4119
#4136
#4166
#4167
#4173
#4191
#4204
#4224
#4227
#4234
#4237
#4245
#4246
#4307
#4309
#4314
#4321
#4329
#4334
#434
#4342
#4347
#4348
#4352
#4355
#4377
#4382
#4409
#4417
#4445
#4446
#4461
#451
#4544
#4561
#4580
#4589
#4590
#4636
#4651
#4662
#4663
#4673
#4680
#4680
#4686
#4687
#4691
#4692
#4700
#4706
#4724
#4733
#4746
#4781
#479
#4793
#4804
#4821
#4822
#4877
#4878
#4892
#4939
#4950
#4957
#4961
#4970
#4995
#4996
#5010
#5019
#5032
#5037
#5068
#5072
#5095
#51
#5109
#511
#5111
#5112
#5115
#5118
#5156
#516
#5163
#5170
#5185
#5188
#5193
#5208
#5226
#5230
#5233
#5237
#5242
#5278
#5290
#5317
#5323
#5326
#5339
#5343
#5346
#5365
#5372
#5388
#5405
#5424
#5427
#5438
#5445
#5451
#5458
#5473
#5475
#5480
#5483
#5486
#5507
#5522
#5532
#5533
#5536
#5546
#5547
#5555
#5563
#5574
#5580
#5581
#5585
#5606
#5615
#5639
#5642
#5653
#5665
#5673
#5746
#5752
#5752
#5758
#5781
#5799
#5801
#5816
#5819
#5839
#5852
#5856
#5857
#5871
#5873
#5880
#5889
#5895
#5897
#5901
#5906
#5907
#5909
#5910
#5912
#5913
#5914
#5920
#5922
#5924
#5926
#5927
#5929
#5933
#596
#5970
#5971
#5973
#598
#5982
#5984
#599
#5990
#5993
#6010
#6022
#6046
#6052
#6065
#6078
#6083
#6098
#6103
#6120
#6121
#6123
#6124
#6125
#6126
#6127
#6128
#6129
#6137
#6138
#6140
#6141
#6151
#6152
#6156
#6157
#6160
#6170
#6175
#619
#6190
#6192
#6204
#6224
#6226
#6233
#6238
#6242
#6246
#6251
#6253
#6265
#6275
#629
#6310
#6313
#6317
#6334
#6359
#6362
#6363
#6364
#6365
#6367
#6368
#6369
#6379
#6384
#6388
#6395
#6396
#6401
#6416
#6418
#6420
#6426
#6430
#644
#6441
#6443
#6444
#6457
#6462
#6465
#6471
#6478
#6483
#6492
#6493
#6498
#6503
#6506
#651
#6512
#6513
#6514
#6515
#6524
#6527
#6528
#6542
#6547
#6564
#6565
#657
#6585
#6588
#6597
#6598
#6600
#6601
#6617
#6620
#6624
#6625
#6626
#6628
#6629
#6631
#6632
#6637
#6640
#6641
#6642
#6645
#6648
#6653
#6657
#6684
#6688
#6689
#6690
#6691
#6692
#6693
#6698
#6701
#6710
#6722
#6753
#6767
#6771
#6778
#6779
#678
#6786
#6787
#6788
#6796
#6797
#68
#6801
#6810
#6814
#6830
#6831
#6834
#6843
#6854
#6855
#6857
#6865
#6866
#6868
#6874
#6879
#6890
#6892
#6895
#6896
#6899
#6901
#6902
#6903
#6904
#6905
#6906
#6907
#6913
#6916
#6917
#6918
#6920
#6930
#6931
#6944
#6946
#6954
#6963
#6972
#6975
#6976
#6977
#6982
#6983
#6985
#6998
#7019
#7051
#7053
#7054
#7058
#7060
#7061
#7067
#7074
#7077
#7089
#7106
#7108
#7117
#7120
#7126
#7142
#7143
#7161
#7166
#7174
#7176
#7179
#7181
#7183
#7190
#7193
#7201
#7204
#7205
#7206
#7207
#7209
#7211
#7219
#7229
#7230
#7231
#7235
#7241
#7242
#7244
#7247
#7253
#7254
#7255
#7256
#7257
#7258
#7259
#7264
#7272
#7273
#7275
#7277
#7278
#7287
#7288
#7294
#7295
#7304
#7308
#7312
#7317
#7318
#7330
#7332
#7338
#7340
#7343
#7345
#7347
#7349
#7351
#7361
#7378
#7381
#7395
#7404
#741
#7413
#7419
#7420
#7432
#7436
#7437
#7440
#7441
#7442
#7445
#7448
#7449
#7453
#7455
#7456
#7462
#7466
#7469
#7471
#7481
#7500
#7505
#7509
#7519
#7523
#7530
#7537
#7546
#7553
#7564
#7566
#7567
#7570
#7573
#7576
#7578
#7594
#7609
#7611
#7612
#7623
#7625
#7635
#7638
#7639
#7644
#7645
#7646
#7647
#7654
#7655
#7657
#766
#7660
#7674
#7686
#7694
#7695
#7700
#7704
#7714
#7715
#7719
#7724
#7725
#7728
#7732
#7739
#7740
#7744
#7745
#7746
#7747
#7748
#7749
#7754
#7765
#7786
#7792
#7793
#7794
#7795
#7797
#7801
#7803
#7804
#7808
#7810
#7817
#7826
#7830
#7840
#7854
#786
#7867
#7870
#7872
#7875
#7879
#7883
#7885
#7887
#7910
#7911
#7912
#7913
#7923
#7924
#7928
#7945
#7946
#7958
#7962
#7964
#7966
#7974
#7988
#7992
#8000
#8015
#8039
#8042
#8050
#8051
#8057
#8067
#8077
#8078
#8095
#8099
#8101
#8103
#8108
#8109
#8110
#8124
#8125
#8128
#8129
#8130
#8156
#8159
#8161
#8162
#8167
#8176
#8178
#8179
#8180
#8181
#8183
#8195
#8196
#8197
#8201
#8202
#8203
#8215
#8220
#8227
#8235
#8245
#8248
#8249
#8258
#8264
#8270
#8276
#8286
#8288
#8291
#8293
#8298
#83
#8303
#8311
#8312
#8314
#8325
#8327
#8328
#8333
#8335
#8348
#8362
#8367
#8385
#8386
#8387
#8388
#8389
#8390
#8396
#84
#8403
#8414
#8421
#8422
#8423
#8432
#8433
#8438
#844
#8441
#8448
#8449
#8457
#8458
#8460
#8461
#8462
#8480
#8481
#8505
#8509
#8517
#8519
#8529
#8530
#8532
#8535
#8538
#8539
#8542
#8543
#8546
#8547
#8548
#8554
#8556
#8557
#8559
#8564
#8565
#8567
#8569
#8571
#8587
#86
#8614
#8623
#8627
#8637
#8651
#8680
#8685
#8689
#8721
#8722
#8731
#8736
#8739
#8750
#8752
#8762
#8770
#8773
#8774
#8776
#8783
#8784
#8787
#8788
#8795
#8812
#8813
#8818
#8823
#8826
#8827
#8829
#8839
#8842
#8845
#8851
#8861
#8863
#8866
#8869
#8875
#8876
#8887
#8899
#8906
#8917
#8930
#8960
#8961
#8962
#8970
#8972
#8975
#8976
#8978
#8985
#8992
#900
#9000
#9008
#9018
#9022
#9024
#9028
#9029
#9046
#9071
#9077
#9078
#9086
#9086
#9112
#9117
#9124
#9128
#9129
#9130
#9137
#9143
#9165
#9176
#9177
#9183
#9188
#9196
#9198
#9204
#9215
#9217
#9219
#9221
#9223
#9224
#9225
#9226
#9227
#9229
#9230
#9231
#9232
#9236
#9237
#9243
#9248
#9249
#9259
#9262
#9263
#9265
#9267
#9274
#9275
#9284
#9293
#9296
#9297
#9299
#9316
#9333
#9337
#9337
#9343
#9351
#9351
#9352
#9354
#9360
#9368
#9370
#9370
#9388
#9391
#9395
#9397
#9399
#9400
#9405
#9406
#9407
#9409
#9449
#9463
#9467
#9477
#9484
#9485
#9486
#9492
#9501
#9504
#9505
#9509
#9511
#9514
#9518
#9520
#9521
#9532
#9536
#9539
#9541
#9543
#9544
#9547
#9549
#9549
#9552
#9557
#9569
#9575
#9579
#9582
#9586
#9587
#9588
#9593
#9595
#9602
#9604
#9607
#9608
#9610
#9611
#9612
#9613
#9615
#9615
#9616
#9617
#9617
#9619
#9621
#9624
#9626
#9627
#9630
#9630
#9632
#9633
#9634
#9636
#9637
#9638
#9640
#9643
#9645
#9649
#9651
#9652
#9654
#9661
#9665
#9669
#9669
#9670
#9673
#9675
#9676
#9676
#975
v0.0.9
v0.1.0
v0.1.1
v0.1.2
v0.1.3
v0.1.4
v0.1.5
v0.1.6
v0.1.7
v0.1.8
v0.2.0
v0.2.1
v0.2.2
v0.3.0
v0.3.2
v0.3.3
v0.4.0
v0.5.0
v0.5.2
v0.5.3
v0.6.0
v0.6.1
v0.6.2
v0.6.3
v0.7.0
v0.7.1
v0.8.0
v0.8.1
v0.8.2
v0.8.3
v0.9.0
v0.9.1
v0.9.2
v0.9.3
Select branches
Hide Pull Requests
hiyouga/misc
main
#1
#1059
#11
#1186
#119
#1252
#1326
#1348
#1353
#1375
#1436
#145
#1454
#1486
#1525
#1544
#1553
#156
#158
#1624
#1689
#1690
#1695
#1699
#1700
#171
#179
#1796
#1800
#1802
#1861
#1864
#1868
#1918
#1932
#1946
#1947
#1953
#1954
#200
#2007
#2019
#2100
#2117
#213
#2163
#2194
#22
#2201
#221
#2226
#2262
#2264
#2266
#2283
#2285
#2319
#2350
#2411
#2423
#2426
#2435
#2445
#2462
#2469
#2474
#2514
#2519
#2525
#2531
#2568
#2570
#2572
#2575
#258
#26
#2608
#2683
#2689
#2730
#2739
#2743
#2746
#2764
#2766
#2830
#2845
#2849
#2872
#2903
#2905
#2919
#2944
#2945
#2963
#2967
#2993
#3004
#3046
#3053
#3057
#306
#3066
#307
#3083
#3103
#3103
#3158
#3159
#3160
#3161
#3201
#3226
#3254
#3256
#3261
#3263
#3267
#3275
#3276
#3287
#3288
#3291
#33
#3332
#3338
#3357
#3371
#3383
#3394
#3412
#3423
#3435
#3449
#3450
#3454
#3471
#3484
#3487
#3490
#3498
#3511
#3513
#3527
#3532
#356
#3578
#3584
#3588
#3596
#3601
#3604
#3651
#3654
#3655
#3661
#3683
#3692
#3702
#3741
#3746
#3748
#3755
#3756
#3785
#3792
#3794
#3799
#3804
#3812
#382
#3829
#3835
#387
#3876
#3921
#3923
#3925
#3930
#3941
#395
#3958
#3976
#3987
#4003
#4006
#4007
#4009
#4011
#4015
#4029
#4043
#4045
#4053
#4066
#4080
#4082
#4083
#4098
#4099
#4119
#4136
#4166
#4167
#4173
#4191
#4204
#4224
#4227
#4234
#4237
#4245
#4246
#4307
#4309
#4314
#4321
#4329
#4334
#434
#4342
#4347
#4348
#4352
#4355
#4377
#4382
#4409
#4417
#4445
#4446
#4461
#451
#4544
#4561
#4580
#4589
#4590
#4636
#4651
#4662
#4663
#4673
#4680
#4680
#4686
#4687
#4691
#4692
#4700
#4706
#4724
#4733
#4746
#4781
#479
#4793
#4804
#4821
#4822
#4877
#4878
#4892
#4939
#4950
#4957
#4961
#4970
#4995
#4996
#5010
#5019
#5032
#5037
#5068
#5072
#5095
#51
#5109
#511
#5111
#5112
#5115
#5118
#5156
#516
#5163
#5170
#5185
#5188
#5193
#5208
#5226
#5230
#5233
#5237
#5242
#5278
#5290
#5317
#5323
#5326
#5339
#5343
#5346
#5365
#5372
#5388
#5405
#5424
#5427
#5438
#5445
#5451
#5458
#5473
#5475
#5480
#5483
#5486
#5507
#5522
#5532
#5533
#5536
#5546
#5547
#5555
#5563
#5574
#5580
#5581
#5585
#5606
#5615
#5639
#5642
#5653
#5665
#5673
#5746
#5752
#5752
#5758
#5781
#5799
#5801
#5816
#5819
#5839
#5852
#5856
#5857
#5871
#5873
#5880
#5889
#5895
#5897
#5901
#5906
#5907
#5909
#5910
#5912
#5913
#5914
#5920
#5922
#5924
#5926
#5927
#5929
#5933
#596
#5970
#5971
#5973
#598
#5982
#5984
#599
#5990
#5993
#6010
#6022
#6046
#6052
#6065
#6078
#6083
#6098
#6103
#6120
#6121
#6123
#6124
#6125
#6126
#6127
#6128
#6129
#6137
#6138
#6140
#6141
#6151
#6152
#6156
#6157
#6160
#6170
#6175
#619
#6190
#6192
#6204
#6224
#6226
#6233
#6238
#6242
#6246
#6251
#6253
#6265
#6275
#629
#6310
#6313
#6317
#6334
#6359
#6362
#6363
#6364
#6365
#6367
#6368
#6369
#6379
#6384
#6388
#6395
#6396
#6401
#6416
#6418
#6420
#6426
#6430
#644
#6441
#6443
#6444
#6457
#6462
#6465
#6471
#6478
#6483
#6492
#6493
#6498
#6503
#6506
#651
#6512
#6513
#6514
#6515
#6524
#6527
#6528
#6542
#6547
#6564
#6565
#657
#6585
#6588
#6597
#6598
#6600
#6601
#6617
#6620
#6624
#6625
#6626
#6628
#6629
#6631
#6632
#6637
#6640
#6641
#6642
#6645
#6648
#6653
#6657
#6684
#6688
#6689
#6690
#6691
#6692
#6693
#6698
#6701
#6710
#6722
#6753
#6767
#6771
#6778
#6779
#678
#6786
#6787
#6788
#6796
#6797
#68
#6801
#6810
#6814
#6830
#6831
#6834
#6843
#6854
#6855
#6857
#6865
#6866
#6868
#6874
#6879
#6890
#6892
#6895
#6896
#6899
#6901
#6902
#6903
#6904
#6905
#6906
#6907
#6913
#6916
#6917
#6918
#6920
#6930
#6931
#6944
#6946
#6954
#6963
#6972
#6975
#6976
#6977
#6982
#6983
#6985
#6998
#7019
#7051
#7053
#7054
#7058
#7060
#7061
#7067
#7074
#7077
#7089
#7106
#7108
#7117
#7120
#7126
#7142
#7143
#7161
#7166
#7174
#7176
#7179
#7181
#7183
#7190
#7193
#7201
#7204
#7205
#7206
#7207
#7209
#7211
#7219
#7229
#7230
#7231
#7235
#7241
#7242
#7244
#7247
#7253
#7254
#7255
#7256
#7257
#7258
#7259
#7264
#7272
#7273
#7275
#7277
#7278
#7287
#7288
#7294
#7295
#7304
#7308
#7312
#7317
#7318
#7330
#7332
#7338
#7340
#7343
#7345
#7347
#7349
#7351
#7361
#7378
#7381
#7395
#7404
#741
#7413
#7419
#7420
#7432
#7436
#7437
#7440
#7441
#7442
#7445
#7448
#7449
#7453
#7455
#7456
#7462
#7466
#7469
#7471
#7481
#7500
#7505
#7509
#7519
#7523
#7530
#7537
#7546
#7553
#7564
#7566
#7567
#7570
#7573
#7576
#7578
#7594
#7609
#7611
#7612
#7623
#7625
#7635
#7638
#7639
#7644
#7645
#7646
#7647
#7654
#7655
#7657
#766
#7660
#7674
#7686
#7694
#7695
#7700
#7704
#7714
#7715
#7719
#7724
#7725
#7728
#7732
#7739
#7740
#7744
#7745
#7746
#7747
#7748
#7749
#7754
#7765
#7786
#7792
#7793
#7794
#7795
#7797
#7801
#7803
#7804
#7808
#7810
#7817
#7826
#7830
#7840
#7854
#786
#7867
#7870
#7872
#7875
#7879
#7883
#7885
#7887
#7910
#7911
#7912
#7913
#7923
#7924
#7928
#7945
#7946
#7958
#7962
#7964
#7966
#7974
#7988
#7992
#8000
#8015
#8039
#8042
#8050
#8051
#8057
#8067
#8077
#8078
#8095
#8099
#8101
#8103
#8108
#8109
#8110
#8124
#8125
#8128
#8129
#8130
#8156
#8159
#8161
#8162
#8167
#8176
#8178
#8179
#8180
#8181
#8183
#8195
#8196
#8197
#8201
#8202
#8203
#8215
#8220
#8227
#8235
#8245
#8248
#8249
#8258
#8264
#8270
#8276
#8286
#8288
#8291
#8293
#8298
#83
#8303
#8311
#8312
#8314
#8325
#8327
#8328
#8333
#8335
#8348
#8362
#8367
#8385
#8386
#8387
#8388
#8389
#8390
#8396
#84
#8403
#8414
#8421
#8422
#8423
#8432
#8433
#8438
#844
#8441
#8448
#8449
#8457
#8458
#8460
#8461
#8462
#8480
#8481
#8505
#8509
#8517
#8519
#8529
#8530
#8532
#8535
#8538
#8539
#8542
#8543
#8546
#8547
#8548
#8554
#8556
#8557
#8559
#8564
#8565
#8567
#8569
#8571
#8587
#86
#8614
#8623
#8627
#8637
#8651
#8680
#8685
#8689
#8721
#8722
#8731
#8736
#8739
#8750
#8752
#8762
#8770
#8773
#8774
#8776
#8783
#8784
#8787
#8788
#8795
#8812
#8813
#8818
#8823
#8826
#8827
#8829
#8839
#8842
#8845
#8851
#8861
#8863
#8866
#8869
#8875
#8876
#8887
#8899
#8906
#8917
#8930
#8960
#8961
#8962
#8970
#8972
#8975
#8976
#8978
#8985
#8992
#900
#9000
#9008
#9018
#9022
#9024
#9028
#9029
#9046
#9071
#9077
#9078
#9086
#9086
#9112
#9117
#9124
#9128
#9129
#9130
#9137
#9143
#9165
#9176
#9177
#9183
#9188
#9196
#9198
#9204
#9215
#9217
#9219
#9221
#9223
#9224
#9225
#9226
#9227
#9229
#9230
#9231
#9232
#9236
#9237
#9243
#9248
#9249
#9259
#9262
#9263
#9265
#9267
#9274
#9275
#9284
#9293
#9296
#9297
#9299
#9316
#9333
#9337
#9337
#9343
#9351
#9351
#9352
#9354
#9360
#9368
#9370
#9370
#9388
#9391
#9395
#9397
#9399
#9400
#9405
#9406
#9407
#9409
#9449
#9463
#9467
#9477
#9484
#9485
#9486
#9492
#9501
#9504
#9505
#9509
#9511
#9514
#9518
#9520
#9521
#9532
#9536
#9539
#9541
#9543
#9544
#9547
#9549
#9549
#9552
#9557
#9569
#9575
#9579
#9582
#9586
#9587
#9588
#9593
#9595
#9602
#9604
#9607
#9608
#9610
#9611
#9612
#9613
#9615
#9615
#9616
#9617
#9617
#9619
#9621
#9624
#9626
#9627
#9630
#9630
#9632
#9633
#9634
#9636
#9637
#9638
#9640
#9643
#9645
#9649
#9651
#9652
#9654
#9661
#9665
#9669
#9669
#9670
#9673
#9675
#9676
#9676
#975
v0.0.9
v0.1.0
v0.1.1
v0.1.2
v0.1.3
v0.1.4
v0.1.5
v0.1.6
v0.1.7
v0.1.8
v0.2.0
v0.2.1
v0.2.2
v0.3.0
v0.3.2
v0.3.3
v0.4.0
v0.5.0
v0.5.2
v0.5.3
v0.6.0
v0.6.1
v0.6.2
v0.6.3
v0.7.0
v0.7.1
v0.8.0
v0.8.1
v0.8.2
v0.8.3
v0.9.0
v0.9.1
v0.9.2
v0.9.3
-
4d8c8b2019
fix
hiyouga/misc
hiyouga
2025-12-27 08:49:43 +08:00 -
6cdbfa980e
fix
hiyouga
2025-12-27 08:46:17 +08:00 -
5eea54f888
fix
hiyouga
2025-12-27 08:18:20 +08:00 -
f69c8efd27
fix
hiyouga
2025-12-27 08:15:02 +08:00 -
e374b615f2
fix
hiyouga
2025-12-27 08:08:57 +08:00 -
d7201fd6ae
fix
hiyouga
2025-12-27 08:06:42 +08:00 -
42b436a4fc
fix
hiyouga
2025-12-27 08:05:25 +08:00 -
5f3e5eb5f8
fix
hiyouga
2025-12-27 07:53:52 +08:00 -
6de0c3da9b
fix
hiyouga
2025-12-27 07:50:18 +08:00 -
1622bad7d4
fix
hiyouga
2025-12-27 07:47:43 +08:00 -
c439924e74
fix
hiyouga
2025-12-27 07:38:10 +08:00 -
a24d8cc78c
fix
hiyouga
2025-12-27 07:36:30 +08:00 -
66e6aa8f37
fixup
hiyouga
2025-12-27 07:35:18 +08:00 -
a1b1931b4a
[breaking] migrate from setuptools to uv (#9673)
main
Copilot
2025-12-26 22:47:23 +08:00 -
3c17f2722c
[model] Update ernie_vl to adapt new version (#9665)
Xunpeng Xiao
2025-12-26 19:57:49 +08:00 -
a882e2d5fc
[assets] Add GitHub Copilot instructions for repository (#9675)
Copilot
2025-12-26 17:32:48 +08:00 -
a754604c11
[misc] fix accelerator (#9661)
Yaowei Zheng
2025-12-25 02:11:04 +08:00 -
6a2eafbae3
[feat] Models trained and inferred with Mxfp4 are dequantized by default (#9652)
Xunpeng Xiao
2025-12-24 00:26:40 +08:00 -
84485406b7
[ci] disable pip cache for ci (#9654)
Yaowei Zheng
2025-12-23 18:37:40 +08:00 -
1c8a42d2f8
[v1&WIP] dataloader init (#9645)
Kingsley
2025-12-23 16:29:47 +08:00 -
7901b2f32e
[model] efficient tuning for gpt-oss (#9354)
thulyubh22
2025-12-23 16:28:38 +08:00 -
1f1f5a7d1b
[ci] remove docker cache (#9640)
Yaowei Zheng
2025-12-22 01:03:10 +08:00 -
6ef9854713
[misc] fix cache & pin transformers to 4.57.1 (#9638)
Yaowei Zheng
2025-12-22 00:20:55 +08:00 -
4923f52a28
[model] support MiMo-V2-Flash model (#9637)
Hertz
2025-12-21 14:38:18 +08:00 -
0894b4f37e
[misc] lint (#9636)
Yaowei Zheng
2025-12-20 16:19:39 +08:00 -
b0d49e137f
[misc] Support split eval_dataset when explict set "predict_with_generate" (#9604)
ZIYI ZENG
2025-12-20 01:46:00 +08:00 -
ddd7dcc722
[data] Fix the video frame sampling issue #9620 (#9634)
Xunpeng Xiao
2025-12-19 18:36:31 +08:00 -
5204cd2bca
[misc] add version check for moe (#9633)
浮梦
2025-12-19 14:57:37 +08:00 -
8c74dca76a
[feat] Models trained and inferred with FP8 are dequantized by default (#9627)
Xunpeng Xiao
2025-12-18 22:54:35 +08:00 -
e8deda53a1
[example] add Qwen3 series examples (#9624)
xvxuopop
2025-12-18 21:27:00 +08:00 -
a769fb94b9
[feat] support ktransformers for dpo (#9621)
mrhaoxx
2025-12-18 21:26:25 +08:00 -
964569751f
[kt] refactor ktransformers integration (#9632)
mrhaoxx
2025-12-18 21:26:04 +08:00 -
9fd4b094d4
[model] support VibeThinker models (#9616)
Hertz
2025-12-16 21:50:46 +08:00 -
18c21bce5a
[test] add allreduce test on npu (#9619)
浮梦
2025-12-16 21:33:30 +08:00 -
a0179772ab
[example] add deepspeed autotp config and example (#9602)
sunyi0505
2025-12-15 15:15:26 +08:00 -
aeda079014
[v1] model loader (#9613)
Yaowei Zheng
2025-12-14 11:50:52 +08:00 -
fdd24276ed
[feat] support new function call value (#9610)
Xunpeng Xiao
2025-12-14 00:20:33 +08:00 -
110d21713e
[v1] add dp & mp mesh (#9611)
Yaowei Zheng
2025-12-13 01:44:28 +08:00 -
203069e11c
[v1] add accelerator (#9607)
Yaowei Zheng
2025-12-12 19:22:06 +08:00 -
4fd94141a4
[model] Add Ministral3 (#9582)
tangefly
2025-12-10 15:57:24 +08:00 -
22d6ac29d5
[model] Rename GLMV template (#9595)
Kingsley
2025-12-10 13:27:47 +08:00 -
cff4483392
[config] Fix RoPE scaling patch for resuming from a scaled model (#9588)
DoubleWheat
2025-12-09 20:37:37 +08:00 -
5d56817e2b
[misc] lint (#9593)
Yaowei Zheng
2025-12-09 18:00:35 +08:00 -
1bbb461f76
[assets] update readme (#9587)
Yaowei Zheng
2025-12-09 12:22:54 +08:00 -
c1f5f8fff6
[model] support GLM4.6v (#9586)
Hertz
2025-12-09 11:06:42 +08:00 -
5744f1ea94
[v1] add models & accelerator (#9579)
Yaowei Zheng
2025-12-08 02:30:25 +08:00 -
739954910a
[deps] Update for Transformers v5 (#9569)
tangefly
2025-12-08 01:13:32 +08:00 -
109162dc56
[fix] fix the issue when using fsdp2 with gradient checkpointing. (#9541)
xvxuopop
2025-12-06 16:04:51 +08:00 -
165f3f073a
[examples] add fsdp config for mutiple nodes (#9575)
jiaqiw09
2025-12-05 23:22:48 +08:00 -
efb13b7483
[V1] Refactor ascend MoE kernel patch logic & Support Qwen3-MoE (#9557)
jiaqiw09
2025-12-02 00:22:03 +08:00 -
e43a972b25
[test] add npu test yaml and add ascend a3 docker file (#9547)
Username_Full
2025-11-30 09:37:08 +08:00 -
22be45c78c
[misc] fix omni thinker load (#9552)
Kingsley
2025-11-30 09:36:36 +08:00 -
d1f585f80a
[test] update test cmd (#9544)
浮梦
2025-11-27 17:59:42 +08:00 -
955396e8a5
[example] correct the parameter errors in the examples file. (#9543)
xvxuopop
2025-11-27 17:38:38 +08:00 -
231756a5bf
[chat] fix the error when the vLLM version is greater than 0.10.0 (#9539)
xvxuopop
2025-11-27 02:14:53 +08:00 -
2c4fb3c97e
[v1] Support fused moe kernel for qwen3vlmoe model. (#9532)
xvxuopop
2025-11-27 02:13:33 +08:00 -
2b6f16f261
[model] temporarily support npu fused options on v0, powered by v1 kernels (#9520)
浮梦
2025-11-27 02:08:36 +08:00 -
f17efde693
[v1] support automatic discovery of registered kernels. (#9509)
浮梦
2025-11-27 01:47:22 +08:00 -
591fc9ed02
[model] support ERNIE-4.5-VL Models (#9521)
Hertz
2025-11-24 16:48:06 +08:00 -
3140c242f0
[assets] add README with KT+llamafactory (#9514)
Peilin Li
2025-11-19 16:50:45 +08:00 -
887c562d60
[example] Add KTransformers Qwen3MoE example (#9511)
Peilin Li
2025-11-19 00:53:28 +08:00 -
9779b1f361
[misc] fix typos in some files (#9505)
Edge-Seven
2025-11-18 19:36:01 +07:00 -
45f0437a14
[v1] Add support for ShareGPT format. (#9486)
Yinlei Sun
2025-11-18 13:44:08 +08:00 -
d4e120423d
[data] fix qwen3omni moe model (#9501)
浮梦
2025-11-18 13:43:22 +08:00 -
10a446e373
[model] ktransformers qwen3 support (#9485)
Pory
2025-11-13 20:09:44 +08:00 -
0aa4a051af
[test] support slow skip and device skip in Uts (#9484)
jiaqiw09
2025-11-13 20:08:22 +08:00 -
8173a88a26
[assets] update readme (#9477)
Yaowei Zheng
2025-11-12 16:15:41 +08:00 -
fef86fa7fe
[data] fix qwen3omni audio length calculation (#9467)
Kingsley
2025-11-12 10:37:15 +08:00 -
5afa851f71
[misc] Modify pip install command for huggingface_hub (#9463)
taohongsheng
2025-11-10 23:04:00 +08:00 -
a711bce664
[data] add openai format (#9449)
MyungHa Kwon
2025-11-06 21:10:20 +09:00 -
bd24350cbf
[v1] add pair data converter (#9360)
魅影
2025-11-06 14:05:58 +08:00 -
bd30c0003b
[train] fix denominator of ga in ksft loss (#9409)
Peilin Li
2025-11-05 20:53:23 +08:00 -
8edd2622ce
[docker] update npu dockerfile (#9407)
魅影
2025-11-05 18:28:32 +08:00 -
eaf963f67f
[model] update kt code (#9406)
Yaowei Zheng
2025-11-05 15:27:22 +08:00 -
56f45e826f
[train] fix MPO re-weight (#9405)
Kingsley
2025-11-04 21:10:41 +08:00 -
14abb75126
[model] enable using FA in npu (#9397)
魅影
2025-11-04 19:32:30 +08:00 -
5a9939050e
[model] add deepstack_merger_list to Qwen3-VL vision_model_keys (#9399)
한송민
2025-11-04 20:27:34 +09:00 -
934b3084ee
[train] KTransformers SFT as backend engine for LLaMA-Factory (#9400)
Peilin Li
2025-11-04 15:54:12 +08:00 -
3ae15da9c0
[misc] lint code (#9395)
Yaowei Zheng
2025-11-03 22:08:59 +08:00 -
215580c77d
[data] fix mm pluigin for qwen omni video training (#9388)
魅影
2025-11-03 11:44:27 +08:00 -
767b344fb4
[model] remove npu sdpa patch (#9368)
魅影
2025-10-30 16:26:35 +08:00 -
3057db15c3
[readme] upd mcore readme (#9352)
Kingsley
2025-10-27 21:23:31 +08:00 -
13170577b2
[feat] support megatron-LM training by mcore_adapter (#9237)
Kingsley
2025-10-26 16:21:30 +08:00 -
129e918106
[data] Fix Qwen3VL plugin (#9297)
Xiaosu Zhu
2025-10-26 16:07:04 +08:00 -
9c0d033a15
[model] add qwen3vl 2b & 32b (#9343)
Yaowei Zheng
2025-10-24 13:22:36 +08:00 -
2a822178de
[deps] fix yanked packages (#9333)
Yaowei Zheng
2025-10-22 20:54:51 +08:00 -
b842457ef4
[ci] revert mac os ci setup (#9316)
Kingsley
2025-10-21 18:26:12 +08:00 -
2c6aded5d4
[v1] kernel plugin (#9274)
魅影
2025-10-18 18:02:14 +08:00 -
d9d67ba62d
[misc] fix import error (#9299)
Yaowei Zheng
2025-10-17 17:46:27 +08:00 -
a442fa90ad
[misc] fix import error (#9296)
Yaowei Zheng
2025-10-17 10:54:30 +08:00 -
8c341cbaae
[model] support hunyuan-mt model (#9284)
wyfdgg
2025-10-17 10:33:09 +08:00 -
47a7dc1698
[deps] upgrade vllm (#9293)
Yaowei Zheng
2025-10-16 23:20:26 +08:00 -
1037f63311
[model] add qwen3vl 4b + 8b (#9275)
Yaowei Zheng
2025-10-15 15:00:36 +08:00 -
c867e28093
[model] adds semantic initialization support for special tokens (#9267)
Ximing Xing
2025-10-14 17:00:48 +08:00 -
3dbca4b533
[data] add new reason tool calls demo data (#9249)
Peter-Hamster
2025-10-13 17:16:47 +08:00 -
9d1acbc191
[ci] fix ci (#9265)
Yaowei Zheng
2025-10-13 16:24:40 +08:00 -
52e46e162e
[v1] add data converter (#9263)
Yaowei Zheng
2025-10-13 15:54:47 +08:00 -
48974783da
[model]: add ernie4_5_moe support for DeepSpeed Zero3 training (#9262)
Jiayi Mao
2025-10-13 13:13:31 +08:00 -
575e4099df
[misc] add qwen bench script (#9259)
Yaowei Zheng
2025-10-13 11:45:25 +08:00 -
9687b71d3a
[v1] init data plugins (#9248)
Yaowei Zheng
2025-10-09 22:36:48 +08:00