Yaowei Zheng 
							
						 
					 
					
						
						
							
							
						
						
						
							
						
						
							af8437095a 
							
						 
					 
					
						
						
							
							[ci] Change macOS version ( #9229 )  
						
						 
						
						
						
						
					 
					
						2025-10-05 02:18:30 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Yaowei Zheng 
							
						 
					 
					
						
						
						
						
							
						
						
							6ffebe5ff7 
							
						 
					 
					
						
						
							
							[data] fix qwen omni plugin ( #9204 )  
						
						 
						
						... 
						
						
						
						Co-authored-by: kingsley <kingsleydodonow@gmail.com> 
						
						
					 
					
						2025-09-28 01:02:29 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								xvxuopop 
							
						 
					 
					
						
						
						
						
							
						
						
							0761a4448f 
							
						 
					 
					
						
						
							
							[model] add qwen3-vl/qwen3-omni ( #9196 )  
						
						 
						
						... 
						
						
						
						Co-authored-by: kingsley <kingsleydodonow@gmail.com> 
						
						
					 
					
						2025-09-27 01:21:47 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Kingsley 
							
						 
					 
					
						
						
						
						
							
						
						
							7e710c6d3e 
							
						 
					 
					
						
						
							
							[misc] update InternVL constants ( #9046 )  
						
						 
						
						
						
						
					 
					
						2025-08-29 13:30:28 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Yaowei Zheng 
							
						 
					 
					
						
						
						
						
							
						
						
							4dfad24902 
							
						 
					 
					
						
						
							
							[model] add gpt oss ( #8826 )  
						
						 
						
						
						
						
					 
					
						2025-08-06 05:56:46 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Yaowei Zheng 
							
						 
					 
					
						
						
						
						
							
						
						
							4b0ec83928 
							
						 
					 
					
						
						
							
							[deps] bump transformers to 4.49.0 ( #8564 )  
						
						 
						
						
						
						
					 
					
						2025-07-07 20:31:50 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Yaowei Zheng 
							
						 
					 
					
						
						
						
						
							
						
						
							906b31fd47 
							
						 
					 
					
						
						
							
							[assets] update readme ( #8529 )  
						
						 
						
						
						
						
					 
					
						2025-07-02 17:42:27 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Liu Jiajun 
							
						 
					 
					
						
						
						
						
							
						
						
							4f0da0aec9 
							
						 
					 
					
						
						
							
							[data] fix gemma2 eos token ( #8480 )  
						
						 
						
						... 
						
						
						
						Co-authored-by: Yaowei Zheng <hiyouga@buaa.edu.cn> 
						
						
					 
					
						2025-06-27 18:19:15 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Yaowei Zheng 
							
						 
					 
					
						
						
						
						
							
						
						
							3a3bae1cfe 
							
						 
					 
					
						
						
							
							[data] fix qwen2vl pos ids ( #8387 )  
						
						 
						
						
						
						
					 
					
						2025-06-17 00:48:54 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Kingsley 
							
						 
					 
					
						
						
						
						
							
						
						
							212a8006dc 
							
						 
					 
					
						
						
							
							[tests] add visual model save test ( #8248 )  
						
						 
						
						... 
						
						
						
						Co-authored-by: Yaowei Zheng <hiyouga@buaa.edu.cn> 
						
						
					 
					
						2025-06-05 20:38:01 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							ba032828e2 
							
						 
					 
					
						
						
							
							[deps] upgrade transformers ( #8159 )  
						
						 
						
						
						
						
					 
					
						2025-05-26 22:03:58 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							9ae17cd173 
							
						 
					 
					
						
						
							
							[deps] update to transformers 4.52 ( #8125 )  
						
						 
						
						
						
						
					 
					
						2025-05-21 05:16:18 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							56926d76f9 
							
						 
					 
					
						
						
							
							[data] llama3 multi tool support ( #8124 )  
						
						 
						
						
						
						
					 
					
						2025-05-21 02:01:12 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							9b5baa97f0 
							
						 
					 
					
						
						
							
							[data] qwen3 fixes ( #8109 )  
						
						 
						
						
						
						
					 
					
						2025-05-20 02:00:30 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Saiya 
							
						 
					 
					
						
						
						
						
							
						
						
							ab41f7956c 
							
						 
					 
					
						
						
							
							[infer] support lora adapter for SGLang backend ( #8067 )  
						
						 
						
						
						
						
					 
					
						2025-05-16 23:33:47 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							052ca871bd 
							
						 
					 
					
						
						
							
							[data] optimize qwen3 loss computation ( #7923 )  
						
						 
						
						
						
						
					 
					
						2025-04-30 16:18:00 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							98f23c6584 
							
						 
					 
					
						
						
							
							[model] add qwen3 ( #7885 )  
						
						 
						
						
						
						
					 
					
						2025-04-29 09:34:05 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Kingsley 
							
						 
					 
					
						
						
						
						
							
						
						
							db9559456c 
							
						 
					 
					
						
						
							
							[data] fix qwen2.5 omni template ( #7883 )  
						
						 
						
						
						
						
					 
					
						2025-04-29 00:58:23 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Kingsley 
							
						 
					 
					
						
						
						
						
							
						
						
							fa0eb91f1f 
							
						 
					 
					
						
						
							
							[data] fix internvl plugin ( #7817 )  
						
						 
						
						
						
						
					 
					
						2025-04-23 00:58:22 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Kingsley 
							
						 
					 
					
						
						
						
						
							
						
						
							7500e761d3 
							
						 
					 
					
						
						
							
							[misc] update internvl constants ( #7801 )  
						
						 
						
						
						
						
					 
					
						2025-04-22 15:53:08 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							b07628dea5 
							
						 
					 
					
						
						
							
							[example] add bash usage ( #7794 )  
						
						 
						
						
						
						
					 
					
						2025-04-22 00:25:51 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							416853dd25 
							
						 
					 
					
						
						
							
							[parser] support omegaconf ( #7793 )  
						
						 
						
						
						
						
					 
					
						2025-04-21 23:30:30 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							39169986ef 
							
						 
					 
					
						
						
							
							[trainer] fix pt loss ( #7748 )  
						
						 
						
						... 
						
						
						
						* fix pt loss
* robust
* fix
* test 
						
						
					 
					
						2025-04-17 03:15:35 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							86ebb219d6 
							
						 
					 
					
						
						
							
							[breaking] bump transformers to 4.45.0 & improve ci ( #7746 )  
						
						 
						
						... 
						
						
						
						* update ci
* fix
* fix
* fix
* fix
* fix 
						
						
					 
					
						2025-04-17 02:36:48 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Kingsley 
							
						 
					 
					
						
						
						
						
							
						
						
							2e518f255f 
							
						 
					 
					
						
						
							
							[model] support intern-VL 2.5-3 series ( #7258 )  
						
						 
						
						... 
						
						
						
						* add internvl and rebase
* fix for internvl2&3
* remove lines
* fix video_inputs & lint
* nit
* add constants
* remove lines
* fix
* fix error
* pass ci
* pass ci
* skip internvl & nit 
						
						
					 
					
						2025-04-17 00:31:30 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							c3c0efbaa0 
							
						 
					 
					
						
						
							
							[misc] fix packing and eval plot ( #7623 )  
						
						 
						
						
						
						
					 
					
						2025-04-07 18:20:57 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							831e7f1cfd 
							
						 
					 
					
						
						
							
							[model] add llama4 ( #7611 )  
						
						 
						
						
						
						
					 
					
						2025-04-06 13:42:31 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Kingsley 
							
						 
					 
					
						
						
						
						
							
						
						
							8da1d2fa71 
							
						 
					 
					
						
						
							
							[data] fix pixtral plugin ( #7505 )  
						
						 
						
						... 
						
						
						
						* preserve `image_sizes`
* add comments 
						
						
					 
					
						2025-03-27 17:06:40 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							0583d06676 
							
						 
					 
					
						
						
							
							[model] add qwen2vl 32b & upgrade peft ( #7469 )  
						
						 
						
						... 
						
						
						
						* add qwen2vl 32b
* fix ci
* upgrade peft to 0.15
* fix ci
* fix ci 
						
						
					 
					
						2025-03-25 12:15:58 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							3aa4f32e9c 
							
						 
					 
					
						
						
							
							[misc] fix ci ( #7441 )  
						
						 
						
						... 
						
						
						
						* fix ci
* improve ci 
						
						
					 
					
						2025-03-23 21:09:35 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Qiaolin Yu 
							
						 
					 
					
						
						
						
						
							
						
						
							a44a53ebec 
							
						 
					 
					
						
						
							
							[inference] support sglang backend ( #7278 )  
						
						 
						
						... 
						
						
						
						* Mimic SGLang offline Engine
* Add more tests and args
* Pass all current tests
* Clean Code
* fix sample_params
* clean code
* Fix Stream Chat
* change sglang from engine mode to server mode
* fix
* Fix Review Issues
* Use SGLang Built-In Utilities
* Fix test SGLang
* Some Doc Issue
* fix sglang engine
* add readme
---------
Co-authored-by: Jin Pan <jpan236@wisc.edu>
Co-authored-by: hiyouga <hiyouga@buaa.edu.cn> 
						
						
					 
					
						2025-03-15 04:37:58 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							93e6184cbe 
							
						 
					 
					
						
						
							
							[data] gemma3 plugin pan and scan ( #7294 )  
						
						 
						
						... 
						
						
						
						* gemma3 pan and scan
* add test case
* fix test 
						
						
					 
					
						2025-03-13 23:29:23 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							650a9a9057 
							
						 
					 
					
						
						
							
							[misc] update format ( #7277 )  
						
						 
						
						
						
						
					 
					
						2025-03-13 02:53:08 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							264538cb26 
							
						 
					 
					
						
						
							
							[misc] upgrade format to py39 ( #7256 )  
						
						 
						
						
						
						
					 
					
						2025-03-12 00:08:41 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							71a1c1321a 
							
						 
					 
					
						
						
							
							[config] update args ( #7231 )  
						
						 
						
						... 
						
						
						
						Former-commit-id: f71a901840811bf560df671ec63a146ff99140c6 
						
						
					 
					
						2025-03-10 23:04:43 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							16419b2834 
							
						 
					 
					
						
						
							
							[data] fix loader ( #7207 )  
						
						 
						
						... 
						
						
						
						* fix dataloader
* add test case
* fix type
* fix ci
* fix ci
* fix ci
* disable overwrite cache in ci
Former-commit-id: e84af0e140b1aafd1a6d6fe185a8e41c8fc5f831 
						
						
					 
					
						2025-03-07 17:20:46 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							065f7fb5da 
							
						 
					 
					
						
						
							
							[data] fix mllama ( #7053 )  
						
						 
						
						... 
						
						
						
						* fix mllama
* fix test
Former-commit-id: f5af20a63f3d59a6a68d323a7c6f68e551edb3a3 
						
						
					 
					
						2025-02-24 22:05:38 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							46203856fc 
							
						 
					 
					
						
						
							
							[breaking change] refactor data pipeline ( #6901 )  
						
						 
						
						... 
						
						
						
						* refactor data
* rename file
Former-commit-id: 7a1a4ce6451cb782573d0bd9dd27a5e443e3a18b 
						
						
					 
					
						2025-02-13 00:39:20 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							2581cc844b 
							
						 
					 
					
						
						
							
							[data] feat: auto template ( #6905 )  
						
						 
						
						... 
						
						
						
						* support auto template
* add unittest
Former-commit-id: 0c6c9150db6414a5a05527ea486dce6633dff4b3 
						
						
					 
					
						2025-02-12 00:22:53 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							86063e27ea 
							
						 
					 
					
						
						
							
							[data] fix ollama template ( #6902 )  
						
						 
						
						... 
						
						
						
						* fix ollama template
* add meta info
* use half precision
Former-commit-id: 1304bbea69d8c8ca57140017515dee7ae2ee6536 
						
						
					 
					
						2025-02-11 22:43:09 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							88eafd865b 
							
						 
					 
					
						
						
							
							[misc] support export ollama modelfile ( #6899 )  
						
						 
						
						... 
						
						
						
						* support export ollama modelfile
* update config
* add system and num ctx
Former-commit-id: 8c2af7466f4015f300b51841db11bcd2505ebf20 
						
						
					 
					
						2025-02-11 19:52:25 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							3f7bd98bfa 
							
						 
					 
					
						
						
							
							[data] refactor template ( #6896 )  
						
						 
						
						... 
						
						
						
						Former-commit-id: f78d5a3eca947ed965ca2f6c87d60441b1a59867 
						
						
					 
					
						2025-02-11 17:59:25 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							72d5b06b08 
							
						 
					 
					
						
						
							
							[test] align test cases ( #6865 )  
						
						 
						
						... 
						
						
						
						* align test cases
* fix function formatter
Former-commit-id: a68f5e22d0391c80a9a826dc83967255be572032 
						
						
					 
					
						2025-02-09 01:03:49 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Zhangchi Feng 
							
						 
					 
					
						
						
						
						
							
						
						
							8f401e37f8 
							
						 
					 
					
						
						
							
							[model] support audio ( #6701 )  
						
						 
						
						... 
						
						
						
						* support qwen2_audio
* improve code
* lint
* fix
* fix
* fix
---------
Co-authored-by: hiyouga <hiyouga@buaa.edu.cn>
Former-commit-id: 5eacb5629e4d7733cd992a63747a1335f2c6a929 
						
						
					 
					
						2025-02-05 04:59:09 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							c2022431aa 
							
						 
					 
					
						
						
							
							[misc] update license year & fix llama pro ( #6814 )  
						
						 
						
						... 
						
						
						
						* fix llamapro script
* change year
Former-commit-id: d9ae594178796994d400a5f207d6499712816f89 
						
						
					 
					
						2025-02-05 01:53:33 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Yueqi Song 
							
						 
					 
					
						
						
						
						
							
						
						
							0817c24c04 
							
						 
					 
					
						
						
							
							[data] fix qwen tool template ( #6796 )  
						
						 
						
						... 
						
						
						
						* Update tool_utils.py
* fix unittest
---------
Co-authored-by: hoshi-hiyouga <hiyouga@buaa.edu.cn>
Former-commit-id: 02bb78a792112f5151b3a96ddde2528823855288 
						
						
					 
					
						2025-02-05 00:02:00 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								Zhangchi Feng 
							
						 
					 
					
						
						
						
						
							
						
						
							cfb926fb84 
							
						 
					 
					
						
						
							
							[data] fix minicpmv plugin ( #6801 )  
						
						 
						
						... 
						
						
						
						* fix template name
* tiny fix
* support minicpm-o-2.6
* support inference of minicpmv
* update readme
* support dpo of minicpmv
* update init audio
* update init audio
* [model]fix image process in minicpmo
Former-commit-id: 8f704c8b6228ef50f828014f85dce67fda868660 
						
						
					 
					
						2025-02-04 21:20:15 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							222423bcef 
							
						 
					 
					
						
						
							
							[breaking] support transformers 4.48 ( #6628 )  
						
						 
						
						... 
						
						
						
						Former-commit-id: f154ab175c513a4d7bb866bf2cffc34b77b50508 
						
						
					 
					
						2025-01-31 01:36:33 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hoshi-hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							2a05941b14 
							
						 
					 
					
						
						
							
							[inference] fix stop token for object detection ( #6624 )  
						
						 
						
						... 
						
						
						
						* fix stop token
* update minicpm data pipeline
* fix npu qlora examples
Former-commit-id: 844919fadaa8a61dfae47020971ea80730b2346f 
						
						
					 
					
						2025-01-13 21:34:20 +08:00  
					
					
						 
						
							
							
							 
						
					 
				 
			
				
					
						
							
							
								 
								hiyouga 
							
						 
					 
					
						
						
						
						
							
						
						
							dc65ecdf09 
							
						 
					 
					
						
						
							
							refactor mllm param logic  
						
						 
						
						... 
						
						
						
						Former-commit-id: b895c190945cf5d991cb4e4dea2ae73cc9c8d246 
						
						
					 
					
						2025-01-10 15:45:48 +00:00