[data] Fix minicpmv/o dpo training (#6657)

* fix template name

* tiny fix

* support minicpm-o-2.6

* support inference of minicpmv

* update readme

* support dpo of minicpmv

Former-commit-id: 8d9f47b98047f370637d1c96c2f3440dcc738ef3
This commit is contained in:
Zhangchi Feng 2025-01-15 17:30:37 +08:00 committed by GitHub
parent 0fc2e19279
commit 3607caa2ad

View File

@ -155,7 +155,7 @@ class MultiModalDataCollatorForSeq2Seq(DataCollatorForSeq2Seq):
if "image_bound" in features: # for minicpmv inputs
bsz, seq_length = features["input_ids"].shape
features["position_ids"] = torch.arange(seq_length).long().repeat(bsz, 1)
return {"data": features, "labels": features["labels"]}
return {"data": features, "input_ids": features["input_ids"], "labels": features["labels"]}
return features