video datasets

Former-commit-id: 8cafc7b055
This commit is contained in:
hiyouga
2024-09-05 02:04:17 +08:00
parent 60d770e4b1
commit 9df7a26e6b
27 changed files with 420 additions and 148 deletions

View File

@@ -100,6 +100,11 @@ def load_tokenizer(model_args: "ModelArguments") -> "TokenizerModule":
setattr(processor, "tokenizer", tokenizer)
setattr(processor, "image_seqlen", get_image_seqlen(config))
setattr(processor, "image_resolution", model_args.image_resolution)
setattr(processor, "video_fps", model_args.video_fps)
if getattr(config, "model_type", None) == "qwen2_vl":
setattr(processor, "video_factor", 2)
else:
setattr(processor, "video_factor", 1)
except Exception:
processor = None