update for multi images sft

This commit is contained in:
qianyu chen
2024-08-13 13:57:48 +08:00
committed by GitHub
parent 61e942ec7c
commit 7842ec1228
5 changed files with 143 additions and 65 deletions

View File

@@ -205,6 +205,7 @@ def train():
tokenizer = AutoTokenizer.from_pretrained(
model_args.model_name_or_path, trust_remote_code=True
)
tokenizer.model_max_length = training_args.model_max_length
if not training_args.tune_vision:
model.vpm.requires_grad_(False)
@@ -276,6 +277,7 @@ def train():
max_length=training_args.model_max_length,
)
training_args.gradient_checkpointing_kwargs={"use_reentrant":False}
trainer = CPMTrainer(
model=model,
tokenizer=tokenizer,