fix: disable checkpoint saving to avoid tensor contiguity error

This commit is contained in:
2026-02-03 02:38:15 +00:00
parent 2680ad5502
commit 0f4858d22f

View File

@@ -103,7 +103,7 @@ def train_ddi_model(job_input: Dict[str, Any]) -> Dict[str, Any]:
warmup_steps=50,
weight_decay=0.01,
logging_steps=10,
save_strategy='epoch',
save_strategy='no', # Don't save checkpoints (avoids tensor contiguity issues)
fp16=torch.cuda.is_available(),
report_to='none',
)