Merge pull request #657 from ZGCTroy/main

fix bug of i2v finetune
This commit is contained in:
OleehyO 2025-01-12 13:55:12 +08:00 committed by GitHub
commit f66f1647e2
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 2 additions and 1 deletions

View File

@ -148,6 +148,7 @@ class BaseI2VDataset(Dataset):
frames, image = self.preprocess(video, image)
frames = frames.to(self.device)
image = image.to(self.device)
image = self.image_transform(image)
# Current shape of frames: [F, C, H, W]
frames = self.video_transform(frames)

View File

@ -526,7 +526,7 @@ class Trainer:
video, self.state.train_frames, self.state.train_height, self.state.train_width
)
# Convert video tensor (F, C, H, W) to list of PIL images
video = (video * 255).round().clamp(0, 255).to(torch.uint8)
video = video.round().clamp(0, 255).to(torch.uint8)
video = [Image.fromarray(frame.permute(1, 2, 0).cpu().numpy()) for frame in video]
logger.debug(