Merge pull request #607 from THUDM/CogVideoX_dev

Add resolution warning
This commit is contained in:
OleehyO 2024-12-17 09:58:10 +08:00 committed by GitHub
commit 7add8f8437
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194

View File

@ -17,6 +17,7 @@ $ python cli_demo.py --prompt "A girl riding a bike." --model_path THUDM/CogVide
Additional options are available to specify the model path, guidance scale, number of inference steps, video generation type, and output paths.
"""
import warnings
import argparse
from typing import Literal
@ -77,6 +78,11 @@ def generate_video(
image = None
video = None
if (width != 1360 or height != 768) and "cogvideox1.5-5b-i2v" in model_path.lower():
warnings.warn(f"The width({width}) and height({height}) are not recommended for CogVideoX1.5-5B-I2V. The best resolution for CogVideoX1.5-5B-I2V is 1360x768.")
elif (width != 720 or height != 480) and "cogvideox-5b-i2v" in model_path.lower():
warnings.warn(f"The width({width}) and height({height}) are not recommended for CogVideo-5B-I2V. The best resolution for CogVideo-5B-I2V is 720x480.")
if generate_type == "i2v":
pipe = CogVideoXImageToVideoPipeline.from_pretrained(model_path, torch_dtype=dtype)
image = load_image(image=image_or_video_path)