diff --git a/README.md b/README.md index 67c6a21..73705cd 100644 --- a/README.md +++ b/README.md @@ -189,7 +189,7 @@ models we currently offer, along with their foundational information. Video Resolution 1360 * 768 - 256 <= W <=1360
256 <= H <=768
W,H % 16 == 0 + Min(W, H) = 768
768 ≤ Max(W, H) ≤ 1360
Max(W, H) % 16 = 0 720 * 480 diff --git a/README_ja.md b/README_ja.md index 375ba03..26b02c1 100644 --- a/README_ja.md +++ b/README_ja.md @@ -181,7 +181,7 @@ CogVideoXは、[清影](https://chatglm.cn/video?fr=osm_cogvideox) と同源の ビデオ解像度 1360 * 768 - 256 <= W <=1360
256 <= H <=768
W,H % 16 == 0 + Min(W, H) = 768
768 ≤ Max(W, H) ≤ 1360
Max(W, H) % 16 = 0 720 * 480 diff --git a/README_zh.md b/README_zh.md index d1ddafc..f456376 100644 --- a/README_zh.md +++ b/README_zh.md @@ -171,7 +171,7 @@ CogVideoX是 [清影](https://chatglm.cn/video?fr=osm_cogvideox) 同源的开源 视频分辨率 1360 * 768 - 256 <= W <=1360
256 <= H <=768
W,H % 16 == 0 + Min(W, H) = 768
768 ≤ Max(W, H) ≤ 1360
Max(W, H) % 16 = 0 720 * 480 diff --git a/tools/parallel_inference/parallel_inference_xdit.py b/tools/parallel_inference/parallel_inference_xdit.py index 03bc268..d0b8029 100644 --- a/tools/parallel_inference/parallel_inference_xdit.py +++ b/tools/parallel_inference/parallel_inference_xdit.py @@ -78,8 +78,9 @@ def main(): num_frames=input_config.num_frames, prompt=input_config.prompt, num_inference_steps=input_config.num_inference_steps, - generator=torch.Generator(device="cuda").manual_seed(input_config.seed), + generator=torch.Generator().manual_seed(input_config.seed), guidance_scale=6, + use_dynamic_cfg=True, ).frames[0] end_time = time.time()