From eb5998479aead1781ef20d5f0e1694f0ea957e71 Mon Sep 17 00:00:00 2001 From: SHYuanBest Date: Wed, 25 Dec 2024 22:31:40 +0800 Subject: [PATCH] update --- TeaCache4ConsisID/teacache_sample_video.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/TeaCache4ConsisID/teacache_sample_video.py b/TeaCache4ConsisID/teacache_sample_video.py index 78c4d50..25fd5de 100644 --- a/TeaCache4ConsisID/teacache_sample_video.py +++ b/TeaCache4ConsisID/teacache_sample_video.py @@ -198,8 +198,9 @@ def main(args): seed = args.seed num_infer_steps = args.num_infer_steps output_path = args.output_path - rel_l1_thresh = args.rel_l1_thresh # higher speedup will cause to worse quality -- 0.1 for 1.6x speedup -- 0.15 for 2.1x speedup -- 0.2 for 2.5x speedup ckpts_path = args.ckpts_path + # higher speedup will cause to worse quality -- 0.1 for 1.6x speedup -- 0.15 for 2.1x speedup -- 0.2 for 2.5x speedup + rel_l1_thresh = args.rel_l1_thresh # ConsisID works well with long and well-described prompts. Make sure the face in the image is clearly visible (e.g., preferably half-body or full-body). prompt = args.prompt image = args.image @@ -255,7 +256,7 @@ def main(args): generator=torch.Generator("cuda").manual_seed(seed), ) file_count = len([f for f in os.listdir(output_path) if os.path.isfile(os.path.join(output_path, f))]) - video_path = f"{output_path}/{seed}_{file_count:04d}.mp4" + video_path = f"{output_path}/{seed}_{rel_l1_thresh}_{file_count:04d}.mp4" export_to_video(video.frames[0], video_path, fps=8) @@ -265,9 +266,9 @@ if __name__ == "__main__": parser.add_argument('--seed', type=int, default=42, help='Random seed') parser.add_argument('--num_infer_steps', type=int, default=50, help='Number of inference steps') parser.add_argument("--output_path", type=str, default="./teacache_results", help="The path where the generated video will be saved") + parser.add_argument('--ckpts_path', type=str, default="BestWishYsh/ConsisID-preview", help='Path to checkpoint') # higher speedup will cause to worse quality -- 0.1 for 1.6x speedup -- 0.15 for 2.1x speedup -- 0.2 for 2.5x speedup parser.add_argument('--rel_l1_thresh', type=float, default=0.1, help='Higher speedup will cause to worse quality -- 0.1 for 1.6x speedup -- 0.15 for 2.1x speedup -- 0.2 for 2.5x speedup') - parser.add_argument('--ckpts_path', type=str, default="BestWishYsh/ConsisID-preview", help='Path to checkpoint') # ConsisID works well with long and well-described prompts. Make sure the face in the image is clearly visible (e.g., preferably half-body or full-body). parser.add_argument('--prompt', type=str, default="The video captures a boy walking along a city street, filmed in black and white on a classic 35mm camera. His expression is thoughtful, his brow slightly furrowed as if he's lost in contemplation. The film grain adds a textured, timeless quality to the image, evoking a sense of nostalgia. Around him, the cityscape is filled with vintage buildings, cobblestone sidewalks, and softly blurred figures passing by, their outlines faint and indistinct. Streetlights cast a gentle glow, while shadows play across the boy\'s path, adding depth to the scene. The lighting highlights the boy\'s subtle smile, hinting at a fleeting moment of curiosity. The overall cinematic atmosphere, complete with classic film still aesthetics and dramatic contrasts, gives the scene an evocative and introspective feel.", help='Description of the video for the model to generate') parser.add_argument('--image', type=str, default="https://github.com/PKU-YuanGroup/ConsisID/blob/main/asserts/example_images/2.png?raw=true", help='URL or path to input image')