From 9f42a31908676d266f0dc50057da245f45dbad5f Mon Sep 17 00:00:00 2001 From: kijai <40791699+kijai@users.noreply.github.com> Date: Wed, 18 Sep 2024 21:13:24 +0300 Subject: [PATCH] Create cogvideox_I2V_example_01.json --- examples/cogvideox_I2V_example_01.json | 633 +++++++++++++++++++++++++ 1 file changed, 633 insertions(+) create mode 100644 examples/cogvideox_I2V_example_01.json diff --git a/examples/cogvideox_I2V_example_01.json b/examples/cogvideox_I2V_example_01.json new file mode 100644 index 0000000..b9c6e28 --- /dev/null +++ b/examples/cogvideox_I2V_example_01.json @@ -0,0 +1,633 @@ +{ + "last_node_id": 58, + "last_link_id": 129, + "nodes": [ + { + "id": 20, + "type": "CLIPLoader", + "pos": { + "0": -26, + "1": 400 + }, + "size": { + "0": 451.30548095703125, + "1": 82 + }, + "flags": {}, + "order": 0, + "mode": 0, + "inputs": [], + "outputs": [ + { + "name": "CLIP", + "type": "CLIP", + "links": [ + 54, + 56 + ], + "slot_index": 0, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "CLIPLoader" + }, + "widgets_values": [ + "t5\\google_t5-v1_1-xxl_encoderonly-fp8_e4m3fn.safetensors", + "sd3" + ] + }, + { + "id": 31, + "type": "CogVideoTextEncode", + "pos": { + "0": 497, + "1": 520 + }, + "size": { + "0": 463.01251220703125, + "1": 98.10446166992188 + }, + "flags": {}, + "order": 4, + "mode": 0, + "inputs": [ + { + "name": "clip", + "type": "CLIP", + "link": 56 + } + ], + "outputs": [ + { + "name": "conditioning", + "type": "CONDITIONING", + "links": [ + 123 + ], + "slot_index": 0, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "CogVideoTextEncode" + }, + "widgets_values": [ + "The video is not of a high quality, it has a low resolution. Watermark present in each frame. Strange motion trajectory. " + ] + }, + { + "id": 30, + "type": "CogVideoTextEncode", + "pos": { + "0": 493, + "1": 303 + }, + "size": { + "0": 471.90142822265625, + "1": 168.08047485351562 + }, + "flags": {}, + "order": 3, + "mode": 0, + "inputs": [ + { + "name": "clip", + "type": "CLIP", + "link": 54 + } + ], + "outputs": [ + { + "name": "conditioning", + "type": "CONDITIONING", + "links": [ + 122 + ], + "slot_index": 0, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "CogVideoTextEncode" + }, + "widgets_values": [ + "a majestic stag is grazing in an enhanced forest, basking in the setting sun filtered by the trees" + ] + }, + { + "id": 1, + "type": "DownloadAndLoadCogVideoModel", + "pos": { + "0": 642, + "1": 90 + }, + "size": { + "0": 337.8885192871094, + "1": 154 + }, + "flags": {}, + "order": 1, + "mode": 0, + "inputs": [], + "outputs": [ + { + "name": "cogvideo_pipe", + "type": "COGVIDEOPIPE", + "links": [ + 121, + 124 + ], + "slot_index": 0, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "DownloadAndLoadCogVideoModel" + }, + "widgets_values": [ + "THUDM/CogVideoX-5b-I2V", + "bf16", + "disabled", + "disabled", + false + ] + }, + { + "id": 57, + "type": "CogVideoSampler", + "pos": { + "0": 1138, + "1": 150 + }, + "size": { + "0": 405.5999755859375, + "1": 378 + }, + "flags": {}, + "order": 7, + "mode": 0, + "inputs": [ + { + "name": "pipeline", + "type": "COGVIDEOPIPE", + "link": 121 + }, + { + "name": "positive", + "type": "CONDITIONING", + "link": 122 + }, + { + "name": "negative", + "type": "CONDITIONING", + "link": 123 + }, + { + "name": "samples", + "type": "LATENT", + "link": null + }, + { + "name": "image_cond_latents", + "type": "LATENT", + "link": 129 + } + ], + "outputs": [ + { + "name": "cogvideo_pipe", + "type": "COGVIDEOPIPE", + "links": [ + 128 + ], + "slot_index": 0, + "shape": 3 + }, + { + "name": "samples", + "type": "LATENT", + "links": [ + 127 + ], + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "CogVideoSampler" + }, + "widgets_values": [ + 480, + 720, + 49, + 50, + 6, + 65334758276105, + "fixed", + "DPM", + 16, + 8, + 1 + ] + }, + { + "id": 37, + "type": "ImageResizeKJ", + "pos": { + "0": 809, + "1": 684 + }, + "size": { + "0": 315, + "1": 266 + }, + "flags": {}, + "order": 5, + "mode": 0, + "inputs": [ + { + "name": "image", + "type": "IMAGE", + "link": 71 + }, + { + "name": "get_image_size", + "type": "IMAGE", + "link": null + }, + { + "name": "width_input", + "type": "INT", + "link": null, + "widget": { + "name": "width_input" + } + }, + { + "name": "height_input", + "type": "INT", + "link": null, + "widget": { + "name": "height_input" + } + } + ], + "outputs": [ + { + "name": "IMAGE", + "type": "IMAGE", + "links": [ + 125 + ], + "slot_index": 0, + "shape": 3 + }, + { + "name": "width", + "type": "INT", + "links": null, + "shape": 3 + }, + { + "name": "height", + "type": "INT", + "links": null, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "ImageResizeKJ" + }, + "widgets_values": [ + 720, + 480, + "lanczos", + false, + 16, + 0, + 0, + "disabled" + ] + }, + { + "id": 58, + "type": "CogVideoImageEncode", + "pos": { + "0": 1156, + "1": 650 + }, + "size": { + "0": 315, + "1": 122 + }, + "flags": {}, + "order": 6, + "mode": 0, + "inputs": [ + { + "name": "pipeline", + "type": "COGVIDEOPIPE", + "link": 124 + }, + { + "name": "image", + "type": "IMAGE", + "link": 125 + }, + { + "name": "mask", + "type": "MASK", + "link": null + } + ], + "outputs": [ + { + "name": "samples", + "type": "LATENT", + "links": [ + 129 + ], + "slot_index": 0, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "CogVideoImageEncode" + }, + "widgets_values": [ + 16, + true + ] + }, + { + "id": 56, + "type": "CogVideoDecode", + "pos": { + "0": 1581, + "1": 148 + }, + "size": { + "0": 300.396484375, + "1": 198 + }, + "flags": {}, + "order": 8, + "mode": 0, + "inputs": [ + { + "name": "pipeline", + "type": "COGVIDEOPIPE", + "link": 128 + }, + { + "name": "samples", + "type": "LATENT", + "link": 127 + } + ], + "outputs": [ + { + "name": "images", + "type": "IMAGE", + "links": [ + 118 + ], + "slot_index": 0, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "CogVideoDecode" + }, + "widgets_values": [ + false, + 96, + 96, + 0.083, + 0.083, + true + ] + }, + { + "id": 44, + "type": "VHS_VideoCombine", + "pos": { + "0": 1927, + "1": 146 + }, + "size": [ + 605.3909912109375, + 714.2606608072917 + ], + "flags": {}, + "order": 9, + "mode": 0, + "inputs": [ + { + "name": "images", + "type": "IMAGE", + "link": 118 + }, + { + "name": "audio", + "type": "AUDIO", + "link": null + }, + { + "name": "meta_batch", + "type": "VHS_BatchManager", + "link": null + }, + { + "name": "vae", + "type": "VAE", + "link": null + } + ], + "outputs": [ + { + "name": "Filenames", + "type": "VHS_FILENAMES", + "links": null, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "VHS_VideoCombine" + }, + "widgets_values": { + "frame_rate": 8, + "loop_count": 0, + "filename_prefix": "CogVideoX-I2V", + "format": "video/h264-mp4", + "pix_fmt": "yuv420p", + "crf": 19, + "save_metadata": true, + "pingpong": false, + "save_output": false, + "videopreview": { + "hidden": false, + "paused": false, + "params": { + "filename": "CogVideoX-I2V_00001.mp4", + "subfolder": "", + "type": "temp", + "format": "video/h264-mp4", + "frame_rate": 8 + }, + "muted": false + } + } + }, + { + "id": 36, + "type": "LoadImage", + "pos": { + "0": 365, + "1": 685 + }, + "size": [ + 402.0635467506413, + 396.62260382077534 + ], + "flags": {}, + "order": 2, + "mode": 0, + "inputs": [], + "outputs": [ + { + "name": "IMAGE", + "type": "IMAGE", + "links": [ + 71 + ], + "slot_index": 0, + "shape": 3 + }, + { + "name": "MASK", + "type": "MASK", + "links": null, + "shape": 3 + } + ], + "properties": { + "Node name for S&R": "LoadImage" + }, + "widgets_values": [ + "sd3stag.png", + "image" + ] + } + ], + "links": [ + [ + 54, + 20, + 0, + 30, + 0, + "CLIP" + ], + [ + 56, + 20, + 0, + 31, + 0, + "CLIP" + ], + [ + 71, + 36, + 0, + 37, + 0, + "IMAGE" + ], + [ + 118, + 56, + 0, + 44, + 0, + "IMAGE" + ], + [ + 121, + 1, + 0, + 57, + 0, + "COGVIDEOPIPE" + ], + [ + 122, + 30, + 0, + 57, + 1, + "CONDITIONING" + ], + [ + 123, + 31, + 0, + 57, + 2, + "CONDITIONING" + ], + [ + 124, + 1, + 0, + 58, + 0, + "COGVIDEOPIPE" + ], + [ + 125, + 37, + 0, + 58, + 1, + "IMAGE" + ], + [ + 127, + 57, + 1, + 56, + 1, + "LATENT" + ], + [ + 128, + 57, + 0, + 56, + 0, + "COGVIDEOPIPE" + ], + [ + 129, + 58, + 0, + 57, + 4, + "LATENT" + ] + ], + "groups": [], + "config": {}, + "extra": { + "ds": { + "scale": 0.7513148009015778, + "offset": [ + 153.9884532493587, + 111.86149660036742 + ] + } + }, + "version": 0.4 +} \ No newline at end of file