ComfyUI-CogVideoXWrapper/examples/cogvideox_fun_pose_example_01.json

1045 lines
18 KiB
JSON

{
"last_node_id": 82,
"last_link_id": 182,
"nodes": [
{
"id": 31,
"type": "CogVideoTextEncode",
"pos": {
"0": 497,
"1": 520
},
"size": {
"0": 501.0985412597656,
"1": 138.65379333496094
},
"flags": {},
"order": 4,
"mode": 0,
"inputs": [
{
"name": "clip",
"type": "CLIP",
"link": 56
}
],
"outputs": [
{
"name": "conditioning",
"type": "CONDITIONING",
"links": [
179
],
"slot_index": 0,
"shape": 3
}
],
"properties": {
"Node name for S&R": "CogVideoTextEncode"
},
"widgets_values": [
"The video is not of a high quality, it has a low resolution. Watermark present in each frame. Strange motion trajectory. Character is speaking",
1,
true
]
},
{
"id": 60,
"type": "WidgetToString",
"pos": {
"0": 1084,
"1": 76
},
"size": {
"0": 315,
"1": 130
},
"flags": {},
"order": 6,
"mode": 0,
"inputs": [
{
"name": "any_input",
"type": "*",
"link": 128
}
],
"outputs": [
{
"name": "STRING",
"type": "STRING",
"links": [
129
],
"slot_index": 0,
"shape": 3
}
],
"properties": {
"Node name for S&R": "WidgetToString"
},
"widgets_values": [
0,
"prompt",
false,
""
]
},
{
"id": 59,
"type": "AddLabel",
"pos": {
"0": 1466,
"1": -5
},
"size": {
"0": 315,
"1": 274
},
"flags": {},
"order": 14,
"mode": 0,
"inputs": [
{
"name": "image",
"type": "IMAGE",
"link": 126
},
{
"name": "caption",
"type": "STRING",
"link": null,
"widget": {
"name": "caption"
}
},
{
"name": "text",
"type": "STRING",
"link": 129,
"widget": {
"name": "text"
}
}
],
"outputs": [
{
"name": "IMAGE",
"type": "IMAGE",
"links": [
150
],
"slot_index": 0,
"shape": 3
}
],
"properties": {
"Node name for S&R": "AddLabel"
},
"widgets_values": [
10,
2,
48,
12,
"white",
"black",
"FreeMono.ttf",
"Text",
"up",
""
]
},
{
"id": 11,
"type": "CogVideoDecode",
"pos": {
"0": 1451,
"1": 363
},
"size": {
"0": 282.7455749511719,
"1": 198
},
"flags": {},
"order": 12,
"mode": 0,
"inputs": [
{
"name": "pipeline",
"type": "COGVIDEOPIPE",
"link": 180
},
{
"name": "samples",
"type": "LATENT",
"link": 181
}
],
"outputs": [
{
"name": "images",
"type": "IMAGE",
"links": [
124
],
"slot_index": 0,
"shape": 3
}
],
"properties": {
"Node name for S&R": "CogVideoDecode"
},
"widgets_values": [
true,
240,
360,
0.2,
0.2,
true
]
},
{
"id": 30,
"type": "CogVideoTextEncode",
"pos": {
"0": 513,
"1": 286
},
"size": {
"0": 471.90142822265625,
"1": 168.08047485351562
},
"flags": {},
"order": 3,
"mode": 0,
"inputs": [
{
"name": "clip",
"type": "CLIP",
"link": 54
}
],
"outputs": [
{
"name": "conditioning",
"type": "CONDITIONING",
"links": [
128,
178
],
"slot_index": 0,
"shape": 3
}
],
"properties": {
"Node name for S&R": "CogVideoTextEncode"
},
"widgets_values": [
"a brown bear is dancing in a forest, in front of a waterfall",
1,
true
]
},
{
"id": 65,
"type": "VHS_LoadVideo",
"pos": {
"0": -191,
"1": 564
},
"size": [
390.1356201171875,
910.0188802083334
],
"flags": {},
"order": 5,
"mode": 0,
"inputs": [
{
"name": "meta_batch",
"type": "VHS_BatchManager",
"link": null
},
{
"name": "vae",
"type": "VAE",
"link": null
},
{
"name": "frame_load_cap",
"type": "INT",
"link": 152,
"widget": {
"name": "frame_load_cap"
}
}
],
"outputs": [
{
"name": "IMAGE",
"type": "IMAGE",
"links": [
173
],
"slot_index": 0,
"shape": 3
},
{
"name": "frame_count",
"type": "INT",
"links": null,
"shape": 3
},
{
"name": "audio",
"type": "AUDIO",
"links": null,
"shape": 3
},
{
"name": "video_info",
"type": "VHS_VIDEOINFO",
"links": [],
"slot_index": 3,
"shape": 3
}
],
"properties": {
"Node name for S&R": "VHS_LoadVideo"
},
"widgets_values": {
"video": "01.mp4",
"force_rate": 0,
"force_size": "Disabled",
"custom_width": 512,
"custom_height": 512,
"frame_load_cap": 17,
"skip_first_frames": 0,
"select_every_nth": 1,
"choose video to upload": "image",
"videopreview": {
"hidden": false,
"paused": false,
"params": {
"frame_load_cap": 17,
"skip_first_frames": 0,
"force_rate": 0,
"filename": "01.mp4",
"type": "input",
"format": "video/mp4",
"select_every_nth": 1
},
"muted": false
}
}
},
{
"id": 20,
"type": "CLIPLoader",
"pos": {
"0": 2,
"1": 412
},
"size": {
"0": 451.30548095703125,
"1": 82
},
"flags": {},
"order": 0,
"mode": 0,
"inputs": [],
"outputs": [
{
"name": "CLIP",
"type": "CLIP",
"links": [
54,
56
],
"slot_index": 0,
"shape": 3
}
],
"properties": {
"Node name for S&R": "CLIPLoader"
},
"widgets_values": [
"t5\\clip\\google_t5-v1_1-xxl_encoderonly-fp8_e4m3fn.safetensors",
"sd3"
]
},
{
"id": 80,
"type": "DWPreprocessor",
"pos": {
"0": 260,
"1": 742
},
"size": {
"0": 364.7358703613281,
"1": 198
},
"flags": {},
"order": 7,
"mode": 0,
"inputs": [
{
"name": "image",
"type": "IMAGE",
"link": 173
}
],
"outputs": [
{
"name": "IMAGE",
"type": "IMAGE",
"links": [
174
],
"slot_index": 0,
"shape": 3
},
{
"name": "POSE_KEYPOINT",
"type": "POSE_KEYPOINT",
"links": null,
"shape": 3
}
],
"properties": {
"Node name for S&R": "DWPreprocessor"
},
"widgets_values": [
"enable",
"enable",
"enable",
512,
"yolox_l.torchscript.pt",
"dw-ll_ucoco_384_bs5.torchscript.pt"
]
},
{
"id": 44,
"type": "VHS_VideoCombine",
"pos": {
"0": 1842,
"1": -5
},
"size": [
1186.0863037109375,
310
],
"flags": {},
"order": 15,
"mode": 0,
"inputs": [
{
"name": "images",
"type": "IMAGE",
"link": 150
},
{
"name": "audio",
"type": "AUDIO",
"link": null
},
{
"name": "meta_batch",
"type": "VHS_BatchManager",
"link": null
},
{
"name": "vae",
"type": "VAE",
"link": null
}
],
"outputs": [
{
"name": "Filenames",
"type": "VHS_FILENAMES",
"links": null,
"shape": 3
}
],
"properties": {
"Node name for S&R": "VHS_VideoCombine"
},
"widgets_values": {
"frame_rate": 8,
"loop_count": 0,
"filename_prefix": "CogVideoX_Fun_Pose",
"format": "video/h264-mp4",
"pix_fmt": "yuv420p",
"crf": 19,
"save_metadata": true,
"pingpong": false,
"save_output": false,
"videopreview": {
"hidden": false,
"paused": false,
"params": {
"filename": "CogVideoX_Fun_Pose_00004.mp4",
"subfolder": "",
"type": "temp",
"format": "video/h264-mp4",
"frame_rate": 8
},
"muted": false
}
}
},
{
"id": 37,
"type": "ImageResizeKJ",
"pos": {
"0": 292,
"1": 1004
},
"size": {
"0": 315,
"1": 266
},
"flags": {},
"order": 8,
"mode": 0,
"inputs": [
{
"name": "image",
"type": "IMAGE",
"link": 174
},
{
"name": "get_image_size",
"type": "IMAGE",
"link": null
},
{
"name": "width_input",
"type": "INT",
"link": null,
"widget": {
"name": "width_input"
}
},
{
"name": "height_input",
"type": "INT",
"link": null,
"widget": {
"name": "height_input"
}
}
],
"outputs": [
{
"name": "IMAGE",
"type": "IMAGE",
"links": [
130
],
"slot_index": 0,
"shape": 3
},
{
"name": "width",
"type": "INT",
"links": null,
"shape": 3
},
{
"name": "height",
"type": "INT",
"links": null,
"shape": 3
}
],
"properties": {
"Node name for S&R": "ImageResizeKJ"
},
"widgets_values": [
512,
512,
"lanczos",
true,
16,
0,
0,
"disabled"
]
},
{
"id": 61,
"type": "GetImageSizeAndCount",
"pos": {
"0": 645,
"1": 1000
},
"size": {
"0": 277.20001220703125,
"1": 86
},
"flags": {},
"order": 9,
"mode": 0,
"inputs": [
{
"name": "image",
"type": "IMAGE",
"link": 130
}
],
"outputs": [
{
"name": "image",
"type": "IMAGE",
"links": [
135,
175
],
"slot_index": 0,
"shape": 3
},
{
"name": "288 width",
"type": "INT",
"links": null,
"shape": 3
},
{
"name": "512 height",
"type": "INT",
"links": null,
"shape": 3
},
{
"name": "49 count",
"type": "INT",
"links": null,
"shape": 3
}
],
"properties": {
"Node name for S&R": "GetImageSizeAndCount"
},
"widgets_values": []
},
{
"id": 71,
"type": "DownloadAndLoadCogVideoGGUFModel",
"pos": {
"0": 515,
"1": 35
},
"size": {
"0": 466.3737487792969,
"1": 174
},
"flags": {},
"order": 1,
"mode": 0,
"inputs": [
{
"name": "pab_config",
"type": "PAB_CONFIG",
"link": null
},
{
"name": "block_edit",
"type": "TRANSFORMERBLOCKS",
"link": null
}
],
"outputs": [
{
"name": "cogvideo_pipe",
"type": "COGVIDEOPIPE",
"links": [
176,
177
],
"slot_index": 0,
"shape": 3
}
],
"properties": {
"Node name for S&R": "DownloadAndLoadCogVideoGGUFModel"
},
"widgets_values": [
"CogVideoX_5b_fun_1_1_Pose_GGUF_Q4_0.safetensors",
"bf16",
false,
"main_device",
false
]
},
{
"id": 81,
"type": "CogVideoControlImageEncode",
"pos": {
"0": 859,
"1": 769
},
"size": {
"0": 367.79998779296875,
"1": 102
},
"flags": {},
"order": 10,
"mode": 0,
"inputs": [
{
"name": "pipeline",
"type": "COGVIDEOPIPE",
"link": 176
},
{
"name": "control_video",
"type": "IMAGE",
"link": 175
}
],
"outputs": [
{
"name": "control_latents",
"type": "COGCONTROL_LATENTS",
"links": [
182
],
"shape": 3,
"slot_index": 0
}
],
"properties": {
"Node name for S&R": "CogVideoControlImageEncode"
},
"widgets_values": [
512,
false
]
},
{
"id": 82,
"type": "CogVideoXFunControlSampler",
"pos": {
"0": 1085,
"1": 312
},
"size": [
311.22059416191496,
286
],
"flags": {},
"order": 11,
"mode": 0,
"inputs": [
{
"name": "pipeline",
"type": "COGVIDEOPIPE",
"link": 177
},
{
"name": "positive",
"type": "CONDITIONING",
"link": 178
},
{
"name": "negative",
"type": "CONDITIONING",
"link": 179
},
{
"name": "control_latents",
"type": "COGCONTROL_LATENTS",
"link": 182
}
],
"outputs": [
{
"name": "cogvideo_pipe",
"type": "COGVIDEOPIPE",
"links": [
180
],
"shape": 3
},
{
"name": "samples",
"type": "LATENT",
"links": [
181
],
"shape": 3
}
],
"properties": {
"Node name for S&R": "CogVideoXFunControlSampler"
},
"widgets_values": [
42,
"fixed",
25,
6,
"CogVideoXDPMScheduler",
0.7000000000000001,
0,
1
]
},
{
"id": 58,
"type": "ImageConcatMulti",
"pos": {
"0": 1472,
"1": 649
},
"size": {
"0": 210,
"1": 150
},
"flags": {},
"order": 13,
"mode": 0,
"inputs": [
{
"name": "image_1",
"type": "IMAGE",
"link": 135
},
{
"name": "image_2",
"type": "IMAGE",
"link": 124
}
],
"outputs": [
{
"name": "images",
"type": "IMAGE",
"links": [
126
],
"slot_index": 0,
"shape": 3
}
],
"properties": {},
"widgets_values": [
2,
"right",
true,
null
]
},
{
"id": 72,
"type": "INTConstant",
"pos": {
"0": -198,
"1": 260
},
"size": {
"0": 210,
"1": 58
},
"flags": {},
"order": 2,
"mode": 0,
"inputs": [],
"outputs": [
{
"name": "value",
"type": "INT",
"links": [
152
],
"slot_index": 0,
"shape": 3
}
],
"title": "Frames",
"properties": {
"Node name for S&R": "INTConstant"
},
"widgets_values": [
49
],
"color": "#1b4669",
"bgcolor": "#29699c"
}
],
"links": [
[
54,
20,
0,
30,
0,
"CLIP"
],
[
56,
20,
0,
31,
0,
"CLIP"
],
[
124,
11,
0,
58,
1,
"IMAGE"
],
[
126,
58,
0,
59,
0,
"IMAGE"
],
[
128,
30,
0,
60,
0,
"*"
],
[
129,
60,
0,
59,
2,
"STRING"
],
[
130,
37,
0,
61,
0,
"IMAGE"
],
[
135,
61,
0,
58,
0,
"IMAGE"
],
[
150,
59,
0,
44,
0,
"IMAGE"
],
[
152,
72,
0,
65,
2,
"INT"
],
[
173,
65,
0,
80,
0,
"IMAGE"
],
[
174,
80,
0,
37,
0,
"IMAGE"
],
[
175,
61,
0,
81,
1,
"IMAGE"
],
[
176,
71,
0,
81,
0,
"COGVIDEOPIPE"
],
[
177,
71,
0,
82,
0,
"COGVIDEOPIPE"
],
[
178,
30,
0,
82,
1,
"CONDITIONING"
],
[
179,
31,
0,
82,
2,
"CONDITIONING"
],
[
180,
82,
0,
11,
0,
"COGVIDEOPIPE"
],
[
181,
82,
1,
11,
1,
"LATENT"
],
[
182,
81,
0,
82,
3,
"COGCONTROL_LATENTS"
]
],
"groups": [],
"config": {},
"extra": {
"ds": {
"scale": 0.6934334949441758,
"offset": [
364.1021432696588,
27.28260472943026
]
}
},
"version": 0.4
}