denk commited on
Commit
4914467
1 Parent(s): 5e88780

added comfyui example

Browse files
README.md CHANGED
@@ -13,6 +13,15 @@ tags:
13
 
14
  <video controls autoplay src="https://cdn-uploads.huggingface.co/production/uploads/63fde49f6315a264aba6a7ed/8vOYgS-Wm51BgOKv4Jnpp.mp4"></video>
15
 
 
 
 
 
 
 
 
 
 
16
  ### How to
17
  Clone repo
18
  ```bash
 
13
 
14
  <video controls autoplay src="https://cdn-uploads.huggingface.co/production/uploads/63fde49f6315a264aba6a7ed/8vOYgS-Wm51BgOKv4Jnpp.mp4"></video>
15
 
16
+ ### ComfyUI Example
17
+ <p>
18
+ <img src="cogvideox-2b-img2vid-workflow.png" width="800" height="400" title="preview"/>
19
+ </p>
20
+ <p>
21
+ <a href="cogvideox-2b-img2vid-workflow.json">JSON Workflow Example</a>
22
+ </p>
23
+ ComfyUI custom node can be found <a href="https://github.com/Nim-Video/ComfyUI-CogVideoXWrapper">here</a>.
24
+
25
  ### How to
26
  Clone repo
27
  ```bash
cogvideox-2b-img2vid-workflow.json ADDED
@@ -0,0 +1,679 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "last_node_id": 58,
3
+ "last_link_id": 129,
4
+ "nodes": [
5
+ {
6
+ "id": 31,
7
+ "type": "CogVideoTextEncode",
8
+ "pos": {
9
+ "0": 497,
10
+ "1": 520
11
+ },
12
+ "size": {
13
+ "0": 463.01251220703125,
14
+ "1": 124
15
+ },
16
+ "flags": {},
17
+ "order": 4,
18
+ "mode": 0,
19
+ "inputs": [
20
+ {
21
+ "name": "clip",
22
+ "type": "CLIP",
23
+ "link": 56
24
+ }
25
+ ],
26
+ "outputs": [
27
+ {
28
+ "name": "conditioning",
29
+ "type": "CONDITIONING",
30
+ "links": [
31
+ 123
32
+ ],
33
+ "slot_index": 0,
34
+ "shape": 3
35
+ }
36
+ ],
37
+ "properties": {
38
+ "Node name for S&R": "CogVideoTextEncode"
39
+ },
40
+ "widgets_values": [
41
+ "The video is not of a high quality, it has a low resolution. Watermark present in each frame. Strange motion trajectory. ",
42
+ 1,
43
+ true
44
+ ]
45
+ },
46
+ {
47
+ "id": 37,
48
+ "type": "ImageResizeKJ",
49
+ "pos": {
50
+ "0": 809,
51
+ "1": 684
52
+ },
53
+ "size": {
54
+ "0": 315,
55
+ "1": 266
56
+ },
57
+ "flags": {},
58
+ "order": 5,
59
+ "mode": 0,
60
+ "inputs": [
61
+ {
62
+ "name": "image",
63
+ "type": "IMAGE",
64
+ "link": 71
65
+ },
66
+ {
67
+ "name": "get_image_size",
68
+ "type": "IMAGE",
69
+ "link": null,
70
+ "shape": 7
71
+ },
72
+ {
73
+ "name": "width_input",
74
+ "type": "INT",
75
+ "link": null,
76
+ "widget": {
77
+ "name": "width_input"
78
+ }
79
+ },
80
+ {
81
+ "name": "height_input",
82
+ "type": "INT",
83
+ "link": null,
84
+ "widget": {
85
+ "name": "height_input"
86
+ }
87
+ }
88
+ ],
89
+ "outputs": [
90
+ {
91
+ "name": "IMAGE",
92
+ "type": "IMAGE",
93
+ "links": [
94
+ 125
95
+ ],
96
+ "slot_index": 0,
97
+ "shape": 3
98
+ },
99
+ {
100
+ "name": "width",
101
+ "type": "INT",
102
+ "links": null,
103
+ "shape": 3
104
+ },
105
+ {
106
+ "name": "height",
107
+ "type": "INT",
108
+ "links": null,
109
+ "shape": 3
110
+ }
111
+ ],
112
+ "properties": {
113
+ "Node name for S&R": "ImageResizeKJ"
114
+ },
115
+ "widgets_values": [
116
+ 720,
117
+ 480,
118
+ "lanczos",
119
+ false,
120
+ 16,
121
+ 0,
122
+ 0,
123
+ "disabled"
124
+ ]
125
+ },
126
+ {
127
+ "id": 58,
128
+ "type": "CogVideoImageEncode",
129
+ "pos": {
130
+ "0": 1156,
131
+ "1": 650
132
+ },
133
+ "size": {
134
+ "0": 315,
135
+ "1": 122
136
+ },
137
+ "flags": {},
138
+ "order": 6,
139
+ "mode": 0,
140
+ "inputs": [
141
+ {
142
+ "name": "pipeline",
143
+ "type": "COGVIDEOPIPE",
144
+ "link": 124
145
+ },
146
+ {
147
+ "name": "image",
148
+ "type": "IMAGE",
149
+ "link": 125
150
+ },
151
+ {
152
+ "name": "mask",
153
+ "type": "MASK",
154
+ "link": null,
155
+ "shape": 7
156
+ }
157
+ ],
158
+ "outputs": [
159
+ {
160
+ "name": "samples",
161
+ "type": "LATENT",
162
+ "links": [
163
+ 129
164
+ ],
165
+ "slot_index": 0,
166
+ "shape": 3
167
+ }
168
+ ],
169
+ "properties": {
170
+ "Node name for S&R": "CogVideoImageEncode"
171
+ },
172
+ "widgets_values": [
173
+ 16,
174
+ true
175
+ ]
176
+ },
177
+ {
178
+ "id": 56,
179
+ "type": "CogVideoDecode",
180
+ "pos": {
181
+ "0": 1581,
182
+ "1": 148
183
+ },
184
+ "size": {
185
+ "0": 300.396484375,
186
+ "1": 198
187
+ },
188
+ "flags": {},
189
+ "order": 8,
190
+ "mode": 0,
191
+ "inputs": [
192
+ {
193
+ "name": "pipeline",
194
+ "type": "COGVIDEOPIPE",
195
+ "link": 128
196
+ },
197
+ {
198
+ "name": "samples",
199
+ "type": "LATENT",
200
+ "link": 127
201
+ }
202
+ ],
203
+ "outputs": [
204
+ {
205
+ "name": "images",
206
+ "type": "IMAGE",
207
+ "links": [
208
+ 118
209
+ ],
210
+ "slot_index": 0,
211
+ "shape": 3
212
+ }
213
+ ],
214
+ "properties": {
215
+ "Node name for S&R": "CogVideoDecode"
216
+ },
217
+ "widgets_values": [
218
+ false,
219
+ 240,
220
+ 360,
221
+ 0.2,
222
+ 0.2,
223
+ true
224
+ ]
225
+ },
226
+ {
227
+ "id": 20,
228
+ "type": "CLIPLoader",
229
+ "pos": {
230
+ "0": -26,
231
+ "1": 400
232
+ },
233
+ "size": {
234
+ "0": 451.30548095703125,
235
+ "1": 82
236
+ },
237
+ "flags": {},
238
+ "order": 0,
239
+ "mode": 0,
240
+ "inputs": [],
241
+ "outputs": [
242
+ {
243
+ "name": "CLIP",
244
+ "type": "CLIP",
245
+ "links": [
246
+ 54,
247
+ 56
248
+ ],
249
+ "slot_index": 0,
250
+ "shape": 3
251
+ }
252
+ ],
253
+ "properties": {
254
+ "Node name for S&R": "CLIPLoader"
255
+ },
256
+ "widgets_values": [
257
+ "t5/google_t5-v1_1-xxl_encoderonly-fp8_e4m3fn.safetensors",
258
+ "sd3"
259
+ ]
260
+ },
261
+ {
262
+ "id": 30,
263
+ "type": "CogVideoTextEncode",
264
+ "pos": {
265
+ "0": 493,
266
+ "1": 303
267
+ },
268
+ "size": {
269
+ "0": 471.90142822265625,
270
+ "1": 168.08047485351562
271
+ },
272
+ "flags": {},
273
+ "order": 3,
274
+ "mode": 0,
275
+ "inputs": [
276
+ {
277
+ "name": "clip",
278
+ "type": "CLIP",
279
+ "link": 54
280
+ }
281
+ ],
282
+ "outputs": [
283
+ {
284
+ "name": "conditioning",
285
+ "type": "CONDITIONING",
286
+ "links": [
287
+ 122
288
+ ],
289
+ "slot_index": 0,
290
+ "shape": 3
291
+ }
292
+ ],
293
+ "properties": {
294
+ "Node name for S&R": "CogVideoTextEncode"
295
+ },
296
+ "widgets_values": [
297
+ "The camera follows before the truck. ",
298
+ 1,
299
+ true
300
+ ]
301
+ },
302
+ {
303
+ "id": 1,
304
+ "type": "DownloadAndLoadCogVideoModel",
305
+ "pos": {
306
+ "0": 633,
307
+ "1": 44
308
+ },
309
+ "size": {
310
+ "0": 337.8885192871094,
311
+ "1": 194
312
+ },
313
+ "flags": {},
314
+ "order": 1,
315
+ "mode": 0,
316
+ "inputs": [
317
+ {
318
+ "name": "pab_config",
319
+ "type": "PAB_CONFIG",
320
+ "link": null,
321
+ "shape": 7
322
+ },
323
+ {
324
+ "name": "block_edit",
325
+ "type": "TRANSFORMERBLOCKS",
326
+ "link": null,
327
+ "shape": 7
328
+ },
329
+ {
330
+ "name": "lora",
331
+ "type": "COGLORA",
332
+ "link": null,
333
+ "shape": 7
334
+ }
335
+ ],
336
+ "outputs": [
337
+ {
338
+ "name": "cogvideo_pipe",
339
+ "type": "COGVIDEOPIPE",
340
+ "links": [
341
+ 121,
342
+ 124
343
+ ],
344
+ "slot_index": 0,
345
+ "shape": 3
346
+ }
347
+ ],
348
+ "properties": {
349
+ "Node name for S&R": "DownloadAndLoadCogVideoModel"
350
+ },
351
+ "widgets_values": [
352
+ "NimVideo/cogvideox-2b-img2vid",
353
+ "fp16",
354
+ "disabled",
355
+ "disabled",
356
+ false
357
+ ]
358
+ },
359
+ {
360
+ "id": 57,
361
+ "type": "CogVideoSampler",
362
+ "pos": {
363
+ "0": 1138,
364
+ "1": 150
365
+ },
366
+ "size": {
367
+ "0": 399.8780822753906,
368
+ "1": 390
369
+ },
370
+ "flags": {},
371
+ "order": 7,
372
+ "mode": 0,
373
+ "inputs": [
374
+ {
375
+ "name": "pipeline",
376
+ "type": "COGVIDEOPIPE",
377
+ "link": 121
378
+ },
379
+ {
380
+ "name": "positive",
381
+ "type": "CONDITIONING",
382
+ "link": 122
383
+ },
384
+ {
385
+ "name": "negative",
386
+ "type": "CONDITIONING",
387
+ "link": 123
388
+ },
389
+ {
390
+ "name": "samples",
391
+ "type": "LATENT",
392
+ "link": null,
393
+ "shape": 7
394
+ },
395
+ {
396
+ "name": "image_cond_latents",
397
+ "type": "LATENT",
398
+ "link": 129,
399
+ "shape": 7
400
+ },
401
+ {
402
+ "name": "context_options",
403
+ "type": "COGCONTEXT",
404
+ "link": null,
405
+ "shape": 7
406
+ },
407
+ {
408
+ "name": "controlnet",
409
+ "type": "COGVIDECONTROLNET",
410
+ "link": null,
411
+ "shape": 7
412
+ },
413
+ {
414
+ "name": "tora_trajectory",
415
+ "type": "TORAFEATURES",
416
+ "link": null,
417
+ "shape": 7
418
+ }
419
+ ],
420
+ "outputs": [
421
+ {
422
+ "name": "cogvideo_pipe",
423
+ "type": "COGVIDEOPIPE",
424
+ "links": [
425
+ 128
426
+ ],
427
+ "slot_index": 0,
428
+ "shape": 3
429
+ },
430
+ {
431
+ "name": "samples",
432
+ "type": "LATENT",
433
+ "links": [
434
+ 127
435
+ ],
436
+ "shape": 3
437
+ }
438
+ ],
439
+ "properties": {
440
+ "Node name for S&R": "CogVideoSampler"
441
+ },
442
+ "widgets_values": [
443
+ 480,
444
+ 720,
445
+ 49,
446
+ 20,
447
+ 6,
448
+ 65334758276105,
449
+ "fixed",
450
+ "CogVideoXDDIM",
451
+ 1
452
+ ]
453
+ },
454
+ {
455
+ "id": 44,
456
+ "type": "VHS_VideoCombine",
457
+ "pos": {
458
+ "0": 1927,
459
+ "1": 146
460
+ },
461
+ "size": [
462
+ 605.3909912109375,
463
+ 714.2606608072917
464
+ ],
465
+ "flags": {},
466
+ "order": 9,
467
+ "mode": 0,
468
+ "inputs": [
469
+ {
470
+ "name": "images",
471
+ "type": "IMAGE",
472
+ "link": 118
473
+ },
474
+ {
475
+ "name": "audio",
476
+ "type": "AUDIO",
477
+ "link": null,
478
+ "shape": 7
479
+ },
480
+ {
481
+ "name": "meta_batch",
482
+ "type": "VHS_BatchManager",
483
+ "link": null,
484
+ "shape": 7
485
+ },
486
+ {
487
+ "name": "vae",
488
+ "type": "VAE",
489
+ "link": null,
490
+ "shape": 7
491
+ }
492
+ ],
493
+ "outputs": [
494
+ {
495
+ "name": "Filenames",
496
+ "type": "VHS_FILENAMES",
497
+ "links": null,
498
+ "shape": 3
499
+ }
500
+ ],
501
+ "properties": {
502
+ "Node name for S&R": "VHS_VideoCombine"
503
+ },
504
+ "widgets_values": {
505
+ "frame_rate": 8,
506
+ "loop_count": 0,
507
+ "filename_prefix": "CogVideoX-2b-I2V",
508
+ "format": "video/h264-mp4",
509
+ "pix_fmt": "yuv420p",
510
+ "crf": 19,
511
+ "save_metadata": true,
512
+ "pingpong": false,
513
+ "save_output": false,
514
+ "videopreview": {
515
+ "hidden": false,
516
+ "paused": false,
517
+ "params": {
518
+ "filename": "CogVideoX-2b-I2V_00001.mp4",
519
+ "subfolder": "",
520
+ "type": "temp",
521
+ "format": "video/h264-mp4",
522
+ "frame_rate": 8
523
+ },
524
+ "muted": false
525
+ }
526
+ }
527
+ },
528
+ {
529
+ "id": 36,
530
+ "type": "LoadImage",
531
+ "pos": {
532
+ "0": 365,
533
+ "1": 685
534
+ },
535
+ "size": {
536
+ "0": 402.06353759765625,
537
+ "1": 396.6225891113281
538
+ },
539
+ "flags": {},
540
+ "order": 2,
541
+ "mode": 0,
542
+ "inputs": [],
543
+ "outputs": [
544
+ {
545
+ "name": "IMAGE",
546
+ "type": "IMAGE",
547
+ "links": [
548
+ 71
549
+ ],
550
+ "slot_index": 0,
551
+ "shape": 3
552
+ },
553
+ {
554
+ "name": "MASK",
555
+ "type": "MASK",
556
+ "links": null,
557
+ "shape": 3
558
+ }
559
+ ],
560
+ "properties": {
561
+ "Node name for S&R": "LoadImage"
562
+ },
563
+ "widgets_values": [
564
+ "truck.jpg",
565
+ "image"
566
+ ]
567
+ }
568
+ ],
569
+ "links": [
570
+ [
571
+ 54,
572
+ 20,
573
+ 0,
574
+ 30,
575
+ 0,
576
+ "CLIP"
577
+ ],
578
+ [
579
+ 56,
580
+ 20,
581
+ 0,
582
+ 31,
583
+ 0,
584
+ "CLIP"
585
+ ],
586
+ [
587
+ 71,
588
+ 36,
589
+ 0,
590
+ 37,
591
+ 0,
592
+ "IMAGE"
593
+ ],
594
+ [
595
+ 118,
596
+ 56,
597
+ 0,
598
+ 44,
599
+ 0,
600
+ "IMAGE"
601
+ ],
602
+ [
603
+ 121,
604
+ 1,
605
+ 0,
606
+ 57,
607
+ 0,
608
+ "COGVIDEOPIPE"
609
+ ],
610
+ [
611
+ 122,
612
+ 30,
613
+ 0,
614
+ 57,
615
+ 1,
616
+ "CONDITIONING"
617
+ ],
618
+ [
619
+ 123,
620
+ 31,
621
+ 0,
622
+ 57,
623
+ 2,
624
+ "CONDITIONING"
625
+ ],
626
+ [
627
+ 124,
628
+ 1,
629
+ 0,
630
+ 58,
631
+ 0,
632
+ "COGVIDEOPIPE"
633
+ ],
634
+ [
635
+ 125,
636
+ 37,
637
+ 0,
638
+ 58,
639
+ 1,
640
+ "IMAGE"
641
+ ],
642
+ [
643
+ 127,
644
+ 57,
645
+ 1,
646
+ 56,
647
+ 1,
648
+ "LATENT"
649
+ ],
650
+ [
651
+ 128,
652
+ 57,
653
+ 0,
654
+ 56,
655
+ 0,
656
+ "COGVIDEOPIPE"
657
+ ],
658
+ [
659
+ 129,
660
+ 58,
661
+ 0,
662
+ 57,
663
+ 4,
664
+ "LATENT"
665
+ ]
666
+ ],
667
+ "groups": [],
668
+ "config": {},
669
+ "extra": {
670
+ "ds": {
671
+ "scale": 0.6830134553650714,
672
+ "offset": [
673
+ 73.42422056322742,
674
+ 83.67389678726582
675
+ ]
676
+ }
677
+ },
678
+ "version": 0.4
679
+ }
cogvideox-2b-img2vid-workflow.png ADDED