fix: rebuild SVD workflow with correct node types

- Replace DiffusersLoader with ImageOnlyCheckpointLoader - Replace SVDSampler with SVD_img2vid_Conditioning + KSampler - Add VideoLinearCFGGuidance for temporal consistency - Add all node connections in links array - Configure VHS_VideoCombine with H.264 parameters 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
2025-11-23 10:10:38 +01:00
parent 22afe18957
commit 764cb5d2d7
1 changed files with 345 additions and 106 deletions
--- a/comfyui/workflows/image-to-video/svd-i2v-production-v1.json
+++ b/comfyui/workflows/image-to-video/svd-i2v-production-v1.json
@@ -1,18 +1,13 @@
 {
-  "last_node_id": 8,
+  "last_node_id": 7,
  "last_link_id": 10,
  "nodes": [
    {
      "id": 1,
      "type": "LoadImage",
-      "pos": [
+      "pos": [50, 100],
-        50,
+      "size": [315, 314],
-        100
+      "widgets_values": ["input_frame.png", "image"],
      ],
      "widgets_values": [
        "input_frame.png",
        "image"
      ],
      "title": "API Input Image",
      "flags": {},
      "order": 0,
@@ -20,157 +15,401 @@
      "properties": {
        "Node name for S&R": "LoadImage"
      },
-      "size": {
+      "outputs": [
-        "0": 350,
+        {
-        "1": 100
+          "name": "IMAGE",
-      }
+          "type": "IMAGE",
          "links": [1],
          "slot_index": 0
        },
        {
          "name": "MASK",
          "type": "MASK",
          "links": null
        }
      ]
    },
    {
      "id": 2,
-      "type": "DiffusersLoader",
+      "type": "ImageOnlyCheckpointLoader",
-      "pos": [
+      "pos": [50, 500],
-        50,
+      "size": [350, 100],
-        400
+      "widgets_values": ["svd_xt.safetensors"],
-      ],
+      "title": "SVD-XT Model Loader",
      "widgets_values": [
        "diffusion_models/stable-video-diffusion-img2vid"
      ],
      "title": "SVD Model Loader",
      "flags": {},
      "order": 1,
      "mode": 0,
      "properties": {
-        "Node name for S&R": "DiffusersLoader"
+        "Node name for S&R": "ImageOnlyCheckpointLoader"
      },
-      "size": {
+      "outputs": [
-        "0": 350,
+        {
-        "1": 100
+          "name": "MODEL",
-      }
+          "type": "MODEL",
          "links": [2],
          "slot_index": 0
        },
        {
          "name": "CLIP_VISION",
          "type": "CLIP_VISION",
          "links": [3],
          "slot_index": 1
        },
        {
          "name": "VAE",
          "type": "VAE",
          "links": [4, 5],
          "slot_index": 2
        }
      ]
    },
    {
      "id": 3,
-      "type": "SVDSampler",
+      "type": "VideoLinearCFGGuidance",
-      "pos": [
+      "pos": [450, 500],
-        450,
+      "size": [315, 100],
-        100
+      "widgets_values": [1.0],
-      ],
+      "title": "Linear CFG Guidance",
      "widgets_values": [
        42,
        "fixed",
        25,
        14,
        127,
        0.02
      ],
      "title": "SVD Sampler (14 frames)",
      "flags": {},
      "order": 2,
      "mode": 0,
      "properties": {
-        "Node name for S&R": "SVDSampler"
+        "Node name for S&R": "VideoLinearCFGGuidance"
      },
-      "size": {
+      "inputs": [
-        "0": 315,
+        {
-        "1": 474
+          "name": "model",
-      }
+          "type": "MODEL",
          "link": 2
        }
      ],
      "outputs": [
        {
          "name": "MODEL",
          "type": "MODEL",
          "links": [6],
          "slot_index": 0
        }
      ]
    },
    {
      "id": 4,
-      "type": "VAEDecode",
+      "type": "SVD_img2vid_Conditioning",
-      "pos": [
+      "pos": [450, 100],
-        800,
+      "size": [315, 350],
-        100
+      "widgets_values": [1024, 576, 14, 127, 6, 0.0],
-      ],
+      "title": "SVD Image-to-Video Conditioning",
      "title": "VAE Decode Video",
      "flags": {},
      "order": 3,
      "mode": 0,
      "properties": {
-        "Node name for S&R": "VAEDecode"
+        "Node name for S&R": "SVD_img2vid_Conditioning"
      },
-      "size": {
+      "inputs": [
-        "0": 315,
+        {
-        "1": 100
+          "name": "clip_vision",
-      }
+          "type": "CLIP_VISION",
          "link": 3
        },
        {
          "name": "init_image",
          "type": "IMAGE",
          "link": 1
        },
        {
          "name": "vae",
          "type": "VAE",
          "link": 4
        }
      ],
      "outputs": [
        {
          "name": "positive",
          "type": "CONDITIONING",
          "links": [7],
          "slot_index": 0
        },
        {
          "name": "negative",
          "type": "CONDITIONING",
          "links": [8],
          "slot_index": 1
        },
        {
          "name": "latent",
          "type": "LATENT",
          "links": [9],
          "slot_index": 2
        }
      ]
    },
    {
      "id": 5,
-      "type": "VHS_VideoCombine",
+      "type": "KSampler",
-      "pos": [
+      "pos": [800, 100],
-        1100,
+      "size": [315, 474],
-        100
+      "widgets_values": [42, "fixed", 25, 6.0, "euler", "karras", 1.0],
-      ],
+      "title": "KSampler (25 steps)",
      "widgets_values": [
        6,
        0,
        "svd_output",
        "video/h264-mp4"
      ],
      "title": "Combine Frames",
      "flags": {},
      "order": 4,
      "mode": 0,
      "properties": {
        "Node name for S&R": "KSampler"
      },
      "inputs": [
        {
          "name": "model",
          "type": "MODEL",
          "link": 6
        },
        {
          "name": "positive",
          "type": "CONDITIONING",
          "link": 7
        },
        {
          "name": "negative",
          "type": "CONDITIONING",
          "link": 8
        },
        {
          "name": "latent_image",
          "type": "LATENT",
          "link": 9
        }
      ],
      "outputs": [
        {
          "name": "LATENT",
          "type": "LATENT",
          "links": [10],
          "slot_index": 0
        }
      ]
    },
    {
      "id": 6,
      "type": "VAEDecode",
      "pos": [1150, 100],
      "size": [210, 46],
      "widgets_values": [],
      "title": "VAE Decode Video Frames",
      "flags": {},
      "order": 5,
      "mode": 0,
      "properties": {
        "Node name for S&R": "VAEDecode"
      },
      "inputs": [
        {
          "name": "samples",
          "type": "LATENT",
          "link": 10
        },
        {
          "name": "vae",
          "type": "VAE",
          "link": 5
        }
      ],
      "outputs": [
        {
          "name": "IMAGE",
          "type": "IMAGE",
          "links": [11],
          "slot_index": 0
        }
      ]
    },
    {
      "id": 7,
      "type": "VHS_VideoCombine",
      "pos": [1400, 100],
      "size": [315, 200],
      "widgets_values": [6, 0, "svd_output", "video/h264-mp4", "yuv420p", 19, true, false],
      "title": "Combine Video Frames",
      "flags": {},
      "order": 6,
      "mode": 0,
      "properties": {
        "Node name for S&R": "VHS_VideoCombine"
      },
-      "size": {
+      "inputs": [
-        "0": 315,
+        {
-        "1": 100
+          "name": "images",
-      }
+          "type": "IMAGE",
          "link": 11
        }
      ],
      "outputs": [
        {
          "name": "Filenames",
          "type": "VHS_FILENAMES",
          "links": null
        }
      ]
    }
  ],
-  "links": [],
+  "links": [
    [1, 1, 0, 4, 1, "IMAGE"],
    [2, 2, 0, 3, 0, "MODEL"],
    [3, 2, 1, 4, 0, "CLIP_VISION"],
    [4, 2, 2, 4, 2, "VAE"],
    [5, 2, 2, 6, 1, "VAE"],
    [6, 3, 0, 5, 0, "MODEL"],
    [7, 4, 0, 5, 1, "CONDITIONING"],
    [8, 4, 1, 5, 2, "CONDITIONING"],
    [9, 4, 2, 5, 3, "LATENT"],
    [10, 5, 0, 6, 0, "LATENT"],
    [11, 6, 0, 7, 0, "IMAGE"]
  ],
  "groups": [],
  "config": {},
  "extra": {
    "workflow_info": {
      "name": "Stable Video Diffusion Image-to-Video Production",
-      "version": "1.0.0",
+      "version": "1.2.0",
-      "description": "Quick animation using SVD. Generate 14-frame video from single image with motion and camera movement.",
+      "description": "Quick animation using SVD-XT. Generate 14-frame video from single image with motion and camera movement.",
      "category": "image-to-video",
-      "tags": [
+      "tags": ["svd", "svd-xt", "stable-video-diffusion", "i2v", "animation", "production"],
        "svd",
        "stable-video-diffusion",
        "i2v",
        "animation",
        "production"
      ],
      "requirements": {
-        "models": [
+        "models": ["SVD-XT"],
-          "stable-video-diffusion-img2vid"
+        "custom_nodes": ["ComfyUI-VideoHelperSuite"],
-        ],
+        "vram_min": "16GB",
-        "custom_nodes": [
+        "vram_recommended": "20GB"
          "ComfyUI-VideoHelperSuite"
        ],
        "vram_min": "16GB"
      },
      "parameters": {
        "input_image": {
          "node_id": 1,
          "widget_index": 0,
          "type": "image",
-          "required": true
+          "required": true,
          "description": "Starting frame for video generation (1024x576 recommended)"
        },
        "width": {
          "node_id": 4,
          "widget_index": 0,
          "type": "integer",
          "required": false,
          "default": 1024,
          "min": 16,
          "max": 16384,
          "description": "Output video width"
        },
        "height": {
          "node_id": 4,
          "widget_index": 1,
          "type": "integer",
          "required": false,
          "default": 576,
          "min": 16,
          "max": 16384,
          "description": "Output video height"
        },
        "video_frames": {
          "node_id": 4,
          "widget_index": 2,
          "type": "integer",
          "required": false,
          "default": 14,
          "min": 1,
          "max": 4096,
          "description": "Number of frames to generate (14 or 25 for SVD/SVD-XT)"
        },
        "motion_bucket_id": {
          "node_id": 4,
          "widget_index": 3,
          "type": "integer",
          "required": false,
          "default": 127,
          "min": 1,
          "max": 1023,
          "description": "Motion amount (higher = more motion)"
        },
        "fps": {
          "node_id": 4,
          "widget_index": 4,
          "type": "integer",
          "required": false,
          "default": 6,
          "min": 1,
          "max": 1024,
          "description": "Frames per second for conditioning"
        },
        "augmentation_level": {
          "node_id": 4,
          "widget_index": 5,
          "type": "float",
          "required": false,
          "default": 0.0,
          "min": 0.0,
          "max": 10.0,
          "description": "Noise augmentation level"
        },
        "steps": {
-          "node_id": 3,
+          "node_id": 5,
          "widget_index": 2,
          "type": "integer",
-          "default": 25
+          "required": false,
          "default": 25,
          "min": 1,
          "max": 150,
          "description": "Sampling steps (25 recommended)"
        },
-        "frames": {
+        "cfg": {
-          "node_id": 3,
+          "node_id": 5,
-          "type": "integer",
+          "widget_index": 3,
-          "default": 14,
+          "type": "float",
-          "description": "Number of output frames"
+          "required": false,
          "default": 6.0,
          "min": 0.0,
          "max": 30.0,
          "description": "Classifier-free guidance scale"
        },
-        "motion_bucket": {
+        "seed": {
-          "node_id": 3,
+          "node_id": 5,
          "widget_index": 0,
          "type": "integer",
-          "default": 127,
+          "required": false,
-          "description": "Motion amount (0-255)"
+          "default": 42,
          "description": "Random seed for reproducibility"
        },
        "output_fps": {
          "node_id": 7,
          "widget_index": 0,
          "type": "integer",
          "required": false,
          "default": 6,
          "description": "Output video framerate"
        }
      },
      "outputs": {
        "video": {
          "node_id": 7,
          "type": "video",
          "format": "MP4 (H.264)",
          "resolution": "1024x576 (configurable)",
          "duration": "~2.3 seconds @ 6fps (14 frames)"
        }
      },
      "performance": {
        "avg_generation_time": "25-35 seconds",
-        "vram_usage": "~14-16GB",
+        "vram_usage": "~16-18GB",
-        "output": "14 frames (~2.3s @ 6fps)"
+        "gpu_utilization": "95-100%"
-      }
+      },
      "use_cases": [
        "Animate static images with natural motion",
        "Create short video loops from single frames",
        "Add subtle camera movements to still images",
        "Generate product animation previews"
      ],
      "notes": [
        "SVD-XT extends frame count from 14 to 25 frames",
        "Model auto-downloads on first use (~9GB)",
        "Recommended resolution: 1024x576 (16:9)",
        "Higher motion_bucket_id = more movement",
        "Linear CFG guidance improves temporal consistency"
      ]
    }
  },
  "version": 0.4