{ "last_node_id": 3, "last_link_id": 2, "nodes": [ { "id": 1, "type": "DiffRhythmTextToMusic", "pos": [100, 100], "size": [400, 300], "flags": {}, "order": 0, "mode": 0, "outputs": [ { "name": "AUDIO", "type": "AUDIO", "links": [1] } ], "properties": {}, "widgets_values": [ "Upbeat electronic dance music with energetic beats and synthesizer melodies", 95.0, 4.0, 42, "cfm_model_v1_2", "auto" ], "title": "DiffRhythm Text-to-Music (95s)" }, { "id": 2, "type": "PreviewAudio", "pos": [600, 100], "size": [300, 100], "flags": {}, "order": 1, "mode": 0, "inputs": [ { "name": "audio", "type": "AUDIO", "link": 1 } ], "properties": {}, "title": "Preview Audio" }, { "id": 3, "type": "SaveAudio", "pos": [600, 250], "size": [300, 100], "flags": {}, "order": 2, "mode": 0, "inputs": [ { "name": "audio", "type": "AUDIO", "link": 2 } ], "properties": {}, "widgets_values": [ "diffrhythm_output" ], "title": "Save Audio" } ], "links": [ [1, 1, 0, 2, 0, "AUDIO"], [2, 1, 0, 3, 0, "AUDIO"] ], "groups": [], "config": {}, "extra": { "workflow_info": { "name": "DiffRhythm Simple Text-to-Music v1", "description": "Basic text-to-music generation using DiffRhythm 1.2 (95 seconds)", "version": "1.0.0", "author": "valknar@pivoine.art", "category": "text-to-music", "tags": ["diffrhythm", "music-generation", "text-to-music", "95s"], "requirements": { "custom_nodes": ["ComfyUI_DiffRhythm"], "models": ["ASLP-lab/DiffRhythm-1_2", "ASLP-lab/DiffRhythm-vae", "OpenMuQ/MuQ-MuLan-large", "OpenMuQ/MuQ-large-msd-iter", "FacebookAI/xlm-roberta-base"], "vram_min": "12GB", "vram_recommended": "16GB", "system_deps": ["espeak-ng"] }, "usage": { "prompt": "Text description of the desired music style, mood, and instruments", "duration": "Fixed at 95 seconds for DiffRhythm 1.2 model", "guidance_scale": "Controls how closely the output follows the prompt (1.0-10.0, default: 4.0)", "seed": "Random seed for reproducibility (default: 42)", "model": "cfm_model_v1_2 (DiffRhythm 1.2 - 95s generation)", "device": "auto (automatic GPU selection)" }, "notes": [ "This workflow uses DiffRhythm 1.2 for 95-second music generation", "All parameters are optional - can generate music randomly without inputs", "Supports English and Chinese text prompts", "Generation time: ~30-60 seconds on RTX 4090", "PLACEHOLDER: Actual node names and parameters need to be updated after ComfyUI_DiffRhythm installation" ] } }, "version": 0.4 }