Initial implementation of AudioCraft Studio

Complete web interface for Meta's AudioCraft AI audio generation: - Gradio UI with tabs for all 5 model families (MusicGen, AudioGen, MAGNeT, MusicGen Style, JASCO) - REST API with FastAPI, OpenAPI docs, and API key auth - VRAM management with ComfyUI coexistence support - SQLite database for project/generation history - Batch processing queue for async generation - Docker deployment optimized for RunPod with RTX 4090 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com>
2025-11-25 19:34:27 +01:00
commit ffbf02b12c
67 changed files with 12032 additions and 0 deletions
--- a/scripts/download_models.py
+++ b/scripts/download_models.py
@@ -0,0 +1,116 @@
+#!/usr/bin/env python3
+"""Pre-download AudioCraft models for faster startup."""
+
+import argparse
+import os
+from pathlib import Path
+
+
+def download_musicgen_models(variants: list[str] = None):
+    """Download MusicGen models."""
+    from audiocraft.models import MusicGen
+
+    variants = variants or ["small", "medium", "large", "melody"]
+
+    for variant in variants:
+        print(f"Downloading MusicGen {variant}...")
+        try:
+            model = MusicGen.get_pretrained(f"facebook/musicgen-{variant}")
+            del model
+            print(f"  ✓ MusicGen {variant} downloaded")
+        except Exception as e:
+            print(f"  ✗ Failed to download MusicGen {variant}: {e}")
+
+
+def download_audiogen_models():
+    """Download AudioGen models."""
+    from audiocraft.models import AudioGen
+
+    print("Downloading AudioGen medium...")
+    try:
+        model = AudioGen.get_pretrained("facebook/audiogen-medium")
+        del model
+        print("  ✓ AudioGen medium downloaded")
+    except Exception as e:
+        print(f"  ✗ Failed to download AudioGen: {e}")
+
+
+def download_magnet_models(variants: list[str] = None):
+    """Download MAGNeT models."""
+    from audiocraft.models import MAGNeT
+
+    variants = variants or ["small", "medium", "audio-small-10secs", "audio-medium-10secs"]
+
+    for variant in variants:
+        print(f"Downloading MAGNeT {variant}...")
+        try:
+            model = MAGNeT.get_pretrained(f"facebook/magnet-{variant}")
+            del model
+            print(f"  ✓ MAGNeT {variant} downloaded")
+        except Exception as e:
+            print(f"  ✗ Failed to download MAGNeT {variant}: {e}")
+
+
+def main():
+    parser = argparse.ArgumentParser(description="Pre-download AudioCraft models")
+    parser.add_argument(
+        "--models",
+        nargs="+",
+        choices=["musicgen", "audiogen", "magnet", "all"],
+        default=["all"],
+        help="Models to download",
+    )
+    parser.add_argument(
+        "--musicgen-variants",
+        nargs="+",
+        default=["small", "medium"],
+        help="MusicGen variants to download",
+    )
+    parser.add_argument(
+        "--magnet-variants",
+        nargs="+",
+        default=["small", "medium"],
+        help="MAGNeT variants to download",
+    )
+    parser.add_argument(
+        "--cache-dir",
+        type=str,
+        default=None,
+        help="Model cache directory",
+    )
+
+    args = parser.parse_args()
+
+    # Set cache directory
+    if args.cache_dir:
+        os.environ["HF_HOME"] = args.cache_dir
+        os.environ["TORCH_HOME"] = args.cache_dir
+        Path(args.cache_dir).mkdir(parents=True, exist_ok=True)
+
+    models = args.models
+    if "all" in models:
+        models = ["musicgen", "audiogen", "magnet"]
+
+    print("=" * 50)
+    print("AudioCraft Model Downloader")
+    print("=" * 50)
+    print(f"Cache directory: {os.environ.get('HF_HOME', 'default')}")
+    print(f"Models to download: {models}")
+    print("=" * 50)
+
+    if "musicgen" in models:
+        download_musicgen_models(args.musicgen_variants)
+
+    if "audiogen" in models:
+        download_audiogen_models()
+
+    if "magnet" in models:
+        download_magnet_models(args.magnet_variants)
+
+    print("=" * 50)
+    print("Download complete!")
+    print("=" * 50)
+
+
+if __name__ == "__main__":
+    main()
--- a/scripts/start.sh
+++ b/scripts/start.sh
@@ -0,0 +1,55 @@
+#!/bin/bash
+# Startup script for AudioCraft Studio
+# Used in Docker container and RunPod
+
+set -e
+
+echo "=========================================="
+echo "  AudioCraft Studio"
+echo "=========================================="
+
+# Create directories if they don't exist
+mkdir -p "${AUDIOCRAFT_OUTPUT_DIR:-/workspace/outputs}"
+mkdir -p "${AUDIOCRAFT_DATA_DIR:-/workspace/data}"
+mkdir -p "${AUDIOCRAFT_MODEL_CACHE:-/workspace/models}"
+
+# Check GPU availability
+echo "Checking GPU..."
+if command -v nvidia-smi &> /dev/null; then
+    nvidia-smi --query-gpu=name,memory.total,memory.free --format=csv
+else
+    echo "Warning: nvidia-smi not found"
+fi
+
+# Check Python and dependencies
+echo "Python version:"
+python --version
+
+echo "PyTorch version:"
+python -c "import torch; print(f'PyTorch: {torch.__version__}, CUDA: {torch.cuda.is_available()}')"
+
+# Check AudioCraft installation
+echo "AudioCraft version:"
+python -c "import audiocraft; print(audiocraft.__version__)" 2>/dev/null || echo "AudioCraft installed from source"
+
+# Generate API key if not exists
+if [ ! -f "${AUDIOCRAFT_DATA_DIR:-/workspace/data}/.api_key" ]; then
+    echo "Generating API key..."
+    python -c "
+from src.api.auth import get_key_manager
+km = get_key_manager()
+if not km.has_key():
+    key = km.generate_new_key()
+    print(f'Generated API key: {key}')
+    print('Store this key securely - it will not be shown again!')
+"
+fi
+
+# Start the application
+echo "Starting AudioCraft Studio..."
+echo "Gradio UI: http://0.0.0.0:${AUDIOCRAFT_GRADIO_PORT:-7860}"
+echo "REST API:  http://0.0.0.0:${AUDIOCRAFT_API_PORT:-8000}"
+echo "API Docs:  http://0.0.0.0:${AUDIOCRAFT_API_PORT:-8000}/api/docs"
+echo "=========================================="
+
+exec python main.py "$@"