From ad30ba98a69dd6ca74d63d9379e387239ad210fc Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 04:10:24 +0000
Subject: [PATCH 01/33] Add multi-provider support and local file media
 provider

Major features:
- Add local file media provider that scans directories for audio files
  using MP3 tags for metadata (ID3, Vorbis comments, etc.)
- Introduce multi-provider architecture with database schema for
  tracking providers, tracks, and cross-provider linking
- Add GUI setup wizard for configuring providers and settings
- Simplify Docker deployment to 2 unified files (CPU/NVIDIA)

Database changes:
- New tables: provider, track, provider_track, app_settings
- Add file_path and track_id columns to score table for linking
- All changes are migration-safe with ON CONFLICT handling

Key implementation details:
- File path hash (SHA-256) used as stable identifier for local files
- Providers can be tested before saving configuration
- Existing installations auto-migrate with default provider from env
- Analysis pipeline updated to store file_path for track linking

Files added:
- tasks/mediaserver_localfiles.py - Local file provider implementation
- app_setup.py - Setup wizard API endpoints
- templates/setup.html - Setup wizard UI
- deployment/docker-compose-unified.yaml - Simplified CPU deployment
- deployment/docker-compose-unified-nvidia.yaml - Simplified GPU deployment
- docs/MULTI_PROVIDER_ARCHITECTURE.md - Architecture documentation

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app.py                                        |    2 +
 app_helper.py                                 |  144 ++-
 app_setup.py                                  |  682 +++++++++++
 config.py                                     |   10 +-
 deployment/.env.example                       |  102 +-
 deployment/docker-compose-unified-nvidia.yaml |  210 ++++
 deployment/docker-compose-unified.yaml        |  188 +++
 docs/MULTI_PROVIDER_ARCHITECTURE.md           |  323 ++++++
 tasks/analysis.py                             |   10 +-
 tasks/mediaserver.py                          |  257 ++++-
 tasks/mediaserver_localfiles.py               |  604 ++++++++++
 templates/setup.html                          | 1028 +++++++++++++++++
 templates/sidebar_navi.html                   |    1 +
 13 files changed, 3511 insertions(+), 50 deletions(-)
 create mode 100644 app_setup.py
 create mode 100644 deployment/docker-compose-unified-nvidia.yaml
 create mode 100644 deployment/docker-compose-unified.yaml
 create mode 100644 docs/MULTI_PROVIDER_ARCHITECTURE.md
 create mode 100644 tasks/mediaserver_localfiles.py
 create mode 100644 templates/setup.html

diff --git a/app.py b/app.py
index 4d4a5136..0b630480 100644
--- a/app.py
+++ b/app.py
@@ -598,6 +598,7 @@ def listen_for_index_reloads():
 from app_artist_similarity import artist_similarity_bp
 from app_clap_search import clap_search_bp
 from app_mulan_search import mulan_search_bp
+from app_setup import setup_bp  # Setup wizard and provider configuration
 
 app.register_blueprint(chat_bp, url_prefix='/chat')
 app.register_blueprint(clustering_bp)
@@ -614,6 +615,7 @@ def listen_for_index_reloads():
 app.register_blueprint(artist_similarity_bp)
 app.register_blueprint(clap_search_bp)
 app.register_blueprint(mulan_search_bp)
+app.register_blueprint(setup_bp)  # Setup wizard
 
 if __name__ == '__main__':
   os.makedirs(TEMP_DIR, exist_ok=True)
diff --git a/app_helper.py b/app_helper.py
index 7afbd822..25a47f90 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -212,7 +212,100 @@ def init_db():
                 """, (query, 1.0, rank))
             
             logger.info(f"Inserted {len(default_queries)} default CLAP search queries")
-        
+
+        # =================================================================
+        # MULTI-PROVIDER SUPPORT TABLES
+        # =================================================================
+
+        # Create 'provider' table - Registry of configured media providers
+        cur.execute("""
+            CREATE TABLE IF NOT EXISTS provider (
+                id SERIAL PRIMARY KEY,
+                provider_type VARCHAR(50) NOT NULL,
+                name VARCHAR(255) NOT NULL,
+                config JSONB NOT NULL DEFAULT '{}',
+                enabled BOOLEAN DEFAULT TRUE,
+                priority INTEGER DEFAULT 0,
+                created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+                updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+                UNIQUE(provider_type, name)
+            )
+        """)
+
+        # Create 'track' table - Stable track identity based on file path
+        cur.execute("""
+            CREATE TABLE IF NOT EXISTS track (
+                id SERIAL PRIMARY KEY,
+                file_path_hash VARCHAR(64) NOT NULL UNIQUE,
+                file_path TEXT NOT NULL,
+                file_size BIGINT,
+                file_modified TIMESTAMP,
+                created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+                updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
+            )
+        """)
+        cur.execute("CREATE INDEX IF NOT EXISTS idx_track_file_path_hash ON track(file_path_hash)")
+
+        # Create 'provider_track' table - Links provider item_ids to tracks
+        cur.execute("""
+            CREATE TABLE IF NOT EXISTS provider_track (
+                id SERIAL PRIMARY KEY,
+                provider_id INTEGER NOT NULL REFERENCES provider(id) ON DELETE CASCADE,
+                track_id INTEGER NOT NULL REFERENCES track(id) ON DELETE CASCADE,
+                item_id TEXT NOT NULL,
+                title TEXT,
+                artist TEXT,
+                album TEXT,
+                last_synced TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+                UNIQUE(provider_id, item_id),
+                UNIQUE(provider_id, track_id)
+            )
+        """)
+        cur.execute("CREATE INDEX IF NOT EXISTS idx_provider_track_item_id ON provider_track(item_id)")
+        cur.execute("CREATE INDEX IF NOT EXISTS idx_provider_track_track_id ON provider_track(track_id)")
+
+        # Create 'app_settings' table - Application configuration storage
+        cur.execute("""
+            CREATE TABLE IF NOT EXISTS app_settings (
+                key VARCHAR(255) PRIMARY KEY,
+                value JSONB NOT NULL,
+                category VARCHAR(100),
+                description TEXT,
+                updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
+            )
+        """)
+
+        # Add 'track_id' column to 'score' table if not exists (for multi-provider linking)
+        cur.execute("SELECT EXISTS (SELECT 1 FROM information_schema.columns WHERE table_name = 'score' AND column_name = 'track_id')")
+        if not cur.fetchone()[0]:
+            logger.info("Adding 'track_id' column to 'score' table for multi-provider support.")
+            cur.execute("ALTER TABLE score ADD COLUMN track_id INTEGER REFERENCES track(id)")
+            cur.execute("CREATE INDEX IF NOT EXISTS idx_score_track_id ON score(track_id)")
+
+        # Add 'file_path' column to 'score' table if not exists (for file identification)
+        cur.execute("SELECT EXISTS (SELECT 1 FROM information_schema.columns WHERE table_name = 'score' AND column_name = 'file_path')")
+        if not cur.fetchone()[0]:
+            logger.info("Adding 'file_path' column to 'score' table.")
+            cur.execute("ALTER TABLE score ADD COLUMN file_path TEXT")
+            cur.execute("CREATE INDEX IF NOT EXISTS idx_score_file_path ON score(file_path)")
+
+        # Insert default settings if app_settings is empty
+        cur.execute("SELECT COUNT(*) FROM app_settings")
+        if cur.fetchone()[0] == 0:
+            default_settings = [
+                ('setup_completed', 'false', 'system', 'Whether the setup wizard has been completed'),
+                ('setup_version', '"1.0"', 'system', 'Version of the setup wizard last completed'),
+                ('multi_provider_enabled', 'false', 'providers', 'Whether multi-provider mode is enabled'),
+                ('primary_provider_id', 'null', 'providers', 'ID of the primary provider for playlist creation'),
+            ]
+            for key, value, category, description in default_settings:
+                cur.execute("""
+                    INSERT INTO app_settings (key, value, category, description)
+                    VALUES (%s, %s::jsonb, %s, %s)
+                    ON CONFLICT (key) DO NOTHING
+                """, (key, value, category, description))
+            logger.info("Inserted default app settings")
+
         db.commit()
 
 # --- Status Constants ---
@@ -427,14 +520,29 @@ def track_exists(item_id):
     cur.close()
     return row is not None
 
-def save_track_analysis_and_embedding(item_id, title, author, tempo, key, scale, moods, embedding_vector, energy=None, other_features=None, album=None):
-    """Saves track analysis and embedding in a single transaction."""
-    
+def save_track_analysis_and_embedding(item_id, title, author, tempo, key, scale, moods, embedding_vector, energy=None, other_features=None, album=None, file_path=None):
+    """Saves track analysis and embedding in a single transaction.
+
+    Args:
+        item_id: Provider-specific track identifier
+        title: Track title
+        author: Artist name
+        tempo: BPM
+        key: Musical key
+        scale: Major/Minor scale
+        moods: Dict of mood labels and scores
+        embedding_vector: numpy array of embeddings
+        energy: Energy level (0.01-0.15)
+        other_features: JSON string of additional features
+        album: Album name
+        file_path: Full path to the audio file (for multi-provider track linking)
+    """
+
     def _sanitize_string(s, max_length=1000, field_name="field"):
         """Sanitize string for PostgreSQL insertion."""
         if s is None:
             return None
-        
+
         # Ensure it's a string
         if not isinstance(s, str):
             try:
@@ -442,25 +550,25 @@ def _sanitize_string(s, max_length=1000, field_name="field"):
             except Exception:
                 logger.warning(f"Could not convert {field_name} to string, using empty string")
                 return ""
-        
+
         # Remove problematic characters
         # NUL byte (0x00) - PostgreSQL cannot store
         s = s.replace('\x00', '')
-        
+
         # Remove other control characters that could cause issues
         # Keep only printable ASCII, space, tab, newline, and common Unicode
         s = ''.join(char for char in s if char.isprintable() or char in '\n\t ')
-        
+
         # Truncate to max length to prevent overly long strings
         if len(s) > max_length:
             logger.warning(f"{field_name} truncated from {len(s)} to {max_length} characters")
             s = s[:max_length]
-        
+
         # Strip leading/trailing whitespace
         s = s.strip()
-        
+
         return s
-    
+
     # Sanitize all string inputs with field-specific limits
     title = _sanitize_string(title, max_length=500, field_name="title")
     author = _sanitize_string(author, max_length=200, field_name="author")
@@ -468,16 +576,17 @@ def _sanitize_string(s, max_length=1000, field_name="field"):
     key = _sanitize_string(key, max_length=10, field_name="key")
     scale = _sanitize_string(scale, max_length=10, field_name="scale")
     other_features = _sanitize_string(other_features, max_length=2000, field_name="other_features")
+    file_path = _sanitize_string(file_path, max_length=2000, field_name="file_path")
 
     mood_str = ','.join(f"{k}:{v:.3f}" for k, v in moods.items())
-    
+
     conn = get_db() # This now calls the function within this file
     cur = conn.cursor()
     try:
-        # Save analysis to score table
+        # Save analysis to score table (includes file_path for multi-provider linking)
         cur.execute("""
-            INSERT INTO score (item_id, title, author, tempo, key, scale, mood_vector, energy, other_features, album)
-            VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s, %s)
+            INSERT INTO score (item_id, title, author, tempo, key, scale, mood_vector, energy, other_features, album, file_path)
+            VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s, %s, %s)
             ON CONFLICT (item_id) DO UPDATE SET
                 title = EXCLUDED.title,
                 author = EXCLUDED.author,
@@ -487,8 +596,9 @@ def _sanitize_string(s, max_length=1000, field_name="field"):
                 mood_vector = EXCLUDED.mood_vector,
                 energy = EXCLUDED.energy,
                 other_features = EXCLUDED.other_features,
-                album = EXCLUDED.album
-        """, (item_id, title, author, tempo, key, scale, mood_str, energy, other_features, album))
+                album = EXCLUDED.album,
+                file_path = EXCLUDED.file_path
+        """, (item_id, title, author, tempo, key, scale, mood_str, energy, other_features, album, file_path))
 
         # Save embedding
         if isinstance(embedding_vector, np.ndarray) and embedding_vector.size > 0:
diff --git a/app_setup.py b/app_setup.py
new file mode 100644
index 00000000..db895861
--- /dev/null
+++ b/app_setup.py
@@ -0,0 +1,682 @@
+# app_setup.py
+"""
+Setup Wizard API for AudioMuse-AI
+
+This module provides the backend API for the setup wizard and provider configuration.
+It handles:
+- Initial setup detection
+- Provider configuration (add, update, delete, test)
+- Application settings management
+- Multi-provider mode enablement
+"""
+
+import logging
+import json
+from datetime import datetime
+from flask import Blueprint, jsonify, request, render_template, redirect, url_for, g
+from functools import wraps
+
+from app_helper import get_db
+from tasks.mediaserver import (
+    get_available_provider_types,
+    get_provider_info,
+    test_provider_connection,
+    PROVIDER_TYPES
+)
+import config
+
+logger = logging.getLogger(__name__)
+
+setup_bp = Blueprint('setup', __name__)
+
+
+# ##############################################################################
+# HELPER FUNCTIONS
+# ##############################################################################
+
+def get_setting(key, default=None):
+    """Get a setting value from the database."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("SELECT value FROM app_settings WHERE key = %s", (key,))
+        row = cur.fetchone()
+        if row:
+            return row[0]
+        return default
+
+
+def set_setting(key, value, category=None, description=None):
+    """Set a setting value in the database."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            INSERT INTO app_settings (key, value, category, description, updated_at)
+            VALUES (%s, %s, %s, %s, NOW())
+            ON CONFLICT (key) DO UPDATE SET
+                value = EXCLUDED.value,
+                category = COALESCE(EXCLUDED.category, app_settings.category),
+                description = COALESCE(EXCLUDED.description, app_settings.description),
+                updated_at = NOW()
+        """, (key, json.dumps(value), category, description))
+        db.commit()
+
+
+def get_all_settings():
+    """Get all settings grouped by category."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("SELECT key, value, category, description FROM app_settings ORDER BY category, key")
+        rows = cur.fetchall()
+        settings = {}
+        for row in rows:
+            key, value, category, description = row
+            if category not in settings:
+                settings[category] = {}
+            settings[category][key] = {
+                'value': value,
+                'description': description
+            }
+        return settings
+
+
+def is_setup_completed():
+    """Check if initial setup has been completed."""
+    result = get_setting('setup_completed')
+    return result is True or result == 'true' or result == True
+
+
+def is_multi_provider_enabled():
+    """Check if multi-provider mode is enabled."""
+    result = get_setting('multi_provider_enabled')
+    return result is True or result == 'true' or result == True
+
+
+# ##############################################################################
+# PROVIDER MANAGEMENT
+# ##############################################################################
+
+def get_providers():
+    """Get all configured providers."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            SELECT id, provider_type, name, config, enabled, priority, created_at, updated_at
+            FROM provider
+            ORDER BY priority DESC, created_at ASC
+        """)
+        rows = cur.fetchall()
+        providers = []
+        for row in rows:
+            provider = {
+                'id': row[0],
+                'provider_type': row[1],
+                'name': row[2],
+                'config': row[3],  # JSONB is automatically parsed
+                'enabled': row[4],
+                'priority': row[5],
+                'created_at': row[6].isoformat() if row[6] else None,
+                'updated_at': row[7].isoformat() if row[7] else None,
+            }
+            # Don't expose sensitive config values
+            if provider['config']:
+                safe_config = {}
+                for k, v in provider['config'].items():
+                    if k in ('password', 'token', 'api_key'):
+                        safe_config[k] = '********' if v else None
+                    else:
+                        safe_config[k] = v
+                provider['config_display'] = safe_config
+            providers.append(provider)
+        return providers
+
+
+def get_provider_by_id(provider_id):
+    """Get a provider by ID."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            SELECT id, provider_type, name, config, enabled, priority
+            FROM provider WHERE id = %s
+        """, (provider_id,))
+        row = cur.fetchone()
+        if row:
+            return {
+                'id': row[0],
+                'provider_type': row[1],
+                'name': row[2],
+                'config': row[3],
+                'enabled': row[4],
+                'priority': row[5],
+            }
+        return None
+
+
+def add_provider(provider_type, name, config_data, enabled=True, priority=0):
+    """Add a new provider configuration."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            INSERT INTO provider (provider_type, name, config, enabled, priority)
+            VALUES (%s, %s, %s, %s, %s)
+            RETURNING id
+        """, (provider_type, name, json.dumps(config_data), enabled, priority))
+        provider_id = cur.fetchone()[0]
+        db.commit()
+        return provider_id
+
+
+def update_provider(provider_id, name=None, config_data=None, enabled=None, priority=None):
+    """Update an existing provider configuration."""
+    db = get_db()
+    updates = []
+    values = []
+
+    if name is not None:
+        updates.append("name = %s")
+        values.append(name)
+    if config_data is not None:
+        updates.append("config = %s")
+        values.append(json.dumps(config_data))
+    if enabled is not None:
+        updates.append("enabled = %s")
+        values.append(enabled)
+    if priority is not None:
+        updates.append("priority = %s")
+        values.append(priority)
+
+    if not updates:
+        return False
+
+    updates.append("updated_at = NOW()")
+    values.append(provider_id)
+
+    with db.cursor() as cur:
+        cur.execute(f"""
+            UPDATE provider SET {', '.join(updates)}
+            WHERE id = %s
+        """, values)
+        db.commit()
+        return cur.rowcount > 0
+
+
+def delete_provider(provider_id):
+    """Delete a provider configuration."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("DELETE FROM provider WHERE id = %s", (provider_id,))
+        db.commit()
+        return cur.rowcount > 0
+
+
+def create_default_provider_from_env():
+    """
+    Create a default provider from environment variables if no providers exist.
+    This enables backward compatibility with existing installations.
+    """
+    existing = get_providers()
+    if existing:
+        return None  # Providers already exist
+
+    provider_type = config.MEDIASERVER_TYPE
+    if provider_type not in PROVIDER_TYPES:
+        logger.warning(f"Unknown provider type from env: {provider_type}")
+        return None
+
+    # Build config from environment variables
+    config_data = {}
+
+    if provider_type == 'jellyfin':
+        config_data = {
+            'url': config.JELLYFIN_URL,
+            'user_id': config.JELLYFIN_USER_ID,
+            'token': config.JELLYFIN_TOKEN,
+        }
+    elif provider_type == 'navidrome':
+        config_data = {
+            'url': config.NAVIDROME_URL,
+            'user': config.NAVIDROME_USER,
+            'password': config.NAVIDROME_PASSWORD,
+        }
+    elif provider_type == 'lyrion':
+        config_data = {
+            'url': config.LYRION_URL,
+        }
+    elif provider_type == 'mpd':
+        config_data = {
+            'host': config.MPD_HOST,
+            'port': config.MPD_PORT,
+            'password': config.MPD_PASSWORD,
+            'music_directory': config.MPD_MUSIC_DIRECTORY,
+        }
+    elif provider_type == 'emby':
+        config_data = {
+            'url': config.EMBY_URL,
+            'user_id': config.EMBY_USER_ID,
+            'token': config.EMBY_TOKEN,
+        }
+    elif provider_type == 'localfiles':
+        config_data = {
+            'music_directory': config.LOCALFILES_MUSIC_DIRECTORY,
+            'supported_formats': config.LOCALFILES_FORMATS,
+            'scan_subdirectories': config.LOCALFILES_SCAN_SUBDIRS,
+            'playlist_directory': config.LOCALFILES_PLAYLIST_DIR,
+        }
+
+    name = f"{PROVIDER_TYPES[provider_type]['name']} (Default)"
+    provider_id = add_provider(provider_type, name, config_data, enabled=True, priority=100)
+    logger.info(f"Created default provider from environment: {provider_type} (id={provider_id})")
+    return provider_id
+
+
+# ##############################################################################
+# API ENDPOINTS
+# ##############################################################################
+
+@setup_bp.route('/setup')
+def setup_page():
+    """Render the setup wizard page."""
+    return render_template('setup.html', title='AudioMuse-AI - Setup', active='setup')
+
+
+@setup_bp.route('/api/setup/status', methods=['GET'])
+def get_setup_status():
+    """
+    Get the current setup status.
+    ---
+    tags:
+      - Setup
+    responses:
+      200:
+        description: Setup status information
+    """
+    completed = is_setup_completed()
+    multi_provider = is_multi_provider_enabled()
+    providers = get_providers()
+
+    # Check if we need to create default provider from env
+    if not providers:
+        create_default_provider_from_env()
+        providers = get_providers()
+
+    return jsonify({
+        'setup_completed': completed,
+        'multi_provider_enabled': multi_provider,
+        'provider_count': len(providers),
+        'providers': providers,
+        'current_mediaserver_type': config.MEDIASERVER_TYPE,
+        'app_version': config.APP_VERSION,
+    })
+
+
+@setup_bp.route('/api/setup/providers/types', methods=['GET'])
+def get_provider_types():
+    """
+    Get available provider types with their configuration fields.
+    ---
+    tags:
+      - Setup
+    responses:
+      200:
+        description: List of provider types
+    """
+    types = get_available_provider_types()
+    result = []
+    for ptype, info in types.items():
+        provider_info = get_provider_info(ptype)
+        result.append({
+            'type': ptype,
+            'name': info['name'],
+            'description': info['description'],
+            'supports_user_auth': info['supports_user_auth'],
+            'supports_play_history': info['supports_play_history'],
+            'config_fields': provider_info.get('config_fields', []) if provider_info else [],
+        })
+    return jsonify(result)
+
+
+@setup_bp.route('/api/setup/providers', methods=['GET'])
+def list_providers():
+    """
+    List all configured providers.
+    ---
+    tags:
+      - Setup
+    responses:
+      200:
+        description: List of providers
+    """
+    providers = get_providers()
+    return jsonify(providers)
+
+
+@setup_bp.route('/api/setup/providers', methods=['POST'])
+def create_provider():
+    """
+    Add a new provider configuration.
+    ---
+    tags:
+      - Setup
+    requestBody:
+      required: true
+      content:
+        application/json:
+          schema:
+            type: object
+            properties:
+              provider_type:
+                type: string
+              name:
+                type: string
+              config:
+                type: object
+              enabled:
+                type: boolean
+              priority:
+                type: integer
+    responses:
+      201:
+        description: Provider created
+      400:
+        description: Invalid request
+    """
+    data = request.get_json()
+    if not data:
+        return jsonify({'error': 'No data provided'}), 400
+
+    provider_type = data.get('provider_type')
+    name = data.get('name')
+    config_data = data.get('config', {})
+    enabled = data.get('enabled', True)
+    priority = data.get('priority', 0)
+
+    if not provider_type:
+        return jsonify({'error': 'provider_type is required'}), 400
+    if not name:
+        return jsonify({'error': 'name is required'}), 400
+    if provider_type not in PROVIDER_TYPES:
+        return jsonify({'error': f'Unknown provider type: {provider_type}'}), 400
+
+    try:
+        provider_id = add_provider(provider_type, name, config_data, enabled, priority)
+        return jsonify({'id': provider_id, 'message': 'Provider created'}), 201
+    except Exception as e:
+        logger.error(f"Error creating provider: {e}")
+        return jsonify({'error': str(e)}), 500
+
+
+@setup_bp.route('/api/setup/providers/<int:provider_id>', methods=['PUT'])
+def update_provider_endpoint(provider_id):
+    """
+    Update an existing provider configuration.
+    ---
+    tags:
+      - Setup
+    parameters:
+      - name: provider_id
+        in: path
+        required: true
+        schema:
+          type: integer
+    responses:
+      200:
+        description: Provider updated
+      404:
+        description: Provider not found
+    """
+    provider = get_provider_by_id(provider_id)
+    if not provider:
+        return jsonify({'error': 'Provider not found'}), 404
+
+    data = request.get_json()
+    if not data:
+        return jsonify({'error': 'No data provided'}), 400
+
+    # Merge config if partial update
+    config_data = data.get('config')
+    if config_data and isinstance(config_data, dict):
+        # Don't allow updating password fields with '********'
+        for key in list(config_data.keys()):
+            if config_data[key] == '********':
+                config_data[key] = provider['config'].get(key)
+
+    success = update_provider(
+        provider_id,
+        name=data.get('name'),
+        config_data=config_data,
+        enabled=data.get('enabled'),
+        priority=data.get('priority')
+    )
+
+    if success:
+        return jsonify({'message': 'Provider updated'})
+    return jsonify({'error': 'Update failed'}), 500
+
+
+@setup_bp.route('/api/setup/providers/<int:provider_id>', methods=['DELETE'])
+def delete_provider_endpoint(provider_id):
+    """
+    Delete a provider configuration.
+    ---
+    tags:
+      - Setup
+    parameters:
+      - name: provider_id
+        in: path
+        required: true
+        schema:
+          type: integer
+    responses:
+      200:
+        description: Provider deleted
+      404:
+        description: Provider not found
+    """
+    success = delete_provider(provider_id)
+    if success:
+        return jsonify({'message': 'Provider deleted'})
+    return jsonify({'error': 'Provider not found'}), 404
+
+
+@setup_bp.route('/api/setup/providers/<int:provider_id>/test', methods=['POST'])
+def test_provider_endpoint(provider_id):
+    """
+    Test connection to a provider.
+    ---
+    tags:
+      - Setup
+    parameters:
+      - name: provider_id
+        in: path
+        required: true
+        schema:
+          type: integer
+    responses:
+      200:
+        description: Connection test result
+    """
+    provider = get_provider_by_id(provider_id)
+    if not provider:
+        return jsonify({'error': 'Provider not found'}), 404
+
+    success, message = test_provider_connection(
+        provider['provider_type'],
+        provider['config']
+    )
+
+    return jsonify({
+        'success': success,
+        'message': message,
+        'provider_id': provider_id,
+        'provider_type': provider['provider_type'],
+    })
+
+
+@setup_bp.route('/api/setup/providers/test', methods=['POST'])
+def test_provider_config():
+    """
+    Test connection with provided configuration (without saving).
+    ---
+    tags:
+      - Setup
+    requestBody:
+      required: true
+      content:
+        application/json:
+          schema:
+            type: object
+            properties:
+              provider_type:
+                type: string
+              config:
+                type: object
+    responses:
+      200:
+        description: Connection test result
+    """
+    data = request.get_json()
+    if not data:
+        return jsonify({'error': 'No data provided'}), 400
+
+    provider_type = data.get('provider_type')
+    config_data = data.get('config', {})
+
+    if not provider_type:
+        return jsonify({'error': 'provider_type is required'}), 400
+
+    success, message = test_provider_connection(provider_type, config_data)
+
+    return jsonify({
+        'success': success,
+        'message': message,
+        'provider_type': provider_type,
+    })
+
+
+@setup_bp.route('/api/setup/settings', methods=['GET'])
+def get_settings():
+    """
+    Get all application settings.
+    ---
+    tags:
+      - Setup
+    responses:
+      200:
+        description: All settings grouped by category
+    """
+    settings = get_all_settings()
+    return jsonify(settings)
+
+
+@setup_bp.route('/api/setup/settings', methods=['PUT'])
+def update_settings():
+    """
+    Update application settings.
+    ---
+    tags:
+      - Setup
+    requestBody:
+      required: true
+      content:
+        application/json:
+          schema:
+            type: object
+            additionalProperties: true
+    responses:
+      200:
+        description: Settings updated
+    """
+    data = request.get_json()
+    if not data:
+        return jsonify({'error': 'No data provided'}), 400
+
+    for key, value in data.items():
+        set_setting(key, value)
+
+    return jsonify({'message': 'Settings updated'})
+
+
+@setup_bp.route('/api/setup/complete', methods=['POST'])
+def complete_setup():
+    """
+    Mark the setup as complete.
+    ---
+    tags:
+      - Setup
+    responses:
+      200:
+        description: Setup marked as complete
+    """
+    set_setting('setup_completed', True, 'system', 'Whether the setup wizard has been completed')
+    set_setting('setup_version', config.APP_VERSION, 'system', 'Version of the setup wizard last completed')
+    return jsonify({'message': 'Setup completed', 'setup_completed': True})
+
+
+@setup_bp.route('/api/setup/multi-provider', methods=['POST'])
+def enable_multi_provider():
+    """
+    Enable or disable multi-provider mode.
+    ---
+    tags:
+      - Setup
+    requestBody:
+      required: true
+      content:
+        application/json:
+          schema:
+            type: object
+            properties:
+              enabled:
+                type: boolean
+    responses:
+      200:
+        description: Multi-provider mode updated
+    """
+    data = request.get_json()
+    if not data:
+        return jsonify({'error': 'No data provided'}), 400
+
+    enabled = data.get('enabled', False)
+    set_setting('multi_provider_enabled', enabled, 'providers', 'Whether multi-provider mode is enabled')
+
+    return jsonify({
+        'message': f"Multi-provider mode {'enabled' if enabled else 'disabled'}",
+        'multi_provider_enabled': enabled
+    })
+
+
+@setup_bp.route('/api/setup/primary-provider', methods=['PUT'])
+def set_primary_provider():
+    """
+    Set the primary provider for playlist creation.
+    ---
+    tags:
+      - Setup
+    requestBody:
+      required: true
+      content:
+        application/json:
+          schema:
+            type: object
+            properties:
+              provider_id:
+                type: integer
+    responses:
+      200:
+        description: Primary provider set
+    """
+    data = request.get_json()
+    if not data:
+        return jsonify({'error': 'No data provided'}), 400
+
+    provider_id = data.get('provider_id')
+    if provider_id is not None:
+        provider = get_provider_by_id(provider_id)
+        if not provider:
+            return jsonify({'error': 'Provider not found'}), 404
+
+    set_setting('primary_provider_id', provider_id, 'providers', 'ID of the primary provider for playlist creation')
+
+    return jsonify({
+        'message': 'Primary provider set',
+        'primary_provider_id': provider_id
+    })
diff --git a/config.py b/config.py
index 9e9dec46..334bd411 100644
--- a/config.py
+++ b/config.py
@@ -2,7 +2,7 @@
 import os
 
 # --- Media Server Type ---
-MEDIASERVER_TYPE = os.environ.get("MEDIASERVER_TYPE", "jellyfin").lower() # Possible values: jellyfin, navidrome, lyrion, mpd, emby
+MEDIASERVER_TYPE = os.environ.get("MEDIASERVER_TYPE", "jellyfin").lower() # Possible values: jellyfin, navidrome, lyrion, mpd, emby, localfiles
 
 # --- Jellyfin and DB Constants (Read from Environment Variables first) ---
 
@@ -49,6 +49,14 @@
 MPD_PASSWORD = os.environ.get("MPD_PASSWORD", "")  # Optional password, leave empty if none
 MPD_MUSIC_DIRECTORY = os.environ.get("MPD_MUSIC_DIRECTORY", "/var/lib/mpd/music")  # Path to MPD's music directory for file access
 
+# --- Local Files Provider Constants ---
+# These are used only if MEDIASERVER_TYPE is "localfiles".
+LOCALFILES_MUSIC_DIRECTORY = os.environ.get("LOCALFILES_MUSIC_DIRECTORY", "/music")  # Path to local music directory
+LOCALFILES_FORMATS = os.environ.get("LOCALFILES_FORMATS", ".mp3,.flac,.ogg,.m4a,.mp4,.wav,.wma,.aac,.opus")  # Supported audio formats
+LOCALFILES_SCAN_SUBDIRS = os.environ.get("LOCALFILES_SCAN_SUBDIRS", "true").lower() == "true"  # Scan subdirectories
+LOCALFILES_USE_METADATA = os.environ.get("LOCALFILES_USE_METADATA", "true").lower() == "true"  # Use embedded metadata
+LOCALFILES_PLAYLIST_DIR = os.environ.get("LOCALFILES_PLAYLIST_DIR", "/music/playlists")  # Where to save M3U playlists
+
 
 # --- General Constants (Read from Environment Variables where applicable) ---
 APP_VERSION = "v0.8.8"
diff --git a/deployment/.env.example b/deployment/.env.example
index 0ec06cb6..d7e7db62 100644
--- a/deployment/.env.example
+++ b/deployment/.env.example
@@ -1,7 +1,16 @@
+# =============================================================================
+# AudioMuse-AI Configuration
+# =============================================================================
 # Copy this file to `.env` and fill in the values that match your setup.
 # Docker Compose files under deployment/ read these variables to keep settings in one place.
 #
-# IMPORTANT: 
+# QUICK START:
+#   1. Copy this file: cp .env.example .env
+#   2. Set your media provider settings below (Jellyfin, Navidrome, etc.)
+#   3. Start the containers: docker-compose -f docker-compose-unified.yaml up -d
+#   4. Open http://localhost:8000 and complete the setup wizard
+#
+# IMPORTANT:
 # 1. This file must be named exactly ".env" (not .env.txt or .env.example)
 # 2. It must be in the SAME directory as your docker-compose-*.yaml file
 # 3. Do NOT use spaces around the = sign
@@ -24,41 +33,90 @@
 #   - Restart containers after changing this file
 # If all else fails, try hardcoding the value directly in docker-compose-*.yaml to isolate the issue
 
+# =============================================================================
+# MEDIA SERVER PROVIDER
+# =============================================================================
+# Choose your primary media provider. Additional providers can be configured
+# via the web-based setup wizard at http://localhost:8000/setup
+#
+# Options: jellyfin, navidrome, lyrion, mpd, emby, localfiles
+# Default: localfiles (scans local music directory)
+MEDIASERVER_TYPE=localfiles
+
+# --- Local Files Provider ---
+# Path to your music library (mounted into the container as /music)
+MUSIC_PATH=/path/to/your/music
+LOCALFILES_MUSIC_DIRECTORY=/music
+LOCALFILES_PLAYLIST_DIR=/music/playlists
+# Supported formats (comma-separated, including the dot)
+LOCALFILES_FORMATS=.mp3,.flac,.ogg,.m4a,.mp4,.wav,.wma,.aac,.opus
+# Scan subdirectories for music files
+LOCALFILES_SCAN_SUBDIRS=true
+
 # --- Jellyfin ---
+JELLYFIN_URL=http://jellyfin.example.com:8096
 JELLYFIN_USER_ID=YOUR_JELLYFIN_USER_ID
 JELLYFIN_TOKEN=YOUR_JELLYFIN_API_TOKEN
-JELLYFIN_URL=http://jellyfin.example.com:8096
 
 # --- Emby ---
+EMBY_URL=
 EMBY_USER_ID=
 EMBY_TOKEN=
-EMBY_URL=
 
 # --- Navidrome ---
 NAVIDROME_URL=
 NAVIDROME_USER=
 NAVIDROME_PASSWORD=
 
-# --- Lyrion ---
-LYRION_URL=http://lyrion.example.com
+# --- Lyrion (formerly LMS) ---
+LYRION_URL=http://lyrion.example.com:9000
+
+# --- MPD (Music Player Daemon) ---
+MPD_HOST=localhost
+MPD_PORT=6600
+MPD_PASSWORD=
+MPD_MUSIC_DIRECTORY=/var/lib/mpd/music
 
-# --- Shared backend configuration ---
+# =============================================================================
+# DATABASE & INFRASTRUCTURE
+# =============================================================================
 POSTGRES_USER=audiomuse
 POSTGRES_PASSWORD=audiomusepassword
 POSTGRES_DB=audiomusedb
 POSTGRES_PORT=5432
 POSTGRES_HOST=postgres
-REDIS_URL=redis://redis:6379/0 # /!\ change port adress if you change REDIS_PORT below
-# --- Timezone (optional) ---
-# Set container timezone using TZ (examples: UTC, Europe/Berlin, America/Los_Angeles)
-# If omitted, default is UTC. Containers read this env var and apply it at startup.
-TZ=UTC
+REDIS_URL=redis://redis:6379/0
 REDIS_PORT=6379
+
+# =============================================================================
+# WEB SERVER
+# =============================================================================
 FRONTEND_PORT=8000
 WORKER_PORT=8029
+# Timezone (examples: UTC, Europe/Berlin, America/Los_Angeles)
+TZ=UTC
+
+# =============================================================================
+# NVIDIA GPU (for docker-compose-unified-nvidia.yaml)
+# =============================================================================
+# GPU device ID (usually 0 for single GPU systems)
+NVIDIA_GPU_ID=0
+# Enable GPU-accelerated clustering using RAPIDS cuML
+# Automatically falls back to CPU if GPU is unavailable
+USE_GPU_CLUSTERING=false
+
+# =============================================================================
+# ML FEATURES
+# =============================================================================
+# CLAP Text Search - natural language music search
+# Allows queries like "upbeat summer songs" or "relaxing piano music"
+# Disable to save memory (~750MB) on systems with limited RAM
+CLAP_ENABLED=true
 
-# --- AI Model Configuration ---
-# Choose your AI provider: NONE, OLLAMA, OPENAI, GEMINI, OPENAI, or MISTRAL
+# =============================================================================
+# AI PLAYLIST NAMING (Optional)
+# =============================================================================
+# Choose an AI provider for creative playlist names: NONE, OLLAMA, OPENAI, GEMINI, MISTRAL
 AI_MODEL_PROVIDER=NONE
 
 # --- OpenAI / OpenRouter Configuration ---
@@ -71,25 +129,9 @@ AI_MODEL_PROVIDER=NONE
 OPENAI_API_KEY=
 OPENAI_SERVER_URL=https://openrouter.ai/api/v1/chat/completions
 OPENAI_MODEL_NAME=
-# Optional: Delay between API calls to respect rate limits (default: 7 seconds)
+# Delay between API calls to respect rate limits (default: 7 seconds)
 OPENAI_API_CALL_DELAY_SECONDS=7
 
 # --- Other AI Provider API Keys ---
 GEMINI_API_KEY=
 MISTRAL_API_KEY=
-
-# --- GPU Acceleration for Clustering ---
-# Enable GPU-accelerated clustering using RAPIDS cuML (requires NVIDIA GPU)
-# Set to true to use GPU for KMeans, DBSCAN, and PCA in clustering tasks
-# Automatically falls back to CPU if GPU is unavailable
-# Default: false (CPU only)
-USE_GPU_CLUSTERING=false
-
-# --- CLAP Text Search Configuration ---
-# Enable CLAP (Contrastive Language-Audio Pretraining) for natural language music search
-# CLAP allows searching your music collection using text queries like "upbeat summer songs" or "relaxing piano music"
-# Set to false to disable CLAP and save memory/CPU on slower systems
-# WARNING: If disabled, text search functionality will not work (only similarity search will be available)
-# Models: Audio model (~268MB) for analysis, Text model (~478MB) for search
-# Default: true
-CLAP_ENABLED=true
diff --git a/deployment/docker-compose-unified-nvidia.yaml b/deployment/docker-compose-unified-nvidia.yaml
new file mode 100644
index 00000000..b355eb1b
--- /dev/null
+++ b/deployment/docker-compose-unified-nvidia.yaml
@@ -0,0 +1,210 @@
+# AudioMuse-AI Unified Docker Compose - NVIDIA GPU Edition
+# =============================================================================
+# This deployment file includes NVIDIA GPU acceleration support.
+# For CPU-only systems, use docker-compose-unified.yaml
+#
+# Requirements:
+#   - NVIDIA GPU with CUDA support
+#   - NVIDIA Container Toolkit installed
+#   - nvidia-docker2 or Docker 19.03+ with nvidia runtime
+#
+# Quick Start:
+#   1. Copy .env.example to .env and configure your settings
+#   2. Run: docker-compose -f docker-compose-unified-nvidia.yaml up -d
+#   3. Open http://localhost:8000 and complete the setup wizard
+#
+# All provider-specific settings are now configured via the GUI setup wizard
+# or the .env file. No need to use different docker-compose files for different
+# media servers!
+# =============================================================================
+
+version: '3.8'
+
+services:
+  # ---------------------------------------------------------------------------
+  # Redis - Task Queue
+  # ---------------------------------------------------------------------------
+  redis:
+    image: redis:7-alpine
+    container_name: audiomuse-redis
+    ports:
+      - "${REDIS_PORT:-6379}:6379"
+    volumes:
+      - redis-data:/data
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "redis-cli", "ping"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+
+  # ---------------------------------------------------------------------------
+  # PostgreSQL - Database
+  # ---------------------------------------------------------------------------
+  postgres:
+    image: postgres:15-alpine
+    container_name: audiomuse-postgres
+    environment:
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+    ports:
+      - "${POSTGRES_PORT:-5432}:5432"
+    volumes:
+      - postgres-data:/var/lib/postgresql/data
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD-SHELL", "pg_isready -U ${POSTGRES_USER:-audiomuse}"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Flask Application (Web UI & API) - NVIDIA GPU
+  # ---------------------------------------------------------------------------
+  audiomuse-ai-flask:
+    image: ghcr.io/neptunehub/audiomuse-ai:latest-nvidia
+    container_name: audiomuse-ai-flask-app
+    ports:
+      - "${FRONTEND_PORT:-8000}:8000"
+    environment:
+      SERVICE_TYPE: "flask"
+      TZ: "${TZ:-UTC}"
+      # Media Server Configuration
+      # Configure via GUI setup wizard or set here for legacy support
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      # Jellyfin (if using)
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      # Navidrome (if using)
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      # Lyrion (if using)
+      LYRION_URL: "${LYRION_URL:-}"
+      # MPD (if using)
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      # Emby (if using)
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      # Local Files Provider (default)
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      # Database Configuration
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+      POSTGRES_HOST: "postgres"
+      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
+      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
+      # AI Configuration
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # Features
+      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
+      TEMP_DIR: "/app/temp_audio"
+    volumes:
+      - temp-audio-flask:/app/temp_audio
+      # Mount music directory for local files provider
+      - ${MUSIC_PATH:-./music}:/music:ro
+    depends_on:
+      redis:
+        condition: service_healthy
+      postgres:
+        condition: service_healthy
+    restart: unless-stopped
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              device_ids: ["${NVIDIA_GPU_ID:-0}"]
+              capabilities: [gpu]
+
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Worker (Background Tasks & ML Analysis) - NVIDIA GPU
+  # ---------------------------------------------------------------------------
+  audiomuse-ai-worker:
+    image: ghcr.io/neptunehub/audiomuse-ai:latest-nvidia
+    container_name: audiomuse-ai-worker-instance
+    environment:
+      SERVICE_TYPE: "worker"
+      TZ: "${TZ:-UTC}"
+      # NVIDIA GPU Settings
+      NVIDIA_VISIBLE_DEVICES: "${NVIDIA_GPU_ID:-0}"
+      NVIDIA_DRIVER_CAPABILITIES: "compute,utility"
+      # Media Server Configuration (same as flask service)
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      LYRION_URL: "${LYRION_URL:-}"
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      # Database Configuration
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+      POSTGRES_HOST: "postgres"
+      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
+      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
+      # AI Configuration
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # Features - Enable GPU clustering for NVIDIA
+      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
+      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-true}"
+      TEMP_DIR: "/app/temp_audio"
+    volumes:
+      - temp-audio-worker:/app/temp_audio
+      # Mount music directory for local files provider
+      - ${MUSIC_PATH:-./music}:/music:ro
+    depends_on:
+      redis:
+        condition: service_healthy
+      postgres:
+        condition: service_healthy
+    restart: unless-stopped
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              device_ids: ["${NVIDIA_GPU_ID:-0}"]
+              capabilities: [gpu]
+
+# =============================================================================
+# Volumes
+# =============================================================================
+volumes:
+  redis-data:
+    name: audiomuse-redis-data
+  postgres-data:
+    name: audiomuse-postgres-data
+  temp-audio-flask:
+    name: audiomuse-temp-flask
+  temp-audio-worker:
+    name: audiomuse-temp-worker
diff --git a/deployment/docker-compose-unified.yaml b/deployment/docker-compose-unified.yaml
new file mode 100644
index 00000000..bdb8be31
--- /dev/null
+++ b/deployment/docker-compose-unified.yaml
@@ -0,0 +1,188 @@
+# AudioMuse-AI Unified Docker Compose
+# =============================================================================
+# This is the unified deployment file for CPU-only systems.
+# For NVIDIA GPU acceleration, use docker-compose-unified-nvidia.yaml
+#
+# Quick Start:
+#   1. Copy .env.example to .env and configure your settings
+#   2. Run: docker-compose -f docker-compose-unified.yaml up -d
+#   3. Open http://localhost:8000 and complete the setup wizard
+#
+# All provider-specific settings are now configured via the GUI setup wizard
+# or the .env file. No need to use different docker-compose files for different
+# media servers!
+# =============================================================================
+
+version: '3.8'
+
+services:
+  # ---------------------------------------------------------------------------
+  # Redis - Task Queue
+  # ---------------------------------------------------------------------------
+  redis:
+    image: redis:7-alpine
+    container_name: audiomuse-redis
+    ports:
+      - "${REDIS_PORT:-6379}:6379"
+    volumes:
+      - redis-data:/data
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "redis-cli", "ping"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+
+  # ---------------------------------------------------------------------------
+  # PostgreSQL - Database
+  # ---------------------------------------------------------------------------
+  postgres:
+    image: postgres:15-alpine
+    container_name: audiomuse-postgres
+    environment:
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+    ports:
+      - "${POSTGRES_PORT:-5432}:5432"
+    volumes:
+      - postgres-data:/var/lib/postgresql/data
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD-SHELL", "pg_isready -U ${POSTGRES_USER:-audiomuse}"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Flask Application (Web UI & API)
+  # ---------------------------------------------------------------------------
+  audiomuse-ai-flask:
+    image: ghcr.io/neptunehub/audiomuse-ai:latest
+    container_name: audiomuse-ai-flask-app
+    ports:
+      - "${FRONTEND_PORT:-8000}:8000"
+    environment:
+      SERVICE_TYPE: "flask"
+      TZ: "${TZ:-UTC}"
+      # Media Server Configuration
+      # Configure via GUI setup wizard or set here for legacy support
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      # Jellyfin (if using)
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      # Navidrome (if using)
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      # Lyrion (if using)
+      LYRION_URL: "${LYRION_URL:-}"
+      # MPD (if using)
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      # Emby (if using)
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      # Local Files Provider (default)
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      # Database Configuration
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+      POSTGRES_HOST: "postgres"
+      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
+      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
+      # AI Configuration
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # Features
+      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
+      TEMP_DIR: "/app/temp_audio"
+    volumes:
+      - temp-audio-flask:/app/temp_audio
+      # Mount music directory for local files provider
+      - ${MUSIC_PATH:-./music}:/music:ro
+    depends_on:
+      redis:
+        condition: service_healthy
+      postgres:
+        condition: service_healthy
+    restart: unless-stopped
+
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Worker (Background Tasks & ML Analysis)
+  # ---------------------------------------------------------------------------
+  audiomuse-ai-worker:
+    image: ghcr.io/neptunehub/audiomuse-ai:latest
+    container_name: audiomuse-ai-worker-instance
+    environment:
+      SERVICE_TYPE: "worker"
+      TZ: "${TZ:-UTC}"
+      # Media Server Configuration (same as flask service)
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      LYRION_URL: "${LYRION_URL:-}"
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      # Database Configuration
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+      POSTGRES_HOST: "postgres"
+      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
+      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
+      # AI Configuration
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # Features
+      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
+      USE_GPU_CLUSTERING: "false"
+      TEMP_DIR: "/app/temp_audio"
+    volumes:
+      - temp-audio-worker:/app/temp_audio
+      # Mount music directory for local files provider
+      - ${MUSIC_PATH:-./music}:/music:ro
+    depends_on:
+      redis:
+        condition: service_healthy
+      postgres:
+        condition: service_healthy
+    restart: unless-stopped
+
+# =============================================================================
+# Volumes
+# =============================================================================
+volumes:
+  redis-data:
+    name: audiomuse-redis-data
+  postgres-data:
+    name: audiomuse-postgres-data
+  temp-audio-flask:
+    name: audiomuse-temp-flask
+  temp-audio-worker:
+    name: audiomuse-temp-worker
diff --git a/docs/MULTI_PROVIDER_ARCHITECTURE.md b/docs/MULTI_PROVIDER_ARCHITECTURE.md
new file mode 100644
index 00000000..83f5ebc3
--- /dev/null
+++ b/docs/MULTI_PROVIDER_ARCHITECTURE.md
@@ -0,0 +1,323 @@
+# Multi-Provider Architecture Design
+
+## Overview
+
+This document outlines the architecture for supporting multiple media providers simultaneously in AudioMuse-AI without requiring re-analysis of tracks. The design ensures:
+
+1. **No re-analysis required** when adding new providers
+2. **Seamless migration** for existing installations
+3. **Future-proof** extensibility for new providers
+4. **Minimal schema changes** to existing tables
+
+## Key Design Decisions
+
+### 1. Primary Key Strategy for Local File Provider
+
+**Decision: Use normalized file path as the stable identifier**
+
+Rationale:
+- File paths are unique within a music library
+- Content hashes would require reading entire files (slow for large libraries)
+- File path changes are rare and can be handled via re-scan
+- Consistent with MPD provider which already uses file paths
+
+For the local file provider:
+- `item_id` = SHA-256 hash of the normalized relative file path
+- This creates a stable, predictable ID that won't change unless the file moves
+
+### 2. Linking Tracks Across Providers
+
+**Decision: Use file path as the universal linking key**
+
+The key insight is that most providers ultimately point to the same physical files:
+- Jellyfin, Navidrome, Lyrion, Emby all index local music directories
+- Local file provider scans the same directories
+- The file path (relative to the music library root) is the common denominator
+
+### 3. Database Schema Design
+
+#### New Tables
+
+```sql
+-- Provider configuration storage
+CREATE TABLE provider (
+    id SERIAL PRIMARY KEY,
+    provider_type VARCHAR(50) NOT NULL,  -- jellyfin, navidrome, localfiles, etc.
+    name VARCHAR(255) NOT NULL,           -- User-friendly name
+    config JSONB NOT NULL,                -- Provider-specific configuration
+    enabled BOOLEAN DEFAULT TRUE,
+    priority INTEGER DEFAULT 0,           -- For ordering when same track in multiple providers
+    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    UNIQUE(provider_type, name)
+);
+
+-- Track identity table - links analysis to file paths
+CREATE TABLE track (
+    id SERIAL PRIMARY KEY,
+    file_path_hash VARCHAR(64) NOT NULL UNIQUE,  -- SHA-256 of normalized relative path
+    file_path TEXT NOT NULL,                      -- Original file path for display
+    file_size BIGINT,                             -- For change detection
+    file_modified TIMESTAMP,                      -- For change detection
+    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
+);
+
+-- Links provider-specific item_ids to tracks
+CREATE TABLE provider_track (
+    id SERIAL PRIMARY KEY,
+    provider_id INTEGER NOT NULL REFERENCES provider(id) ON DELETE CASCADE,
+    track_id INTEGER NOT NULL REFERENCES track(id) ON DELETE CASCADE,
+    item_id TEXT NOT NULL,               -- Provider's native ID
+    title TEXT,                          -- Title from this provider
+    artist TEXT,                         -- Artist from this provider
+    album TEXT,                          -- Album from this provider
+    last_synced TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    UNIQUE(provider_id, item_id),
+    UNIQUE(provider_id, track_id)
+);
+CREATE INDEX idx_provider_track_item_id ON provider_track(item_id);
+CREATE INDEX idx_provider_track_track_id ON provider_track(track_id);
+
+-- Application settings stored in database (for GUI configuration)
+CREATE TABLE app_settings (
+    key VARCHAR(255) PRIMARY KEY,
+    value JSONB NOT NULL,
+    category VARCHAR(100),               -- For UI grouping
+    description TEXT,
+    updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
+);
+```
+
+#### Modified Tables
+
+The `score` table remains largely unchanged, but we add a foreign key to `track`:
+
+```sql
+ALTER TABLE score ADD COLUMN track_id INTEGER REFERENCES track(id);
+CREATE INDEX idx_score_track_id ON score(track_id);
+```
+
+**Critical**: `item_id` remains the PRIMARY KEY for backward compatibility. The new `track_id` column provides the link to file-based identity.
+
+### 4. Migration Strategy
+
+**Phase 1: Schema Extension (Non-breaking)**
+1. Add new tables (`provider`, `track`, `provider_track`, `app_settings`)
+2. Add `track_id` column to `score` table (nullable initially)
+3. Existing code continues to work unchanged
+
+**Phase 2: Data Migration**
+1. Create default provider entry for current `MEDIASERVER_TYPE`
+2. For each existing `score` record:
+   - Look up the track in the current provider
+   - Extract file path if available (via provider API)
+   - Create `track` record
+   - Create `provider_track` mapping
+   - Update `score.track_id`
+
+**Phase 3: Multi-Provider Activation**
+1. Enable multi-provider mode via configuration
+2. New providers can be added via GUI or API
+3. When scanning new providers:
+   - Match tracks by file path
+   - Reuse existing analysis data
+   - Create new `provider_track` mappings
+
+### 5. API Changes
+
+#### New Endpoints
+
+```
+POST /api/setup/provider           - Add/configure a provider
+GET  /api/setup/providers          - List configured providers
+PUT  /api/setup/provider/{id}      - Update provider config
+DELETE /api/setup/provider/{id}    - Remove provider
+
+GET  /api/setup/settings           - Get all settings
+PUT  /api/setup/settings           - Update settings
+GET  /api/setup/wizard/status      - Get setup wizard state
+
+POST /api/provider/{id}/sync       - Sync tracks from provider
+GET  /api/provider/{id}/status     - Get provider sync status
+```
+
+#### Modified Endpoints
+
+Existing endpoints remain unchanged but internally:
+- `/api/analyze` - Uses active providers (priority-ordered)
+- `/api/similarity` - Returns tracks with provider context
+- Playlist creation - Creates in preferred provider(s)
+
+### 6. Provider Interface
+
+All providers must implement:
+
+```python
+class MediaProvider:
+    """Base class for media providers"""
+
+    def get_provider_type(self) -> str:
+        """Return provider type identifier (jellyfin, navidrome, etc.)"""
+
+    def test_connection(self) -> Tuple[bool, str]:
+        """Test if provider is reachable, return (success, message)"""
+
+    def get_all_songs(self) -> List[Dict]:
+        """Return all songs with metadata including file_path if available"""
+
+    def get_tracks_from_album(self, album_id: str) -> List[Dict]:
+        """Return tracks for an album"""
+
+    def download_track(self, temp_dir: str, item: Dict) -> Optional[str]:
+        """Download track to temp directory, return local path"""
+
+    def create_playlist(self, name: str, item_ids: List[str]) -> Optional[str]:
+        """Create playlist, return playlist ID"""
+
+    def get_file_path(self, item: Dict) -> Optional[str]:
+        """Extract file path from item metadata (for track linking)"""
+```
+
+### 7. Local File Provider Specifics
+
+```python
+# Configuration for local file provider
+{
+    "provider_type": "localfiles",
+    "name": "Local Music Library",
+    "config": {
+        "music_directory": "/path/to/music",
+        "supported_formats": ["mp3", "flac", "m4a", "ogg", "wav"],
+        "scan_subdirectories": true,
+        "use_embedded_metadata": true
+    }
+}
+```
+
+Features:
+- Scans directories for audio files
+- Extracts metadata from ID3 tags (MP3), Vorbis comments (FLAC/OGG), etc.
+- Creates item_id from file path hash
+- Supports playlist creation via M3U files
+
+### 8. Docker Compose Simplification
+
+**Before**: 16+ docker-compose files for various scenarios
+**After**: 2 main files + optional components
+
+```
+deployment/
+├── docker-compose.yaml           # CPU version (default)
+├── docker-compose-nvidia.yaml    # GPU/NVIDIA version
+└── docker-compose-extras.yaml    # Optional: pgAdmin, monitoring, etc.
+```
+
+All provider-specific configuration moves to:
+1. `.env` file for initial setup
+2. Database `app_settings` table for runtime configuration
+3. GUI Setup Wizard for user-friendly configuration
+
+### 9. Setup Wizard Flow
+
+```
+1. Welcome Screen
+   - Detect if first run or existing installation
+   - Show version and hardware detection (GPU available?)
+
+2. Hardware Selection
+   - CPU-only or NVIDIA GPU acceleration
+   - Validate GPU drivers if selected
+
+3. Provider Configuration
+   - List of available providers with descriptions
+   - Multi-select enabled providers
+   - For each provider: configuration form
+   - Connection test for each provider
+
+4. Music Library Paths
+   - For local file provider: select directories
+   - For media servers: auto-detected from provider config
+
+5. Advanced Settings (collapsible)
+   - Database settings (show defaults, allow override)
+   - Analysis settings (CLAP, MuLan options)
+   - AI provider settings (optional)
+
+6. Review & Apply
+   - Summary of all settings
+   - Apply configuration
+   - Start initial sync (optional)
+
+7. Complete
+   - Link to main dashboard
+   - Quick start guide
+```
+
+### 10. Backward Compatibility
+
+The system maintains full backward compatibility:
+
+1. **Environment variables** still work:
+   - `MEDIASERVER_TYPE` creates a default provider on first run
+   - All `JELLYFIN_*`, `NAVIDROME_*` etc. variables honored
+
+2. **Existing data preserved**:
+   - `score` table unchanged except optional `track_id` column
+   - `embedding`, `clap_embedding` tables unchanged
+   - All indexes and projections preserved
+
+3. **Gradual migration**:
+   - Single-provider mode works exactly as before
+   - Multi-provider can be enabled via GUI/API
+   - No forced migration path
+
+### 11. File Path Normalization
+
+To ensure consistent file path matching:
+
+```python
+def normalize_file_path(path: str, base_path: str = "") -> str:
+    """
+    Normalize a file path for cross-provider matching.
+
+    - Convert to POSIX style (forward slashes)
+    - Make relative to music library root
+    - Lowercase (optional, for case-insensitive filesystems)
+    - Remove leading/trailing whitespace
+    """
+    import os
+    from pathlib import PurePosixPath
+
+    # Convert to Path object
+    p = Path(path)
+
+    # Make relative if absolute and base_path provided
+    if base_path and p.is_absolute():
+        try:
+            p = p.relative_to(base_path)
+        except ValueError:
+            pass  # Not relative to base, keep as-is
+
+    # Convert to POSIX style
+    normalized = PurePosixPath(p).as_posix()
+
+    return normalized.strip()
+
+
+def file_path_hash(normalized_path: str) -> str:
+    """Generate SHA-256 hash of normalized file path."""
+    import hashlib
+    return hashlib.sha256(normalized_path.encode('utf-8')).hexdigest()
+```
+
+## Implementation Order
+
+1. Database schema changes (migration-safe)
+2. Local file provider implementation
+3. Provider configuration storage
+4. Multi-provider dispatcher updates
+5. Setup wizard backend
+6. Setup wizard frontend
+7. Docker Compose simplification
+8. Documentation updates
diff --git a/tasks/analysis.py b/tasks/analysis.py
index 9c3901d7..df4871dd 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -911,7 +911,15 @@ def get_missing_mulan_track_ids(track_ids):
                         logger.info(f"  - Top Moods: {top_moods}")
                         logger.info(f"  - Other Features: {other_features}")
                         
-                        save_track_analysis_and_embedding(item['Id'], item['Name'], item.get('AlbumArtist', 'Unknown'), analysis['tempo'], analysis['key'], analysis['scale'], top_moods, embedding, energy=analysis['energy'], other_features=other_features, album=item.get('Album', None))
+                        save_track_analysis_and_embedding(
+                            item['Id'], item['Name'], item.get('AlbumArtist', 'Unknown'),
+                            analysis['tempo'], analysis['key'], analysis['scale'],
+                            top_moods, embedding,
+                            energy=analysis['energy'],
+                            other_features=other_features,
+                            album=item.get('Album', None),
+                            file_path=item.get('Path')  # For multi-provider track linking
+                        )
                         track_processed = True
                         
                         # Increment session recycler counter after successful analysis
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index ae47dad0..ce6c3752 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -1,4 +1,24 @@
 # tasks/mediaserver.py
+"""
+Media Server Dispatcher for AudioMuse-AI
+
+This module provides a unified interface to multiple media server providers.
+It dispatches function calls to the appropriate provider implementation based
+on the configured MEDIASERVER_TYPE.
+
+Supported providers:
+- jellyfin: Jellyfin Media Server
+- navidrome: Navidrome (Subsonic API)
+- lyrion: Lyrion Music Server (formerly LMS)
+- mpd: Music Player Daemon
+- emby: Emby Media Server
+- localfiles: Local file system scanner
+
+Multi-provider support:
+When multi_provider_enabled is true in app_settings, multiple providers can be
+configured and used simultaneously. Tracks are linked via file paths, allowing
+analysis data to be shared across providers.
+"""
 
 import logging
 import os
@@ -73,10 +93,74 @@
     get_top_played_songs as emby_get_top_played_songs,
     get_last_played_time as emby_get_last_played_time,
 )
+from tasks.mediaserver_localfiles import (
+    get_all_playlists as localfiles_get_all_playlists,
+    delete_playlist as localfiles_delete_playlist,
+    get_recent_albums as localfiles_get_recent_albums,
+    get_tracks_from_album as localfiles_get_tracks_from_album,
+    download_track as localfiles_download_track,
+    get_all_songs as localfiles_get_all_songs,
+    get_playlist_by_name as localfiles_get_playlist_by_name,
+    create_playlist as localfiles_create_playlist,
+    create_instant_playlist as localfiles_create_instant_playlist,
+    get_top_played_songs as localfiles_get_top_played_songs,
+    get_last_played_time as localfiles_get_last_played_time,
+    test_connection as localfiles_test_connection,
+    get_provider_info as localfiles_get_provider_info,
+)
 
 logger = logging.getLogger(__name__)
 
 
+# ##############################################################################
+# PROVIDER REGISTRY
+# ##############################################################################
+
+PROVIDER_TYPES = {
+    'jellyfin': {
+        'name': 'Jellyfin',
+        'description': 'Jellyfin Media Server - Open source media solution',
+        'supports_user_auth': True,
+        'supports_play_history': True,
+    },
+    'navidrome': {
+        'name': 'Navidrome',
+        'description': 'Navidrome - Modern music server (Subsonic API)',
+        'supports_user_auth': True,
+        'supports_play_history': True,
+    },
+    'lyrion': {
+        'name': 'Lyrion',
+        'description': 'Lyrion Music Server (formerly Logitech Media Server)',
+        'supports_user_auth': False,
+        'supports_play_history': True,
+    },
+    'mpd': {
+        'name': 'MPD',
+        'description': 'Music Player Daemon - Flexible music server',
+        'supports_user_auth': False,
+        'supports_play_history': False,
+    },
+    'emby': {
+        'name': 'Emby',
+        'description': 'Emby Media Server - Personal media server',
+        'supports_user_auth': True,
+        'supports_play_history': True,
+    },
+    'localfiles': {
+        'name': 'Local Files',
+        'description': 'Scan local directories for audio files',
+        'supports_user_auth': False,
+        'supports_play_history': False,
+    },
+}
+
+
+def get_available_provider_types():
+    """Return information about all available provider types."""
+    return PROVIDER_TYPES.copy()
+
+
 # ##############################################################################
 # PUBLIC API (Dispatcher functions)
 # ##############################################################################
@@ -128,6 +212,7 @@ def get_recent_albums(limit):
     if config.MEDIASERVER_TYPE == 'lyrion': return lyrion_get_recent_albums(limit)
     if config.MEDIASERVER_TYPE == 'mpd': return mpd_get_recent_albums(limit)
     if config.MEDIASERVER_TYPE == 'emby': return emby_get_recent_albums(limit)
+    if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_recent_albums(limit)
     return []
 
 def get_recent_music_items(limit):
@@ -156,6 +241,7 @@ def get_tracks_from_album(album_id):
     if config.MEDIASERVER_TYPE == 'lyrion': return lyrion_get_tracks_from_album(album_id)
     if config.MEDIASERVER_TYPE == 'mpd': return mpd_get_tracks_from_album(album_id)
     if config.MEDIASERVER_TYPE == 'emby': return emby_get_tracks_from_album(album_id)
+    if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_tracks_from_album(album_id)
     return []
 
 def download_track(temp_dir, item):
@@ -167,6 +253,7 @@ def download_track(temp_dir, item):
     elif config.MEDIASERVER_TYPE == 'lyrion': downloaded_path = lyrion_download_track(temp_dir, item)
     elif config.MEDIASERVER_TYPE == 'mpd': downloaded_path = mpd_download_track(temp_dir, item)
     elif config.MEDIASERVER_TYPE == 'emby': downloaded_path = emby_download_track(temp_dir, item)
+    elif config.MEDIASERVER_TYPE == 'localfiles': downloaded_path = localfiles_download_track(temp_dir, item)
     
     # If download failed or returned None, return as is
     if not downloaded_path:
@@ -244,6 +331,7 @@ def get_all_songs():
     if config.MEDIASERVER_TYPE == 'lyrion': return lyrion_get_all_songs()
     if config.MEDIASERVER_TYPE == 'mpd': return mpd_get_all_songs()
     if config.MEDIASERVER_TYPE == 'emby': return emby_get_all_songs()
+    if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_all_songs()
     return []
 
 def get_playlist_by_name(playlist_name):
@@ -254,6 +342,7 @@ def get_playlist_by_name(playlist_name):
     if config.MEDIASERVER_TYPE == 'lyrion': return lyrion_get_playlist_by_name(playlist_name)
     if config.MEDIASERVER_TYPE == 'mpd': return mpd_get_playlist_by_name(playlist_name)
     if config.MEDIASERVER_TYPE == 'emby': return emby_get_playlist_by_name(playlist_name)
+    if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_playlist_by_name(playlist_name)
     return None
 
 def create_playlist(base_name, item_ids):
@@ -265,12 +354,13 @@ def create_playlist(base_name, item_ids):
     elif config.MEDIASERVER_TYPE == 'lyrion': lyrion_create_playlist(base_name, item_ids)
     elif config.MEDIASERVER_TYPE == 'mpd': mpd_create_playlist(base_name, item_ids)
     elif config.MEDIASERVER_TYPE == 'emby': emby_create_playlist(base_name, item_ids)
+    elif config.MEDIASERVER_TYPE == 'localfiles': localfiles_create_playlist(base_name, item_ids)
 
 def create_instant_playlist(playlist_name, item_ids, user_creds=None):
     """Creates an instant playlist. Uses user_creds if provided, otherwise admin."""
     if not playlist_name: raise ValueError("Playlist name is required.")
     if not item_ids: raise ValueError("Track IDs are required.")
-    
+
     if config.MEDIASERVER_TYPE == 'jellyfin':
         return jellyfin_create_instant_playlist(playlist_name, item_ids, user_creds)
     if config.MEDIASERVER_TYPE == 'navidrome':
@@ -281,6 +371,8 @@ def create_instant_playlist(playlist_name, item_ids, user_creds=None):
         return mpd_create_instant_playlist(playlist_name, item_ids, user_creds)
     if config.MEDIASERVER_TYPE == 'emby':
         return emby_create_instant_playlist(playlist_name, item_ids, user_creds)
+    if config.MEDIASERVER_TYPE == 'localfiles':
+        return localfiles_create_instant_playlist(playlist_name, item_ids, user_creds)
     return None
 
 def get_top_played_songs(limit, user_creds=None):
@@ -295,6 +387,8 @@ def get_top_played_songs(limit, user_creds=None):
         return mpd_get_top_played_songs(limit, user_creds)
     if config.MEDIASERVER_TYPE == 'emby':
         return emby_get_top_played_songs(limit, user_creds)
+    if config.MEDIASERVER_TYPE == 'localfiles':
+        return localfiles_get_top_played_songs(limit, user_creds)
     return []
 
 def get_last_played_time(item_id, user_creds=None):
@@ -309,5 +403,166 @@ def get_last_played_time(item_id, user_creds=None):
         return mpd_get_last_played_time(item_id, user_creds)
     if config.MEDIASERVER_TYPE == 'emby':
         return emby_get_last_played_time(item_id, user_creds)
+    if config.MEDIASERVER_TYPE == 'localfiles':
+        return localfiles_get_last_played_time(item_id, user_creds)
     return None
 
+
+# ##############################################################################
+# MULTI-PROVIDER SUPPORT FUNCTIONS
+# ##############################################################################
+
+def test_provider_connection(provider_type: str, config_dict: dict = None):
+    """
+    Test connection to a specific provider.
+
+    Args:
+        provider_type: Type of provider (jellyfin, navidrome, localfiles, etc.)
+        config_dict: Optional configuration dictionary for the provider
+
+    Returns:
+        Tuple of (success: bool, message: str)
+    """
+    import requests
+
+    try:
+        if provider_type == 'localfiles':
+            return localfiles_test_connection(config_dict)
+
+        elif provider_type == 'jellyfin':
+            url = config_dict.get('url') if config_dict else config.JELLYFIN_URL
+            token = config_dict.get('token') if config_dict else config.JELLYFIN_TOKEN
+            if not url or not token:
+                return False, "Jellyfin URL and token are required"
+            resp = requests.get(f"{url.rstrip('/')}/System/Info",
+                              headers={"X-Emby-Token": token}, timeout=10)
+            if resp.status_code == 200:
+                return True, f"Connected to Jellyfin at {url}"
+            return False, f"Jellyfin returned status {resp.status_code}"
+
+        elif provider_type == 'navidrome':
+            import hashlib
+            import secrets
+            url = config_dict.get('url') if config_dict else config.NAVIDROME_URL
+            user = config_dict.get('user') if config_dict else config.NAVIDROME_USER
+            password = config_dict.get('password') if config_dict else config.NAVIDROME_PASSWORD
+            if not url or not user or not password:
+                return False, "Navidrome URL, user, and password are required"
+            salt = secrets.token_hex(8)
+            token = hashlib.md5((password + salt).encode()).hexdigest()
+            params = {'u': user, 't': token, 's': salt, 'v': '1.16.1', 'c': 'audiomuse', 'f': 'json'}
+            resp = requests.get(f"{url.rstrip('/')}/rest/ping", params=params, timeout=10)
+            if resp.status_code == 200:
+                data = resp.json()
+                if data.get('subsonic-response', {}).get('status') == 'ok':
+                    return True, f"Connected to Navidrome at {url}"
+                err = data.get('subsonic-response', {}).get('error', {}).get('message', 'Unknown error')
+                return False, f"Navidrome error: {err}"
+            return False, f"Navidrome returned status {resp.status_code}"
+
+        elif provider_type == 'lyrion':
+            url = config_dict.get('url') if config_dict else config.LYRION_URL
+            if not url:
+                return False, "Lyrion URL is required"
+            resp = requests.get(f"{url.rstrip('/')}/status.html", timeout=10)
+            if resp.status_code == 200:
+                return True, f"Connected to Lyrion at {url}"
+            return False, f"Lyrion returned status {resp.status_code}"
+
+        elif provider_type == 'emby':
+            url = config_dict.get('url') if config_dict else config.EMBY_URL
+            token = config_dict.get('token') if config_dict else config.EMBY_TOKEN
+            if not url or not token:
+                return False, "Emby URL and token are required"
+            resp = requests.get(f"{url.rstrip('/')}/System/Info",
+                              headers={"X-Emby-Token": token}, timeout=10)
+            if resp.status_code == 200:
+                return True, f"Connected to Emby at {url}"
+            return False, f"Emby returned status {resp.status_code}"
+
+        elif provider_type == 'mpd':
+            try:
+                from mpd import MPDClient
+                host = config_dict.get('host') if config_dict else config.MPD_HOST
+                port = config_dict.get('port') if config_dict else config.MPD_PORT
+                password = config_dict.get('password') if config_dict else config.MPD_PASSWORD
+                client = MPDClient()
+                client.timeout = 10
+                client.connect(host, int(port))
+                if password:
+                    client.password(password)
+                stats = client.stats()
+                client.close()
+                client.disconnect()
+                return True, f"Connected to MPD at {host}:{port} ({stats.get('songs', 0)} songs)"
+            except Exception as e:
+                return False, f"MPD connection error: {str(e)}"
+
+        else:
+            return False, f"Unknown provider type: {provider_type}"
+
+    except requests.RequestException as e:
+        return False, f"Network error: {str(e)}"
+    except Exception as e:
+        return False, f"Connection test failed: {str(e)}"
+
+
+def get_provider_info(provider_type: str):
+    """Get detailed information about a provider type including config fields."""
+    if provider_type == 'localfiles':
+        return localfiles_get_provider_info()
+
+    # Return basic info for other providers
+    if provider_type in PROVIDER_TYPES:
+        info = PROVIDER_TYPES[provider_type].copy()
+        info['type'] = provider_type
+        info['config_fields'] = _get_provider_config_fields(provider_type)
+        return info
+
+    return None
+
+
+def _get_provider_config_fields(provider_type: str):
+    """Get configuration fields for a provider type."""
+    fields = {
+        'jellyfin': [
+            {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
+             'description': 'Jellyfin server URL (e.g., http://192.168.1.100:8096)'},
+            {'name': 'user_id', 'label': 'User ID', 'type': 'text', 'required': True,
+             'description': 'Jellyfin user ID (found in dashboard)'},
+            {'name': 'token', 'label': 'API Token', 'type': 'password', 'required': True,
+             'description': 'API key from Jellyfin settings'},
+        ],
+        'navidrome': [
+            {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
+             'description': 'Navidrome server URL (e.g., http://192.168.1.100:4533)'},
+            {'name': 'user', 'label': 'Username', 'type': 'text', 'required': True,
+             'description': 'Navidrome username'},
+            {'name': 'password', 'label': 'Password', 'type': 'password', 'required': True,
+             'description': 'Navidrome password'},
+        ],
+        'lyrion': [
+            {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
+             'description': 'Lyrion server URL (e.g., http://192.168.1.100:9000)'},
+        ],
+        'mpd': [
+            {'name': 'host', 'label': 'Host', 'type': 'text', 'required': True,
+             'description': 'MPD server hostname or IP', 'default': 'localhost'},
+            {'name': 'port', 'label': 'Port', 'type': 'number', 'required': True,
+             'description': 'MPD port number', 'default': 6600},
+            {'name': 'password', 'label': 'Password', 'type': 'password', 'required': False,
+             'description': 'MPD password (if configured)'},
+            {'name': 'music_directory', 'label': 'Music Directory', 'type': 'path', 'required': True,
+             'description': 'Path to music files on the MPD server'},
+        ],
+        'emby': [
+            {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
+             'description': 'Emby server URL (e.g., http://192.168.1.100:8096)'},
+            {'name': 'user_id', 'label': 'User ID', 'type': 'text', 'required': True,
+             'description': 'Emby user ID'},
+            {'name': 'token', 'label': 'API Token', 'type': 'password', 'required': True,
+             'description': 'API key from Emby settings'},
+        ],
+    }
+    return fields.get(provider_type, [])
+
diff --git a/tasks/mediaserver_localfiles.py b/tasks/mediaserver_localfiles.py
new file mode 100644
index 00000000..df02dca1
--- /dev/null
+++ b/tasks/mediaserver_localfiles.py
@@ -0,0 +1,604 @@
+# tasks/mediaserver_localfiles.py
+"""
+Local File Media Provider for AudioMuse-AI
+
+This provider scans local directories for audio files and extracts metadata
+from embedded tags (ID3 for MP3, Vorbis comments for FLAC/OGG, etc.).
+
+The item_id for each track is a SHA-256 hash of the normalized relative file path,
+ensuring stable, predictable identifiers that won't change unless files move.
+"""
+
+import logging
+import os
+import hashlib
+import shutil
+from datetime import datetime
+from pathlib import Path, PurePosixPath
+from typing import List, Dict, Optional, Tuple
+import json
+
+try:
+    from mutagen import File as MutagenFile
+    from mutagen.mp3 import MP3
+    from mutagen.flac import FLAC
+    from mutagen.oggvorbis import OggVorbis
+    from mutagen.mp4 import MP4
+    from mutagen.id3 import ID3
+    MUTAGEN_AVAILABLE = True
+except ImportError:
+    MUTAGEN_AVAILABLE = False
+
+import config
+
+logger = logging.getLogger(__name__)
+
+# Supported audio formats
+SUPPORTED_FORMATS = {'.mp3', '.flac', '.ogg', '.m4a', '.mp4', '.wav', '.wma', '.aac', '.opus'}
+
+# ##############################################################################
+# CONFIGURATION
+# ##############################################################################
+
+def get_config() -> Dict:
+    """Get local file provider configuration from environment or defaults."""
+    return {
+        'music_directory': os.environ.get('LOCALFILES_MUSIC_DIRECTORY', '/music'),
+        'supported_formats': os.environ.get('LOCALFILES_FORMATS', ','.join(SUPPORTED_FORMATS)).split(','),
+        'scan_subdirectories': os.environ.get('LOCALFILES_SCAN_SUBDIRS', 'true').lower() == 'true',
+        'use_embedded_metadata': os.environ.get('LOCALFILES_USE_METADATA', 'true').lower() == 'true',
+        'playlist_directory': os.environ.get('LOCALFILES_PLAYLIST_DIR', '/music/playlists'),
+    }
+
+
+# ##############################################################################
+# UTILITY FUNCTIONS
+# ##############################################################################
+
+def normalize_file_path(path: str, base_path: str = "") -> str:
+    """
+    Normalize a file path for cross-provider matching.
+
+    - Convert to POSIX style (forward slashes)
+    - Make relative to music library root
+    - Strip leading/trailing whitespace
+    """
+    p = Path(path)
+
+    # Make relative if absolute and base_path provided
+    if base_path and p.is_absolute():
+        try:
+            base = Path(base_path)
+            p = p.relative_to(base)
+        except ValueError:
+            pass  # Not relative to base, keep as-is
+
+    # Convert to POSIX style
+    normalized = PurePosixPath(p).as_posix()
+
+    return normalized.strip()
+
+
+def file_path_hash(normalized_path: str) -> str:
+    """Generate SHA-256 hash of normalized file path for use as item_id."""
+    return hashlib.sha256(normalized_path.encode('utf-8')).hexdigest()
+
+
+def extract_metadata(file_path: str) -> Dict:
+    """
+    Extract metadata from an audio file using mutagen.
+
+    Returns a dict with keys: title, artist, album, album_artist, track_number, year, genre
+    """
+    metadata = {
+        'title': os.path.splitext(os.path.basename(file_path))[0],  # Default to filename
+        'artist': 'Unknown Artist',
+        'album': 'Unknown Album',
+        'album_artist': None,
+        'track_number': None,
+        'year': None,
+        'genre': None,
+        'duration': None,
+    }
+
+    if not MUTAGEN_AVAILABLE:
+        logger.warning("Mutagen not available, using filename as title")
+        return metadata
+
+    try:
+        audio = MutagenFile(file_path, easy=True)
+        if audio is None:
+            logger.debug(f"Mutagen couldn't read: {file_path}")
+            return metadata
+
+        # Extract common tags (easy=True gives us simplified tag access)
+        if hasattr(audio, 'info') and audio.info:
+            metadata['duration'] = getattr(audio.info, 'length', None)
+
+        # Handle different tag formats
+        if isinstance(audio.tags, dict) or hasattr(audio, 'tags'):
+            tags = audio.tags if isinstance(audio.tags, dict) else dict(audio)
+
+            # Title
+            if 'title' in tags:
+                val = tags['title']
+                metadata['title'] = val[0] if isinstance(val, list) else str(val)
+
+            # Artist
+            if 'artist' in tags:
+                val = tags['artist']
+                metadata['artist'] = val[0] if isinstance(val, list) else str(val)
+            elif 'performer' in tags:
+                val = tags['performer']
+                metadata['artist'] = val[0] if isinstance(val, list) else str(val)
+
+            # Album
+            if 'album' in tags:
+                val = tags['album']
+                metadata['album'] = val[0] if isinstance(val, list) else str(val)
+
+            # Album Artist
+            if 'albumartist' in tags:
+                val = tags['albumartist']
+                metadata['album_artist'] = val[0] if isinstance(val, list) else str(val)
+            elif 'album artist' in tags:
+                val = tags['album artist']
+                metadata['album_artist'] = val[0] if isinstance(val, list) else str(val)
+
+            # Track number
+            if 'tracknumber' in tags:
+                val = tags['tracknumber']
+                track_str = val[0] if isinstance(val, list) else str(val)
+                try:
+                    # Handle "1/12" format
+                    metadata['track_number'] = int(track_str.split('/')[0])
+                except (ValueError, IndexError):
+                    pass
+
+            # Year/Date
+            if 'date' in tags:
+                val = tags['date']
+                date_str = val[0] if isinstance(val, list) else str(val)
+                try:
+                    metadata['year'] = int(date_str[:4])
+                except (ValueError, IndexError):
+                    pass
+            elif 'year' in tags:
+                val = tags['year']
+                year_str = val[0] if isinstance(val, list) else str(val)
+                try:
+                    metadata['year'] = int(year_str)
+                except ValueError:
+                    pass
+
+            # Genre
+            if 'genre' in tags:
+                val = tags['genre']
+                metadata['genre'] = val[0] if isinstance(val, list) else str(val)
+
+    except Exception as e:
+        logger.warning(f"Error extracting metadata from {file_path}: {e}")
+
+    return metadata
+
+
+def _format_song(file_path: str, base_path: str) -> Dict:
+    """Format a local file into the standard song format used by AudioMuse-AI."""
+    normalized_path = normalize_file_path(file_path, base_path)
+    item_id = file_path_hash(normalized_path)
+
+    metadata = extract_metadata(file_path)
+
+    # Get file stats
+    try:
+        stat = os.stat(file_path)
+        file_size = stat.st_size
+        file_modified = datetime.fromtimestamp(stat.st_mtime)
+    except OSError:
+        file_size = None
+        file_modified = None
+
+    return {
+        'Id': item_id,
+        'Name': metadata['title'],
+        'Artist': metadata['artist'],
+        'AlbumArtist': metadata['album_artist'] or metadata['artist'],
+        'Album': metadata['album'],
+        'Path': file_path,
+        'RelativePath': normalized_path,
+        'TrackNumber': metadata['track_number'],
+        'Year': metadata['year'],
+        'Genre': metadata['genre'],
+        'Duration': metadata['duration'],
+        'FileSize': file_size,
+        'last-modified': file_modified.isoformat() if file_modified else None,
+        # For compatibility with other providers
+        'ArtistId': None,  # Local files don't have artist IDs
+    }
+
+
+# ##############################################################################
+# PUBLIC API
+# ##############################################################################
+
+def test_connection(config_override: Dict = None) -> Tuple[bool, str]:
+    """Test if the local file provider can access the music directory.
+
+    Args:
+        config_override: Optional dict with configuration to test instead of default
+    """
+    if config_override:
+        cfg = {
+            'music_directory': config_override.get('music_directory', '/music'),
+            'supported_formats': config_override.get('supported_formats', SUPPORTED_FORMATS),
+            'scan_subdirectories': config_override.get('scan_subdirectories', True),
+            'playlist_directory': config_override.get('playlist_directory', '/music/playlists'),
+        }
+    else:
+        cfg = get_config()
+    music_dir = cfg['music_directory']
+
+    if not os.path.exists(music_dir):
+        return False, f"Music directory does not exist: {music_dir}"
+
+    if not os.path.isdir(music_dir):
+        return False, f"Music path is not a directory: {music_dir}"
+
+    if not os.access(music_dir, os.R_OK):
+        return False, f"Music directory is not readable: {music_dir}"
+
+    # Count files to verify
+    try:
+        audio_count = 0
+        for root, _, files in os.walk(music_dir):
+            for f in files:
+                if os.path.splitext(f)[1].lower() in SUPPORTED_FORMATS:
+                    audio_count += 1
+                    if audio_count >= 10:  # Quick check, don't scan everything
+                        break
+            if audio_count >= 10:
+                break
+
+        if audio_count == 0:
+            return False, f"No audio files found in: {music_dir}"
+
+        return True, f"Found audio files in: {music_dir}"
+    except Exception as e:
+        return False, f"Error scanning music directory: {e}"
+
+
+def get_all_songs() -> List[Dict]:
+    """Fetch all audio files from the music directory."""
+    cfg = get_config()
+    music_dir = cfg['music_directory']
+    supported = set(fmt.lower() if fmt.startswith('.') else f'.{fmt.lower()}'
+                    for fmt in cfg['supported_formats'])
+    scan_subdirs = cfg['scan_subdirectories']
+
+    all_songs = []
+
+    if not os.path.isdir(music_dir):
+        logger.error(f"Music directory not found: {music_dir}")
+        return []
+
+    logger.info(f"Scanning local music directory: {music_dir}")
+
+    try:
+        if scan_subdirs:
+            for root, _, files in os.walk(music_dir):
+                for filename in files:
+                    ext = os.path.splitext(filename)[1].lower()
+                    if ext in supported:
+                        full_path = os.path.join(root, filename)
+                        try:
+                            song = _format_song(full_path, music_dir)
+                            all_songs.append(song)
+                        except Exception as e:
+                            logger.warning(f"Error processing {full_path}: {e}")
+        else:
+            for filename in os.listdir(music_dir):
+                ext = os.path.splitext(filename)[1].lower()
+                if ext in supported:
+                    full_path = os.path.join(music_dir, filename)
+                    if os.path.isfile(full_path):
+                        try:
+                            song = _format_song(full_path, music_dir)
+                            all_songs.append(song)
+                        except Exception as e:
+                            logger.warning(f"Error processing {full_path}: {e}")
+
+        logger.info(f"Found {len(all_songs)} audio files in local library")
+
+    except Exception as e:
+        logger.error(f"Error scanning music directory: {e}", exc_info=True)
+
+    return all_songs
+
+
+def get_recent_albums(limit: int) -> List[Dict]:
+    """
+    Get recently modified albums from the local music directory.
+
+    For local files, we group songs by album and return the most recently
+    modified albums based on the newest file in each album.
+    """
+    cfg = get_config()
+    music_dir = cfg['music_directory']
+
+    all_songs = get_all_songs()
+    if not all_songs:
+        return []
+
+    # Group by album
+    albums = {}
+    for song in all_songs:
+        album_name = song.get('Album', 'Unknown Album')
+        album_artist = song.get('AlbumArtist', 'Unknown Artist')
+        album_key = f"{album_artist} - {album_name}"
+
+        if album_key not in albums:
+            albums[album_key] = {
+                'Id': album_key,  # Use album name as ID
+                'Name': album_name,
+                'Artist': album_artist,
+                'tracks': [],
+                'last_modified': None
+            }
+
+        albums[album_key]['tracks'].append(song)
+
+        # Track the most recent modification time
+        mod_time = song.get('last-modified')
+        if mod_time:
+            if albums[album_key]['last_modified'] is None or mod_time > albums[album_key]['last_modified']:
+                albums[album_key]['last_modified'] = mod_time
+
+    # Sort by modification time (most recent first)
+    sorted_albums = sorted(
+        albums.values(),
+        key=lambda a: a.get('last_modified') or '',
+        reverse=True
+    )
+
+    # Return requested limit (0 = all)
+    if limit == 0:
+        return sorted_albums
+    return sorted_albums[:limit]
+
+
+def get_tracks_from_album(album_id: str) -> List[Dict]:
+    """
+    Get all tracks from an album.
+
+    For local files, album_id is "Artist - Album Name" format.
+    """
+    all_songs = get_all_songs()
+
+    # Filter songs matching this album
+    tracks = []
+    for song in all_songs:
+        album_name = song.get('Album', 'Unknown Album')
+        album_artist = song.get('AlbumArtist', 'Unknown Artist')
+        song_album_key = f"{album_artist} - {album_name}"
+
+        if song_album_key == album_id or album_name == album_id:
+            tracks.append(song)
+
+    # Sort by track number if available
+    tracks.sort(key=lambda t: (t.get('TrackNumber') or 999, t.get('Name', '')))
+
+    logger.info(f"Found {len(tracks)} tracks for album '{album_id}'")
+    return tracks
+
+
+def download_track(temp_dir: str, item: Dict) -> Optional[str]:
+    """
+    'Download' a track - for local files, we simply copy to temp directory.
+
+    Returns the path to the temporary file.
+    """
+    source_path = item.get('Path')
+    if not source_path or not os.path.exists(source_path):
+        logger.error(f"Source file not found: {source_path}")
+        return None
+
+    try:
+        # Create a unique filename in temp directory
+        filename = os.path.basename(source_path)
+        dest_path = os.path.join(temp_dir, filename)
+
+        # Handle filename collisions
+        if os.path.exists(dest_path):
+            name, ext = os.path.splitext(filename)
+            item_id = item.get('Id', '')[:8]
+            dest_path = os.path.join(temp_dir, f"{name}_{item_id}{ext}")
+
+        # Copy file to temp directory
+        shutil.copy2(source_path, dest_path)
+        logger.info(f"Copied '{item.get('Name', filename)}' to temp directory")
+
+        return dest_path
+
+    except Exception as e:
+        logger.error(f"Error copying file {source_path}: {e}", exc_info=True)
+        return None
+
+
+def get_all_playlists() -> List[Dict]:
+    """Get all M3U playlists from the playlist directory."""
+    cfg = get_config()
+    playlist_dir = cfg['playlist_directory']
+
+    playlists = []
+
+    if not os.path.isdir(playlist_dir):
+        logger.info(f"Playlist directory not found: {playlist_dir}")
+        return playlists
+
+    try:
+        for filename in os.listdir(playlist_dir):
+            if filename.lower().endswith(('.m3u', '.m3u8')):
+                name = os.path.splitext(filename)[0]
+                playlists.append({
+                    'Id': filename,
+                    'Name': name,
+                    'Path': os.path.join(playlist_dir, filename)
+                })
+    except Exception as e:
+        logger.error(f"Error listing playlists: {e}")
+
+    return playlists
+
+
+def get_playlist_by_name(playlist_name: str) -> Optional[Dict]:
+    """Find a playlist by name."""
+    playlists = get_all_playlists()
+    for p in playlists:
+        if p['Name'] == playlist_name:
+            return p
+    return None
+
+
+def create_playlist(base_name: str, item_ids: List[str]) -> Optional[str]:
+    """
+    Create an M3U playlist file.
+
+    item_ids are the file path hashes - we need to look up the actual paths.
+    """
+    cfg = get_config()
+    playlist_dir = cfg['playlist_directory']
+    music_dir = cfg['music_directory']
+
+    # Ensure playlist directory exists
+    os.makedirs(playlist_dir, exist_ok=True)
+
+    # Build a lookup from item_id to file path
+    all_songs = get_all_songs()
+    id_to_path = {song['Id']: song['Path'] for song in all_songs}
+
+    # Resolve paths
+    paths = []
+    for item_id in item_ids:
+        if item_id in id_to_path:
+            # Use relative path for portability
+            full_path = id_to_path[item_id]
+            try:
+                rel_path = os.path.relpath(full_path, playlist_dir)
+            except ValueError:
+                rel_path = full_path  # Different drive on Windows
+            paths.append(rel_path)
+        else:
+            logger.warning(f"Track not found for item_id: {item_id}")
+
+    if not paths:
+        logger.error("No valid tracks found for playlist")
+        return None
+
+    # Write M3U file
+    playlist_name = f"{base_name}_automatic.m3u"
+    playlist_path = os.path.join(playlist_dir, playlist_name)
+
+    try:
+        with open(playlist_path, 'w', encoding='utf-8') as f:
+            f.write("#EXTM3U\n")
+            for path in paths:
+                f.write(f"{path}\n")
+
+        logger.info(f"Created playlist '{playlist_name}' with {len(paths)} tracks")
+        return playlist_name
+
+    except Exception as e:
+        logger.error(f"Error creating playlist: {e}", exc_info=True)
+        return None
+
+
+def delete_playlist(playlist_id: str) -> bool:
+    """Delete an M3U playlist file."""
+    cfg = get_config()
+    playlist_dir = cfg['playlist_directory']
+
+    playlist_path = os.path.join(playlist_dir, playlist_id)
+
+    if not os.path.exists(playlist_path):
+        logger.warning(f"Playlist file not found: {playlist_path}")
+        return False
+
+    try:
+        os.remove(playlist_path)
+        logger.info(f"Deleted playlist: {playlist_id}")
+        return True
+    except Exception as e:
+        logger.error(f"Error deleting playlist: {e}")
+        return False
+
+
+def create_instant_playlist(playlist_name: str, item_ids: List[str], user_creds=None) -> Optional[Dict]:
+    """Create an instant playlist (same as regular playlist for local files)."""
+    final_name = f"{playlist_name.strip()}_instant"
+    result = create_playlist(final_name, item_ids)
+    if result:
+        return {'Id': result, 'Name': final_name}
+    return None
+
+
+def get_top_played_songs(limit: int, user_creds=None) -> List[Dict]:
+    """Not supported for local files - no play history tracking."""
+    logger.warning("get_top_played_songs is not supported for local files provider")
+    return []
+
+
+def get_last_played_time(item_id: str, user_creds=None):
+    """Not supported for local files - no play history tracking."""
+    logger.warning("get_last_played_time is not supported for local files provider")
+    return None
+
+
+# ##############################################################################
+# PROVIDER INFO
+# ##############################################################################
+
+def get_provider_info() -> Dict:
+    """Return information about this provider."""
+    cfg = get_config()
+    return {
+        'type': 'localfiles',
+        'name': 'Local Files',
+        'description': 'Scan local directories for audio files',
+        'supports_playlists': True,
+        'supports_play_history': False,
+        'supports_user_auth': False,
+        'config_fields': [
+            {
+                'name': 'music_directory',
+                'label': 'Music Directory',
+                'type': 'path',
+                'required': True,
+                'description': 'Path to your music library folder',
+                'default': '/music'
+            },
+            {
+                'name': 'supported_formats',
+                'label': 'Supported Formats',
+                'type': 'text',
+                'required': False,
+                'description': 'Comma-separated list of audio file extensions',
+                'default': ','.join(SUPPORTED_FORMATS)
+            },
+            {
+                'name': 'scan_subdirectories',
+                'label': 'Scan Subdirectories',
+                'type': 'boolean',
+                'required': False,
+                'description': 'Include files in subdirectories',
+                'default': True
+            },
+            {
+                'name': 'playlist_directory',
+                'label': 'Playlist Directory',
+                'type': 'path',
+                'required': False,
+                'description': 'Where to save generated M3U playlists',
+                'default': '/music/playlists'
+            }
+        ]
+    }
diff --git a/templates/setup.html b/templates/setup.html
new file mode 100644
index 00000000..08f65f23
--- /dev/null
+++ b/templates/setup.html
@@ -0,0 +1,1028 @@
+{% extends "includes/layout.html" %}
+
+{% block headAdditions %}
+<style>
+    .setup-wizard {
+        max-width: 800px;
+        margin: 0 auto;
+    }
+
+    .setup-header {
+        text-align: center;
+        margin-bottom: 2rem;
+    }
+
+    .setup-header h1 {
+        font-size: 2rem;
+        margin-bottom: 0.5rem;
+    }
+
+    .setup-header .subtitle {
+        color: var(--text-muted);
+        font-size: 1.1rem;
+    }
+
+    /* Progress Steps */
+    .setup-progress {
+        display: flex;
+        justify-content: space-between;
+        margin-bottom: 2rem;
+        padding: 0 1rem;
+    }
+
+    .progress-step {
+        display: flex;
+        flex-direction: column;
+        align-items: center;
+        flex: 1;
+        position: relative;
+    }
+
+    .progress-step:not(:last-child)::after {
+        content: '';
+        position: absolute;
+        top: 15px;
+        left: 50%;
+        width: 100%;
+        height: 2px;
+        background: var(--border-color);
+        z-index: 0;
+    }
+
+    .progress-step.completed:not(:last-child)::after {
+        background: var(--primary-color);
+    }
+
+    .step-number {
+        width: 32px;
+        height: 32px;
+        border-radius: 50%;
+        background: var(--bg-secondary);
+        border: 2px solid var(--border-color);
+        display: flex;
+        align-items: center;
+        justify-content: center;
+        font-weight: bold;
+        z-index: 1;
+        transition: all 0.3s ease;
+    }
+
+    .progress-step.active .step-number {
+        border-color: var(--primary-color);
+        background: var(--primary-color);
+        color: white;
+    }
+
+    .progress-step.completed .step-number {
+        border-color: var(--primary-color);
+        background: var(--primary-color);
+        color: white;
+    }
+
+    .step-label {
+        margin-top: 0.5rem;
+        font-size: 0.85rem;
+        color: var(--text-muted);
+    }
+
+    .progress-step.active .step-label {
+        color: var(--text-color);
+        font-weight: 500;
+    }
+
+    /* Step Content */
+    .step-content {
+        display: none;
+        animation: fadeIn 0.3s ease;
+    }
+
+    .step-content.active {
+        display: block;
+    }
+
+    @keyframes fadeIn {
+        from { opacity: 0; transform: translateY(10px); }
+        to { opacity: 1; transform: translateY(0); }
+    }
+
+    .step-section {
+        background: var(--bg-secondary);
+        border-radius: 8px;
+        padding: 1.5rem;
+        margin-bottom: 1.5rem;
+    }
+
+    .step-section h3 {
+        margin-top: 0;
+        margin-bottom: 1rem;
+        font-size: 1.2rem;
+    }
+
+    .step-section p.description {
+        color: var(--text-muted);
+        margin-bottom: 1rem;
+    }
+
+    /* Provider Cards */
+    .provider-grid {
+        display: grid;
+        grid-template-columns: repeat(auto-fill, minmax(220px, 1fr));
+        gap: 1rem;
+    }
+
+    .provider-card {
+        background: var(--bg-primary);
+        border: 2px solid var(--border-color);
+        border-radius: 8px;
+        padding: 1rem;
+        cursor: pointer;
+        transition: all 0.2s ease;
+    }
+
+    .provider-card:hover {
+        border-color: var(--primary-color);
+    }
+
+    .provider-card.selected {
+        border-color: var(--primary-color);
+        background: rgba(var(--primary-rgb), 0.1);
+    }
+
+    .provider-card .provider-name {
+        font-weight: bold;
+        margin-bottom: 0.5rem;
+    }
+
+    .provider-card .provider-desc {
+        font-size: 0.85rem;
+        color: var(--text-muted);
+    }
+
+    .provider-card .provider-check {
+        display: none;
+        color: var(--primary-color);
+        font-size: 1.2rem;
+    }
+
+    .provider-card.selected .provider-check {
+        display: inline;
+    }
+
+    /* Provider Config Form */
+    .provider-config {
+        margin-top: 1.5rem;
+        padding: 1rem;
+        background: var(--bg-primary);
+        border-radius: 8px;
+        display: none;
+    }
+
+    .provider-config.visible {
+        display: block;
+    }
+
+    .provider-config h4 {
+        margin-top: 0;
+        margin-bottom: 1rem;
+    }
+
+    .config-field {
+        margin-bottom: 1rem;
+    }
+
+    .config-field label {
+        display: block;
+        margin-bottom: 0.25rem;
+        font-weight: 500;
+    }
+
+    .config-field .field-help {
+        font-size: 0.85rem;
+        color: var(--text-muted);
+        margin-top: 0.25rem;
+    }
+
+    .config-field input,
+    .config-field select {
+        width: 100%;
+        padding: 0.5rem;
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+        background: var(--bg-secondary);
+        color: var(--text-color);
+    }
+
+    .config-field input:focus,
+    .config-field select:focus {
+        outline: none;
+        border-color: var(--primary-color);
+    }
+
+    /* Test Connection Button */
+    .test-connection-btn {
+        background: var(--bg-secondary);
+        border: 1px solid var(--border-color);
+        padding: 0.5rem 1rem;
+        border-radius: 4px;
+        cursor: pointer;
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+    }
+
+    .test-connection-btn:hover {
+        background: var(--bg-primary);
+    }
+
+    .test-result {
+        margin-top: 0.5rem;
+        padding: 0.5rem;
+        border-radius: 4px;
+        font-size: 0.9rem;
+    }
+
+    .test-result.success {
+        background: rgba(40, 167, 69, 0.2);
+        color: #28a745;
+    }
+
+    .test-result.error {
+        background: rgba(220, 53, 69, 0.2);
+        color: #dc3545;
+    }
+
+    /* Navigation Buttons */
+    .step-navigation {
+        display: flex;
+        justify-content: space-between;
+        margin-top: 2rem;
+        padding-top: 1rem;
+        border-top: 1px solid var(--border-color);
+    }
+
+    .step-navigation button {
+        padding: 0.75rem 1.5rem;
+        border-radius: 4px;
+        font-weight: 500;
+        cursor: pointer;
+        transition: all 0.2s ease;
+    }
+
+    .btn-prev {
+        background: var(--bg-secondary);
+        border: 1px solid var(--border-color);
+        color: var(--text-color);
+    }
+
+    .btn-prev:hover {
+        background: var(--bg-primary);
+    }
+
+    .btn-next, .btn-complete {
+        background: var(--primary-color);
+        border: none;
+        color: white;
+    }
+
+    .btn-next:hover, .btn-complete:hover {
+        opacity: 0.9;
+    }
+
+    .btn-next:disabled, .btn-complete:disabled {
+        opacity: 0.5;
+        cursor: not-allowed;
+    }
+
+    /* Advanced Settings Toggle */
+    .advanced-toggle {
+        cursor: pointer;
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+        color: var(--text-muted);
+        margin-top: 1rem;
+        padding: 0.5rem 0;
+    }
+
+    .advanced-toggle:hover {
+        color: var(--text-color);
+    }
+
+    .advanced-content {
+        display: none;
+        margin-top: 1rem;
+    }
+
+    .advanced-content.visible {
+        display: block;
+    }
+
+    /* Hardware Options */
+    .hardware-options {
+        display: flex;
+        gap: 1rem;
+        margin-top: 1rem;
+    }
+
+    .hardware-option {
+        flex: 1;
+        padding: 1.5rem;
+        border: 2px solid var(--border-color);
+        border-radius: 8px;
+        cursor: pointer;
+        text-align: center;
+        transition: all 0.2s ease;
+    }
+
+    .hardware-option:hover {
+        border-color: var(--primary-color);
+    }
+
+    .hardware-option.selected {
+        border-color: var(--primary-color);
+        background: rgba(var(--primary-rgb), 0.1);
+    }
+
+    .hardware-option .option-icon {
+        font-size: 2rem;
+        margin-bottom: 0.5rem;
+    }
+
+    .hardware-option .option-name {
+        font-weight: bold;
+        margin-bottom: 0.25rem;
+    }
+
+    .hardware-option .option-desc {
+        font-size: 0.85rem;
+        color: var(--text-muted);
+    }
+
+    /* Summary Section */
+    .summary-item {
+        display: flex;
+        justify-content: space-between;
+        padding: 0.75rem 0;
+        border-bottom: 1px solid var(--border-color);
+    }
+
+    .summary-item:last-child {
+        border-bottom: none;
+    }
+
+    .summary-label {
+        color: var(--text-muted);
+    }
+
+    .summary-value {
+        font-weight: 500;
+    }
+
+    /* Existing Install Banner */
+    .existing-install-banner {
+        background: rgba(var(--primary-rgb), 0.1);
+        border: 1px solid var(--primary-color);
+        border-radius: 8px;
+        padding: 1rem;
+        margin-bottom: 1.5rem;
+        display: flex;
+        align-items: center;
+        gap: 1rem;
+    }
+
+    .existing-install-banner .banner-icon {
+        font-size: 1.5rem;
+    }
+
+    .existing-install-banner .banner-content h4 {
+        margin: 0 0 0.25rem 0;
+    }
+
+    .existing-install-banner .banner-content p {
+        margin: 0;
+        color: var(--text-muted);
+        font-size: 0.9rem;
+    }
+
+    /* Provider List */
+    .configured-providers {
+        margin-top: 1rem;
+    }
+
+    .provider-list-item {
+        display: flex;
+        align-items: center;
+        justify-content: space-between;
+        padding: 1rem;
+        background: var(--bg-primary);
+        border-radius: 8px;
+        margin-bottom: 0.5rem;
+    }
+
+    .provider-list-item .provider-info {
+        display: flex;
+        align-items: center;
+        gap: 1rem;
+    }
+
+    .provider-list-item .provider-status {
+        padding: 0.25rem 0.5rem;
+        border-radius: 4px;
+        font-size: 0.85rem;
+    }
+
+    .provider-status.enabled {
+        background: rgba(40, 167, 69, 0.2);
+        color: #28a745;
+    }
+
+    .provider-status.disabled {
+        background: rgba(108, 117, 125, 0.2);
+        color: #6c757d;
+    }
+
+    .provider-actions {
+        display: flex;
+        gap: 0.5rem;
+    }
+
+    .provider-actions button {
+        padding: 0.25rem 0.5rem;
+        border-radius: 4px;
+        font-size: 0.85rem;
+        cursor: pointer;
+    }
+</style>
+{% endblock %}
+
+{% block content %}
+<div class="setup-wizard">
+    <div class="setup-header">
+        <h1>AudioMuse-AI Setup</h1>
+        <p class="subtitle">Configure your music analysis system</p>
+    </div>
+
+    <!-- Progress Steps -->
+    <div class="setup-progress">
+        <div class="progress-step active" data-step="1">
+            <div class="step-number">1</div>
+            <span class="step-label">Welcome</span>
+        </div>
+        <div class="progress-step" data-step="2">
+            <div class="step-number">2</div>
+            <span class="step-label">Providers</span>
+        </div>
+        <div class="progress-step" data-step="3">
+            <div class="step-number">3</div>
+            <span class="step-label">Settings</span>
+        </div>
+        <div class="progress-step" data-step="4">
+            <div class="step-number">4</div>
+            <span class="step-label">Complete</span>
+        </div>
+    </div>
+
+    <!-- Step 1: Welcome -->
+    <div class="step-content active" id="step-1">
+        <div class="step-section">
+            <h3>Welcome to AudioMuse-AI</h3>
+            <p class="description">
+                This setup wizard will help you configure AudioMuse-AI to analyze your music library
+                and create intelligent playlists. Let's get started!
+            </p>
+
+            <div id="existing-install-info" style="display: none;">
+                <!-- Populated by JS if existing installation detected -->
+            </div>
+        </div>
+
+        <div class="step-section">
+            <h3>Select Hardware Configuration</h3>
+            <p class="description">
+                Choose your hardware setup for music analysis. GPU acceleration significantly speeds up
+                the ML analysis process.
+            </p>
+
+            <div class="hardware-options">
+                <div class="hardware-option selected" data-hardware="cpu">
+                    <div class="option-icon">&#128187;</div>
+                    <div class="option-name">CPU Only</div>
+                    <div class="option-desc">Works on any system. Slower analysis but no special requirements.</div>
+                </div>
+                <div class="hardware-option" data-hardware="nvidia">
+                    <div class="option-icon">&#9889;</div>
+                    <div class="option-name">NVIDIA GPU</div>
+                    <div class="option-desc">Faster analysis with CUDA acceleration. Requires NVIDIA GPU with drivers.</div>
+                </div>
+            </div>
+        </div>
+
+        <div class="step-navigation">
+            <div></div>
+            <button class="btn-next" onclick="nextStep()">Continue</button>
+        </div>
+    </div>
+
+    <!-- Step 2: Provider Configuration -->
+    <div class="step-content" id="step-2">
+        <div class="step-section">
+            <h3>Configure Media Providers</h3>
+            <p class="description">
+                Select one or more media providers. You can add multiple providers to analyze music
+                from different sources. Tracks are linked by file path, so the same song in different
+                providers will share analysis data.
+            </p>
+
+            <div class="provider-grid" id="provider-grid">
+                <!-- Populated by JS -->
+            </div>
+        </div>
+
+        <div class="step-section" id="provider-config-section" style="display: none;">
+            <h3 id="provider-config-title">Provider Configuration</h3>
+            <div id="provider-configs">
+                <!-- Populated by JS -->
+            </div>
+        </div>
+
+        <div class="configured-providers" id="configured-providers" style="display: none;">
+            <h3>Configured Providers</h3>
+            <div id="provider-list">
+                <!-- Populated by JS -->
+            </div>
+        </div>
+
+        <div class="step-navigation">
+            <button class="btn-prev" onclick="prevStep()">Back</button>
+            <button class="btn-next" onclick="nextStep()" id="btn-step2-next">Continue</button>
+        </div>
+    </div>
+
+    <!-- Step 3: Advanced Settings -->
+    <div class="step-content" id="step-3">
+        <div class="step-section">
+            <h3>Analysis Settings</h3>
+            <p class="description">
+                Configure optional analysis features. The defaults work well for most users.
+            </p>
+
+            <div class="config-field">
+                <label>
+                    <input type="checkbox" id="setting-clap-enabled" checked>
+                    Enable CLAP Text Search
+                </label>
+                <div class="field-help">
+                    Allows searching your music using natural language queries like "upbeat summer songs".
+                    Uses additional memory (~750MB).
+                </div>
+            </div>
+
+            <div class="config-field">
+                <label>
+                    <input type="checkbox" id="setting-gpu-clustering">
+                    Use GPU for Clustering
+                </label>
+                <div class="field-help">
+                    Accelerate clustering with NVIDIA RAPIDS cuML. Only available with NVIDIA GPU.
+                </div>
+            </div>
+        </div>
+
+        <div class="advanced-toggle" onclick="toggleAdvanced()">
+            <span id="advanced-arrow">&#9654;</span>
+            <span>Advanced Settings</span>
+        </div>
+
+        <div class="advanced-content" id="advanced-settings">
+            <div class="step-section">
+                <h3>Database Configuration</h3>
+                <p class="description">
+                    These settings are typically configured via environment variables in Docker.
+                    Only change if you know what you're doing.
+                </p>
+
+                <div class="config-field">
+                    <label for="setting-postgres-host">PostgreSQL Host</label>
+                    <input type="text" id="setting-postgres-host" value="postgres" readonly>
+                    <div class="field-help">Database host (set via POSTGRES_HOST env var)</div>
+                </div>
+
+                <div class="config-field">
+                    <label for="setting-redis-url">Redis URL</label>
+                    <input type="text" id="setting-redis-url" value="redis://redis:6379/0" readonly>
+                    <div class="field-help">Redis connection URL (set via REDIS_URL env var)</div>
+                </div>
+            </div>
+
+            <div class="step-section">
+                <h3>AI Playlist Naming</h3>
+                <p class="description">
+                    Optionally configure an AI provider for creative playlist names.
+                </p>
+
+                <div class="config-field">
+                    <label for="setting-ai-provider">AI Provider</label>
+                    <select id="setting-ai-provider">
+                        <option value="NONE" selected>None (Use Default Names)</option>
+                        <option value="OLLAMA">Ollama (Local)</option>
+                        <option value="OPENAI">OpenAI / OpenRouter</option>
+                        <option value="GEMINI">Google Gemini</option>
+                        <option value="MISTRAL">Mistral AI</option>
+                    </select>
+                    <div class="field-help">AI service for generating creative playlist names</div>
+                </div>
+            </div>
+        </div>
+
+        <div class="step-navigation">
+            <button class="btn-prev" onclick="prevStep()">Back</button>
+            <button class="btn-next" onclick="nextStep()">Continue</button>
+        </div>
+    </div>
+
+    <!-- Step 4: Summary & Complete -->
+    <div class="step-content" id="step-4">
+        <div class="step-section">
+            <h3>Setup Summary</h3>
+            <p class="description">
+                Review your configuration before completing the setup.
+            </p>
+
+            <div id="setup-summary">
+                <!-- Populated by JS -->
+            </div>
+        </div>
+
+        <div class="step-section">
+            <h3>What's Next?</h3>
+            <ul>
+                <li>Run the analysis to scan and analyze your music library</li>
+                <li>Generate intelligent playlists based on audio fingerprints</li>
+                <li>Explore your music with similarity search and visualization tools</li>
+            </ul>
+        </div>
+
+        <div class="step-navigation">
+            <button class="btn-prev" onclick="prevStep()">Back</button>
+            <button class="btn-complete" onclick="completeSetup()">Complete Setup</button>
+        </div>
+    </div>
+</div>
+{% endblock %}
+
+{% block bodyAdditions %}
+<script src="{{ url_for('static', filename='menu.js') }}"></script>
+<script>
+    // State
+    let currentStep = 1;
+    let selectedHardware = 'cpu';
+    let selectedProviders = [];
+    let providerConfigs = {};
+    let providerTypes = [];
+    let existingProviders = [];
+
+    // Initialize
+    document.addEventListener('DOMContentLoaded', async function() {
+        await loadSetupStatus();
+        await loadProviderTypes();
+        renderProviderGrid();
+        setupHardwareOptions();
+    });
+
+    async function loadSetupStatus() {
+        try {
+            const response = await fetch('/api/setup/status');
+            const data = await response.json();
+
+            existingProviders = data.providers || [];
+
+            if (data.setup_completed && existingProviders.length > 0) {
+                // Show existing installation info
+                const info = document.getElementById('existing-install-info');
+                info.style.display = 'block';
+                info.innerHTML = `
+                    <div class="existing-install-banner">
+                        <div class="banner-icon">&#9989;</div>
+                        <div class="banner-content">
+                            <h4>Existing Installation Detected</h4>
+                            <p>You have ${existingProviders.length} provider(s) configured.
+                               You can modify your settings or add new providers.</p>
+                        </div>
+                    </div>
+                `;
+            }
+        } catch (err) {
+            console.error('Error loading setup status:', err);
+        }
+    }
+
+    async function loadProviderTypes() {
+        try {
+            const response = await fetch('/api/setup/providers/types');
+            providerTypes = await response.json();
+        } catch (err) {
+            console.error('Error loading provider types:', err);
+        }
+    }
+
+    function renderProviderGrid() {
+        const grid = document.getElementById('provider-grid');
+        grid.innerHTML = '';
+
+        providerTypes.forEach(provider => {
+            const isSelected = selectedProviders.includes(provider.type);
+            const card = document.createElement('div');
+            card.className = `provider-card ${isSelected ? 'selected' : ''}`;
+            card.dataset.type = provider.type;
+            card.onclick = () => toggleProvider(provider.type);
+
+            card.innerHTML = `
+                <div class="provider-name">
+                    ${provider.name}
+                    <span class="provider-check">&#10003;</span>
+                </div>
+                <div class="provider-desc">${provider.description}</div>
+            `;
+
+            grid.appendChild(card);
+        });
+
+        updateProviderConfigSection();
+    }
+
+    function toggleProvider(type) {
+        const idx = selectedProviders.indexOf(type);
+        if (idx >= 0) {
+            selectedProviders.splice(idx, 1);
+            delete providerConfigs[type];
+        } else {
+            selectedProviders.push(type);
+            providerConfigs[type] = {};
+        }
+        renderProviderGrid();
+    }
+
+    function updateProviderConfigSection() {
+        const section = document.getElementById('provider-config-section');
+        const configs = document.getElementById('provider-configs');
+
+        if (selectedProviders.length === 0) {
+            section.style.display = 'none';
+            return;
+        }
+
+        section.style.display = 'block';
+        configs.innerHTML = '';
+
+        selectedProviders.forEach(type => {
+            const provider = providerTypes.find(p => p.type === type);
+            if (!provider) return;
+
+            const configDiv = document.createElement('div');
+            configDiv.className = 'provider-config visible';
+            configDiv.innerHTML = `<h4>${provider.name} Configuration</h4>`;
+
+            const form = document.createElement('div');
+
+            provider.config_fields.forEach(field => {
+                const fieldDiv = document.createElement('div');
+                fieldDiv.className = 'config-field';
+
+                let inputHtml = '';
+                if (field.type === 'password') {
+                    inputHtml = `<input type="password" id="config-${type}-${field.name}"
+                                 placeholder="${field.default || ''}"
+                                 data-provider="${type}" data-field="${field.name}">`;
+                } else if (field.type === 'boolean') {
+                    inputHtml = `<input type="checkbox" id="config-${type}-${field.name}"
+                                 ${field.default ? 'checked' : ''}
+                                 data-provider="${type}" data-field="${field.name}">`;
+                } else if (field.type === 'number') {
+                    inputHtml = `<input type="number" id="config-${type}-${field.name}"
+                                 value="${field.default || ''}"
+                                 data-provider="${type}" data-field="${field.name}">`;
+                } else {
+                    inputHtml = `<input type="text" id="config-${type}-${field.name}"
+                                 value="${field.default || ''}"
+                                 placeholder="${field.default || ''}"
+                                 data-provider="${type}" data-field="${field.name}">`;
+                }
+
+                fieldDiv.innerHTML = `
+                    <label for="config-${type}-${field.name}">
+                        ${field.label}${field.required ? ' *' : ''}
+                    </label>
+                    ${inputHtml}
+                    <div class="field-help">${field.description || ''}</div>
+                `;
+
+                form.appendChild(fieldDiv);
+            });
+
+            // Add test connection button
+            const testBtn = document.createElement('button');
+            testBtn.className = 'test-connection-btn';
+            testBtn.innerHTML = '&#128268; Test Connection';
+            testBtn.onclick = () => testProviderConnection(type);
+
+            const testResult = document.createElement('div');
+            testResult.id = `test-result-${type}`;
+            testResult.className = 'test-result';
+            testResult.style.display = 'none';
+
+            configDiv.appendChild(form);
+            configDiv.appendChild(testBtn);
+            configDiv.appendChild(testResult);
+            configs.appendChild(configDiv);
+        });
+    }
+
+    async function testProviderConnection(type) {
+        const config = collectProviderConfig(type);
+        const resultDiv = document.getElementById(`test-result-${type}`);
+
+        resultDiv.style.display = 'block';
+        resultDiv.className = 'test-result';
+        resultDiv.textContent = 'Testing connection...';
+
+        try {
+            const response = await fetch('/api/setup/providers/test', {
+                method: 'POST',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({ provider_type: type, config })
+            });
+            const data = await response.json();
+
+            resultDiv.className = `test-result ${data.success ? 'success' : 'error'}`;
+            resultDiv.textContent = data.message;
+        } catch (err) {
+            resultDiv.className = 'test-result error';
+            resultDiv.textContent = 'Connection test failed: ' + err.message;
+        }
+    }
+
+    function collectProviderConfig(type) {
+        const config = {};
+        const inputs = document.querySelectorAll(`[data-provider="${type}"]`);
+        inputs.forEach(input => {
+            const field = input.dataset.field;
+            if (input.type === 'checkbox') {
+                config[field] = input.checked;
+            } else {
+                config[field] = input.value;
+            }
+        });
+        return config;
+    }
+
+    function collectAllProviderConfigs() {
+        selectedProviders.forEach(type => {
+            providerConfigs[type] = collectProviderConfig(type);
+        });
+    }
+
+    function setupHardwareOptions() {
+        document.querySelectorAll('.hardware-option').forEach(option => {
+            option.onclick = function() {
+                document.querySelectorAll('.hardware-option').forEach(o => o.classList.remove('selected'));
+                this.classList.add('selected');
+                selectedHardware = this.dataset.hardware;
+
+                // Update GPU clustering option
+                const gpuClustering = document.getElementById('setting-gpu-clustering');
+                if (selectedHardware === 'nvidia') {
+                    gpuClustering.disabled = false;
+                } else {
+                    gpuClustering.disabled = true;
+                    gpuClustering.checked = false;
+                }
+            };
+        });
+    }
+
+    function toggleAdvanced() {
+        const content = document.getElementById('advanced-settings');
+        const arrow = document.getElementById('advanced-arrow');
+        content.classList.toggle('visible');
+        arrow.innerHTML = content.classList.contains('visible') ? '&#9660;' : '&#9654;';
+    }
+
+    function updateProgressSteps() {
+        document.querySelectorAll('.progress-step').forEach((step, idx) => {
+            const stepNum = idx + 1;
+            step.classList.remove('active', 'completed');
+            if (stepNum < currentStep) {
+                step.classList.add('completed');
+            } else if (stepNum === currentStep) {
+                step.classList.add('active');
+            }
+        });
+    }
+
+    function showStep(step) {
+        document.querySelectorAll('.step-content').forEach(content => {
+            content.classList.remove('active');
+        });
+        document.getElementById(`step-${step}`).classList.add('active');
+        currentStep = step;
+        updateProgressSteps();
+
+        if (step === 4) {
+            renderSummary();
+        }
+    }
+
+    function nextStep() {
+        if (currentStep === 2) {
+            collectAllProviderConfigs();
+            if (selectedProviders.length === 0) {
+                alert('Please select at least one media provider.');
+                return;
+            }
+        }
+        if (currentStep < 4) {
+            showStep(currentStep + 1);
+        }
+    }
+
+    function prevStep() {
+        if (currentStep > 1) {
+            showStep(currentStep - 1);
+        }
+    }
+
+    function renderSummary() {
+        const summary = document.getElementById('setup-summary');
+        const providerNames = selectedProviders.map(type => {
+            const p = providerTypes.find(pt => pt.type === type);
+            return p ? p.name : type;
+        }).join(', ');
+
+        summary.innerHTML = `
+            <div class="summary-item">
+                <span class="summary-label">Hardware</span>
+                <span class="summary-value">${selectedHardware === 'nvidia' ? 'NVIDIA GPU' : 'CPU Only'}</span>
+            </div>
+            <div class="summary-item">
+                <span class="summary-label">Providers</span>
+                <span class="summary-value">${providerNames || 'None selected'}</span>
+            </div>
+            <div class="summary-item">
+                <span class="summary-label">CLAP Text Search</span>
+                <span class="summary-value">${document.getElementById('setting-clap-enabled').checked ? 'Enabled' : 'Disabled'}</span>
+            </div>
+            <div class="summary-item">
+                <span class="summary-label">GPU Clustering</span>
+                <span class="summary-value">${document.getElementById('setting-gpu-clustering').checked ? 'Enabled' : 'Disabled'}</span>
+            </div>
+            <div class="summary-item">
+                <span class="summary-label">AI Playlist Naming</span>
+                <span class="summary-value">${document.getElementById('setting-ai-provider').value}</span>
+            </div>
+        `;
+    }
+
+    async function completeSetup() {
+        try {
+            // Save providers
+            for (const type of selectedProviders) {
+                const provider = providerTypes.find(p => p.type === type);
+                await fetch('/api/setup/providers', {
+                    method: 'POST',
+                    headers: { 'Content-Type': 'application/json' },
+                    body: JSON.stringify({
+                        provider_type: type,
+                        name: provider.name,
+                        config: providerConfigs[type],
+                        enabled: true,
+                        priority: 0
+                    })
+                });
+            }
+
+            // Save settings
+            await fetch('/api/setup/settings', {
+                method: 'PUT',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({
+                    hardware_type: selectedHardware,
+                    clap_enabled: document.getElementById('setting-clap-enabled').checked,
+                    gpu_clustering: document.getElementById('setting-gpu-clustering').checked,
+                    ai_provider: document.getElementById('setting-ai-provider').value
+                })
+            });
+
+            // Mark setup as complete
+            await fetch('/api/setup/complete', { method: 'POST' });
+
+            // Redirect to home
+            alert('Setup complete! Redirecting to the main page...');
+            window.location.href = '/';
+
+        } catch (err) {
+            console.error('Error completing setup:', err);
+            alert('Error saving configuration: ' + err.message);
+        }
+    }
+</script>
+{% endblock %}
diff --git a/templates/sidebar_navi.html b/templates/sidebar_navi.html
index d8e98bb8..1f8932b9 100644
--- a/templates/sidebar_navi.html
+++ b/templates/sidebar_navi.html
@@ -12,4 +12,5 @@
 <!-- <li><a href="{{ url_for('collection_bp.collection_page') }}" {% if active == 'collection' %}class="active"{% endif %}">Collection Sync</a></li> -->
 <li><a href="{{ url_for('analysis_bp.cleaning_page') }}" {% if active == 'cleaning' %}class="active"{% endif %}>Cleaning</a></li>
 <li><a href="{{ url_for('cron_bp.cron_page') }}" {% if active == 'cron' %}class="active"{% endif %}>Scheduled Tasks</a></li>
+<li><a href="{{ url_for('setup.setup_page') }}" {% if active == 'setup' %}class="active"{% endif %}>Setup &amp; Providers</a></li>
 <li><button type="button" id="dark-mode-toggle" aria-pressed="false" aria-label="Toggle dark mode">🌙 Dark Mode</button></li>
\ No newline at end of file

From 79c89708439e67fe72a542bd02a5bc08b7744b35 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 04:27:53 +0000
Subject: [PATCH 02/33] Add provider-aware API helpers with backward
 compatibility

Implements provider fallback logic for API calls:
- When provider_id specified: look up in that provider, fall back to score
- When provider_id NOT specified (backward compatible):
  1. Try primary provider first
  2. Try other enabled providers by priority
  3. Fall back to direct score table (legacy mode)

New helper functions:
- get_track_by_item_id(item_id, provider_id=None)
- get_tracks_by_item_ids(item_ids, provider_id=None)
- get_primary_provider_id()
- get_enabled_provider_ids()
- resolve_item_id_to_provider(item_id)
- get_item_id_for_provider(file_path_or_track_id, provider_id)
- is_multi_provider_mode()
- set_primary_provider(provider_id)

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_helper.py | 248 +++++++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 246 insertions(+), 2 deletions(-)

diff --git a/app_helper.py b/app_helper.py
index 25a47f90..24f56f20 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -1076,5 +1076,249 @@ def cancel_job_and_children_recursive(job_id, task_type_from_db=None, reason="Ta
         if child_db_info and child_db_info.get('status') not in [TASK_STATUS_SUCCESS, TASK_STATUS_FAILURE, TASK_STATUS_REVOKED]:
              logger.info(f"Recursively cancelling child job: {child_job_id}")
              cancelled_count += cancel_job_and_children_recursive(child_job_id, reason="Cancelled due to parent task revocation.")
-        
-    return cancelled_count
\ No newline at end of file
+
+    return cancelled_count
+
+
+# ##############################################################################
+# MULTI-PROVIDER HELPER FUNCTIONS
+# ##############################################################################
+
+def get_primary_provider_id():
+    """Get the primary provider ID from app_settings."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("SELECT value FROM app_settings WHERE key = 'primary_provider_id'")
+        row = cur.fetchone()
+        if row and row[0] is not None:
+            try:
+                # Value is stored as JSONB, could be int or null
+                val = row[0]
+                if isinstance(val, int):
+                    return val
+                if val is None or val == 'null':
+                    return None
+                return int(val)
+            except (ValueError, TypeError):
+                return None
+        return None
+
+
+def get_enabled_provider_ids():
+    """Get list of enabled provider IDs ordered by priority (highest first)."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            SELECT id FROM provider
+            WHERE enabled = TRUE
+            ORDER BY priority DESC, created_at ASC
+        """)
+        return [row[0] for row in cur.fetchall()]
+
+
+def get_track_by_item_id(item_id, provider_id=None):
+    """
+    Look up a track by item_id with provider fallback logic.
+
+    If provider_id is specified:
+        - Look up in provider_track for that provider first
+        - Fall back to score table if not in provider_track
+
+    If provider_id is NOT specified (backward compatible mode):
+        1. Try the primary provider first
+        2. Try other enabled providers in priority order
+        3. Fall back to direct score table lookup (legacy mode)
+
+    Returns:
+        dict with track info or None if not found
+    """
+    db = get_db()
+
+    def lookup_in_score(item_id):
+        """Direct lookup in score table (legacy mode)."""
+        with db.cursor() as cur:
+            cur.execute("""
+                SELECT item_id, title, author, album, tempo, key, scale,
+                       mood_vector, energy, other_features, file_path, track_id
+                FROM score WHERE item_id = %s
+            """, (item_id,))
+            row = cur.fetchone()
+            if row:
+                return {
+                    'item_id': row[0],
+                    'title': row[1],
+                    'author': row[2],
+                    'album': row[3],
+                    'tempo': row[4],
+                    'key': row[5],
+                    'scale': row[6],
+                    'mood_vector': row[7],
+                    'energy': row[8],
+                    'other_features': row[9],
+                    'file_path': row[10],
+                    'track_id': row[11],
+                    'provider_id': None  # Unknown provider in legacy mode
+                }
+        return None
+
+    def lookup_via_provider(item_id, prov_id):
+        """Look up via provider_track table."""
+        with db.cursor() as cur:
+            # First check provider_track
+            cur.execute("""
+                SELECT pt.item_id, pt.title, pt.artist, pt.album, pt.track_id,
+                       s.tempo, s.key, s.scale, s.mood_vector, s.energy,
+                       s.other_features, s.file_path
+                FROM provider_track pt
+                LEFT JOIN score s ON (
+                    pt.item_id = s.item_id OR
+                    (pt.track_id IS NOT NULL AND pt.track_id = s.track_id)
+                )
+                WHERE pt.provider_id = %s AND pt.item_id = %s
+            """, (prov_id, item_id))
+            row = cur.fetchone()
+            if row:
+                return {
+                    'item_id': row[0],
+                    'title': row[1],
+                    'author': row[2],
+                    'album': row[3],
+                    'track_id': row[4],
+                    'tempo': row[5],
+                    'key': row[6],
+                    'scale': row[7],
+                    'mood_vector': row[8],
+                    'energy': row[9],
+                    'other_features': row[10],
+                    'file_path': row[11],
+                    'provider_id': prov_id
+                }
+        return None
+
+    # If provider_id specified, try that provider first then fall back
+    if provider_id is not None:
+        result = lookup_via_provider(item_id, provider_id)
+        if result:
+            return result
+        # Fall back to direct score lookup
+        return lookup_in_score(item_id)
+
+    # No provider specified - use fallback logic
+    # 1. Try primary provider first
+    primary_id = get_primary_provider_id()
+    if primary_id:
+        result = lookup_via_provider(item_id, primary_id)
+        if result:
+            return result
+
+    # 2. Try other enabled providers in priority order
+    enabled_ids = get_enabled_provider_ids()
+    for prov_id in enabled_ids:
+        if prov_id == primary_id:
+            continue  # Already tried
+        result = lookup_via_provider(item_id, prov_id)
+        if result:
+            return result
+
+    # 3. Fall back to direct score table lookup (legacy/backward compatible)
+    return lookup_in_score(item_id)
+
+
+def get_tracks_by_item_ids(item_ids, provider_id=None):
+    """
+    Look up multiple tracks by item_ids with provider fallback logic.
+
+    Args:
+        item_ids: List of item IDs to look up
+        provider_id: Optional provider ID to scope the lookup
+
+    Returns:
+        dict mapping item_id to track info
+    """
+    if not item_ids:
+        return {}
+
+    results = {}
+    for item_id in item_ids:
+        track = get_track_by_item_id(item_id, provider_id)
+        if track:
+            results[item_id] = track
+
+    return results
+
+
+def resolve_item_id_to_provider(item_id):
+    """
+    Resolve which provider(s) know about a given item_id.
+
+    Returns:
+        List of provider_ids that have this item_id,
+        or empty list if only in score table (legacy)
+    """
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            SELECT DISTINCT provider_id FROM provider_track
+            WHERE item_id = %s
+        """, (item_id,))
+        return [row[0] for row in cur.fetchall()]
+
+
+def get_item_id_for_provider(file_path_or_track_id, provider_id):
+    """
+    Get the provider-specific item_id for a track.
+
+    Useful when you have analysis data linked to one provider
+    and need to find the equivalent track in another provider.
+
+    Args:
+        file_path_or_track_id: Either file path (str) or track_id (int)
+        provider_id: The provider to look up in
+
+    Returns:
+        The item_id for that provider, or None if not found
+    """
+    db = get_db()
+    with db.cursor() as cur:
+        if isinstance(file_path_or_track_id, int):
+            # Lookup by track_id
+            cur.execute("""
+                SELECT item_id FROM provider_track
+                WHERE provider_id = %s AND track_id = %s
+            """, (provider_id, file_path_or_track_id))
+        else:
+            # Lookup by file path - need to join through track table
+            cur.execute("""
+                SELECT pt.item_id FROM provider_track pt
+                JOIN track t ON pt.track_id = t.id
+                WHERE pt.provider_id = %s AND t.file_path = %s
+            """, (provider_id, file_path_or_track_id))
+
+        row = cur.fetchone()
+        return row[0] if row else None
+
+
+def is_multi_provider_mode():
+    """Check if multi-provider mode is enabled."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("SELECT value FROM app_settings WHERE key = 'multi_provider_enabled'")
+        row = cur.fetchone()
+        if row:
+            val = row[0]
+            return val is True or val == True or val == 'true'
+        return False
+
+
+def set_primary_provider(provider_id):
+    """Set the primary provider ID."""
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            INSERT INTO app_settings (key, value, category, description, updated_at)
+            VALUES ('primary_provider_id', %s, 'providers', 'ID of the primary provider', NOW())
+            ON CONFLICT (key) DO UPDATE SET
+                value = EXCLUDED.value,
+                updated_at = NOW()
+        """, (str(provider_id) if provider_id is not None else 'null',))
+        db.commit()
\ No newline at end of file

From 6d575fc35058f640df1d84f77f1fd9398c1f574c Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 04:42:17 +0000
Subject: [PATCH 03/33] Add split deployment support for remote workers

- Add docker-compose-worker-cpu.yaml for CPU-only remote workers
- Update docker-compose-worker-nvidia.yaml with all provider configs
- Update docker-compose-server.yaml for server-only deployment
- Add worker connection settings to .env.example (WORKER_REDIS_URL, WORKER_POSTGRES_HOST)
- Add deployment mode selection to setup wizard (unified/split)
- Add worker configuration section in setup wizard with connection info
- Add server-info API endpoint for automatic IP detection

This allows running ML analysis workers on separate machines from the
main Flask server, useful for utilizing dedicated GPU servers or
distributing workload across multiple workers.

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_setup.py                                 |  43 ++++
 deployment/.env.example                      |  30 +++
 deployment/docker-compose-server.yaml        | 116 ++++++++---
 deployment/docker-compose-worker-cpu.yaml    | 113 +++++++++++
 deployment/docker-compose-worker-nvidia.yaml | 118 ++++++++---
 templates/setup.html                         | 200 ++++++++++++++++++-
 6 files changed, 569 insertions(+), 51 deletions(-)
 create mode 100644 deployment/docker-compose-worker-cpu.yaml

diff --git a/app_setup.py b/app_setup.py
index db895861..507441be 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -680,3 +680,46 @@ def set_primary_provider():
         'message': 'Primary provider set',
         'primary_provider_id': provider_id
     })
+
+
+@setup_bp.route('/api/setup/server-info', methods=['GET'])
+def get_server_info():
+    """
+    Get server connection information for configuring remote workers.
+    ---
+    tags:
+      - Setup
+    responses:
+      200:
+        description: Server connection information
+    """
+    import socket
+    import os
+
+    # Try to get the server's IP address
+    try:
+        # Get the hostname and try to resolve it
+        hostname = socket.gethostname()
+        host_ip = socket.gethostbyname(hostname)
+        # If we get a loopback address, try to get a better one
+        if host_ip.startswith('127.'):
+            # Try to connect to a public DNS to get our real IP
+            s = socket.socket(socket.AF_INET, socket.SOCK_DGRAM)
+            try:
+                s.connect(('8.8.8.8', 80))
+                host_ip = s.getsockname()[0]
+            except Exception:
+                host_ip = hostname  # Fall back to hostname
+            finally:
+                s.close()
+    except Exception:
+        host_ip = 'localhost'
+
+    return jsonify({
+        'host': host_ip,
+        'hostname': socket.gethostname() if hasattr(socket, 'gethostname') else 'unknown',
+        'redis_port': os.environ.get('REDIS_PORT', '6379'),
+        'postgres_port': os.environ.get('POSTGRES_PORT', '5432'),
+        'postgres_host': os.environ.get('POSTGRES_HOST', 'postgres'),
+        'redis_url': os.environ.get('REDIS_URL', 'redis://redis:6379/0'),
+    })
diff --git a/deployment/.env.example b/deployment/.env.example
index d7e7db62..fc8867a4 100644
--- a/deployment/.env.example
+++ b/deployment/.env.example
@@ -96,6 +96,36 @@ WORKER_PORT=8029
 # Timezone (examples: UTC, Europe/Berlin, America/Los_Angeles)
 TZ=UTC
 
+# =============================================================================
+# SPLIT DEPLOYMENT (Remote Worker Configuration)
+# =============================================================================
+# Use these settings when running workers on a separate machine from the server.
+#
+# DEPLOYMENT OPTIONS:
+#   1. UNIFIED (default) - Server and worker on same machine
+#      Use: docker-compose-unified.yaml or docker-compose-unified-nvidia.yaml
+#      Leave these settings at defaults
+#
+#   2. SPLIT - Server and worker on different machines
+#      Server machine: Run docker-compose-server.yaml
+#      Worker machine: Run docker-compose-worker-cpu.yaml or docker-compose-worker-nvidia.yaml
+#      Configure WORKER_* settings below on worker machine
+#
+# On the WORKER machine, set these to point to the SERVER machine:
+#
+# Redis URL on server (replace SERVER_IP with your server's IP/hostname)
+# Format: redis://[password@]host:port/db
+# Examples:
+#   WORKER_REDIS_URL=redis://192.168.1.100:6379/0
+#   WORKER_REDIS_URL=redis://:mypassword@192.168.1.100:6379/0
+WORKER_REDIS_URL=redis://redis:6379/0
+#
+# PostgreSQL host on server (replace with your server's IP/hostname)
+# Examples:
+#   WORKER_POSTGRES_HOST=192.168.1.100
+#   WORKER_POSTGRES_HOST=my-server.local
+WORKER_POSTGRES_HOST=postgres
+
 # =============================================================================
 # NVIDIA GPU (for docker-compose-unified-nvidia.yaml)
 # =============================================================================
diff --git a/deployment/docker-compose-server.yaml b/deployment/docker-compose-server.yaml
index 757c3e9a..8c968d5b 100644
--- a/deployment/docker-compose-server.yaml
+++ b/deployment/docker-compose-server.yaml
@@ -1,13 +1,38 @@
-# AudioMuse-AI Deployment Configuration
-# 
-# SERVER TEMPLATE - Run database, Redis and Flask API
-# This can be run on a lightweight server, tested on an N100 mini PC (without heavy CPU or GPU requirements).
-# For remote worker setup with CPU/GPU on a separate machine, use docker-compose-worker.yaml on the remote machine
-# and configure WORKER_POSTGRES_HOST and WORKER_REDIS_URL in that worker's .env file to point to this server.
+# AudioMuse-AI Server-Only Docker Compose
+# =============================================================================
+# SERVER TEMPLATE - Runs Flask API + Redis + PostgreSQL (NO workers)
+#
+# Use this for split deployments where:
+#   - Server runs on lightweight hardware (N100, Raspberry Pi, NAS, etc.)
+#   - Workers run on separate machines with GPU/better CPU
+#
+# Quick Start:
+#   1. Copy .env.example to .env and configure settings
+#   2. Run: docker-compose -f docker-compose-server.yaml up -d
+#   3. Note this server's IP address for worker configuration
+#   4. On worker machine(s), use docker-compose-worker-cpu.yaml or
+#      docker-compose-worker-nvidia.yaml with these .env settings:
+#        WORKER_REDIS_URL=redis://SERVER_IP:6379/0
+#        WORKER_POSTGRES_HOST=SERVER_IP
+#
+# Network Requirements (ports to open for workers):
+#   - Port 6379: Redis (workers connect here for task queue)
+#   - Port 5432: PostgreSQL (workers connect here for data)
+#   - Port 8000: Web UI (optional, only if exposing to users)
+#
+# Security Note:
+#   For production, consider:
+#   - VPN or private network between server and workers
+#   - Redis password (uncomment command in redis service)
+#   - PostgreSQL with SSL and strong password
+# =============================================================================
 
 version: '3.8'
+
 services:
-  # Redis service for RQ (task queue)
+  # ---------------------------------------------------------------------------
+  # Redis - Task Queue (exposed for remote workers)
+  # ---------------------------------------------------------------------------
   redis:
     image: redis:7-alpine
     container_name: audiomuse-redis
@@ -16,8 +41,17 @@ services:
     volumes:
       - redis-data:/data
     restart: unless-stopped
+    # Uncomment for password protection:
+    # command: redis-server --requirepass ${REDIS_PASSWORD:-changeme}
+    healthcheck:
+      test: ["CMD", "redis-cli", "ping"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
 
-  # PostgreSQL database service
+  # ---------------------------------------------------------------------------
+  # PostgreSQL - Database (exposed for remote workers)
+  # ---------------------------------------------------------------------------
   postgres:
     image: postgres:15-alpine
     container_name: audiomuse-postgres
@@ -30,42 +64,76 @@ services:
     volumes:
       - postgres-data:/var/lib/postgresql/data
     restart: unless-stopped
+    healthcheck:
+      test: ["CMD-SHELL", "pg_isready -U ${POSTGRES_USER:-audiomuse}"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
 
-  # AudioMuse-AI Flask application service
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Flask Application (Web UI & API only)
+  # NOTE: No worker - analysis tasks are sent to remote workers via Redis
+  # ---------------------------------------------------------------------------
   audiomuse-ai-flask:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest-nvidia
+    image: ghcr.io/neptunehub/audiomuse-ai:latest
     container_name: audiomuse-ai-flask-app
     ports:
       - "${FRONTEND_PORT:-8000}:8000"
     environment:
       SERVICE_TYPE: "flask"
       TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
+      # Media Server Configuration (configure via GUI or .env)
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      LYRION_URL: "${LYRION_URL:-}"
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      # Database Configuration
       POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
       POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
       POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
       POSTGRES_HOST: "postgres"
       POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
       REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
+      # AI Configuration
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # Flask doesn't need CLAP models - workers handle that
+      CLAP_ENABLED: "false"
       TEMP_DIR: "/app/temp_audio"
     volumes:
       - temp-audio-flask:/app/temp_audio
+      - ${MUSIC_PATH:-./music}:/music:ro
     depends_on:
-      - redis
-      - postgres
+      redis:
+        condition: service_healthy
+      postgres:
+        condition: service_healthy
     restart: unless-stopped
 
+# =============================================================================
+# Volumes
+# =============================================================================
 volumes:
   redis-data:
+    name: audiomuse-redis-data
   postgres-data:
-  temp-audio-flask:
\ No newline at end of file
+    name: audiomuse-postgres-data
+  temp-audio-flask:
+    name: audiomuse-temp-flask
\ No newline at end of file
diff --git a/deployment/docker-compose-worker-cpu.yaml b/deployment/docker-compose-worker-cpu.yaml
new file mode 100644
index 00000000..ae093b87
--- /dev/null
+++ b/deployment/docker-compose-worker-cpu.yaml
@@ -0,0 +1,113 @@
+# AudioMuse-AI Worker-Only Docker Compose (CPU)
+# =============================================================================
+# WORKER TEMPLATE - Runs RQ workers only, connects to remote server
+#
+# Use this for split deployments where:
+#   - Server (Flask + Redis + PostgreSQL) runs on separate machine
+#   - This worker handles CPU-intensive ML analysis tasks
+#
+# Prerequisites:
+#   - Server running docker-compose-server.yaml on another machine
+#   - Network connectivity to server (ports 6379 Redis, 5432 PostgreSQL)
+#   - Access to same music files (via media server API or shared storage)
+#
+# Quick Start:
+#   1. Copy .env.example to .env on this worker machine
+#   2. Configure connection to remote server:
+#        WORKER_REDIS_URL=redis://SERVER_IP:6379/0
+#        WORKER_POSTGRES_HOST=SERVER_IP
+#   3. Copy media server credentials from server's .env
+#   4. Run: docker-compose -f docker-compose-worker-cpu.yaml up -d
+#
+# Scaling:
+#   - Run multiple workers on different machines
+#   - All workers connect to same Redis queue
+#   - Tasks automatically distributed across workers
+# =============================================================================
+
+version: '3.8'
+
+services:
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Worker (CPU-only, connects to remote server)
+  # ---------------------------------------------------------------------------
+  audiomuse-ai-worker:
+    image: ghcr.io/neptunehub/audiomuse-ai:latest
+    container_name: audiomuse-ai-worker-cpu
+    environment:
+      SERVICE_TYPE: "worker"
+      TZ: "${TZ:-UTC}"
+      # =======================================================================
+      # REMOTE SERVER CONNECTION (REQUIRED)
+      # =======================================================================
+      # Redis URL - point to server machine
+      # Format: redis://[password@]host:port/db
+      # Examples:
+      #   redis://192.168.1.100:6379/0
+      #   redis://:mypassword@192.168.1.100:6379/0
+      REDIS_URL: "${WORKER_REDIS_URL:-redis://redis:6379/0}"
+      # PostgreSQL host - IP or hostname of server machine
+      POSTGRES_HOST: "${WORKER_POSTGRES_HOST:-postgres}"
+      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+      # =======================================================================
+      # MEDIA SERVER CONFIGURATION (must match server)
+      # =======================================================================
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      LYRION_URL: "${LYRION_URL:-}"
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      # =======================================================================
+      # AI CONFIGURATION (optional)
+      # =======================================================================
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # =======================================================================
+      # WORKER FEATURES
+      # =======================================================================
+      # CLAP text search - uses ~750MB RAM
+      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
+      # GPU clustering - disabled for CPU worker
+      USE_GPU_CLUSTERING: "false"
+      # Worker tuning
+      RQ_MAX_JOBS: "${RQ_MAX_JOBS:-50}"
+      RQ_MAX_JOBS_HIGH: "${RQ_MAX_JOBS_HIGH:-100}"
+      RQ_LOGGING_LEVEL: "${RQ_LOGGING_LEVEL:-INFO}"
+      TEMP_DIR: "/app/temp_audio"
+    volumes:
+      - temp-audio-worker:/app/temp_audio
+      # Mount music directory if using local files provider
+      - ${MUSIC_PATH:-./music}:/music:ro
+    restart: unless-stopped
+    # Optional: Limit CPU usage
+    # deploy:
+    #   resources:
+    #     limits:
+    #       cpus: '4'
+    #       memory: 8G
+
+# =============================================================================
+# Volumes
+# =============================================================================
+volumes:
+  temp-audio-worker:
+    name: audiomuse-temp-worker-cpu
diff --git a/deployment/docker-compose-worker-nvidia.yaml b/deployment/docker-compose-worker-nvidia.yaml
index 4b6021e0..18d7cf90 100644
--- a/deployment/docker-compose-worker-nvidia.yaml
+++ b/deployment/docker-compose-worker-nvidia.yaml
@@ -1,50 +1,118 @@
-# AudioMuse-AI Deployment Configuration
+# AudioMuse-AI Worker-Only Docker Compose (NVIDIA GPU)
+# =============================================================================
+# WORKER TEMPLATE - Runs RQ workers only with GPU acceleration
 #
-# WORKER TEMPLATE - Run this for heavy CPU/GPU tasks like analysis and clustering, connected to a lightweight server with Jellyfin and AudioMuse-AI Flask application and databases.
-# This configuration is intended for deployment on a server with NVIDIA GPU support.
+# Use this for split deployments where:
+#   - Server (Flask + Redis + PostgreSQL) runs on separate machine
+#   - This worker handles GPU-accelerated ML analysis tasks
 #
+# Prerequisites:
+#   - Server running docker-compose-server.yaml on another machine
+#   - Network connectivity to server (ports 6379 Redis, 5432 PostgreSQL)
+#   - Access to same music files (via media server API or shared storage)
+#   - NVIDIA GPU with docker nvidia-runtime installed
+#
+# Quick Start:
+#   1. Copy .env.example to .env on this worker machine
+#   2. Configure connection to remote server:
+#        WORKER_REDIS_URL=redis://SERVER_IP:6379/0
+#        WORKER_POSTGRES_HOST=SERVER_IP
+#   3. Copy media server credentials from server's .env
+#   4. Run: docker-compose -f docker-compose-worker-nvidia.yaml up -d
+#
+# Scaling:
+#   - Run multiple workers on different machines
+#   - All workers connect to same Redis queue
+#   - Tasks automatically distributed across workers
+# =============================================================================
 
 version: '3.8'
+
 services:
-  # AudioMuse-AI Worker service (GPU-dependent)
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Worker (NVIDIA GPU, connects to remote server)
+  # ---------------------------------------------------------------------------
   audiomuse-ai-worker:
     image: ghcr.io/neptunehub/audiomuse-ai:latest-nvidia
-    container_name: audiomuse-ai-worker-instance
-    ports:
-      - "${WORKER_PORT:-8029}:8000"  # Expose worker API
+    container_name: audiomuse-ai-worker-nvidia
     environment:
       SERVICE_TYPE: "worker"
       TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
+      # =======================================================================
+      # REMOTE SERVER CONNECTION (REQUIRED)
+      # =======================================================================
+      # Redis URL - point to server machine
+      # Format: redis://[password@]host:port/db
+      # Examples:
+      #   redis://192.168.1.100:6379/0
+      #   redis://:mypassword@192.168.1.100:6379/0
+      REDIS_URL: "${WORKER_REDIS_URL:-redis://redis:6379/0}"
+      # PostgreSQL host - IP or hostname of server machine
+      POSTGRES_HOST: "${WORKER_POSTGRES_HOST:-postgres}"
+      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
       POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
       POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
       POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "${WORKER_POSTGRES_HOST:-postgres}" # Replace via WORKER_POSTGRES_HOST in .env when running remotely
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${WORKER_REDIS_URL:-redis://redis:6379/0}"  # Set WORKER_REDIS_URL in .env for remote connections
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
+      # =======================================================================
+      # MEDIA SERVER CONFIGURATION (must match server)
+      # =======================================================================
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      LYRION_URL: "${LYRION_URL:-}"
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      # =======================================================================
+      # AI CONFIGURATION (optional)
+      # =======================================================================
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # =======================================================================
+      # WORKER FEATURES (GPU-enabled)
+      # =======================================================================
+      # CLAP text search - uses ~750MB RAM
+      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
+      # GPU clustering - enabled for NVIDIA worker
+      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-true}"
+      # Worker tuning
+      RQ_MAX_JOBS: "${RQ_MAX_JOBS:-50}"
+      RQ_MAX_JOBS_HIGH: "${RQ_MAX_JOBS_HIGH:-100}"
+      RQ_LOGGING_LEVEL: "${RQ_LOGGING_LEVEL:-INFO}"
       TEMP_DIR: "/app/temp_audio"
-      NVIDIA_VISIBLE_DEVICES: "0"
+      # NVIDIA GPU settings
+      NVIDIA_VISIBLE_DEVICES: "${NVIDIA_GPU_ID:-0}"
       NVIDIA_DRIVER_CAPABILITIES: "compute,utility"
-      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-true}"
     volumes:
       - temp-audio-worker:/app/temp_audio
+      # Mount music directory if using local files provider
+      - ${MUSIC_PATH:-./music}:/music:ro
     restart: unless-stopped
     deploy:
       resources:
         reservations:
           devices:
             - driver: nvidia
-              device_ids: ["0"]
+              device_ids: ["${NVIDIA_GPU_ID:-0}"]
               capabilities: [gpu]
+
+# =============================================================================
+# Volumes
+# =============================================================================
 volumes:
-  temp-audio-worker:
\ No newline at end of file
+  temp-audio-worker:
+    name: audiomuse-temp-worker-nvidia
diff --git a/templates/setup.html b/templates/setup.html
index 08f65f23..81f4189b 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -452,6 +452,47 @@
         font-size: 0.85rem;
         cursor: pointer;
     }
+
+    /* Worker Connection Info */
+    .connection-info-box {
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+        background: var(--bg-primary);
+        padding: 0.75rem;
+        border-radius: 4px;
+        border: 1px solid var(--border-color);
+    }
+
+    .connection-info-box code {
+        flex: 1;
+        font-family: monospace;
+        font-size: 0.95rem;
+        word-break: break-all;
+    }
+
+    .copy-btn {
+        padding: 0.25rem 0.75rem;
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+        background: var(--bg-secondary);
+        cursor: pointer;
+        font-size: 0.85rem;
+    }
+
+    .copy-btn:hover {
+        background: var(--bg-primary);
+    }
+
+    .copy-btn.copied {
+        background: rgba(40, 167, 69, 0.2);
+        border-color: #28a745;
+        color: #28a745;
+    }
+
+    .worker-connection-info .config-field {
+        margin-bottom: 1.25rem;
+    }
 </style>
 {% endblock %}
 
@@ -496,6 +537,26 @@ <h3>Welcome to AudioMuse-AI</h3>
             </div>
         </div>
 
+        <div class="step-section">
+            <h3>Select Deployment Mode</h3>
+            <p class="description">
+                Choose how you want to deploy AudioMuse-AI.
+            </p>
+
+            <div class="hardware-options">
+                <div class="hardware-option selected" data-deployment="unified">
+                    <div class="option-icon">&#128230;</div>
+                    <div class="option-name">Unified</div>
+                    <div class="option-desc">Server and worker on the same machine. Best for most users.</div>
+                </div>
+                <div class="hardware-option" data-deployment="split">
+                    <div class="option-icon">&#128423;</div>
+                    <div class="option-name">Split</div>
+                    <div class="option-desc">Run workers on separate machines. For distributed setups or dedicated GPU servers.</div>
+                </div>
+            </div>
+        </div>
+
         <div class="step-section">
             <h3>Select Hardware Configuration</h3>
             <p class="description">
@@ -588,6 +649,53 @@ <h3>Analysis Settings</h3>
             </div>
         </div>
 
+        <div class="step-section" id="worker-config-section" style="display: none;">
+            <h3>Worker Connection Info</h3>
+            <p class="description">
+                Use these settings when configuring remote workers. Copy them to the worker machine's .env file.
+            </p>
+
+            <div class="worker-connection-info">
+                <div class="config-field">
+                    <label>Redis URL for Workers</label>
+                    <div class="connection-info-box">
+                        <code id="worker-redis-url">redis://&lt;THIS_SERVER_IP&gt;:6379/0</code>
+                        <button class="copy-btn" onclick="copyToClipboard('worker-redis-url')">Copy</button>
+                    </div>
+                    <div class="field-help">Set WORKER_REDIS_URL in worker's .env to this value</div>
+                </div>
+
+                <div class="config-field">
+                    <label>PostgreSQL Host for Workers</label>
+                    <div class="connection-info-box">
+                        <code id="worker-postgres-host">&lt;THIS_SERVER_IP&gt;</code>
+                        <button class="copy-btn" onclick="copyToClipboard('worker-postgres-host')">Copy</button>
+                    </div>
+                    <div class="field-help">Set WORKER_POSTGRES_HOST in worker's .env to this value</div>
+                </div>
+
+                <div class="config-field">
+                    <label>Recommended Docker Compose File</label>
+                    <div class="connection-info-box">
+                        <code id="worker-compose-file">docker-compose-worker-cpu.yaml</code>
+                    </div>
+                    <div class="field-help" id="worker-compose-help">
+                        Run on worker machine: <code>docker-compose -f docker-compose-worker-cpu.yaml up -d</code>
+                    </div>
+                </div>
+            </div>
+
+            <div class="step-section" style="margin-top: 1rem; padding: 1rem; background: rgba(var(--primary-rgb), 0.1); border-radius: 8px;">
+                <h4 style="margin-top: 0;">Quick Setup for Workers</h4>
+                <ol style="margin: 0.5rem 0 0 1.5rem; padding: 0;">
+                    <li>Copy .env.example to the worker machine</li>
+                    <li>Set WORKER_REDIS_URL and WORKER_POSTGRES_HOST as shown above</li>
+                    <li>Copy your media server credentials (same as this server)</li>
+                    <li>Run the appropriate docker-compose file</li>
+                </ol>
+            </div>
+        </div>
+
         <div class="advanced-toggle" onclick="toggleAdvanced()">
             <span id="advanced-arrow">&#9654;</span>
             <span>Advanced Settings</span>
@@ -676,17 +784,21 @@ <h3>What's Next?</h3>
     // State
     let currentStep = 1;
     let selectedHardware = 'cpu';
+    let selectedDeployment = 'unified';
     let selectedProviders = [];
     let providerConfigs = {};
     let providerTypes = [];
     let existingProviders = [];
+    let serverInfo = { host: window.location.hostname, port: window.location.port || '8000' };
 
     // Initialize
     document.addEventListener('DOMContentLoaded', async function() {
         await loadSetupStatus();
         await loadProviderTypes();
+        await loadServerInfo();
         renderProviderGrid();
         setupHardwareOptions();
+        setupDeploymentOptions();
     });
 
     async function loadSetupStatus() {
@@ -882,9 +994,9 @@ <h4>Existing Installation Detected</h4>
     }
 
     function setupHardwareOptions() {
-        document.querySelectorAll('.hardware-option').forEach(option => {
+        document.querySelectorAll('.hardware-option[data-hardware]').forEach(option => {
             option.onclick = function() {
-                document.querySelectorAll('.hardware-option').forEach(o => o.classList.remove('selected'));
+                document.querySelectorAll('.hardware-option[data-hardware]').forEach(o => o.classList.remove('selected'));
                 this.classList.add('selected');
                 selectedHardware = this.dataset.hardware;
 
@@ -896,10 +1008,85 @@ <h4>Existing Installation Detected</h4>
                     gpuClustering.disabled = true;
                     gpuClustering.checked = false;
                 }
+
+                // Update worker compose file recommendation
+                updateWorkerComposeRecommendation();
             };
         });
     }
 
+    function setupDeploymentOptions() {
+        document.querySelectorAll('.hardware-option[data-deployment]').forEach(option => {
+            option.onclick = function() {
+                document.querySelectorAll('.hardware-option[data-deployment]').forEach(o => o.classList.remove('selected'));
+                this.classList.add('selected');
+                selectedDeployment = this.dataset.deployment;
+
+                // Show/hide worker config section
+                updateWorkerConfigVisibility();
+            };
+        });
+    }
+
+    async function loadServerInfo() {
+        try {
+            const response = await fetch('/api/setup/server-info');
+            if (response.ok) {
+                const data = await response.json();
+                serverInfo = data;
+            }
+        } catch (err) {
+            console.log('Could not load server info, using defaults');
+        }
+        updateWorkerConnectionInfo();
+    }
+
+    function updateWorkerConfigVisibility() {
+        const workerSection = document.getElementById('worker-config-section');
+        if (selectedDeployment === 'split') {
+            workerSection.style.display = 'block';
+            updateWorkerConnectionInfo();
+        } else {
+            workerSection.style.display = 'none';
+        }
+    }
+
+    function updateWorkerConnectionInfo() {
+        const serverIp = serverInfo.host || window.location.hostname;
+        const redisPort = serverInfo.redis_port || '6379';
+        const postgresPort = serverInfo.postgres_port || '5432';
+
+        document.getElementById('worker-redis-url').textContent = `redis://${serverIp}:${redisPort}/0`;
+        document.getElementById('worker-postgres-host').textContent = serverIp;
+        updateWorkerComposeRecommendation();
+    }
+
+    function updateWorkerComposeRecommendation() {
+        const composeFile = selectedHardware === 'nvidia'
+            ? 'docker-compose-worker-nvidia.yaml'
+            : 'docker-compose-worker-cpu.yaml';
+        document.getElementById('worker-compose-file').textContent = composeFile;
+        document.getElementById('worker-compose-help').innerHTML =
+            `Run on worker machine: <code>docker-compose -f ${composeFile} up -d</code>`;
+    }
+
+    function copyToClipboard(elementId) {
+        const element = document.getElementById(elementId);
+        const text = element.textContent;
+
+        navigator.clipboard.writeText(text).then(() => {
+            const btn = element.parentElement.querySelector('.copy-btn');
+            btn.textContent = 'Copied!';
+            btn.classList.add('copied');
+            setTimeout(() => {
+                btn.textContent = 'Copy';
+                btn.classList.remove('copied');
+            }, 2000);
+        }).catch(err => {
+            console.error('Failed to copy:', err);
+        });
+    }
+
     function toggleAdvanced() {
         const content = document.getElementById('advanced-settings');
         const arrow = document.getElementById('advanced-arrow');
@@ -958,7 +1145,15 @@ <h4>Existing Installation Detected</h4>
             return p ? p.name : type;
         }).join(', ');
 
+        let deploymentInfo = selectedDeployment === 'unified'
+            ? 'Unified (server + worker on same machine)'
+            : 'Split (workers on separate machines)';
+
         summary.innerHTML = `
+            <div class="summary-item">
+                <span class="summary-label">Deployment Mode</span>
+                <span class="summary-value">${deploymentInfo}</span>
+            </div>
             <div class="summary-item">
                 <span class="summary-label">Hardware</span>
                 <span class="summary-value">${selectedHardware === 'nvidia' ? 'NVIDIA GPU' : 'CPU Only'}</span>
@@ -1005,6 +1200,7 @@ <h4>Existing Installation Detected</h4>
                 method: 'PUT',
                 headers: { 'Content-Type': 'application/json' },
                 body: JSON.stringify({
+                    deployment_type: selectedDeployment,
                     hardware_type: selectedHardware,
                     clap_enabled: document.getElementById('setting-clap-enabled').checked,
                     gpu_clustering: document.getElementById('setting-gpu-clustering').checked,

From 9b2d8215bf60763f262be22360c0eb22d7968084 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 04:46:47 +0000
Subject: [PATCH 04/33] Clarify unified compose files for CPU and NVIDIA in
 setup wizard

- Add Docker Compose file recommendation to setup summary
- Show correct unified file based on hardware selection
- Clarify CPU vs NVIDIA image usage in .env.example comments

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 deployment/.env.example | 10 ++++++----
 templates/setup.html    | 17 +++++++++++++++++
 2 files changed, 23 insertions(+), 4 deletions(-)

diff --git a/deployment/.env.example b/deployment/.env.example
index fc8867a4..bc5b2bc1 100644
--- a/deployment/.env.example
+++ b/deployment/.env.example
@@ -103,12 +103,14 @@ TZ=UTC
 #
 # DEPLOYMENT OPTIONS:
 #   1. UNIFIED (default) - Server and worker on same machine
-#      Use: docker-compose-unified.yaml or docker-compose-unified-nvidia.yaml
-#      Leave these settings at defaults
+#      CPU:    docker-compose-unified.yaml (uses :latest image)
+#      NVIDIA: docker-compose-unified-nvidia.yaml (uses :latest-nvidia image)
+#      Leave WORKER_* settings at defaults
 #
 #   2. SPLIT - Server and worker on different machines
-#      Server machine: Run docker-compose-server.yaml
-#      Worker machine: Run docker-compose-worker-cpu.yaml or docker-compose-worker-nvidia.yaml
+#      Server machine: docker-compose-server.yaml
+#      Worker machine: docker-compose-worker-cpu.yaml (CPU) or
+#                      docker-compose-worker-nvidia.yaml (NVIDIA GPU)
 #      Configure WORKER_* settings below on worker machine
 #
 # On the WORKER machine, set these to point to the SERVER machine:
diff --git a/templates/setup.html b/templates/setup.html
index 81f4189b..451b21f4 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -1149,6 +1149,19 @@ <h4>Existing Installation Detected</h4>
             ? 'Unified (server + worker on same machine)'
             : 'Split (workers on separate machines)';
 
+        // Determine recommended compose files
+        let composeFiles = [];
+        if (selectedDeployment === 'unified') {
+            composeFiles.push(selectedHardware === 'nvidia'
+                ? 'docker-compose-unified-nvidia.yaml'
+                : 'docker-compose-unified.yaml');
+        } else {
+            composeFiles.push('docker-compose-server.yaml (this machine)');
+            composeFiles.push(selectedHardware === 'nvidia'
+                ? 'docker-compose-worker-nvidia.yaml (workers)'
+                : 'docker-compose-worker-cpu.yaml (workers)');
+        }
+
         summary.innerHTML = `
             <div class="summary-item">
                 <span class="summary-label">Deployment Mode</span>
@@ -1158,6 +1171,10 @@ <h4>Existing Installation Detected</h4>
                 <span class="summary-label">Hardware</span>
                 <span class="summary-value">${selectedHardware === 'nvidia' ? 'NVIDIA GPU' : 'CPU Only'}</span>
             </div>
+            <div class="summary-item">
+                <span class="summary-label">Docker Compose Files</span>
+                <span class="summary-value">${composeFiles.join('<br>')}</span>
+            </div>
             <div class="summary-item">
                 <span class="summary-label">Providers</span>
                 <span class="summary-value">${providerNames || 'None selected'}</span>

From 9287f36ee975850ed89b6fecee0d99dcfd895227 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 07:27:31 +0000
Subject: [PATCH 05/33] Add dedicated Settings page for configuration
 management

- Create settings.html with collapsible sections for:
  - Media Providers (list, add, edit, delete, set primary)
  - Deployment (unified/split mode, hardware type, worker info)
  - Analysis (CLAP, GPU clustering)
  - AI Integration (playlist naming provider)
- Add /settings route in app_setup.py
- Update sidebar navigation with Settings link
- Keep Setup Wizard as separate option for initial configuration

The Settings page provides quick access to modify individual settings
without going through the full setup wizard flow.

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_setup.py                |    6 +
 templates/settings.html     | 1184 +++++++++++++++++++++++++++++++++++
 templates/sidebar_navi.html |    3 +-
 3 files changed, 1192 insertions(+), 1 deletion(-)
 create mode 100644 templates/settings.html

diff --git a/app_setup.py b/app_setup.py
index 507441be..f857f5e8 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -278,6 +278,12 @@ def setup_page():
     return render_template('setup.html', title='AudioMuse-AI - Setup', active='setup')
 
 
+@setup_bp.route('/settings')
+def settings_page():
+    """Render the settings page."""
+    return render_template('settings.html', title='AudioMuse-AI - Settings', active='settings')
+
+
 @setup_bp.route('/api/setup/status', methods=['GET'])
 def get_setup_status():
     """
diff --git a/templates/settings.html b/templates/settings.html
new file mode 100644
index 00000000..1116c7c1
--- /dev/null
+++ b/templates/settings.html
@@ -0,0 +1,1184 @@
+{% extends "includes/layout.html" %}
+
+{% block headAdditions %}
+<style>
+    .settings-page {
+        max-width: 900px;
+        margin: 0 auto;
+    }
+
+    .settings-header {
+        margin-bottom: 2rem;
+    }
+
+    .settings-header h1 {
+        font-size: 1.8rem;
+        margin-bottom: 0.5rem;
+    }
+
+    .settings-header .subtitle {
+        color: var(--text-muted);
+    }
+
+    /* Settings Sections */
+    .settings-section {
+        background: var(--bg-secondary);
+        border-radius: 8px;
+        margin-bottom: 1.5rem;
+        overflow: hidden;
+    }
+
+    .section-header {
+        display: flex;
+        justify-content: space-between;
+        align-items: center;
+        padding: 1rem 1.5rem;
+        cursor: pointer;
+        user-select: none;
+        border-bottom: 1px solid var(--border-color);
+    }
+
+    .section-header:hover {
+        background: rgba(var(--primary-rgb), 0.05);
+    }
+
+    .section-header h2 {
+        font-size: 1.1rem;
+        margin: 0;
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+    }
+
+    .section-header .section-icon {
+        font-size: 1.2rem;
+    }
+
+    .section-header .toggle-icon {
+        transition: transform 0.2s ease;
+    }
+
+    .section-header.collapsed .toggle-icon {
+        transform: rotate(-90deg);
+    }
+
+    .section-content {
+        padding: 1.5rem;
+    }
+
+    .section-content.collapsed {
+        display: none;
+    }
+
+    .section-description {
+        color: var(--text-muted);
+        margin-bottom: 1.5rem;
+        font-size: 0.95rem;
+    }
+
+    /* Form Fields */
+    .field-group {
+        margin-bottom: 1.25rem;
+    }
+
+    .field-group:last-child {
+        margin-bottom: 0;
+    }
+
+    .field-group label {
+        display: block;
+        margin-bottom: 0.5rem;
+        font-weight: 500;
+    }
+
+    .field-group .field-help {
+        font-size: 0.85rem;
+        color: var(--text-muted);
+        margin-top: 0.25rem;
+    }
+
+    .field-group input[type="text"],
+    .field-group input[type="password"],
+    .field-group input[type="number"],
+    .field-group select {
+        width: 100%;
+        max-width: 400px;
+        padding: 0.5rem 0.75rem;
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+        background: var(--bg-primary);
+        color: var(--text-color);
+        font-size: 0.95rem;
+    }
+
+    .field-group input:focus,
+    .field-group select:focus {
+        outline: none;
+        border-color: var(--primary-color);
+    }
+
+    .field-group .checkbox-label {
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+        cursor: pointer;
+    }
+
+    .field-group .checkbox-label input {
+        width: auto;
+    }
+
+    /* Option Cards (for deployment/hardware) */
+    .option-cards {
+        display: flex;
+        gap: 1rem;
+        flex-wrap: wrap;
+    }
+
+    .option-card {
+        flex: 1;
+        min-width: 200px;
+        max-width: 280px;
+        padding: 1rem;
+        border: 2px solid var(--border-color);
+        border-radius: 8px;
+        cursor: pointer;
+        transition: all 0.2s ease;
+        text-align: center;
+    }
+
+    .option-card:hover {
+        border-color: var(--primary-color);
+    }
+
+    .option-card.selected {
+        border-color: var(--primary-color);
+        background: rgba(var(--primary-rgb), 0.1);
+    }
+
+    .option-card .card-icon {
+        font-size: 1.5rem;
+        margin-bottom: 0.5rem;
+    }
+
+    .option-card .card-title {
+        font-weight: bold;
+        margin-bottom: 0.25rem;
+    }
+
+    .option-card .card-desc {
+        font-size: 0.85rem;
+        color: var(--text-muted);
+    }
+
+    /* Provider List */
+    .provider-list {
+        margin-top: 1rem;
+    }
+
+    .provider-item {
+        display: flex;
+        align-items: center;
+        justify-content: space-between;
+        padding: 1rem;
+        background: var(--bg-primary);
+        border-radius: 8px;
+        margin-bottom: 0.5rem;
+    }
+
+    .provider-item .provider-info {
+        display: flex;
+        align-items: center;
+        gap: 1rem;
+    }
+
+    .provider-item .provider-name {
+        font-weight: 500;
+    }
+
+    .provider-item .provider-type {
+        font-size: 0.85rem;
+        color: var(--text-muted);
+    }
+
+    .provider-item .provider-badges {
+        display: flex;
+        gap: 0.5rem;
+    }
+
+    .badge {
+        padding: 0.2rem 0.5rem;
+        border-radius: 4px;
+        font-size: 0.75rem;
+        font-weight: 500;
+    }
+
+    .badge-primary {
+        background: rgba(var(--primary-rgb), 0.2);
+        color: var(--primary-color);
+    }
+
+    .badge-enabled {
+        background: rgba(40, 167, 69, 0.2);
+        color: #28a745;
+    }
+
+    .badge-disabled {
+        background: rgba(108, 117, 125, 0.2);
+        color: #6c757d;
+    }
+
+    .provider-item .provider-actions {
+        display: flex;
+        gap: 0.5rem;
+    }
+
+    .provider-item .provider-actions button {
+        padding: 0.4rem 0.75rem;
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+        background: var(--bg-secondary);
+        cursor: pointer;
+        font-size: 0.85rem;
+    }
+
+    .provider-item .provider-actions button:hover {
+        background: var(--bg-primary);
+    }
+
+    .provider-item .provider-actions button.btn-danger {
+        border-color: #dc3545;
+        color: #dc3545;
+    }
+
+    .provider-item .provider-actions button.btn-danger:hover {
+        background: rgba(220, 53, 69, 0.1);
+    }
+
+    .add-provider-btn {
+        display: flex;
+        align-items: center;
+        justify-content: center;
+        gap: 0.5rem;
+        width: 100%;
+        padding: 1rem;
+        border: 2px dashed var(--border-color);
+        border-radius: 8px;
+        background: transparent;
+        color: var(--text-muted);
+        cursor: pointer;
+        margin-top: 1rem;
+        font-size: 0.95rem;
+    }
+
+    .add-provider-btn:hover {
+        border-color: var(--primary-color);
+        color: var(--primary-color);
+    }
+
+    /* Worker Connection Info */
+    .connection-info {
+        background: var(--bg-primary);
+        padding: 1rem;
+        border-radius: 8px;
+        margin-top: 1rem;
+    }
+
+    .connection-info .info-row {
+        display: flex;
+        align-items: center;
+        gap: 0.75rem;
+        margin-bottom: 0.75rem;
+    }
+
+    .connection-info .info-row:last-child {
+        margin-bottom: 0;
+    }
+
+    .connection-info .info-label {
+        min-width: 150px;
+        font-weight: 500;
+        font-size: 0.9rem;
+    }
+
+    .connection-info .info-value {
+        flex: 1;
+        font-family: monospace;
+        background: var(--bg-secondary);
+        padding: 0.5rem 0.75rem;
+        border-radius: 4px;
+        font-size: 0.9rem;
+    }
+
+    .connection-info .copy-btn {
+        padding: 0.4rem 0.75rem;
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+        background: var(--bg-secondary);
+        cursor: pointer;
+        font-size: 0.8rem;
+    }
+
+    .connection-info .copy-btn:hover {
+        background: var(--bg-primary);
+    }
+
+    .connection-info .copy-btn.copied {
+        background: rgba(40, 167, 69, 0.2);
+        border-color: #28a745;
+        color: #28a745;
+    }
+
+    /* Save Button */
+    .save-bar {
+        position: sticky;
+        bottom: 0;
+        background: var(--bg-secondary);
+        padding: 1rem 1.5rem;
+        margin: 2rem -1rem -1rem -1rem;
+        border-top: 1px solid var(--border-color);
+        display: flex;
+        justify-content: flex-end;
+        gap: 1rem;
+    }
+
+    .save-bar button {
+        padding: 0.6rem 1.5rem;
+        border-radius: 4px;
+        font-weight: 500;
+        cursor: pointer;
+    }
+
+    .btn-save {
+        background: var(--primary-color);
+        border: none;
+        color: white;
+    }
+
+    .btn-save:hover {
+        opacity: 0.9;
+    }
+
+    .btn-save:disabled {
+        opacity: 0.5;
+        cursor: not-allowed;
+    }
+
+    /* Modal */
+    .modal-overlay {
+        display: none;
+        position: fixed;
+        top: 0;
+        left: 0;
+        right: 0;
+        bottom: 0;
+        background: rgba(0, 0, 0, 0.5);
+        z-index: 1000;
+        align-items: center;
+        justify-content: center;
+    }
+
+    .modal-overlay.visible {
+        display: flex;
+    }
+
+    .modal {
+        background: var(--bg-secondary);
+        border-radius: 8px;
+        max-width: 500px;
+        width: 90%;
+        max-height: 80vh;
+        overflow-y: auto;
+    }
+
+    .modal-header {
+        padding: 1rem 1.5rem;
+        border-bottom: 1px solid var(--border-color);
+        display: flex;
+        justify-content: space-between;
+        align-items: center;
+    }
+
+    .modal-header h3 {
+        margin: 0;
+    }
+
+    .modal-header .close-btn {
+        background: none;
+        border: none;
+        font-size: 1.5rem;
+        cursor: pointer;
+        color: var(--text-muted);
+    }
+
+    .modal-body {
+        padding: 1.5rem;
+    }
+
+    .modal-footer {
+        padding: 1rem 1.5rem;
+        border-top: 1px solid var(--border-color);
+        display: flex;
+        justify-content: flex-end;
+        gap: 0.75rem;
+    }
+
+    .modal-footer button {
+        padding: 0.5rem 1rem;
+        border-radius: 4px;
+        cursor: pointer;
+    }
+
+    .modal-footer .btn-cancel {
+        background: var(--bg-primary);
+        border: 1px solid var(--border-color);
+    }
+
+    .modal-footer .btn-primary {
+        background: var(--primary-color);
+        border: none;
+        color: white;
+    }
+
+    /* Toast notifications */
+    .toast {
+        position: fixed;
+        bottom: 2rem;
+        right: 2rem;
+        padding: 1rem 1.5rem;
+        border-radius: 8px;
+        background: var(--bg-secondary);
+        border: 1px solid var(--border-color);
+        box-shadow: 0 4px 12px rgba(0, 0, 0, 0.15);
+        z-index: 1001;
+        display: none;
+    }
+
+    .toast.visible {
+        display: block;
+        animation: slideIn 0.3s ease;
+    }
+
+    .toast.success {
+        border-color: #28a745;
+    }
+
+    .toast.error {
+        border-color: #dc3545;
+    }
+
+    @keyframes slideIn {
+        from { transform: translateY(20px); opacity: 0; }
+        to { transform: translateY(0); opacity: 1; }
+    }
+
+    /* Test result */
+    .test-result {
+        margin-top: 0.5rem;
+        padding: 0.5rem 0.75rem;
+        border-radius: 4px;
+        font-size: 0.9rem;
+    }
+
+    .test-result.success {
+        background: rgba(40, 167, 69, 0.2);
+        color: #28a745;
+    }
+
+    .test-result.error {
+        background: rgba(220, 53, 69, 0.2);
+        color: #dc3545;
+    }
+</style>
+{% endblock %}
+
+{% block content %}
+<div class="settings-page">
+    <div class="settings-header">
+        <h1>Settings</h1>
+        <p class="subtitle">Configure AudioMuse-AI settings and manage providers</p>
+    </div>
+
+    <!-- Providers Section -->
+    <div class="settings-section">
+        <div class="section-header" onclick="toggleSection(this)">
+            <h2><span class="section-icon">&#128230;</span> Media Providers</h2>
+            <span class="toggle-icon">&#9660;</span>
+        </div>
+        <div class="section-content">
+            <p class="section-description">
+                Configure your music library sources. Multiple providers can share analysis data through file path linking.
+            </p>
+
+            <div class="field-group">
+                <label for="primary-provider">Primary Provider</label>
+                <select id="primary-provider" onchange="markDirty()">
+                    <option value="">-- Select Primary --</option>
+                </select>
+                <div class="field-help">Used by default for API calls without provider specification</div>
+            </div>
+
+            <div class="provider-list" id="provider-list">
+                <!-- Populated by JS -->
+            </div>
+
+            <button class="add-provider-btn" onclick="showAddProviderModal()">
+                <span>+</span> Add Provider
+            </button>
+        </div>
+    </div>
+
+    <!-- Deployment Section -->
+    <div class="settings-section">
+        <div class="section-header" onclick="toggleSection(this)">
+            <h2><span class="section-icon">&#9881;</span> Deployment</h2>
+            <span class="toggle-icon">&#9660;</span>
+        </div>
+        <div class="section-content">
+            <p class="section-description">
+                Configure how AudioMuse-AI is deployed across your infrastructure.
+            </p>
+
+            <div class="field-group">
+                <label>Deployment Mode</label>
+                <div class="option-cards">
+                    <div class="option-card selected" data-value="unified" onclick="selectOption(this, 'deployment')">
+                        <div class="card-icon">&#128230;</div>
+                        <div class="card-title">Unified</div>
+                        <div class="card-desc">Server and worker on same machine</div>
+                    </div>
+                    <div class="option-card" data-value="split" onclick="selectOption(this, 'deployment')">
+                        <div class="card-icon">&#128423;</div>
+                        <div class="card-title">Split</div>
+                        <div class="card-desc">Workers on separate machines</div>
+                    </div>
+                </div>
+            </div>
+
+            <div class="field-group">
+                <label>Hardware Type</label>
+                <div class="option-cards">
+                    <div class="option-card selected" data-value="cpu" onclick="selectOption(this, 'hardware')">
+                        <div class="card-icon">&#128187;</div>
+                        <div class="card-title">CPU Only</div>
+                        <div class="card-desc">Standard processing</div>
+                    </div>
+                    <div class="option-card" data-value="nvidia" onclick="selectOption(this, 'hardware')">
+                        <div class="card-icon">&#9889;</div>
+                        <div class="card-title">NVIDIA GPU</div>
+                        <div class="card-desc">CUDA acceleration</div>
+                    </div>
+                </div>
+            </div>
+
+            <div id="worker-info" style="display: none;">
+                <div class="field-group">
+                    <label>Worker Connection Info</label>
+                    <div class="field-help">Use these settings when configuring remote workers</div>
+                    <div class="connection-info">
+                        <div class="info-row">
+                            <span class="info-label">Redis URL:</span>
+                            <span class="info-value" id="worker-redis-url">redis://localhost:6379/0</span>
+                            <button class="copy-btn" onclick="copyValue('worker-redis-url')">Copy</button>
+                        </div>
+                        <div class="info-row">
+                            <span class="info-label">PostgreSQL Host:</span>
+                            <span class="info-value" id="worker-postgres-host">localhost</span>
+                            <button class="copy-btn" onclick="copyValue('worker-postgres-host')">Copy</button>
+                        </div>
+                        <div class="info-row">
+                            <span class="info-label">Compose File:</span>
+                            <span class="info-value" id="worker-compose-file">docker-compose-worker-cpu.yaml</span>
+                        </div>
+                    </div>
+                </div>
+            </div>
+        </div>
+    </div>
+
+    <!-- Analysis Section -->
+    <div class="settings-section">
+        <div class="section-header" onclick="toggleSection(this)">
+            <h2><span class="section-icon">&#128202;</span> Analysis</h2>
+            <span class="toggle-icon">&#9660;</span>
+        </div>
+        <div class="section-content">
+            <p class="section-description">
+                Configure music analysis features and performance options.
+            </p>
+
+            <div class="field-group">
+                <label class="checkbox-label">
+                    <input type="checkbox" id="clap-enabled" checked onchange="markDirty()">
+                    <span>Enable CLAP Text Search</span>
+                </label>
+                <div class="field-help">Search music using natural language. Uses ~750MB additional memory.</div>
+            </div>
+
+            <div class="field-group">
+                <label class="checkbox-label">
+                    <input type="checkbox" id="gpu-clustering" onchange="markDirty()">
+                    <span>Use GPU for Clustering</span>
+                </label>
+                <div class="field-help">Accelerate clustering with NVIDIA RAPIDS cuML. Requires NVIDIA GPU.</div>
+            </div>
+        </div>
+    </div>
+
+    <!-- AI Section -->
+    <div class="settings-section">
+        <div class="section-header" onclick="toggleSection(this)">
+            <h2><span class="section-icon">&#129302;</span> AI Integration</h2>
+            <span class="toggle-icon">&#9660;</span>
+        </div>
+        <div class="section-content">
+            <p class="section-description">
+                Configure AI providers for creative playlist naming and other features.
+            </p>
+
+            <div class="field-group">
+                <label for="ai-provider">AI Provider</label>
+                <select id="ai-provider" onchange="markDirty()">
+                    <option value="NONE">None (Use Default Names)</option>
+                    <option value="OLLAMA">Ollama (Local)</option>
+                    <option value="OPENAI">OpenAI / OpenRouter</option>
+                    <option value="GEMINI">Google Gemini</option>
+                    <option value="MISTRAL">Mistral AI</option>
+                </select>
+                <div class="field-help">AI service for generating creative playlist names</div>
+            </div>
+        </div>
+    </div>
+
+    <!-- Save Bar -->
+    <div class="save-bar">
+        <button class="btn-save" id="save-btn" onclick="saveSettings()" disabled>Save Changes</button>
+    </div>
+</div>
+
+<!-- Add/Edit Provider Modal -->
+<div class="modal-overlay" id="provider-modal">
+    <div class="modal">
+        <div class="modal-header">
+            <h3 id="modal-title">Add Provider</h3>
+            <button class="close-btn" onclick="closeProviderModal()">&times;</button>
+        </div>
+        <div class="modal-body">
+            <div class="field-group">
+                <label for="provider-type">Provider Type</label>
+                <select id="provider-type" onchange="updateProviderFields()">
+                    <!-- Populated by JS -->
+                </select>
+            </div>
+            <div id="provider-fields">
+                <!-- Populated based on provider type -->
+            </div>
+            <div id="provider-test-result" class="test-result" style="display: none;"></div>
+        </div>
+        <div class="modal-footer">
+            <button class="btn-cancel" onclick="closeProviderModal()">Cancel</button>
+            <button class="btn-cancel" onclick="testProviderConnection()">Test Connection</button>
+            <button class="btn-primary" onclick="saveProvider()">Save Provider</button>
+        </div>
+    </div>
+</div>
+
+<!-- Toast -->
+<div class="toast" id="toast"></div>
+{% endblock %}
+
+{% block bodyAdditions %}
+<script src="{{ url_for('static', filename='menu.js') }}"></script>
+<script>
+    // State
+    let providers = [];
+    let providerTypes = [];
+    let settings = {};
+    let serverInfo = {};
+    let isDirty = false;
+    let editingProviderId = null;
+
+    // Initialize
+    document.addEventListener('DOMContentLoaded', async function() {
+        await Promise.all([
+            loadProviders(),
+            loadProviderTypes(),
+            loadSettings(),
+            loadServerInfo()
+        ]);
+        renderProviders();
+        applySettings();
+        updateWorkerInfo();
+    });
+
+    // Data loading
+    async function loadProviders() {
+        try {
+            const response = await fetch('/api/setup/providers');
+            providers = await response.json();
+        } catch (err) {
+            console.error('Error loading providers:', err);
+        }
+    }
+
+    async function loadProviderTypes() {
+        try {
+            const response = await fetch('/api/setup/providers/types');
+            providerTypes = await response.json();
+        } catch (err) {
+            console.error('Error loading provider types:', err);
+        }
+    }
+
+    async function loadSettings() {
+        try {
+            const response = await fetch('/api/setup/settings');
+            settings = await response.json();
+        } catch (err) {
+            console.error('Error loading settings:', err);
+        }
+    }
+
+    async function loadServerInfo() {
+        try {
+            const response = await fetch('/api/setup/server-info');
+            serverInfo = await response.json();
+        } catch (err) {
+            console.error('Error loading server info:', err);
+        }
+    }
+
+    // Rendering
+    function renderProviders() {
+        const list = document.getElementById('provider-list');
+        const primarySelect = document.getElementById('primary-provider');
+
+        list.innerHTML = '';
+        primarySelect.innerHTML = '<option value="">-- Select Primary --</option>';
+
+        providers.forEach(p => {
+            const typeInfo = providerTypes.find(t => t.type === p.provider_type) || {};
+            const isPrimary = settings.primary_provider_id === p.id;
+
+            const item = document.createElement('div');
+            item.className = 'provider-item';
+            item.innerHTML = `
+                <div class="provider-info">
+                    <div>
+                        <div class="provider-name">${p.name || typeInfo.name || p.provider_type}</div>
+                        <div class="provider-type">${typeInfo.name || p.provider_type}</div>
+                    </div>
+                    <div class="provider-badges">
+                        ${isPrimary ? '<span class="badge badge-primary">Primary</span>' : ''}
+                        <span class="badge ${p.enabled ? 'badge-enabled' : 'badge-disabled'}">${p.enabled ? 'Enabled' : 'Disabled'}</span>
+                    </div>
+                </div>
+                <div class="provider-actions">
+                    <button onclick="editProvider(${p.id})">Edit</button>
+                    <button onclick="toggleProvider(${p.id}, ${!p.enabled})">${p.enabled ? 'Disable' : 'Enable'}</button>
+                    <button class="btn-danger" onclick="deleteProvider(${p.id})">Delete</button>
+                </div>
+            `;
+            list.appendChild(item);
+
+            // Add to primary select
+            const option = document.createElement('option');
+            option.value = p.id;
+            option.textContent = p.name || typeInfo.name || p.provider_type;
+            if (isPrimary) option.selected = true;
+            primarySelect.appendChild(option);
+        });
+
+        if (providers.length === 0) {
+            list.innerHTML = '<p style="color: var(--text-muted); text-align: center; padding: 2rem;">No providers configured. Add one to get started.</p>';
+        }
+    }
+
+    function applySettings() {
+        // Deployment
+        document.querySelectorAll('.option-card[data-value]').forEach(card => {
+            const parent = card.parentElement;
+            const isDeployment = parent.previousElementSibling?.textContent.includes('Deployment');
+            const isHardware = parent.previousElementSibling?.textContent.includes('Hardware');
+
+            if (isDeployment && settings.deployment_type === card.dataset.value) {
+                selectOption(card, 'deployment', false);
+            } else if (isHardware && settings.hardware_type === card.dataset.value) {
+                selectOption(card, 'hardware', false);
+            }
+        });
+
+        // Analysis
+        document.getElementById('clap-enabled').checked = settings.clap_enabled !== false;
+        document.getElementById('gpu-clustering').checked = settings.gpu_clustering === true;
+
+        // AI
+        const aiProvider = document.getElementById('ai-provider');
+        if (settings.ai_provider) {
+            aiProvider.value = settings.ai_provider;
+        }
+
+        // Update GPU clustering availability
+        updateGpuClusteringState();
+    }
+
+    function updateWorkerInfo() {
+        const workerInfo = document.getElementById('worker-info');
+        const deploymentCards = document.querySelectorAll('.option-card[data-value="unified"], .option-card[data-value="split"]');
+        let selectedDeployment = 'unified';
+        deploymentCards.forEach(card => {
+            if (card.classList.contains('selected')) {
+                selectedDeployment = card.dataset.value;
+            }
+        });
+
+        workerInfo.style.display = selectedDeployment === 'split' ? 'block' : 'none';
+
+        if (selectedDeployment === 'split') {
+            const serverIp = serverInfo.host || window.location.hostname;
+            const redisPort = serverInfo.redis_port || '6379';
+
+            document.getElementById('worker-redis-url').textContent = `redis://${serverIp}:${redisPort}/0`;
+            document.getElementById('worker-postgres-host').textContent = serverIp;
+
+            // Update compose file based on hardware
+            const hardwareCards = document.querySelectorAll('.option-card[data-value="cpu"], .option-card[data-value="nvidia"]');
+            let selectedHardware = 'cpu';
+            hardwareCards.forEach(card => {
+                if (card.classList.contains('selected') && (card.dataset.value === 'cpu' || card.dataset.value === 'nvidia')) {
+                    selectedHardware = card.dataset.value;
+                }
+            });
+
+            const composeFile = selectedHardware === 'nvidia'
+                ? 'docker-compose-worker-nvidia.yaml'
+                : 'docker-compose-worker-cpu.yaml';
+            document.getElementById('worker-compose-file').textContent = composeFile;
+        }
+    }
+
+    function updateGpuClusteringState() {
+        const gpuClustering = document.getElementById('gpu-clustering');
+        const hardwareCards = document.querySelectorAll('.option-card[data-value="cpu"], .option-card[data-value="nvidia"]');
+        let selectedHardware = 'cpu';
+        hardwareCards.forEach(card => {
+            if (card.classList.contains('selected') && (card.dataset.value === 'cpu' || card.dataset.value === 'nvidia')) {
+                selectedHardware = card.dataset.value;
+            }
+        });
+
+        if (selectedHardware !== 'nvidia') {
+            gpuClustering.checked = false;
+            gpuClustering.disabled = true;
+        } else {
+            gpuClustering.disabled = false;
+        }
+    }
+
+    // UI interactions
+    function toggleSection(header) {
+        header.classList.toggle('collapsed');
+        header.nextElementSibling.classList.toggle('collapsed');
+    }
+
+    function selectOption(card, type, markAsDirty = true) {
+        const parent = card.parentElement;
+        parent.querySelectorAll('.option-card').forEach(c => c.classList.remove('selected'));
+        card.classList.add('selected');
+
+        if (markAsDirty) markDirty();
+
+        if (type === 'deployment') {
+            updateWorkerInfo();
+        } else if (type === 'hardware') {
+            updateGpuClusteringState();
+            updateWorkerInfo();
+        }
+    }
+
+    function markDirty() {
+        isDirty = true;
+        document.getElementById('save-btn').disabled = false;
+    }
+
+    function copyValue(elementId) {
+        const element = document.getElementById(elementId);
+        navigator.clipboard.writeText(element.textContent).then(() => {
+            const btn = element.nextElementSibling;
+            btn.textContent = 'Copied!';
+            btn.classList.add('copied');
+            setTimeout(() => {
+                btn.textContent = 'Copy';
+                btn.classList.remove('copied');
+            }, 2000);
+        });
+    }
+
+    // Provider modal
+    function showAddProviderModal() {
+        editingProviderId = null;
+        document.getElementById('modal-title').textContent = 'Add Provider';
+
+        const typeSelect = document.getElementById('provider-type');
+        typeSelect.innerHTML = '';
+        providerTypes.forEach(t => {
+            const option = document.createElement('option');
+            option.value = t.type;
+            option.textContent = t.name;
+            typeSelect.appendChild(option);
+        });
+
+        updateProviderFields();
+        document.getElementById('provider-test-result').style.display = 'none';
+        document.getElementById('provider-modal').classList.add('visible');
+    }
+
+    function editProvider(id) {
+        editingProviderId = id;
+        const provider = providers.find(p => p.id === id);
+        if (!provider) return;
+
+        document.getElementById('modal-title').textContent = 'Edit Provider';
+
+        const typeSelect = document.getElementById('provider-type');
+        typeSelect.innerHTML = '';
+        providerTypes.forEach(t => {
+            const option = document.createElement('option');
+            option.value = t.type;
+            option.textContent = t.name;
+            if (t.type === provider.provider_type) option.selected = true;
+            typeSelect.appendChild(option);
+        });
+        typeSelect.disabled = true; // Can't change type when editing
+
+        updateProviderFields(provider.config);
+        document.getElementById('provider-test-result').style.display = 'none';
+        document.getElementById('provider-modal').classList.add('visible');
+    }
+
+    function closeProviderModal() {
+        document.getElementById('provider-modal').classList.remove('visible');
+        document.getElementById('provider-type').disabled = false;
+        editingProviderId = null;
+    }
+
+    function updateProviderFields(existingConfig = {}) {
+        const type = document.getElementById('provider-type').value;
+        const typeInfo = providerTypes.find(t => t.type === type);
+        if (!typeInfo) return;
+
+        const container = document.getElementById('provider-fields');
+        container.innerHTML = '';
+
+        typeInfo.config_fields.forEach(field => {
+            const div = document.createElement('div');
+            div.className = 'field-group';
+
+            const value = existingConfig[field.name] || field.default || '';
+
+            let inputHtml = '';
+            if (field.type === 'password') {
+                inputHtml = `<input type="password" id="field-${field.name}" value="${value}" placeholder="${field.default || ''}">`;
+            } else if (field.type === 'boolean') {
+                inputHtml = `<label class="checkbox-label"><input type="checkbox" id="field-${field.name}" ${value ? 'checked' : ''}><span>${field.label}</span></label>`;
+            } else if (field.type === 'number') {
+                inputHtml = `<input type="number" id="field-${field.name}" value="${value}">`;
+            } else {
+                inputHtml = `<input type="text" id="field-${field.name}" value="${value}" placeholder="${field.default || ''}">`;
+            }
+
+            div.innerHTML = `
+                ${field.type !== 'boolean' ? `<label for="field-${field.name}">${field.label}${field.required ? ' *' : ''}</label>` : ''}
+                ${inputHtml}
+                ${field.description ? `<div class="field-help">${field.description}</div>` : ''}
+            `;
+            container.appendChild(div);
+        });
+    }
+
+    function collectProviderConfig() {
+        const type = document.getElementById('provider-type').value;
+        const typeInfo = providerTypes.find(t => t.type === type);
+        if (!typeInfo) return {};
+
+        const config = {};
+        typeInfo.config_fields.forEach(field => {
+            const input = document.getElementById(`field-${field.name}`);
+            if (input) {
+                if (field.type === 'boolean') {
+                    config[field.name] = input.checked;
+                } else {
+                    config[field.name] = input.value;
+                }
+            }
+        });
+        return config;
+    }
+
+    async function testProviderConnection() {
+        const type = document.getElementById('provider-type').value;
+        const config = collectProviderConfig();
+        const resultDiv = document.getElementById('provider-test-result');
+
+        resultDiv.style.display = 'block';
+        resultDiv.className = 'test-result';
+        resultDiv.textContent = 'Testing connection...';
+
+        try {
+            const response = await fetch('/api/setup/providers/test', {
+                method: 'POST',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({ provider_type: type, config })
+            });
+            const data = await response.json();
+            resultDiv.className = `test-result ${data.success ? 'success' : 'error'}`;
+            resultDiv.textContent = data.message;
+        } catch (err) {
+            resultDiv.className = 'test-result error';
+            resultDiv.textContent = 'Connection test failed: ' + err.message;
+        }
+    }
+
+    async function saveProvider() {
+        const type = document.getElementById('provider-type').value;
+        const typeInfo = providerTypes.find(t => t.type === type);
+        const config = collectProviderConfig();
+
+        try {
+            let response;
+            if (editingProviderId) {
+                response = await fetch(`/api/setup/providers/${editingProviderId}`, {
+                    method: 'PUT',
+                    headers: { 'Content-Type': 'application/json' },
+                    body: JSON.stringify({ config })
+                });
+            } else {
+                response = await fetch('/api/setup/providers', {
+                    method: 'POST',
+                    headers: { 'Content-Type': 'application/json' },
+                    body: JSON.stringify({
+                        provider_type: type,
+                        name: typeInfo?.name || type,
+                        config,
+                        enabled: true
+                    })
+                });
+            }
+
+            if (response.ok) {
+                closeProviderModal();
+                await loadProviders();
+                renderProviders();
+                showToast('Provider saved successfully', 'success');
+            } else {
+                const data = await response.json();
+                showToast(data.error || 'Failed to save provider', 'error');
+            }
+        } catch (err) {
+            showToast('Error saving provider: ' + err.message, 'error');
+        }
+    }
+
+    async function toggleProvider(id, enabled) {
+        try {
+            const response = await fetch(`/api/setup/providers/${id}`, {
+                method: 'PUT',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({ enabled })
+            });
+            if (response.ok) {
+                await loadProviders();
+                renderProviders();
+                showToast(`Provider ${enabled ? 'enabled' : 'disabled'}`, 'success');
+            }
+        } catch (err) {
+            showToast('Error updating provider', 'error');
+        }
+    }
+
+    async function deleteProvider(id) {
+        if (!confirm('Are you sure you want to delete this provider?')) return;
+
+        try {
+            const response = await fetch(`/api/setup/providers/${id}`, {
+                method: 'DELETE'
+            });
+            if (response.ok) {
+                await loadProviders();
+                renderProviders();
+                showToast('Provider deleted', 'success');
+            }
+        } catch (err) {
+            showToast('Error deleting provider', 'error');
+        }
+    }
+
+    // Save settings
+    async function saveSettings() {
+        // Collect current values
+        const deploymentCards = document.querySelectorAll('.option-card[data-value="unified"], .option-card[data-value="split"]');
+        let deploymentType = 'unified';
+        deploymentCards.forEach(card => {
+            if (card.classList.contains('selected')) {
+                deploymentType = card.dataset.value;
+            }
+        });
+
+        const hardwareCards = document.querySelectorAll('.option-card[data-value="cpu"], .option-card[data-value="nvidia"]');
+        let hardwareType = 'cpu';
+        hardwareCards.forEach(card => {
+            if (card.classList.contains('selected') && (card.dataset.value === 'cpu' || card.dataset.value === 'nvidia')) {
+                hardwareType = card.dataset.value;
+            }
+        });
+
+        const settingsData = {
+            deployment_type: deploymentType,
+            hardware_type: hardwareType,
+            clap_enabled: document.getElementById('clap-enabled').checked,
+            gpu_clustering: document.getElementById('gpu-clustering').checked,
+            ai_provider: document.getElementById('ai-provider').value
+        };
+
+        try {
+            // Save settings
+            const settingsResponse = await fetch('/api/setup/settings', {
+                method: 'PUT',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify(settingsData)
+            });
+
+            // Save primary provider
+            const primaryProviderId = document.getElementById('primary-provider').value;
+            if (primaryProviderId) {
+                await fetch('/api/setup/primary-provider', {
+                    method: 'PUT',
+                    headers: { 'Content-Type': 'application/json' },
+                    body: JSON.stringify({ provider_id: parseInt(primaryProviderId) })
+                });
+            }
+
+            if (settingsResponse.ok) {
+                isDirty = false;
+                document.getElementById('save-btn').disabled = true;
+                settings = { ...settings, ...settingsData };
+                showToast('Settings saved successfully', 'success');
+            } else {
+                showToast('Failed to save settings', 'error');
+            }
+        } catch (err) {
+            showToast('Error saving settings: ' + err.message, 'error');
+        }
+    }
+
+    // Toast notifications
+    function showToast(message, type = 'info') {
+        const toast = document.getElementById('toast');
+        toast.textContent = message;
+        toast.className = `toast visible ${type}`;
+        setTimeout(() => {
+            toast.classList.remove('visible');
+        }, 3000);
+    }
+</script>
+{% endblock %}
diff --git a/templates/sidebar_navi.html b/templates/sidebar_navi.html
index 1f8932b9..ef5ea47d 100644
--- a/templates/sidebar_navi.html
+++ b/templates/sidebar_navi.html
@@ -12,5 +12,6 @@
 <!-- <li><a href="{{ url_for('collection_bp.collection_page') }}" {% if active == 'collection' %}class="active"{% endif %}">Collection Sync</a></li> -->
 <li><a href="{{ url_for('analysis_bp.cleaning_page') }}" {% if active == 'cleaning' %}class="active"{% endif %}>Cleaning</a></li>
 <li><a href="{{ url_for('cron_bp.cron_page') }}" {% if active == 'cron' %}class="active"{% endif %}>Scheduled Tasks</a></li>
-<li><a href="{{ url_for('setup.setup_page') }}" {% if active == 'setup' %}class="active"{% endif %}>Setup &amp; Providers</a></li>
+<li><a href="{{ url_for('setup.settings_page') }}" {% if active == 'settings' %}class="active"{% endif %}>Settings</a></li>
+<li><a href="{{ url_for('setup.setup_page') }}" {% if active == 'setup' %}class="active"{% endif %}>Setup Wizard</a></li>
 <li><button type="button" id="dark-mode-toggle" aria-pressed="false" aria-label="Toggle dark mode">🌙 Dark Mode</button></li>
\ No newline at end of file

From ab3b39ac6064c3088f2f913979d1948172967c01 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 07:44:00 +0000
Subject: [PATCH 06/33] Add multi-provider playlist creation with provider
 selector dropdown

- Add provider selector dropdown to all playlist forms
- Create shared provider-selector.js component for consistent UI
- Add /api/providers/enabled endpoint for fetching available providers
- Update create_playlist_from_ids to support provider_ids parameter
- Add create_playlist_multi_provider for creating on multiple providers
- Add get_all_playlists_multi_provider with deduplication
- Update all templates: similarity, path, clap_search, mulan_search,
  sonic_fingerprint, alchemy, artist_similarity, map, chat
- Support 'all' option to create playlist on all enabled providers

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_chat.py                      |  26 +++--
 app_voyager.py                   |  50 +++++++--
 static/provider-selector.js      | 179 ++++++++++++++++++++++++++++++
 tasks/mediaserver.py             | 185 +++++++++++++++++++++++++++++++
 tasks/voyager_manager.py         |  41 ++++++-
 templates/alchemy.html           |   8 +-
 templates/artist_similarity.html |  23 ++--
 templates/chat.html              |   6 +
 templates/clap_search.html       |  27 +++--
 templates/map.html               |   8 +-
 templates/mulan_search.html      |  18 ++-
 templates/path.html              |  19 +++-
 templates/similarity.html        |  21 +++-
 templates/sonic_fingerprint.html |   6 +
 14 files changed, 563 insertions(+), 54 deletions(-)
 create mode 100644 static/provider-selector.js

diff --git a/app_chat.py b/app_chat.py
index 4f8a5242..4ee17e84 100644
--- a/app_chat.py
+++ b/app_chat.py
@@ -750,7 +750,7 @@ def create_media_server_playlist_api():
     API endpoint to create a playlist on the configured media server.
     """
     # Local import to break circular dependency at startup
-    from tasks.mediaserver import create_instant_playlist
+    from tasks.voyager_manager import create_playlist_from_ids
 
     data = request.get_json()
     if not data or 'playlist_name' not in data or 'item_ids' not in data:
@@ -758,6 +758,7 @@ def create_media_server_playlist_api():
 
     user_playlist_name = data.get('playlist_name')
     item_ids = data.get('item_ids') # This will be a list of strings
+    provider_ids = data.get('provider_ids')  # Can be 'all', int, or list of ints
 
     if not user_playlist_name.strip():
         return jsonify({"message": "Error: Playlist name cannot be empty."}), 400
@@ -765,14 +766,21 @@ def create_media_server_playlist_api():
         return jsonify({"message": "Error: No songs provided to create the playlist."}), 400
 
     try:
-        # MODIFIED: Call the simplified create_instant_playlist function
-        created_playlist_info = create_instant_playlist(user_playlist_name, item_ids)
-        
-        if not created_playlist_info:
-            raise Exception("Media server did not return playlist information after creation.")
-            
-        # The created_playlist_info is the full JSON response from the media server
-        return jsonify({"message": f"Successfully created playlist '{user_playlist_name}' on the media server with ID: {created_playlist_info.get('Id')}"}), 200
+        # Use the voyager_manager function that supports multi-provider
+        result = create_playlist_from_ids(user_playlist_name, item_ids, provider_ids=provider_ids)
+
+        # Handle multi-provider result (dict) vs single provider result (string)
+        if isinstance(result, dict):
+            # Multi-provider response
+            success_count = sum(1 for r in result.values() if r.get('success'))
+            total_count = len(result)
+            return jsonify({
+                "message": f"Playlist '{user_playlist_name}' created on {success_count}/{total_count} provider(s).",
+                "results": result
+            }), 200
+        else:
+            # Single provider response
+            return jsonify({"message": f"Successfully created playlist '{user_playlist_name}' on the media server with ID: {result}"}), 200
 
     except Exception as e:
         # Log detailed error on the server
diff --git a/app_voyager.py b/app_voyager.py
index b1837a58..9896d0c0 100644
--- a/app_voyager.py
+++ b/app_voyager.py
@@ -321,6 +321,8 @@ def create_media_server_playlist():
                 items:
                   type: string
                 description: A list of track Item IDs to add to the playlist.
+              provider_ids:
+                description: Provider(s) to create playlist on. Can be 'all', a single ID, or array of IDs.
     responses:
       201:
         description: Playlist created successfully.
@@ -341,6 +343,7 @@ def create_media_server_playlist():
 
     playlist_name = data.get('playlist_name')
     track_ids_raw = data.get('track_ids', [])
+    provider_ids = data.get('provider_ids')  # Can be 'all', int, or list of ints
 
     if not playlist_name:
         return jsonify({"error": "Missing 'playlist_name'"}), 400
@@ -364,15 +367,46 @@ def create_media_server_playlist():
     user_creds = data.get('user_creds') if isinstance(data, dict) else None
 
     try:
-        new_playlist_id = create_playlist_from_ids(playlist_name, final_track_ids, user_creds=user_creds)
-
-        logger.info(f"Successfully created playlist '{playlist_name}' with ID {new_playlist_id}.")
-
-        return jsonify({
-            "message": f"Playlist '{playlist_name}' created successfully!",
-            "playlist_id": new_playlist_id
-        }), 201
+        result = create_playlist_from_ids(playlist_name, final_track_ids, user_creds=user_creds, provider_ids=provider_ids)
+
+        # Handle multi-provider result (dict) vs single provider result (string)
+        if isinstance(result, dict):
+            # Multi-provider response
+            success_count = sum(1 for r in result.values() if r.get('success'))
+            total_count = len(result)
+            logger.info(f"Created playlist '{playlist_name}' on {success_count}/{total_count} providers.")
+            return jsonify({
+                "message": f"Playlist '{playlist_name}' created on {success_count}/{total_count} provider(s).",
+                "results": result
+            }), 201
+        else:
+            # Single provider response (backward compatible)
+            logger.info(f"Successfully created playlist '{playlist_name}' with ID {result}.")
+            return jsonify({
+                "message": f"Playlist '{playlist_name}' created successfully!",
+                "playlist_id": result
+            }), 201
 
     except Exception as e:
         logger.error(f"Failed to create media server playlist '{playlist_name}': {e}", exc_info=True)
         return jsonify({"error": "An error occurred while creating the playlist on the media server."}), 500
+
+
+@voyager_bp.route('/api/providers/enabled', methods=['GET'])
+def get_enabled_providers():
+    """
+    Get list of enabled providers for playlist creation dropdown.
+    ---
+    tags:
+      - Providers
+    responses:
+      200:
+        description: List of enabled providers
+    """
+    try:
+        from tasks.mediaserver import get_enabled_providers_for_playlists
+        providers = get_enabled_providers_for_playlists()
+        return jsonify(providers), 200
+    except Exception as e:
+        logger.error(f"Failed to get enabled providers: {e}", exc_info=True)
+        return jsonify([]), 200
diff --git a/static/provider-selector.js b/static/provider-selector.js
new file mode 100644
index 00000000..754cfdb4
--- /dev/null
+++ b/static/provider-selector.js
@@ -0,0 +1,179 @@
+/**
+ * Provider Selector Component for Multi-Provider Playlist Support
+ *
+ * Usage:
+ * 1. Include this script in your template
+ * 2. Add a container div: <div id="provider-selector-container"></div>
+ * 3. Call initProviderSelector() after DOM is loaded
+ * 4. Get selected value with getSelectedProviders() when creating playlist
+ */
+
+let _providers = [];
+let _selectedProviderValue = null; // null = primary/default, 'all' = all providers, number = specific provider
+
+/**
+ * Initialize the provider selector component.
+ * Fetches enabled providers and renders the dropdown.
+ *
+ * @param {string} containerId - ID of the container element
+ * @param {object} options - Configuration options
+ * @param {boolean} options.showAllOption - Whether to show "All Providers" option (default: true)
+ * @param {boolean} options.showLabel - Whether to show label (default: true)
+ * @param {string} options.labelText - Label text (default: "Save to:")
+ */
+async function initProviderSelector(containerId = 'provider-selector-container', options = {}) {
+    const container = document.getElementById(containerId);
+    if (!container) {
+        console.warn(`Provider selector container '${containerId}' not found`);
+        return;
+    }
+
+    const showAllOption = options.showAllOption !== false;
+    const showLabel = options.showLabel !== false;
+    const labelText = options.labelText || 'Save to:';
+
+    try {
+        const response = await fetch('/api/providers/enabled');
+        _providers = await response.json();
+    } catch (err) {
+        console.error('Failed to load providers:', err);
+        _providers = [];
+    }
+
+    // Only show selector if there are multiple providers or showAllOption is true
+    if (_providers.length <= 1 && !showAllOption) {
+        container.style.display = 'none';
+        return;
+    }
+
+    // Build the selector HTML
+    let html = '<div class="provider-selector">';
+
+    if (showLabel) {
+        html += `<label for="provider-select">${labelText}</label>`;
+    }
+
+    html += '<select id="provider-select" class="provider-select">';
+    html += '<option value="">Primary Provider</option>';
+
+    if (showAllOption && _providers.length > 1) {
+        html += '<option value="all">All Providers</option>';
+    }
+
+    _providers.forEach(p => {
+        html += `<option value="${p.id}">${p.name}</option>`;
+    });
+
+    html += '</select></div>';
+
+    container.innerHTML = html;
+
+    // Add event listener
+    const select = document.getElementById('provider-select');
+    if (select) {
+        select.addEventListener('change', function() {
+            const value = this.value;
+            if (value === '') {
+                _selectedProviderValue = null;
+            } else if (value === 'all') {
+                _selectedProviderValue = 'all';
+            } else {
+                _selectedProviderValue = parseInt(value, 10);
+            }
+        });
+    }
+}
+
+/**
+ * Get the currently selected provider value.
+ *
+ * @returns {null|string|number} null for primary, 'all' for all, or provider ID
+ */
+function getSelectedProviders() {
+    return _selectedProviderValue;
+}
+
+/**
+ * Get the list of loaded providers.
+ *
+ * @returns {Array} List of provider objects
+ */
+function getProviderList() {
+    return _providers;
+}
+
+/**
+ * Check if multiple providers are available.
+ *
+ * @returns {boolean}
+ */
+function hasMultipleProviders() {
+    return _providers.length > 1;
+}
+
+/**
+ * Add provider_ids to a playlist creation payload.
+ *
+ * @param {object} payload - The existing payload object
+ * @returns {object} Payload with provider_ids added if applicable
+ */
+function addProviderToPayload(payload) {
+    const selected = getSelectedProviders();
+    if (selected !== null) {
+        payload.provider_ids = selected;
+    }
+    return payload;
+}
+
+// CSS styles for the provider selector
+const providerSelectorStyles = `
+.provider-selector {
+    display: flex;
+    align-items: center;
+    gap: 0.5rem;
+    margin-bottom: 0.75rem;
+}
+
+.provider-selector label {
+    font-weight: 500;
+    font-size: 0.9rem;
+    white-space: nowrap;
+}
+
+.provider-select {
+    padding: 0.4rem 0.75rem;
+    border: 1px solid var(--border-color, #ccc);
+    border-radius: 4px;
+    background: var(--bg-primary, #fff);
+    color: var(--text-color, #333);
+    font-size: 0.9rem;
+    min-width: 150px;
+}
+
+.provider-select:focus {
+    outline: none;
+    border-color: var(--primary-color, #007bff);
+}
+
+/* Compact variant for inline use */
+.provider-selector.compact {
+    margin-bottom: 0;
+}
+
+.provider-selector.compact label {
+    font-size: 0.85rem;
+}
+
+.provider-selector.compact .provider-select {
+    padding: 0.3rem 0.5rem;
+    font-size: 0.85rem;
+    min-width: 120px;
+}
+`;
+
+// Inject styles when script loads
+(function() {
+    const styleEl = document.createElement('style');
+    styleEl.textContent = providerSelectorStyles;
+    document.head.appendChild(styleEl);
+})();
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index ce6c3752..6fd99418 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -566,3 +566,188 @@ def _get_provider_config_fields(provider_type: str):
     }
     return fields.get(provider_type, [])
 
+
+# ##############################################################################
+# MULTI-PROVIDER PLAYLIST FUNCTIONS
+# ##############################################################################
+
+def get_all_playlists_multi_provider(provider_ids=None):
+    """
+    Get playlists from multiple providers with deduplication.
+
+    Args:
+        provider_ids: List of provider IDs to query, or None for all enabled providers
+
+    Returns:
+        List of playlists with provider info, deduplicated by name
+    """
+    from app_helper import get_providers, get_provider_by_id
+
+    all_playlists = []
+    seen_names = {}  # Track playlist names to detect duplicates
+
+    # Get providers to query
+    if provider_ids is None:
+        providers = get_providers(enabled_only=True)
+    else:
+        providers = [get_provider_by_id(pid) for pid in provider_ids if get_provider_by_id(pid)]
+
+    for provider in providers:
+        try:
+            provider_type = provider['provider_type']
+            playlists = _get_playlists_for_provider_type(provider_type)
+
+            for playlist in playlists:
+                playlist_name = playlist.get('Name') or playlist.get('name', '')
+                playlist_id = playlist.get('Id') or playlist.get('id', '')
+
+                # Add provider info to playlist
+                playlist['provider_id'] = provider['id']
+                playlist['provider_type'] = provider_type
+                playlist['provider_name'] = provider.get('name', provider_type)
+
+                # Check for duplicates by name
+                if playlist_name in seen_names:
+                    # Mark as duplicate
+                    playlist['is_duplicate'] = True
+                    playlist['duplicate_of_provider'] = seen_names[playlist_name]
+                else:
+                    playlist['is_duplicate'] = False
+                    seen_names[playlist_name] = provider['id']
+
+                all_playlists.append(playlist)
+
+        except Exception as e:
+            logger.warning(f"Failed to get playlists from provider {provider.get('name', 'unknown')}: {e}")
+            continue
+
+    return all_playlists
+
+
+def _get_playlists_for_provider_type(provider_type):
+    """Get playlists for a specific provider type using current config."""
+    if provider_type == 'jellyfin':
+        return jellyfin_get_all_playlists()
+    elif provider_type == 'navidrome':
+        return navidrome_get_all_playlists()
+    elif provider_type == 'lyrion':
+        return lyrion_get_all_playlists()
+    elif provider_type == 'mpd':
+        return mpd_get_all_playlists()
+    elif provider_type == 'emby':
+        return emby_get_all_playlists()
+    elif provider_type == 'localfiles':
+        return localfiles_get_all_playlists()
+    return []
+
+
+def create_playlist_multi_provider(playlist_name, item_ids, provider_ids=None, user_creds=None):
+    """
+    Create a playlist on one or more providers.
+
+    Args:
+        playlist_name: Name of the playlist to create
+        item_ids: List of track IDs to add
+        provider_ids: List of provider IDs to create playlist on,
+                     'all' for all enabled providers,
+                     or None for the primary/default provider
+        user_creds: Optional user credentials for providers that support them
+
+    Returns:
+        Dict with results for each provider: {provider_id: {'success': bool, 'playlist_id': str, 'error': str}}
+    """
+    from app_helper import get_providers, get_provider_by_id, get_primary_provider_id
+
+    if not playlist_name:
+        raise ValueError("Playlist name is required")
+    if not item_ids:
+        raise ValueError("Track IDs are required")
+
+    results = {}
+
+    # Determine which providers to use
+    if provider_ids == 'all':
+        providers = get_providers(enabled_only=True)
+    elif provider_ids is None:
+        # Use primary provider or fall back to current config
+        primary_id = get_primary_provider_id()
+        if primary_id:
+            provider = get_provider_by_id(primary_id)
+            providers = [provider] if provider else []
+        else:
+            # Fall back to creating on current configured provider
+            try:
+                created = create_instant_playlist(playlist_name, item_ids, user_creds=user_creds)
+                return {'default': {'success': True, 'playlist_id': created.get('Id') if created else None}}
+            except Exception as e:
+                return {'default': {'success': False, 'error': str(e)}}
+    else:
+        # Specific provider IDs
+        if isinstance(provider_ids, (list, tuple)):
+            providers = [get_provider_by_id(pid) for pid in provider_ids if get_provider_by_id(pid)]
+        else:
+            provider = get_provider_by_id(provider_ids)
+            providers = [provider] if provider else []
+
+    # Create playlist on each provider
+    for provider in providers:
+        provider_id = provider['id']
+        provider_type = provider['provider_type']
+
+        try:
+            # For now, use the dispatcher which uses current config
+            # In the future, we may want provider-specific config
+            created = _create_playlist_for_provider_type(provider_type, playlist_name, item_ids, user_creds)
+
+            results[provider_id] = {
+                'success': True,
+                'playlist_id': created.get('Id') or created.get('id') if created else None,
+                'provider_name': provider.get('name', provider_type)
+            }
+        except Exception as e:
+            logger.error(f"Failed to create playlist on provider {provider.get('name')}: {e}")
+            results[provider_id] = {
+                'success': False,
+                'error': str(e),
+                'provider_name': provider.get('name', provider_type)
+            }
+
+    return results
+
+
+def _create_playlist_for_provider_type(provider_type, playlist_name, item_ids, user_creds=None):
+    """Create playlist on a specific provider type."""
+    if provider_type == 'jellyfin':
+        return jellyfin_create_instant_playlist(playlist_name, item_ids, user_creds)
+    elif provider_type == 'navidrome':
+        return navidrome_create_instant_playlist(playlist_name, item_ids, user_creds)
+    elif provider_type == 'lyrion':
+        return lyrion_create_instant_playlist(playlist_name, item_ids)
+    elif provider_type == 'mpd':
+        return mpd_create_instant_playlist(playlist_name, item_ids, user_creds)
+    elif provider_type == 'emby':
+        return emby_create_instant_playlist(playlist_name, item_ids, user_creds)
+    elif provider_type == 'localfiles':
+        return localfiles_create_instant_playlist(playlist_name, item_ids, user_creds)
+    else:
+        raise ValueError(f"Unknown provider type: {provider_type}")
+
+
+def get_enabled_providers_for_playlists():
+    """
+    Get list of enabled providers for use in playlist dropdowns.
+
+    Returns:
+        List of dicts with 'id', 'name', 'type' for each enabled provider
+    """
+    from app_helper import get_providers
+
+    providers = get_providers(enabled_only=True)
+    return [
+        {
+            'id': p['id'],
+            'name': p.get('name') or p['provider_type'],
+            'type': p['provider_type']
+        }
+        for p in providers
+    ]
diff --git a/tasks/voyager_manager.py b/tasks/voyager_manager.py
index ac0f9909..30fedf14 100644
--- a/tasks/voyager_manager.py
+++ b/tasks/voyager_manager.py
@@ -1647,15 +1647,46 @@ def search_tracks_by_title_and_artist(title_query: str, artist_query: str, limit
     return results
 
 
-def create_playlist_from_ids(playlist_name: str, track_ids: list, user_creds: dict = None):
+def create_playlist_from_ids(playlist_name: str, track_ids: list, user_creds: dict = None, provider_ids=None):
     """
-    Creates a new playlist on the configured media server with the provided name and track IDs.
+    Creates a new playlist on the configured media server(s) with the provided name and track IDs.
+
+    Args:
+        playlist_name: Name of the playlist
+        track_ids: List of track IDs
+        user_creds: Optional user credentials
+        provider_ids: Provider(s) to create playlist on:
+                     - None: Use primary provider or default config
+                     - 'all': Create on all enabled providers
+                     - int: Single provider ID
+                     - list[int]: Multiple provider IDs
+
+    Returns:
+        If single provider: playlist_id (str)
+        If multiple providers: dict of {provider_id: {'success': bool, 'playlist_id': str, 'error': str}}
     """
     try:
-        # Use the mediaserver dispatcher (imported at module top) to create the playlist.
-        # This avoids importing app_external which may not export the helper.
+        from tasks.mediaserver import create_playlist_multi_provider
+
+        # Use multi-provider function if provider_ids is specified as 'all' or a list
+        if provider_ids == 'all' or isinstance(provider_ids, (list, tuple)):
+            return create_playlist_multi_provider(playlist_name, track_ids, provider_ids, user_creds)
+
+        # Single provider specified
+        if provider_ids is not None:
+            results = create_playlist_multi_provider(playlist_name, track_ids, provider_ids, user_creds)
+            # Extract single result
+            if results:
+                result = list(results.values())[0]
+                if result.get('success'):
+                    return result.get('playlist_id')
+                else:
+                    raise Exception(result.get('error', 'Playlist creation failed'))
+            raise Exception("No provider found")
+
+        # Default: use existing single-provider logic for backward compatibility
         created_playlist = create_instant_playlist(playlist_name, track_ids, user_creds=user_creds)
-        
+
         if not created_playlist:
             raise Exception("Playlist creation failed. The media server did not return a playlist object.")
 
diff --git a/templates/alchemy.html b/templates/alchemy.html
index 0286d19a..4aca6d41 100644
--- a/templates/alchemy.html
+++ b/templates/alchemy.html
@@ -143,6 +143,7 @@ <h3>Create a Playlist from Results</h3>
                 <input type="text" id="playlist_name" name="playlist_name" required placeholder="e.g., My Alchemy Mix">
             </div>
         </div>
+        <div id="provider-selector-container"></div>
         <button type="submit" style="background-color: var(--color-success);">Create Playlist on Media Server</button>
     </form>
     <div id="playlist-status"></div>
@@ -150,8 +151,11 @@ <h3>Create a Playlist from Results</h3>
 {% endblock %}
 
 {% block bodyAdditions %}
+<script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
 <script>
     (async () => {
+        // Initialize provider selector
+        initProviderSelector();
         // Fetch config to get ALCHEMY defaults
         let defaultN = 100;
         let maxN = 200;
@@ -919,10 +923,12 @@ <h3>Create a Playlist from Results</h3>
 
             playlistStatusDiv.textContent = 'Creating playlist...';
             try {
+                const payload = { playlist_name: playlistName, track_ids: combined };
+                addProviderToPayload(payload);
                 const response = await fetch("{{ url_for('voyager_bp.create_media_server_playlist') }}", {
                     method: 'POST',
                     headers: { 'Content-Type': 'application/json' },
-                    body: JSON.stringify({ playlist_name: playlistName, track_ids: combined }),
+                    body: JSON.stringify(payload),
                 });
                 const result = await response.json();
                 if (!response.ok) throw new Error(result.error || `HTTP error! status: ${response.status}`);
diff --git a/templates/artist_similarity.html b/templates/artist_similarity.html
index 08a09c0b..c8e26244 100644
--- a/templates/artist_similarity.html
+++ b/templates/artist_similarity.html
@@ -227,13 +227,14 @@ <h3>Create Playlist from Selected Artist</h3>
         <div class="param-group">
             <div>
                 <label for="playlist_name">Playlist Name:</label>
-                <input type="text" 
-                       id="playlist_name" 
-                       name="playlist_name" 
-                       required 
+                <input type="text"
+                       id="playlist_name"
+                       name="playlist_name"
+                       required
                        placeholder="e.g., Best of Artist">
             </div>
         </div>
+        <div id="provider-selector-container"></div>
         <button type="submit" id="create-artist-playlist-btn">Create Playlist on Media Server</button>
     </form>
     <div id="playlist-status"></div>
@@ -241,8 +242,12 @@ <h3>Create Playlist from Selected Artist</h3>
 {% endblock %}
 
 {% block bodyAdditions %}
+<script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
 <script>
     (() => {
+        // Initialize provider selector
+        initProviderSelector();
+
         let currentArtist = null;
         let similarArtists = [];
         let selectedArtist = null;
@@ -690,13 +695,15 @@ <h4>All Tracks by ${artistName}:</h4>
                     finalTrackIds = selectedArtistTracks.map(t => t.item_id);
                 }
                 
+                const payload = {
+                    playlist_name: playlistName,
+                    track_ids: finalTrackIds
+                };
+                addProviderToPayload(payload);
                 const response = await fetch("{{ url_for('voyager_bp.create_media_server_playlist') }}", {
                     method: 'POST',
                     headers: { 'Content-Type': 'application/json' },
-                    body: JSON.stringify({
-                        playlist_name: playlistName,
-                        track_ids: finalTrackIds
-                    }),
+                    body: JSON.stringify(payload),
                 });
                 const result = await response.json();
                 if (!response.ok) throw new Error(result.error || `HTTP error! status: ${response.status}`);
diff --git a/templates/chat.html b/templates/chat.html
index 76ab310e..46b501d1 100644
--- a/templates/chat.html
+++ b/templates/chat.html
@@ -180,6 +180,7 @@ <h3>Create Playlist on Media Server</h3>
                     <input type="text" id="mediaServerPlaylistName" name="playlist_name" placeholder="Enter playlist name" required>
                 </div>
             </div>
+            <div id="provider-selector-container"></div>
             <button type="submit" id="submitMediaServerPlaylist">Create Playlist</button>
         </form>
         <div id="mediaServerResponseArea"></div>
@@ -188,11 +189,15 @@ <h3>Create Playlist on Media Server</h3>
 {% endblock %}
 
 {% block bodyAdditions %}
+    <script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
     <script>
         // --- Self-Executing Anonymous Function to Encapsulate Code ---
         (() => {
             let globalConfig = {};
 
+            // Initialize provider selector
+            initProviderSelector();
+
             // --- DOM Element References ---
             const aiProviderSelect = document.getElementById('aiProvider');
             const ollamaConfigDiv = document.getElementById('ollamaConfig');
@@ -659,6 +664,7 @@ <h3>Create Playlist on Media Server</h3>
                     playlist_name: playlistNameInput.value,
                     item_ids: itemIdsInput.value.split(',') // Send as an array
                 };
+                addProviderToPayload(payload);
 
                 try {
                     // MODIFIED: Changed API endpoint to be more generic
diff --git a/templates/clap_search.html b/templates/clap_search.html
index 5fc4feed..1e12ffd6 100644
--- a/templates/clap_search.html
+++ b/templates/clap_search.html
@@ -255,11 +255,13 @@ <h3>Create a Playlist from Results</h3>
             <label for="playlist_name">Playlist Name:</label>
             <input type="text" id="playlist_name" name="playlist_name" placeholder="My CLAP Search Playlist" required>
         </div>
+        <div id="provider-selector-container"></div>
         <button type="submit">Create Playlist on Media Server</button>
     </form>
     <div id="playlist-status"></div>
 </section>
 
+<script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
 <script>
 document.addEventListener('DOMContentLoaded', function() {
     const searchForm = document.getElementById('search-form');
@@ -270,8 +272,11 @@ <h3>Create a Playlist from Results</h3>
     const playlistCreator = document.getElementById('playlist-creator');
     const playlistForm = document.getElementById('playlist-form');
     const topQueriesContainer = document.getElementById('top-queries-container');
-    
+
     let currentResults = [];
+
+    // Initialize provider selector
+    initProviderSelector();
     
     // Warmup model on page load for instant searches
     warmupModel();
@@ -432,19 +437,25 @@ <h3>Create a Playlist from Results</h3>
         
         const trackIds = currentResults.map(r => r.item_id);
         playlistStatusDiv.textContent = 'Creating playlist...';
-        
+
         try {
+            const payload = {
+                playlist_name: playlistName,
+                track_ids: trackIds
+            };
+            const providerIds = typeof getSelectedProviders === 'function' ? getSelectedProviders() : null;
+            if (providerIds !== null) {
+                payload.provider_ids = providerIds;
+            }
+
             const response = await fetch("{{ url_for('voyager_bp.create_media_server_playlist') }}", {
                 method: 'POST',
                 headers: { 'Content-Type': 'application/json' },
-                body: JSON.stringify({
-                    playlist_name: playlistName,
-                    track_ids: trackIds
-                })
+                body: JSON.stringify(payload)
             });
-            
+
             const data = await response.json();
-            
+
             if (!response.ok) throw new Error(data.error || `HTTP error! status: ${response.status}`);
             playlistStatusDiv.textContent = data.message;
             playlistStatusDiv.className = 'status-success';
diff --git a/templates/map.html b/templates/map.html
index 99ad69d2..5457f5a7 100644
--- a/templates/map.html
+++ b/templates/map.html
@@ -26,7 +26,7 @@
         <h1>AudioMuse-AI - Music Map</h1>
         <p>Precompute your music map with a song analysis, then explore it interactively and create your playlist</p>
     </header>
-    <div class="map-controls" style="display:flex; gap:8px; align-items:center; margin-bottom:8px;">
+    <div class="map-controls" style="display:flex; gap:8px; align-items:center; margin-bottom:8px; flex-wrap:wrap;">
         <label for="map_size" class="label-with-tooltip">
             Map size:
             <span class="info-tooltip" tabindex="0">
@@ -40,6 +40,7 @@ <h1>AudioMuse-AI - Music Map</h1>
             <button id="btn-pct-75" type="button" class="btn btn-ghost">75%</button>
             <button id="btn-pct-100" type="button" class="btn btn-ghost">100%</button>
         </div>
+        <div id="provider-selector-container" style="display:inline-flex; align-items:center;"></div>
         <button id="create-playlist" class="btn btn-primary">Create playlist</button>
         <button id="song-path-btn" class="btn btn-primary" disabled style="margin-left:6px;">Song Path</button>
         <button id="refresh-map" type="button" class="btn btn-ghost" title="Refresh map (clear overlays)" style="margin-left:6px;">Refresh</button>
@@ -1191,7 +1192,11 @@ <h1>AudioMuse-AI - Music Map</h1>
 {% endblock %}
 
 {% block postHTMLScripts %}
+<script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
 <script>
+        // Initialize provider selector
+        initProviderSelector();
+
         // Improved create-playlist response handling: parse response text safely and surface status
         document.getElementById('create-playlist').onclick = async () => {
             const sel = window._plotSelection || [];
@@ -1202,6 +1207,7 @@ <h1>AudioMuse-AI - Music Map</h1>
             const filtered = (sel || []).filter(id => id !== undefined && id !== null);
             console.debug('Creating playlist with ids', filtered.slice(0,50));
             const payload = { playlist_name: `Map selection ${new Date().toISOString()}`, track_ids: filtered };
+            addProviderToPayload(payload);
             const resp = await fetch("{{ url_for('voyager_bp.create_media_server_playlist') }}", { method: 'POST', headers: {'Content-Type':'application/json'}, body: JSON.stringify(payload) });
                 const text = await resp.text();
                 let json = null;
diff --git a/templates/mulan_search.html b/templates/mulan_search.html
index 5736cc0a..afd5ec94 100644
--- a/templates/mulan_search.html
+++ b/templates/mulan_search.html
@@ -255,11 +255,13 @@ <h3>Create a Playlist from Results</h3>
             <label for="playlist_name">Playlist Name:</label>
             <input type="text" id="playlist_name" name="playlist_name" placeholder="My MuLan Search Playlist" required>
         </div>
+        <div id="provider-selector-container"></div>
         <button type="submit">Create Playlist on Media Server</button>
     </form>
     <div id="playlist-status"></div>
 </section>
 
+<script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
 <script>
 document.addEventListener('DOMContentLoaded', function() {
     const searchForm = document.getElementById('search-form');
@@ -270,8 +272,11 @@ <h3>Create a Playlist from Results</h3>
     const playlistCreator = document.getElementById('playlist-creator');
     const playlistForm = document.getElementById('playlist-form');
     const topQueriesContainer = document.getElementById('top-queries-container');
-    
+
     let currentResults = [];
+
+    // Initialize provider selector
+    initProviderSelector();
     
     // Warmup model on page load for instant searches
     warmupModel();
@@ -425,13 +430,16 @@ <h3>Create a Playlist from Results</h3>
         playlistStatusDiv.textContent = 'Creating playlist...';
         
         try {
+            const payload = {
+                playlist_name: playlistName,
+                track_ids: trackIds
+            };
+            addProviderToPayload(payload);
+
             const response = await fetch("{{ url_for('voyager_bp.create_media_server_playlist') }}", {
                 method: 'POST',
                 headers: { 'Content-Type': 'application/json' },
-                body: JSON.stringify({
-                    playlist_name: playlistName,
-                    track_ids: trackIds
-                })
+                body: JSON.stringify(payload)
             });
             
             const data = await response.json();
diff --git a/templates/path.html b/templates/path.html
index 6c16e5a3..494ea126 100644
--- a/templates/path.html
+++ b/templates/path.html
@@ -155,6 +155,7 @@ <h3>Create a Playlist from Path</h3>
                 <input type="text" id="playlist_name" name="playlist_name" required placeholder="e.g., Path from Song A to B">
             </div>
         </div>
+        <div id="provider-selector-container"></div>
         <button type="submit" style="background-color: var(--color-success);">Create Playlist on Media Server</button>
     </form>
     <div id="playlist-status"></div>
@@ -163,6 +164,7 @@ <h3>Create a Playlist from Path</h3>
 
 {% block bodyAdditions %}
     <script src="{{ url_for('static', filename='chart.js') }}"></script>
+    <script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
     <script>
         (async () => {
             let currentTrackIds = [];
@@ -172,6 +174,9 @@ <h3>Create a Playlist from Path</h3>
             let pathDistanceMetric = 'euclidean'; // Default value
             let mapIdToCoord = {}; // cache of id -> [x,y] from /api/map
 
+            // Initialize provider selector
+            initProviderSelector();
+
             // --- Fetch config to get the distance metric ---
             try {
                 const response = await fetch("{{ url_for('get_config_endpoint') }}");
@@ -821,13 +826,19 @@ <h3>Create a Playlist from Path</h3>
                 }
                 playlistStatusDiv.textContent = 'Creating playlist...';
                 try {
+                    const payload = {
+                        playlist_name: playlistName,
+                        track_ids: currentTrackIds
+                    };
+                    const providerIds = typeof getSelectedProviders === 'function' ? getSelectedProviders() : null;
+                    if (providerIds !== null) {
+                        payload.provider_ids = providerIds;
+                    }
+
                     const response = await fetch("{{ url_for('voyager_bp.create_media_server_playlist') }}", {
                         method: 'POST',
                         headers: { 'Content-Type': 'application/json' },
-                        body: JSON.stringify({
-                            playlist_name: playlistName,
-                            track_ids: currentTrackIds
-                        }),
+                        body: JSON.stringify(payload),
                     });
                     const result = await response.json();
                     if (!response.ok) throw new Error(result.error || `HTTP error! status: ${response.status}`);
diff --git a/templates/similarity.html b/templates/similarity.html
index 12c26395..0645695b 100644
--- a/templates/similarity.html
+++ b/templates/similarity.html
@@ -107,7 +107,7 @@ <h3>Create a Playlist from Results</h3>
                 <input type="text" id="playlist_name" name="playlist_name" required placeholder="e.g., My Awesome Mix">
             </div>
         </div>
-        <!-- MODIFIED: Changed button text to be more generic -->
+        <div id="provider-selector-container"></div>
         <button type="submit" style="background-color: var(--color-success);">
             Create Playlist on Media Server
         </button>
@@ -117,6 +117,7 @@ <h3>Create a Playlist from Results</h3>
 {% endblock %}
 
 {% block bodyAdditions %}
+    <script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
     <script>
         (() => {
             let currentTrackIds = [];
@@ -135,6 +136,9 @@ <h3>Create a Playlist from Results</h3>
             const resultsTableWrapper = document.getElementById('results-table-wrapper');
             const playlistStatusDiv = document.getElementById('playlist-status');
 
+            // Initialize provider selector
+            initProviderSelector();
+
             // --- Autocomplete Logic ---
             const handleSearchInput = () => {
                 clearTimeout(searchTimeout);
@@ -330,13 +334,20 @@ <h3>Create a Playlist from Results</h3>
                 playlistStatusDiv.textContent = 'Creating playlist...';
 
                 try {
+                    const payload = {
+                        playlist_name: playlistName,
+                        track_ids: currentTrackIds
+                    };
+                    // Add provider selection if available
+                    const providerIds = typeof getSelectedProviders === 'function' ? getSelectedProviders() : null;
+                    if (providerIds !== null) {
+                        payload.provider_ids = providerIds;
+                    }
+
                     const response = await fetch("{{ url_for('voyager_bp.create_media_server_playlist') }}", {
                         method: 'POST',
                         headers: { 'Content-Type': 'application/json' },
-                        body: JSON.stringify({
-                            playlist_name: playlistName,
-                            track_ids: currentTrackIds
-                        }),
+                        body: JSON.stringify(payload),
                     });
                     const result = await response.json();
                     if (!response.ok) throw new Error(result.error || `HTTP error! status: ${response.status}`);
diff --git a/templates/sonic_fingerprint.html b/templates/sonic_fingerprint.html
index 55df943d..b3999564 100644
--- a/templates/sonic_fingerprint.html
+++ b/templates/sonic_fingerprint.html
@@ -120,6 +120,7 @@ <h3>Create a Playlist from Results</h3>
                 <input type="text" id="playlist_name" name="playlist_name" required placeholder="e.g., My Sonic Mix">
             </div>
         </div>
+        <div id="provider-selector-container"></div>
         <button type="submit" style="background-color: var(--color-success);">
             Create Playlist on Media Server
         </button>
@@ -129,11 +130,15 @@ <h3>Create a Playlist from Results</h3>
 {% endblock %}
 
 {% block bodyAdditions %}
+    <script src="{{ url_for('static', filename='provider-selector.js') }}"></script>
     <script>
         (() => {
             let currentTrackIds = [];
             const mediaserverType = "{{ mediaserver_type }}";
 
+            // Initialize provider selector
+            initProviderSelector();
+
             const fingerprintForm = document.getElementById('fingerprint-form');
             const playlistForm = document.getElementById('playlist-form');
             const statusDiv = document.getElementById('status');
@@ -259,6 +264,7 @@ <h3>Create a Playlist from Results</h3>
                     payload.user_creds.user = document.getElementById('navidrome_user').value;
                     payload.user_creds.password = document.getElementById('navidrome_password').value;
                 }
+                addProviderToPayload(payload);
 
                 playlistStatusDiv.textContent = 'Creating playlist...';
 

From 9987a830520c6a7a255e15f71cf69028598a8875 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 08:52:22 +0000
Subject: [PATCH 07/33] Implement track linking mechanism for multi-provider
 support

- Add track table population functions:
  - get_or_create_track() - Creates/retrieves track record by file_path
  - link_provider_track() - Links provider item_id to track
  - update_score_track_id() - Links score analysis to track
  - get_track_by_file_path() - Lookup track by file path
  - find_existing_analysis_by_file_path() - Check for existing analysis
  - get_all_provider_item_ids_for_track() - Get all provider links for a track

- Update save_track_analysis_and_embedding() to:
  - Accept optional provider_id parameter
  - Automatically create track record when file_path is provided
  - Link score to track via track_id
  - Create provider_track link if provider_id specified

- Update analyze_album_task() to pass provider_id for track linking

- Add enabled_only parameter to get_providers() function

This completes the multi-provider track linking architecture allowing
tracks to be identified across providers by their file path.

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_helper.py     | 328 +++++++++++++++++++++++++++++++++++++++++++++-
 app_setup.py      |  26 +++-
 tasks/analysis.py |   9 +-
 3 files changed, 352 insertions(+), 11 deletions(-)

diff --git a/app_helper.py b/app_helper.py
index c5190c61..8a44b4db 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -540,9 +540,11 @@ def track_exists(item_id):
     cur.close()
     return row is not None
 
-def save_track_analysis_and_embedding(item_id, title, author, tempo, key, scale, moods, embedding_vector, energy=None, other_features=None, album=None, album_artist=None, year=None, rating=None, file_path=None):
+def save_track_analysis_and_embedding(item_id, title, author, tempo, key, scale, moods, embedding_vector, energy=None, other_features=None, album=None, album_artist=None, year=None, rating=None, file_path=None, provider_id=None):
     """Saves track analysis and embedding in a single transaction.
 
+    Also creates/updates track linking for multi-provider support when file_path is provided.
+
     Args:
         item_id: Provider-specific track identifier
         title: Track title
@@ -559,6 +561,7 @@ def save_track_analysis_and_embedding(item_id, title, author, tempo, key, scale,
         year: Release year
         rating: User rating
         file_path: Full path to the audio file (for multi-provider track linking)
+        provider_id: Optional provider ID for creating provider_track link
     """
 
     def _sanitize_string(s, max_length=1000, field_name="field"):
@@ -706,6 +709,22 @@ def _parse_year_from_date(year_value):
     finally:
         cur.close()
 
+    # Create track linking for multi-provider support (after main transaction commits)
+    if file_path:
+        try:
+            # Get or create track record based on file path
+            track_id = get_or_create_track(file_path)
+            if track_id:
+                # Link score to track
+                update_score_track_id(item_id, track_id)
+
+                # Create provider_track link if provider_id is specified
+                if provider_id:
+                    link_provider_track(provider_id, track_id, item_id, title, author, album)
+        except Exception as e:
+            # Log but don't fail - track linking is supplementary
+            logger.warning("Failed to create track linking for %s: %s", item_id, e)
+
 def save_clap_embedding(item_id, clap_embedding_vector):
     """Saves CLAP embedding for a track."""
     if clap_embedding_vector is None or (isinstance(clap_embedding_vector, np.ndarray) and clap_embedding_vector.size == 0):
@@ -1411,4 +1430,309 @@ def set_primary_provider(provider_id):
                 value = EXCLUDED.value,
                 updated_at = NOW()
         """, (str(provider_id) if provider_id is not None else 'null',))
-        db.commit()
\ No newline at end of file
+        db.commit()
+
+
+# ##############################################################################
+# TRACK LINKING FUNCTIONS - For multi-provider track identity
+# ##############################################################################
+
+def _compute_file_path_hash(file_path):
+    """
+    Compute SHA-256 hash of normalized file path for track identity.
+
+    Normalizes path to handle different provider path formats:
+    - Strips leading slashes and 'music/' prefixes
+    - Converts to lowercase for case-insensitive matching
+    - Uses forward slashes consistently
+    """
+    import hashlib
+    from pathlib import PurePosixPath
+
+    if not file_path:
+        return None
+
+    # Normalize path: convert to POSIX style, strip common prefixes
+    normalized = file_path.replace('\\', '/')
+
+    # Strip common music library prefixes
+    prefixes_to_strip = ['/music/', 'music/', '/data/', 'data/', '/mnt/']
+    lower_path = normalized.lower()
+    for prefix in prefixes_to_strip:
+        if lower_path.startswith(prefix):
+            normalized = normalized[len(prefix):]
+            break
+
+    # Remove leading slashes
+    normalized = normalized.lstrip('/')
+
+    # Compute hash
+    return hashlib.sha256(normalized.encode('utf-8')).hexdigest()
+
+
+def get_or_create_track(file_path, file_size=None, file_modified=None):
+    """
+    Get or create a track record based on file path.
+
+    The track table provides stable identity across providers based on file path.
+
+    Args:
+        file_path: Full or relative path to the audio file
+        file_size: Optional file size in bytes
+        file_modified: Optional file modification timestamp
+
+    Returns:
+        track_id (int) or None if file_path is empty
+    """
+    if not file_path:
+        return None
+
+    file_path_hash = _compute_file_path_hash(file_path)
+    if not file_path_hash:
+        return None
+
+    db = get_db()
+    with db.cursor() as cur:
+        # Try to get existing track
+        cur.execute("SELECT id FROM track WHERE file_path_hash = %s", (file_path_hash,))
+        row = cur.fetchone()
+
+        if row:
+            track_id = row[0]
+            # Update file info if provided
+            if file_size is not None or file_modified is not None:
+                updates = ["updated_at = NOW()"]
+                values = []
+                if file_size is not None:
+                    updates.append("file_size = %s")
+                    values.append(file_size)
+                if file_modified is not None:
+                    updates.append("file_modified = %s")
+                    values.append(file_modified)
+                values.append(track_id)
+                cur.execute(f"UPDATE track SET {', '.join(updates)} WHERE id = %s", values)
+                db.commit()
+            return track_id
+
+        # Create new track
+        cur.execute("""
+            INSERT INTO track (file_path_hash, file_path, file_size, file_modified)
+            VALUES (%s, %s, %s, %s)
+            RETURNING id
+        """, (file_path_hash, file_path, file_size, file_modified))
+        track_id = cur.fetchone()[0]
+        db.commit()
+        return track_id
+
+
+def link_provider_track(provider_id, track_id, item_id, title=None, artist=None, album=None):
+    """
+    Link a provider's item_id to a track.
+
+    Creates or updates the provider_track mapping that links a provider's
+    native item_id to the stable track identity.
+
+    Args:
+        provider_id: ID of the provider
+        track_id: ID of the track in the track table
+        item_id: Provider's native item identifier
+        title: Track title from this provider
+        artist: Artist name from this provider
+        album: Album name from this provider
+
+    Returns:
+        provider_track id or None on failure
+    """
+    if not provider_id or not track_id or not item_id:
+        return None
+
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            INSERT INTO provider_track (provider_id, track_id, item_id, title, artist, album, last_synced)
+            VALUES (%s, %s, %s, %s, %s, %s, NOW())
+            ON CONFLICT (provider_id, item_id) DO UPDATE SET
+                track_id = EXCLUDED.track_id,
+                title = COALESCE(EXCLUDED.title, provider_track.title),
+                artist = COALESCE(EXCLUDED.artist, provider_track.artist),
+                album = COALESCE(EXCLUDED.album, provider_track.album),
+                last_synced = NOW()
+            RETURNING id
+        """, (provider_id, track_id, item_id, title, artist, album))
+        result = cur.fetchone()
+        db.commit()
+        return result[0] if result else None
+
+
+def update_score_track_id(item_id, track_id):
+    """
+    Update the track_id reference in the score table.
+
+    This links the analysis data to the stable track identity.
+
+    Args:
+        item_id: The item_id in the score table
+        track_id: The track_id to link to
+    """
+    if not item_id or not track_id:
+        return
+
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            UPDATE score SET track_id = %s WHERE item_id = %s AND (track_id IS NULL OR track_id != %s)
+        """, (track_id, item_id, track_id))
+        db.commit()
+
+
+def get_track_by_file_path(file_path):
+    """
+    Get track info by file path.
+
+    Args:
+        file_path: Full or relative path to the audio file
+
+    Returns:
+        dict with track info or None if not found
+    """
+    if not file_path:
+        return None
+
+    file_path_hash = _compute_file_path_hash(file_path)
+    if not file_path_hash:
+        return None
+
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            SELECT t.id, t.file_path, t.file_path_hash, t.file_size, t.file_modified,
+                   s.item_id, s.title, s.author, s.album, s.tempo, s.key, s.scale,
+                   s.mood_vector, s.energy, s.other_features
+            FROM track t
+            LEFT JOIN score s ON s.track_id = t.id
+            WHERE t.file_path_hash = %s
+        """, (file_path_hash,))
+        row = cur.fetchone()
+        if row:
+            return {
+                'track_id': row[0],
+                'file_path': row[1],
+                'file_path_hash': row[2],
+                'file_size': row[3],
+                'file_modified': row[4],
+                'item_id': row[5],
+                'title': row[6],
+                'author': row[7],
+                'album': row[8],
+                'tempo': row[9],
+                'key': row[10],
+                'scale': row[11],
+                'mood_vector': row[12],
+                'energy': row[13],
+                'other_features': row[14],
+            }
+        return None
+
+
+def get_all_provider_item_ids_for_track(track_id):
+    """
+    Get all provider item_ids linked to a track.
+
+    Args:
+        track_id: The track ID
+
+    Returns:
+        List of dicts with provider_id, item_id, title, artist, album
+    """
+    if not track_id:
+        return []
+
+    db = get_db()
+    with db.cursor() as cur:
+        cur.execute("""
+            SELECT pt.provider_id, pt.item_id, pt.title, pt.artist, pt.album,
+                   p.provider_type, p.name as provider_name
+            FROM provider_track pt
+            JOIN provider p ON p.id = pt.provider_id
+            WHERE pt.track_id = %s
+        """, (track_id,))
+        return [
+            {
+                'provider_id': row[0],
+                'item_id': row[1],
+                'title': row[2],
+                'artist': row[3],
+                'album': row[4],
+                'provider_type': row[5],
+                'provider_name': row[6],
+            }
+            for row in cur.fetchall()
+        ]
+
+
+def find_existing_analysis_by_file_path(file_path):
+    """
+    Find existing analysis data for a file path.
+
+    This is used to check if a track has already been analyzed under a different
+    provider's item_id, allowing reuse of analysis data.
+
+    Args:
+        file_path: Full or relative path to the audio file
+
+    Returns:
+        dict with item_id and analysis status, or None if not found
+    """
+    if not file_path:
+        return None
+
+    file_path_hash = _compute_file_path_hash(file_path)
+    if not file_path_hash:
+        return None
+
+    db = get_db()
+    with db.cursor() as cur:
+        # First try via track table (proper linking)
+        cur.execute("""
+            SELECT s.item_id, s.title, s.author,
+                   (s.tempo IS NOT NULL) as has_musicnn,
+                   EXISTS(SELECT 1 FROM embedding e WHERE e.item_id = s.item_id) as has_embedding,
+                   EXISTS(SELECT 1 FROM clap_embedding ce WHERE ce.item_id = s.item_id) as has_clap
+            FROM track t
+            JOIN score s ON s.track_id = t.id
+            WHERE t.file_path_hash = %s
+        """, (file_path_hash,))
+        row = cur.fetchone()
+        if row:
+            return {
+                'item_id': row[0],
+                'title': row[1],
+                'author': row[2],
+                'has_musicnn': row[3],
+                'has_embedding': row[4],
+                'has_clap': row[5],
+                'source': 'track_table'
+            }
+
+        # Fall back to checking score.file_path directly (for legacy data)
+        cur.execute("""
+            SELECT s.item_id, s.title, s.author,
+                   (s.tempo IS NOT NULL) as has_musicnn,
+                   EXISTS(SELECT 1 FROM embedding e WHERE e.item_id = s.item_id) as has_embedding,
+                   EXISTS(SELECT 1 FROM clap_embedding ce WHERE ce.item_id = s.item_id) as has_clap
+            FROM score s
+            WHERE s.file_path = %s
+        """, (file_path,))
+        row = cur.fetchone()
+        if row:
+            return {
+                'item_id': row[0],
+                'title': row[1],
+                'author': row[2],
+                'has_musicnn': row[3],
+                'has_embedding': row[4],
+                'has_clap': row[5],
+                'source': 'score_file_path'
+            }
+
+        return None
\ No newline at end of file
diff --git a/app_setup.py b/app_setup.py
index f857f5e8..dd33f7d0 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -95,15 +95,27 @@ def is_multi_provider_enabled():
 # PROVIDER MANAGEMENT
 # ##############################################################################
 
-def get_providers():
-    """Get all configured providers."""
+def get_providers(enabled_only=False):
+    """Get all configured providers.
+
+    Args:
+        enabled_only: If True, only return enabled providers
+    """
     db = get_db()
     with db.cursor() as cur:
-        cur.execute("""
-            SELECT id, provider_type, name, config, enabled, priority, created_at, updated_at
-            FROM provider
-            ORDER BY priority DESC, created_at ASC
-        """)
+        if enabled_only:
+            cur.execute("""
+                SELECT id, provider_type, name, config, enabled, priority, created_at, updated_at
+                FROM provider
+                WHERE enabled = TRUE
+                ORDER BY priority DESC, created_at ASC
+            """)
+        else:
+            cur.execute("""
+                SELECT id, provider_type, name, config, enabled, priority, created_at, updated_at
+                FROM provider
+                ORDER BY priority DESC, created_at ASC
+            """)
         rows = cur.fetchall()
         providers = []
         for row in rows:
diff --git a/tasks/analysis.py b/tasks/analysis.py
index 4cb01d8a..3dffcfee 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -650,14 +650,18 @@ def analyze_track(file_path, mood_labels_list, model_paths, onnx_sessions=None):
 
 # --- RQ Task Definitions ---
 # MODIFIED: Removed jellyfin_url, jellyfin_user_id, jellyfin_token as they are no longer needed for the function calls.
-def analyze_album_task(album_id, album_name, top_n_moods, parent_task_id):
+def analyze_album_task(album_id, album_name, top_n_moods, parent_task_id, provider_id=None):
     from app import (app, JobStatus)
     from app_helper import (redis_conn, get_db, save_task_status, get_task_info_from_db,
                      save_track_analysis_and_embedding, save_clap_embedding,
+                     get_primary_provider_id,
                      TASK_STATUS_STARTED, TASK_STATUS_PROGRESS, TASK_STATUS_SUCCESS, TASK_STATUS_FAILURE, TASK_STATUS_REVOKED)
     from .clap_analyzer import analyze_audio_file as clap_analyze, is_clap_available
     from .mulan_analyzer import analyze_audio_file as mulan_analyze
     from config import MULAN_ENABLED
+
+    # Get provider_id for track linking (use passed value or get primary provider)
+    active_provider_id = provider_id if provider_id is not None else get_primary_provider_id()
     
     current_job = get_current_job(redis_conn)
     current_task_id = current_job.id if current_job else str(uuid.uuid4())
@@ -921,7 +925,8 @@ def get_missing_mulan_track_ids(track_ids):
                             album_artist=item.get('OriginalAlbumArtist', None),
                             year=item.get('Year'),
                             rating=item.get('Rating'),
-                            file_path=item.get('Path') or item.get('FilePath')  # For multi-provider track linking
+                            file_path=item.get('Path') or item.get('FilePath'),  # For multi-provider track linking
+                            provider_id=active_provider_id  # Link to provider for multi-provider support
                         )
                         track_processed = True
                         

From f64bff9efa510bb8d3fd3fb6713a7449f25631ec Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 09:04:07 +0000
Subject: [PATCH 08/33] Improve file path normalization for cross-provider
 matching

The path normalization now handles more provider formats:
- Jellyfin: /media/music/... paths
- Navidrome: /music/... or relative paths
- Lyrion: file:///music/... URLs (with URL decoding)
- Various mount points: /mnt/*, /data/*, /share/*, /volume1/*

Prefixes are stripped case-insensitively to get the relative path
from the music library root, enabling track matching across providers
that mount the same music folder at different paths.

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_helper.py | 77 +++++++++++++++++++++++++++++++++++++++++----------
 1 file changed, 63 insertions(+), 14 deletions(-)

diff --git a/app_helper.py b/app_helper.py
index 8a44b4db..d4d0235b 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -1441,32 +1441,81 @@ def _compute_file_path_hash(file_path):
     """
     Compute SHA-256 hash of normalized file path for track identity.
 
-    Normalizes path to handle different provider path formats:
-    - Strips leading slashes and 'music/' prefixes
-    - Converts to lowercase for case-insensitive matching
-    - Uses forward slashes consistently
+    Normalizes paths to handle different provider formats:
+    - Jellyfin: /media/music/Library/Artist/Album/song.mp3
+    - Navidrome: Library/Artist/Album/song.mp3 or /music/Library/Artist/Album/song.mp3
+    - Lyrion: file:///music/Artist/Album/song.mp3
+    - Local: /music/Artist/Album/song.mp3
+
+    Normalization:
+    - Strips file:// URL prefix
+    - Strips common mount points (/media/music, /music, /data, /mnt/*, etc.)
+    - Converts backslashes to forward slashes
+    - Removes leading slashes to get relative path
+    - Does NOT convert to lowercase (preserves case for accurate matching)
     """
     import hashlib
-    from pathlib import PurePosixPath
+    from urllib.parse import unquote
 
     if not file_path:
         return None
 
-    # Normalize path: convert to POSIX style, strip common prefixes
-    normalized = file_path.replace('\\', '/')
-
-    # Strip common music library prefixes
-    prefixes_to_strip = ['/music/', 'music/', '/data/', 'data/', '/mnt/']
-    lower_path = normalized.lower()
+    normalized = file_path
+
+    # Handle file:// URLs (Lyrion/LMS style)
+    if normalized.startswith('file://'):
+        normalized = normalized[7:]  # Remove 'file://'
+        # URL-decode the path (handles %20 for spaces, etc.)
+        normalized = unquote(normalized)
+
+    # Convert Windows backslashes to forward slashes
+    normalized = normalized.replace('\\', '/')
+
+    # List of common mount point prefixes to strip (order matters - longer first)
+    # These are typical Docker volume mounts and media server paths
+    prefixes_to_strip = [
+        '/media/music/',      # Common Jellyfin mount
+        '/media/Media/',      # Alternate Jellyfin
+        '/media/',            # Generic media mount
+        '/mnt/media/music/',  # Mount point style
+        '/mnt/media/',        # Mount point style
+        '/mnt/music/',        # Mount point style
+        '/mnt/data/music/',   # Data volume style
+        '/mnt/data/',         # Data volume style
+        '/mnt/',              # Generic mount
+        '/data/music/',       # Data volume style
+        '/data/',             # Data volume style
+        '/music/',            # Direct music mount
+        '/share/music/',      # NAS style
+        '/share/',            # NAS style
+        '/volume1/music/',    # Synology style
+        '/volume1/',          # Synology style
+    ]
+
+    # Try to strip prefixes (case-insensitive check, preserve original case in result)
+    lower_normalized = normalized.lower()
     for prefix in prefixes_to_strip:
-        if lower_path.startswith(prefix):
+        if lower_normalized.startswith(prefix.lower()):
             normalized = normalized[len(prefix):]
             break
 
-    # Remove leading slashes
+    # Remove any remaining leading slashes
     normalized = normalized.lstrip('/')
 
-    # Compute hash
+    # If path still looks absolute (starts with drive letter on Windows),
+    # try to extract just the relative part after common folder names
+    if len(normalized) > 1 and normalized[1] == ':':
+        # Windows absolute path - try to find music folder
+        for marker in ['/music/', '/Music/', '/media/', '/Media/']:
+            idx = normalized.find(marker)
+            if idx != -1:
+                normalized = normalized[idx + len(marker):]
+                break
+
+    if not normalized:
+        return None
+
+    # Compute hash of normalized path
     return hashlib.sha256(normalized.encode('utf-8')).hexdigest()
 
 

From 7f3fbccc5f069dafcfe2abcd2bbaf68313cac922 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 09:09:34 +0000
Subject: [PATCH 09/33] Add provider-specific music_path_prefix for path
 normalization

Each provider can now have a 'music_path_prefix' in its config
that will be stripped during path normalization. This handles cases
where providers have different folder structures:

- Jellyfin: /media/music/MyLibrary/Artist/Album/song.mp3
- Navidrome: /music/Artist/Album/song.mp3

By setting music_path_prefix="MyLibrary" on Jellyfin, both normalize
to "Artist/Album/song.mp3" enabling cross-provider track matching.

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_helper.py | 84 +++++++++++++++++++++++++++++++++++++--------------
 1 file changed, 62 insertions(+), 22 deletions(-)

diff --git a/app_helper.py b/app_helper.py
index d4d0235b..a5f753bb 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -713,7 +713,8 @@ def _parse_year_from_date(year_value):
     if file_path:
         try:
             # Get or create track record based on file path
-            track_id = get_or_create_track(file_path)
+            # Pass provider_id for provider-specific path normalization (music_path_prefix)
+            track_id = get_or_create_track(file_path, provider_id=provider_id)
             if track_id:
                 # Link score to track
                 update_score_track_id(item_id, track_id)
@@ -1437,24 +1438,30 @@ def set_primary_provider(provider_id):
 # TRACK LINKING FUNCTIONS - For multi-provider track identity
 # ##############################################################################
 
-def _compute_file_path_hash(file_path):
+def normalize_provider_path(file_path, provider_id=None):
     """
-    Compute SHA-256 hash of normalized file path for track identity.
+    Normalize a file path for cross-provider matching.
 
-    Normalizes paths to handle different provider formats:
+    Handles different provider path formats:
     - Jellyfin: /media/music/Library/Artist/Album/song.mp3
-    - Navidrome: Library/Artist/Album/song.mp3 or /music/Library/Artist/Album/song.mp3
+    - Navidrome: Artist/Album/song.mp3 (no library folder)
     - Lyrion: file:///music/Artist/Album/song.mp3
     - Local: /music/Artist/Album/song.mp3
 
-    Normalization:
-    - Strips file:// URL prefix
-    - Strips common mount points (/media/music, /music, /data, /mnt/*, etc.)
-    - Converts backslashes to forward slashes
-    - Removes leading slashes to get relative path
-    - Does NOT convert to lowercase (preserves case for accurate matching)
+    Normalization steps:
+    1. Strip file:// URL prefix and URL-decode
+    2. Strip common mount points (/media/music, /music, etc.)
+    3. Strip provider-specific music_path_prefix from config (e.g., "MyLibrary/")
+    4. Convert backslashes to forward slashes
+    5. Remove leading slashes
+
+    Args:
+        file_path: The file path to normalize
+        provider_id: Optional provider ID to get provider-specific path prefix
+
+    Returns:
+        Normalized relative path (e.g., "Artist/Album/song.mp3")
     """
-    import hashlib
     from urllib.parse import unquote
 
     if not file_path:
@@ -1465,14 +1472,12 @@ def _compute_file_path_hash(file_path):
     # Handle file:// URLs (Lyrion/LMS style)
     if normalized.startswith('file://'):
         normalized = normalized[7:]  # Remove 'file://'
-        # URL-decode the path (handles %20 for spaces, etc.)
-        normalized = unquote(normalized)
+        normalized = unquote(normalized)  # URL-decode
 
     # Convert Windows backslashes to forward slashes
     normalized = normalized.replace('\\', '/')
 
     # List of common mount point prefixes to strip (order matters - longer first)
-    # These are typical Docker volume mounts and media server paths
     prefixes_to_strip = [
         '/media/music/',      # Common Jellyfin mount
         '/media/Media/',      # Alternate Jellyfin
@@ -1492,7 +1497,7 @@ def _compute_file_path_hash(file_path):
         '/volume1/',          # Synology style
     ]
 
-    # Try to strip prefixes (case-insensitive check, preserve original case in result)
+    # Strip mount point prefixes (case-insensitive)
     lower_normalized = normalized.lower()
     for prefix in prefixes_to_strip:
         if lower_normalized.startswith(prefix.lower()):
@@ -1502,33 +1507,68 @@ def _compute_file_path_hash(file_path):
     # Remove any remaining leading slashes
     normalized = normalized.lstrip('/')
 
-    # If path still looks absolute (starts with drive letter on Windows),
-    # try to extract just the relative part after common folder names
+    # Handle Windows absolute paths
     if len(normalized) > 1 and normalized[1] == ':':
-        # Windows absolute path - try to find music folder
         for marker in ['/music/', '/Music/', '/media/', '/Media/']:
             idx = normalized.find(marker)
             if idx != -1:
                 normalized = normalized[idx + len(marker):]
                 break
 
+    # Strip provider-specific music_path_prefix if configured
+    # This handles cases like Jellyfin including "MyLibrary/" but Navidrome not
+    if provider_id:
+        try:
+            from app_setup import get_provider_by_id
+            provider = get_provider_by_id(provider_id)
+            if provider and provider.get('config'):
+                music_prefix = provider['config'].get('music_path_prefix', '')
+                if music_prefix:
+                    music_prefix = music_prefix.replace('\\', '/').strip('/')
+                    if music_prefix and normalized.lower().startswith(music_prefix.lower()):
+                        # Strip the prefix plus any following slash
+                        prefix_len = len(music_prefix)
+                        if len(normalized) > prefix_len and normalized[prefix_len] == '/':
+                            prefix_len += 1
+                        normalized = normalized[prefix_len:]
+        except Exception:
+            pass  # Ignore errors - continue with standard normalization
+
+    return normalized.lstrip('/') if normalized else None
+
+
+def _compute_file_path_hash(file_path, provider_id=None):
+    """
+    Compute SHA-256 hash of normalized file path for track identity.
+
+    Args:
+        file_path: The file path to hash
+        provider_id: Optional provider ID for provider-specific normalization
+
+    Returns:
+        SHA-256 hash string or None if path is empty
+    """
+    import hashlib
+
+    normalized = normalize_provider_path(file_path, provider_id)
     if not normalized:
         return None
 
-    # Compute hash of normalized path
     return hashlib.sha256(normalized.encode('utf-8')).hexdigest()
 
 
-def get_or_create_track(file_path, file_size=None, file_modified=None):
+def get_or_create_track(file_path, file_size=None, file_modified=None, provider_id=None):
     """
     Get or create a track record based on file path.
 
     The track table provides stable identity across providers based on file path.
+    Uses provider-specific path normalization if provider_id is given.
 
     Args:
         file_path: Full or relative path to the audio file
         file_size: Optional file size in bytes
         file_modified: Optional file modification timestamp
+        provider_id: Optional provider ID for path normalization (uses music_path_prefix from config)
 
     Returns:
         track_id (int) or None if file_path is empty
@@ -1536,7 +1576,7 @@ def get_or_create_track(file_path, file_size=None, file_modified=None):
     if not file_path:
         return None
 
-    file_path_hash = _compute_file_path_hash(file_path)
+    file_path_hash = _compute_file_path_hash(file_path, provider_id)
     if not file_path_hash:
         return None
 

From 83014e3c6c23446cccdcb3b8fd5560880cce210d Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 09:12:11 +0000
Subject: [PATCH 10/33] Add music_path_prefix configuration field to all
 providers

Users can now configure a 'Music Path Prefix' for each provider
to handle different folder structures:

- Jellyfin: paths like "MyLibrary/Artist/Album/song.mp3"
- Navidrome: paths like "Artist/Album/song.mp3"

By setting music_path_prefix="MyLibrary" on Jellyfin, both normalize
to "Artist/Album/song.mp3" enabling cross-provider track matching.

The field appears in the setup wizard for all provider types.

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 tasks/mediaserver.py            | 14 ++++++++++++++
 tasks/mediaserver_localfiles.py |  7 +++++++
 2 files changed, 21 insertions(+)

diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index 6fd99418..a890d2d8 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -524,6 +524,15 @@ def get_provider_info(provider_type: str):
 
 def _get_provider_config_fields(provider_type: str):
     """Get configuration fields for a provider type."""
+    # Common field for path normalization in multi-provider setups
+    music_path_prefix_field = {
+        'name': 'music_path_prefix',
+        'label': 'Music Path Prefix',
+        'type': 'text',
+        'required': False,
+        'description': 'Folder prefix to strip for cross-provider matching (e.g., "MyLibrary" if paths include library name). Leave empty if provider paths start directly with artist folders.',
+    }
+
     fields = {
         'jellyfin': [
             {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
@@ -532,6 +541,7 @@ def _get_provider_config_fields(provider_type: str):
              'description': 'Jellyfin user ID (found in dashboard)'},
             {'name': 'token', 'label': 'API Token', 'type': 'password', 'required': True,
              'description': 'API key from Jellyfin settings'},
+            music_path_prefix_field,
         ],
         'navidrome': [
             {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
@@ -540,10 +550,12 @@ def _get_provider_config_fields(provider_type: str):
              'description': 'Navidrome username'},
             {'name': 'password', 'label': 'Password', 'type': 'password', 'required': True,
              'description': 'Navidrome password'},
+            music_path_prefix_field,
         ],
         'lyrion': [
             {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
              'description': 'Lyrion server URL (e.g., http://192.168.1.100:9000)'},
+            music_path_prefix_field,
         ],
         'mpd': [
             {'name': 'host', 'label': 'Host', 'type': 'text', 'required': True,
@@ -554,6 +566,7 @@ def _get_provider_config_fields(provider_type: str):
              'description': 'MPD password (if configured)'},
             {'name': 'music_directory', 'label': 'Music Directory', 'type': 'path', 'required': True,
              'description': 'Path to music files on the MPD server'},
+            music_path_prefix_field,
         ],
         'emby': [
             {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
@@ -562,6 +575,7 @@ def _get_provider_config_fields(provider_type: str):
              'description': 'Emby user ID'},
             {'name': 'token', 'label': 'API Token', 'type': 'password', 'required': True,
              'description': 'API key from Emby settings'},
+            music_path_prefix_field,
         ],
     }
     return fields.get(provider_type, [])
diff --git a/tasks/mediaserver_localfiles.py b/tasks/mediaserver_localfiles.py
index df02dca1..8cd40360 100644
--- a/tasks/mediaserver_localfiles.py
+++ b/tasks/mediaserver_localfiles.py
@@ -599,6 +599,13 @@ def get_provider_info() -> Dict:
                 'required': False,
                 'description': 'Where to save generated M3U playlists',
                 'default': '/music/playlists'
+            },
+            {
+                'name': 'music_path_prefix',
+                'label': 'Music Path Prefix',
+                'type': 'text',
+                'required': False,
+                'description': 'Folder prefix to strip for cross-provider matching. Leave empty if paths start directly with artist folders.'
             }
         ]
     }

From c07762d2aeff0c3a1b103c75747b90b50a648f9b Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 09:22:08 +0000
Subject: [PATCH 11/33] Add auto-detection of music_path_prefix during provider
 setup

- Add get_sample_tracks_from_provider() to fetch tracks with ad-hoc config
- Add detect_music_path_prefix() to compare paths between providers
- Update provider test endpoint to auto-detect prefix after connection test
- Add normalized_path column to track table for path comparison
- Update setup UI to display detection results and auto-fill prefix field

When adding a second provider, the system now:
1. Fetches sample tracks from the new provider
2. Compares paths with existing normalized tracks
3. Detects the prefix difference (e.g., "Library/" folder)
4. Auto-fills the music_path_prefix field in the setup form

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_helper.py        | 232 +++++++++++++++++++++++++++++++++++++++----
 app_setup.py         |  48 ++++++++-
 tasks/mediaserver.py | 209 ++++++++++++++++++++++++++++++++++++++
 templates/setup.html |  31 +++++-
 4 files changed, 494 insertions(+), 26 deletions(-)

diff --git a/app_helper.py b/app_helper.py
index a5f753bb..6073a40b 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -258,6 +258,7 @@ def init_db():
                 id SERIAL PRIMARY KEY,
                 file_path_hash VARCHAR(64) NOT NULL UNIQUE,
                 file_path TEXT NOT NULL,
+                normalized_path TEXT,
                 file_size BIGINT,
                 file_modified TIMESTAMP,
                 created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
@@ -265,6 +266,12 @@ def init_db():
             )
         """)
         cur.execute("CREATE INDEX IF NOT EXISTS idx_track_file_path_hash ON track(file_path_hash)")
+        # Add normalized_path column if it doesn't exist (migration for existing installs)
+        cur.execute("SELECT EXISTS (SELECT 1 FROM information_schema.columns WHERE table_name = 'track' AND column_name = 'normalized_path')")
+        if not cur.fetchone()[0]:
+            logger.info("Adding 'normalized_path' column to 'track' table.")
+            cur.execute("ALTER TABLE track ADD COLUMN normalized_path TEXT")
+            cur.execute("CREATE INDEX IF NOT EXISTS idx_track_normalized_path ON track(normalized_path)")
 
         # Create 'provider_track' table - Links provider item_ids to tracks
         cur.execute("""
@@ -1576,39 +1583,46 @@ def get_or_create_track(file_path, file_size=None, file_modified=None, provider_
     if not file_path:
         return None
 
-    file_path_hash = _compute_file_path_hash(file_path, provider_id)
-    if not file_path_hash:
+    # Get normalized path (without provider-specific prefix)
+    normalized_path = normalize_provider_path(file_path, provider_id)
+    if not normalized_path:
         return None
 
+    # Compute hash of the normalized path
+    import hashlib
+    file_path_hash = hashlib.sha256(normalized_path.encode('utf-8')).hexdigest()
+
     db = get_db()
     with db.cursor() as cur:
-        # Try to get existing track
+        # Try to get existing track by normalized path hash
         cur.execute("SELECT id FROM track WHERE file_path_hash = %s", (file_path_hash,))
         row = cur.fetchone()
 
         if row:
             track_id = row[0]
-            # Update file info if provided
-            if file_size is not None or file_modified is not None:
-                updates = ["updated_at = NOW()"]
-                values = []
-                if file_size is not None:
-                    updates.append("file_size = %s")
-                    values.append(file_size)
-                if file_modified is not None:
-                    updates.append("file_modified = %s")
-                    values.append(file_modified)
-                values.append(track_id)
-                cur.execute(f"UPDATE track SET {', '.join(updates)} WHERE id = %s", values)
-                db.commit()
+            # Update file info and normalized_path if provided
+            updates = ["updated_at = NOW()"]
+            values = []
+            if file_size is not None:
+                updates.append("file_size = %s")
+                values.append(file_size)
+            if file_modified is not None:
+                updates.append("file_modified = %s")
+                values.append(file_modified)
+            # Always update normalized_path to latest
+            updates.append("normalized_path = %s")
+            values.append(normalized_path)
+            values.append(track_id)
+            cur.execute(f"UPDATE track SET {', '.join(updates)} WHERE id = %s", values)
+            db.commit()
             return track_id
 
-        # Create new track
+        # Create new track with normalized_path
         cur.execute("""
-            INSERT INTO track (file_path_hash, file_path, file_size, file_modified)
-            VALUES (%s, %s, %s, %s)
+            INSERT INTO track (file_path_hash, file_path, normalized_path, file_size, file_modified)
+            VALUES (%s, %s, %s, %s, %s)
             RETURNING id
-        """, (file_path_hash, file_path, file_size, file_modified))
+        """, (file_path_hash, file_path, normalized_path, file_size, file_modified))
         track_id = cur.fetchone()[0]
         db.commit()
         return track_id
@@ -1824,4 +1838,180 @@ def find_existing_analysis_by_file_path(file_path):
                 'source': 'score_file_path'
             }
 
-        return None
\ No newline at end of file
+        return None
+
+
+def detect_music_path_prefix(sample_tracks, existing_normalized_paths=None):
+    """
+    Auto-detect the music_path_prefix for a new provider by comparing paths.
+
+    Takes sample tracks from a new provider and compares their paths with
+    existing normalized paths in the database to find the prefix difference.
+
+    Args:
+        sample_tracks: List of track dicts with 'title', 'artist', 'file_path' keys
+        existing_normalized_paths: Optional dict mapping (title, artist) -> normalized_path
+                                   If None, fetches from database
+
+    Returns:
+        dict with:
+            - detected_prefix: The detected prefix to strip (or empty string)
+            - confidence: 'high', 'medium', 'low', or 'none'
+            - matches_found: Number of matching tracks found
+            - sample_comparisons: List of example path comparisons
+    """
+    from urllib.parse import unquote
+
+    if not sample_tracks:
+        return {'detected_prefix': '', 'confidence': 'none', 'matches_found': 0, 'sample_comparisons': []}
+
+    # Get existing normalized paths from database if not provided
+    if existing_normalized_paths is None:
+        existing_normalized_paths = {}
+        db = get_db()
+        with db.cursor() as cur:
+            # Get normalized paths from track table
+            cur.execute("""
+                SELECT LOWER(pt.title), LOWER(pt.artist), t.normalized_path
+                FROM provider_track pt
+                JOIN track t ON pt.track_id = t.id
+                WHERE t.normalized_path IS NOT NULL
+                  AND pt.title IS NOT NULL
+                  AND pt.artist IS NOT NULL
+            """)
+            for row in cur.fetchall():
+                key = (row[0], row[1])
+                if key not in existing_normalized_paths:
+                    existing_normalized_paths[key] = row[2]
+
+            # Also check score table for legacy data
+            cur.execute("""
+                SELECT LOWER(title), LOWER(author), file_path
+                FROM score
+                WHERE file_path IS NOT NULL
+                  AND title IS NOT NULL
+                  AND author IS NOT NULL
+            """)
+            for row in cur.fetchall():
+                key = (row[0], row[1])
+                if key not in existing_normalized_paths:
+                    # Normalize the legacy path
+                    normalized = normalize_provider_path(row[2], provider_id=None)
+                    if normalized:
+                        existing_normalized_paths[key] = normalized
+
+    if not existing_normalized_paths:
+        return {'detected_prefix': '', 'confidence': 'none', 'matches_found': 0,
+                'sample_comparisons': [], 'message': 'No existing tracks to compare with'}
+
+    # Normalize the sample paths (basic normalization without provider prefix)
+    def basic_normalize(path):
+        """Basic path normalization without provider-specific prefix stripping."""
+        if not path:
+            return None
+        normalized = path
+        # Handle file:// URLs
+        if normalized.startswith('file://'):
+            normalized = normalized[7:]
+            normalized = unquote(normalized)
+        normalized = normalized.replace('\\', '/')
+        # Strip common mount points
+        prefixes = ['/media/music/', '/media/', '/mnt/media/music/', '/mnt/music/',
+                    '/mnt/', '/data/music/', '/data/', '/music/', '/share/', '/volume1/']
+        lower = normalized.lower()
+        for prefix in prefixes:
+            if lower.startswith(prefix.lower()):
+                normalized = normalized[len(prefix):]
+                break
+        return normalized.lstrip('/')
+
+    # Find matches and compare paths
+    matches = []
+    for track in sample_tracks:
+        title = track.get('title') or track.get('Name') or track.get('name')
+        artist = track.get('artist') or track.get('Artist') or track.get('AlbumArtist')
+        file_path = track.get('file_path') or track.get('Path') or track.get('path')
+
+        if not title or not artist or not file_path:
+            continue
+
+        key = (title.lower(), artist.lower())
+        existing_path = existing_normalized_paths.get(key)
+
+        if existing_path:
+            new_normalized = basic_normalize(file_path)
+            if new_normalized:
+                matches.append({
+                    'title': title,
+                    'artist': artist,
+                    'new_path': new_normalized,
+                    'existing_path': existing_path
+                })
+
+    if not matches:
+        return {'detected_prefix': '', 'confidence': 'none', 'matches_found': 0,
+                'sample_comparisons': [], 'message': 'No matching tracks found between providers'}
+
+    # Detect prefix by finding common suffix
+    prefix_candidates = {}
+    sample_comparisons = []
+
+    for match in matches[:20]:  # Limit analysis to first 20 matches
+        new_path = match['new_path']
+        existing_path = match['existing_path']
+
+        # Check if new path ends with existing path (case-insensitive)
+        if new_path.lower().endswith(existing_path.lower()):
+            # The prefix is what's before the existing path
+            prefix_len = len(new_path) - len(existing_path)
+            prefix = new_path[:prefix_len].rstrip('/')
+            if prefix:
+                prefix_candidates[prefix] = prefix_candidates.get(prefix, 0) + 1
+
+            sample_comparisons.append({
+                'title': match['title'],
+                'new_path': new_path,
+                'existing_path': existing_path,
+                'detected_prefix': prefix
+            })
+        elif existing_path.lower().endswith(new_path.lower()):
+            # The existing path has a prefix (new provider doesn't have it)
+            # This means the NEW provider needs no prefix, but existing does
+            prefix_len = len(existing_path) - len(new_path)
+            # In this case, we don't need a prefix for the new provider
+            prefix_candidates[''] = prefix_candidates.get('', 0) + 1
+
+            sample_comparisons.append({
+                'title': match['title'],
+                'new_path': new_path,
+                'existing_path': existing_path,
+                'detected_prefix': '(existing has prefix, new does not)'
+            })
+
+    if not prefix_candidates:
+        return {'detected_prefix': '', 'confidence': 'low', 'matches_found': len(matches),
+                'sample_comparisons': sample_comparisons[:5],
+                'message': 'Could not detect consistent prefix pattern'}
+
+    # Find most common prefix
+    most_common_prefix = max(prefix_candidates, key=prefix_candidates.get)
+    occurrence_count = prefix_candidates[most_common_prefix]
+    total_matches = len(matches)
+
+    # Determine confidence
+    if occurrence_count == total_matches and total_matches >= 3:
+        confidence = 'high'
+    elif occurrence_count >= total_matches * 0.8 and total_matches >= 2:
+        confidence = 'medium'
+    elif occurrence_count >= 1:
+        confidence = 'low'
+    else:
+        confidence = 'none'
+
+    return {
+        'detected_prefix': most_common_prefix,
+        'confidence': confidence,
+        'matches_found': len(matches),
+        'prefix_occurrences': occurrence_count,
+        'sample_comparisons': sample_comparisons[:5]
+    }
\ No newline at end of file
diff --git a/app_setup.py b/app_setup.py
index dd33f7d0..3da287a4 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -16,11 +16,12 @@
 from flask import Blueprint, jsonify, request, render_template, redirect, url_for, g
 from functools import wraps
 
-from app_helper import get_db
+from app_helper import get_db, detect_music_path_prefix
 from tasks.mediaserver import (
     get_available_provider_types,
     get_provider_info,
     test_provider_connection,
+    get_sample_tracks_from_provider,
     PROVIDER_TYPES
 )
 import config
@@ -533,6 +534,7 @@ def test_provider_endpoint(provider_id):
 def test_provider_config():
     """
     Test connection with provided configuration (without saving).
+    Also detects the music_path_prefix by comparing sample tracks with existing data.
     ---
     tags:
       - Setup
@@ -547,9 +549,12 @@ def test_provider_config():
                 type: string
               config:
                 type: object
+              detect_prefix:
+                type: boolean
+                description: Whether to auto-detect music_path_prefix (default true)
     responses:
       200:
-        description: Connection test result
+        description: Connection test result with optional prefix detection
     """
     data = request.get_json()
     if not data:
@@ -557,17 +562,52 @@ def test_provider_config():
 
     provider_type = data.get('provider_type')
     config_data = data.get('config', {})
+    detect_prefix = data.get('detect_prefix', True)
 
     if not provider_type:
         return jsonify({'error': 'provider_type is required'}), 400
 
     success, message = test_provider_connection(provider_type, config_data)
 
-    return jsonify({
+    result = {
         'success': success,
         'message': message,
         'provider_type': provider_type,
-    })
+    }
+
+    # If connection succeeded and prefix detection is enabled, try to detect prefix
+    if success and detect_prefix:
+        try:
+            # Fetch sample tracks from the new provider
+            sample_tracks = get_sample_tracks_from_provider(provider_type, config_data, limit=50)
+
+            if sample_tracks:
+                # Detect prefix by comparing with existing tracks
+                prefix_result = detect_music_path_prefix(sample_tracks)
+                result['prefix_detection'] = prefix_result
+
+                # If we detected a prefix with medium or high confidence, suggest it
+                if prefix_result.get('confidence') in ('high', 'medium'):
+                    result['suggested_prefix'] = prefix_result.get('detected_prefix', '')
+                    result['message'] += f" Detected path prefix: '{prefix_result.get('detected_prefix', '')}' ({prefix_result.get('confidence')} confidence)"
+                elif prefix_result.get('matches_found', 0) == 0:
+                    # No matching tracks found - this is likely the first provider
+                    result['prefix_detection']['message'] = 'No existing tracks to compare with (first provider setup)'
+            else:
+                result['prefix_detection'] = {
+                    'detected_prefix': '',
+                    'confidence': 'none',
+                    'message': 'Could not fetch sample tracks for comparison'
+                }
+        except Exception as e:
+            logger.warning(f"Prefix detection failed for {provider_type}: {e}")
+            result['prefix_detection'] = {
+                'detected_prefix': '',
+                'confidence': 'none',
+                'message': f'Prefix detection failed: {str(e)}'
+            }
+
+    return jsonify(result)
 
 
 @setup_bp.route('/api/setup/settings', methods=['GET'])
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index a890d2d8..0680380e 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -507,6 +507,215 @@ def test_provider_connection(provider_type: str, config_dict: dict = None):
         return False, f"Connection test failed: {str(e)}"
 
 
+def get_sample_tracks_from_provider(provider_type: str, config_dict: dict, limit: int = 50):
+    """
+    Fetch sample tracks from a provider using provided configuration.
+
+    This is used during provider setup to detect the music_path_prefix
+    by comparing track paths with existing data.
+
+    Args:
+        provider_type: Type of provider (jellyfin, navidrome, etc.)
+        config_dict: Configuration dictionary for the provider
+        limit: Maximum number of tracks to fetch
+
+    Returns:
+        List of track dicts with keys: title, artist, file_path
+    """
+    import requests
+
+    try:
+        if provider_type == 'jellyfin':
+            url = config_dict.get('url')
+            user_id = config_dict.get('user_id')
+            token = config_dict.get('token')
+            if not url or not user_id or not token:
+                return []
+
+            api_url = f"{url.rstrip('/')}/Users/{user_id}/Items"
+            headers = {"X-Emby-Token": token}
+            params = {
+                "IncludeItemTypes": "Audio",
+                "Recursive": True,
+                "Fields": "Path",
+                "Limit": limit
+            }
+            r = requests.get(api_url, headers=headers, params=params, timeout=15)
+            if r.status_code != 200:
+                return []
+
+            items = r.json().get("Items", [])
+            tracks = []
+            for item in items:
+                tracks.append({
+                    'title': item.get('Name'),
+                    'artist': item.get('AlbumArtist') or (item.get('Artists', [None])[0] if item.get('Artists') else None),
+                    'file_path': item.get('Path')
+                })
+            return tracks
+
+        elif provider_type == 'navidrome':
+            import hashlib
+            import secrets
+
+            url = config_dict.get('url')
+            user = config_dict.get('user')
+            password = config_dict.get('password')
+            if not url or not user or not password:
+                return []
+
+            salt = secrets.token_hex(8)
+            token = hashlib.md5((password + salt).encode()).hexdigest()
+            params = {
+                'u': user, 't': token, 's': salt,
+                'v': '1.16.1', 'c': 'audiomuse', 'f': 'json',
+                'query': '', 'songCount': limit, 'songOffset': 0
+            }
+            r = requests.get(f"{url.rstrip('/')}/rest/search3", params=params, timeout=15)
+            if r.status_code != 200:
+                return []
+
+            data = r.json()
+            songs = data.get('subsonic-response', {}).get('searchResult3', {}).get('song', [])
+            tracks = []
+            for s in songs:
+                tracks.append({
+                    'title': s.get('title'),
+                    'artist': s.get('artist'),
+                    'file_path': s.get('path')
+                })
+            return tracks
+
+        elif provider_type == 'emby':
+            url = config_dict.get('url')
+            user_id = config_dict.get('user_id')
+            token = config_dict.get('token')
+            if not url or not user_id or not token:
+                return []
+
+            api_url = f"{url.rstrip('/')}/Users/{user_id}/Items"
+            headers = {"X-Emby-Token": token}
+            params = {
+                "IncludeItemTypes": "Audio",
+                "Recursive": True,
+                "Fields": "Path",
+                "Limit": limit
+            }
+            r = requests.get(api_url, headers=headers, params=params, timeout=15)
+            if r.status_code != 200:
+                return []
+
+            items = r.json().get("Items", [])
+            tracks = []
+            for item in items:
+                tracks.append({
+                    'title': item.get('Name'),
+                    'artist': item.get('AlbumArtist') or (item.get('Artists', [None])[0] if item.get('Artists') else None),
+                    'file_path': item.get('Path')
+                })
+            return tracks
+
+        elif provider_type == 'lyrion':
+            url = config_dict.get('url')
+            if not url:
+                return []
+
+            # Lyrion uses JSON-RPC for queries
+            api_url = f"{url.rstrip('/')}/jsonrpc.js"
+            payload = {
+                "id": 1,
+                "method": "slim.request",
+                "params": ["", ["titles", "0", str(limit), "tags:aspu"]]
+            }
+            r = requests.post(api_url, json=payload, timeout=15)
+            if r.status_code != 200:
+                return []
+
+            data = r.json()
+            titles_loop = data.get('result', {}).get('titles_loop', [])
+            tracks = []
+            for t in titles_loop:
+                tracks.append({
+                    'title': t.get('title'),
+                    'artist': t.get('artist'),
+                    'file_path': t.get('url')  # Lyrion uses 'url' for file path
+                })
+            return tracks
+
+        elif provider_type == 'mpd':
+            try:
+                from mpd import MPDClient
+                host = config_dict.get('host', 'localhost')
+                port = int(config_dict.get('port', 6600))
+                password = config_dict.get('password')
+
+                client = MPDClient()
+                client.timeout = 10
+                client.connect(host, port)
+                if password:
+                    client.password(password)
+
+                # List all songs and take a sample
+                all_songs = client.listallinfo()
+                client.close()
+                client.disconnect()
+
+                tracks = []
+                count = 0
+                for song in all_songs:
+                    if song.get('file') and count < limit:
+                        tracks.append({
+                            'title': song.get('title'),
+                            'artist': song.get('artist') or song.get('albumartist'),
+                            'file_path': song.get('file')
+                        })
+                        count += 1
+                return tracks
+            except Exception:
+                return []
+
+        elif provider_type == 'localfiles':
+            import os
+            music_dir = config_dict.get('music_directory')
+            if not music_dir or not os.path.isdir(music_dir):
+                return []
+
+            formats = config_dict.get('supported_formats', '.mp3,.flac,.ogg,.m4a,.wav,.wma,.aac')
+            if isinstance(formats, str):
+                formats = [f.strip().lower() for f in formats.split(',')]
+
+            tracks = []
+            count = 0
+            for root, dirs, files in os.walk(music_dir):
+                for f in files:
+                    if count >= limit:
+                        break
+                    ext = os.path.splitext(f)[1].lower()
+                    if ext in formats or ext.lstrip('.') in [fmt.lstrip('.') for fmt in formats]:
+                        full_path = os.path.join(root, f)
+                        rel_path = os.path.relpath(full_path, music_dir)
+                        # Extract artist/title from path structure (Artist/Album/Track.ext)
+                        parts = rel_path.split(os.sep)
+                        artist = parts[0] if len(parts) > 1 else 'Unknown'
+                        title = os.path.splitext(parts[-1])[0]
+                        tracks.append({
+                            'title': title,
+                            'artist': artist,
+                            'file_path': rel_path
+                        })
+                        count += 1
+                if count >= limit:
+                    break
+            return tracks
+
+        else:
+            return []
+
+    except Exception as e:
+        logger.error(f"Error fetching sample tracks from {provider_type}: {e}")
+        return []
+
+
 def get_provider_info(provider_type: str):
     """Get detailed information about a provider type including config fields."""
     if provider_type == 'localfiles':
diff --git a/templates/setup.html b/templates/setup.html
index 451b21f4..db51bf49 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -966,7 +966,36 @@ <h4>Existing Installation Detected</h4>
             const data = await response.json();
 
             resultDiv.className = `test-result ${data.success ? 'success' : 'error'}`;
-            resultDiv.textContent = data.message;
+
+            // Build result message with prefix detection info
+            let resultHTML = `<strong>${data.success ? 'Success' : 'Failed'}:</strong> ${data.message}`;
+
+            // Handle prefix detection result
+            if (data.success && data.prefix_detection) {
+                const pd = data.prefix_detection;
+
+                // Auto-fill the music_path_prefix field if prefix detected with confidence
+                if (data.suggested_prefix !== undefined) {
+                    const prefixInput = document.querySelector(`[data-provider="${type}"][data-field="music_path_prefix"]`);
+                    if (prefixInput && !prefixInput.value) {
+                        prefixInput.value = data.suggested_prefix;
+                        resultHTML += `<br><small>Auto-filled path prefix: "${data.suggested_prefix}"</small>`;
+                    }
+                }
+
+                // Show prefix detection details
+                if (pd.confidence && pd.confidence !== 'none') {
+                    resultHTML += `<br><small>Path prefix detection: ${pd.confidence} confidence`;
+                    if (pd.matches_found) {
+                        resultHTML += ` (${pd.matches_found} matching tracks found)`;
+                    }
+                    resultHTML += `</small>`;
+                } else if (pd.message) {
+                    resultHTML += `<br><small>${pd.message}</small>`;
+                }
+            }
+
+            resultDiv.innerHTML = resultHTML;
         } catch (err) {
             resultDiv.className = 'test-result error';
             resultDiv.textContent = 'Connection test failed: ' + err.message;

From 90a15a86e9d05353489fe6e95f5ab153bb30d683 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Wed, 4 Feb 2026 09:28:49 +0000
Subject: [PATCH 12/33] Fix cross-provider analysis reuse to prevent duplicate
 track processing

- Update find_existing_analysis_by_file_path() to accept provider_id
- Add copy_analysis_to_new_item() to copy analysis between item_ids
- Update analyze_album_task() to check for existing cross-provider analysis
  before downloading and processing audio files

In multi-provider setups, when provider B tries to analyze a track that
provider A already analyzed, the system now:
1. Checks for existing analysis via normalized file path hash
2. Copies score, embedding, CLAP, and MuLan data to the new item_id
3. Creates proper track linking for the new provider

This prevents redundant GPU-intensive analysis of the same audio file
when multiple providers point to the same music library.

https://claude.ai/code/session_011AebTWAucDafK4m6uoSSNg
---
 app_helper.py     | 85 ++++++++++++++++++++++++++++++++++++++++++++---
 tasks/analysis.py | 20 ++++++++++-
 2 files changed, 100 insertions(+), 5 deletions(-)

diff --git a/app_helper.py b/app_helper.py
index 6073a40b..bb685c7a 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -1773,15 +1773,16 @@ def get_all_provider_item_ids_for_track(track_id):
         ]
 
 
-def find_existing_analysis_by_file_path(file_path):
+def find_existing_analysis_by_file_path(file_path, provider_id=None):
     """
-    Find existing analysis data for a file path.
+    Find existing analysis data for a file path using cross-provider matching.
 
     This is used to check if a track has already been analyzed under a different
-    provider's item_id, allowing reuse of analysis data.
+    provider's item_id, allowing reuse of analysis data in multi-provider setups.
 
     Args:
         file_path: Full or relative path to the audio file
+        provider_id: Optional provider ID for provider-specific path normalization
 
     Returns:
         dict with item_id and analysis status, or None if not found
@@ -1789,7 +1790,7 @@ def find_existing_analysis_by_file_path(file_path):
     if not file_path:
         return None
 
-    file_path_hash = _compute_file_path_hash(file_path)
+    file_path_hash = _compute_file_path_hash(file_path, provider_id)
     if not file_path_hash:
         return None
 
@@ -1841,6 +1842,82 @@ def find_existing_analysis_by_file_path(file_path):
         return None
 
 
+def copy_analysis_to_new_item(source_item_id, target_item_id, file_path=None, provider_id=None):
+    """
+    Copy analysis data from one item_id to another.
+
+    This is used in multi-provider setups when a track has already been analyzed
+    under a different provider's item_id. Instead of re-analyzing, we copy the
+    existing analysis to the new provider's item_id.
+
+    Args:
+        source_item_id: The item_id that has existing analysis
+        target_item_id: The new item_id to copy analysis to
+        file_path: Optional file path for track linking
+        provider_id: Optional provider ID for track linking
+
+    Returns:
+        True if analysis was copied successfully, False otherwise
+    """
+    if not source_item_id or not target_item_id:
+        return False
+
+    if source_item_id == target_item_id:
+        return True  # Nothing to copy
+
+    db = get_db()
+    try:
+        with db.cursor() as cur:
+            # Copy score data
+            cur.execute("""
+                INSERT INTO score (item_id, title, author, tempo, key, scale, mood_vector,
+                                   energy, other_features, album, album_artist, year, rating, file_path, track_id)
+                SELECT %s, title, author, tempo, key, scale, mood_vector,
+                       energy, other_features, album, album_artist, year, rating, file_path, track_id
+                FROM score WHERE item_id = %s
+                ON CONFLICT (item_id) DO NOTHING
+            """, (target_item_id, source_item_id))
+
+            # Copy embedding
+            cur.execute("""
+                INSERT INTO embedding (item_id, embedding)
+                SELECT %s, embedding FROM embedding WHERE item_id = %s
+                ON CONFLICT (item_id) DO NOTHING
+            """, (target_item_id, source_item_id))
+
+            # Copy CLAP embedding if exists
+            cur.execute("""
+                INSERT INTO clap_embedding (item_id, embedding)
+                SELECT %s, embedding FROM clap_embedding WHERE item_id = %s
+                ON CONFLICT (item_id) DO NOTHING
+            """, (target_item_id, source_item_id))
+
+            # Copy MuLan embedding if exists
+            cur.execute("""
+                INSERT INTO mulan_embedding (item_id, embedding)
+                SELECT %s, embedding FROM mulan_embedding WHERE item_id = %s
+                ON CONFLICT (item_id) DO NOTHING
+            """, (target_item_id, source_item_id))
+
+            db.commit()
+
+            # Create track linking for the new item
+            if file_path:
+                track_id = get_or_create_track(file_path, provider_id=provider_id)
+                if track_id:
+                    update_score_track_id(target_item_id, track_id)
+                    if provider_id is not None:
+                        link_provider_track(provider_id, track_id, target_item_id)
+
+            logger.info(f"Copied analysis from {source_item_id} to {target_item_id}")
+            return True
+
+    except Exception as e:
+        db.rollback()
+        logger.error(f"Failed to copy analysis from {source_item_id} to {target_item_id}: {e}")
+        return False
+
+
 def detect_music_path_prefix(sample_tracks, existing_normalized_paths=None):
     """
     Auto-detect the music_path_prefix for a new provider by comparing paths.
diff --git a/tasks/analysis.py b/tasks/analysis.py
index 3dffcfee..c0d16389 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -654,7 +654,8 @@ def analyze_album_task(album_id, album_name, top_n_moods, parent_task_id, provid
     from app import (app, JobStatus)
     from app_helper import (redis_conn, get_db, save_task_status, get_task_info_from_db,
                      save_track_analysis_and_embedding, save_clap_embedding,
-                     get_primary_provider_id,
+                     get_primary_provider_id, find_existing_analysis_by_file_path,
+                     copy_analysis_to_new_item,
                      TASK_STATUS_STARTED, TASK_STATUS_PROGRESS, TASK_STATUS_SUCCESS, TASK_STATUS_FAILURE, TASK_STATUS_REVOKED)
     from .clap_analyzer import analyze_audio_file as clap_analyze, is_clap_available
     from .mulan_analyzer import analyze_audio_file as mulan_analyze
@@ -781,6 +782,23 @@ def get_missing_mulan_track_ids(track_ids):
                 needs_clap = track_id_str in missing_clap_ids_set
                 needs_mulan = track_id_str in missing_mulan_ids_set
 
+                # Multi-provider: Check if this track was already analyzed under a different provider's item_id
+                # If so, copy the analysis instead of re-analyzing (saves significant compute time)
+                item_file_path = item.get('Path') or item.get('FilePath')
+                if needs_musicnn and item_file_path:
+                    existing_analysis = find_existing_analysis_by_file_path(item_file_path, active_provider_id)
+                    if existing_analysis and existing_analysis.get('has_musicnn'):
+                        # Found existing analysis from another provider - copy it
+                        source_item_id = existing_analysis.get('item_id')
+                        if source_item_id and source_item_id != track_id_str:
+                            if copy_analysis_to_new_item(source_item_id, track_id_str, item_file_path, active_provider_id):
+                                logger.info(f"Copied existing analysis for '{track_name_full}' from provider item {source_item_id}")
+                                needs_musicnn = False
+                                # Also check if CLAP/MuLan can be copied
+                                if needs_clap and existing_analysis.get('has_clap'):
+                                    needs_clap = False
+                                    logger.info(f"  - Also copied CLAP embedding")
+
                 # Album name update now handled in main analysis task. If needed, uncomment below:
                 # try:
                 #     with get_db() as conn, conn.cursor() as cur:

From c0c91f94a58261a1a0ab1c43e451a10a5ce1b9ef Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Wed, 4 Feb 2026 14:23:39 +0100
Subject: [PATCH 13/33] Many bug fixes

---
 README.md                                     |  54 ++
 app.py                                        |   9 +-
 app_helper.py                                 |  74 +-
 app_setup.py                                  | 193 ++++-
 config.py                                     |   9 +-
 .../docker-compose-unified-nvidia-test.yaml   | 233 ++++++
 deployment/docker-compose-unified-nvidia.yaml |  14 +-
 deployment/docker-compose-unified.yaml        |  14 +-
 requirements/common-noavx2.txt                |   1 -
 requirements/common.txt                       |   1 -
 tasks/analysis.py                             |   6 +-
 tasks/mediaserver.py                          | 373 +++++++---
 tasks/mediaserver_localfiles.py               | 122 +++-
 tasks/mediaserver_mpd.py                      | 308 --------
 tasks/song_alchemy.py                         |  20 -
 tasks/voyager_manager.py                      |  24 +-
 templates/settings.html                       |  75 +-
 templates/setup.html                          | 679 ++++++++++++++++--
 18 files changed, 1583 insertions(+), 626 deletions(-)
 create mode 100644 deployment/docker-compose-unified-nvidia-test.yaml
 delete mode 100644 tasks/mediaserver_mpd.py

diff --git a/README.md b/README.md
index 9dea9300..0c1670b7 100644
--- a/README.md
+++ b/README.md
@@ -105,6 +105,13 @@ For the architecture design of AudioMuse-AI, take a look to the [ARCHITECTURE](d
    EMBY_TOKEN=your-api-token
    ```
 
+   **For Local Files (No Media Server):**
+   ```env
+   MEDIASERVER_TYPE=localfiles
+   LOCALFILES_MUSIC_DIRECTORY=/path/to/your/music
+   LOCALFILES_PLAYLIST_DIR=/path/to/your/music/playlists
+   ```
+
 3. **Start the services:**
    ```bash
    docker compose -f deployment/docker-compose.yaml up -d
@@ -123,6 +130,53 @@ For the architecture design of AudioMuse-AI, take a look to the [ARCHITECTURE](d
 docker compose -f deployment/docker-compose.yaml down
 ```
 
+## Multi-Provider Support
+
+AudioMuse-AI supports connecting to multiple media servers simultaneously, allowing you to:
+- Share analysis data across providers (analyze once, use everywhere)
+- Create playlists on multiple servers at once
+- Use a GUI Setup Wizard for easy configuration
+
+### GUI Setup Wizard
+
+Access the Setup Wizard at `http://localhost:8000/setup` to:
+1. Add and configure multiple providers
+2. Test connections before saving
+3. Auto-detect music path prefixes for cross-provider matching
+4. Set a primary provider for playlist creation
+
+### Local Files Provider
+
+The Local Files provider scans your music directory directly without requiring a media server:
+- Supports MP3, FLAC, OGG, M4A, WAV, WMA, AAC, and OPUS formats
+- Extracts metadata from embedded tags (ID3, Vorbis comments, etc.)
+- Creates M3U playlists in a configurable directory
+- Extracts ratings from POPM, TXXX:RATING, and Vorbis RATING tags
+
+**Configuration:**
+```env
+MEDIASERVER_TYPE=localfiles
+LOCALFILES_MUSIC_DIRECTORY=/music              # Path to your music library
+LOCALFILES_PLAYLIST_DIR=/music/playlists       # Where to save generated playlists
+LOCALFILES_FORMATS=.mp3,.flac,.ogg,.m4a,.wav   # Supported audio formats
+LOCALFILES_SCAN_SUBDIRS=true                   # Scan subdirectories
+```
+
+### Cross-Provider Track Matching
+
+When using multiple providers, tracks are matched across servers using normalized file paths. This allows:
+- Analysis data to be reused across providers
+- Playlists to be created on any provider using tracks from another
+- Automatic ID remapping when creating cross-provider playlists
+
+### Extended Metadata Fields
+
+AudioMuse-AI now stores additional metadata for each track:
+- **album_artist**: The album artist (useful for compilations)
+- **year**: Release year extracted from various tag formats
+- **rating**: User rating on 0-5 scale (from tags or media server)
+- **file_path**: Normalized file path for cross-provider linking
+
 ## **Hardware Requirements**
 
 AudioMuse-AI has been tested on:
diff --git a/app.py b/app.py
index 0b630480..4b4c2943 100644
--- a/app.py
+++ b/app.py
@@ -1,7 +1,7 @@
 import os
 import psycopg2
 from psycopg2.extras import DictCursor
-from flask import Flask, jsonify, request, render_template, g
+from flask import Flask, jsonify, request, render_template, redirect, url_for, g
 import json
 import logging
 import threading
@@ -103,6 +103,7 @@ def teardown_db(e=None):
 def index():
     """
     Serve the main HTML page.
+    Redirects to setup wizard if initial setup is not completed.
     ---
     tags:
       - UI
@@ -113,7 +114,13 @@ def index():
           text/html:
             schema:
               type: string
+      302:
+        description: Redirect to setup wizard if setup not completed.
     """
+    # Check if setup is completed - redirect to wizard if not
+    from app_setup import is_setup_completed
+    if not is_setup_completed():
+        return redirect(url_for('setup.setup_page'))
     return render_template('index.html', title = 'AudioMuse-AI - Home Page', active='index')
 
 
diff --git a/app_helper.py b/app_helper.py
index bb685c7a..d7dca0f7 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -673,8 +673,6 @@ def _parse_year_from_date(year_value):
         except (ValueError, TypeError):
             rating = None
 
-    file_path = _sanitize_string(file_path, max_length=1000, field_name="file_path")
-
     mood_str = ','.join(f"{k}:{v:.3f}" for k, v in moods.items())
 
     conn = get_db() # This now calls the function within this file
@@ -1918,7 +1916,7 @@ def copy_analysis_to_new_item(source_item_id, target_item_id, file_path=None, pr
         return False
 
 
-def detect_music_path_prefix(sample_tracks, existing_normalized_paths=None):
+def detect_music_path_prefix(sample_tracks, existing_normalized_paths=None, extra_sample_tracks=None):
     """
     Auto-detect the music_path_prefix for a new provider by comparing paths.
 
@@ -1929,6 +1927,8 @@ def detect_music_path_prefix(sample_tracks, existing_normalized_paths=None):
         sample_tracks: List of track dicts with 'title', 'artist', 'file_path' keys
         existing_normalized_paths: Optional dict mapping (title, artist) -> normalized_path
                                    If None, fetches from database
+        extra_sample_tracks: Optional dict mapping provider_type -> list of track dicts
+                            from previously tested providers (for setup wizard flow)
 
     Returns:
         dict with:
@@ -1977,9 +1977,34 @@ def detect_music_path_prefix(sample_tracks, existing_normalized_paths=None):
                     if normalized:
                         existing_normalized_paths[key] = normalized
 
+    # Also add paths from extra_sample_tracks (from previously tested providers in setup wizard)
+    if extra_sample_tracks:
+        for provider_type, tracks in extra_sample_tracks.items():
+            for track in tracks:
+                title = track.get('title') or track.get('Name') or track.get('name')
+                artist = track.get('artist') or track.get('Artist') or track.get('AlbumArtist')
+                file_path = track.get('file_path') or track.get('Path') or track.get('path')
+                if title and artist and file_path:
+                    key = (title.lower(), artist.lower())
+                    if key not in existing_normalized_paths:
+                        normalized = normalize_provider_path(file_path, provider_id=None)
+                        if normalized:
+                            existing_normalized_paths[key] = normalized
+
     if not existing_normalized_paths:
         return {'detected_prefix': '', 'confidence': 'none', 'matches_found': 0,
-                'sample_comparisons': [], 'message': 'No existing tracks to compare with'}
+                'sample_comparisons': [], 'message': 'No existing tracks to compare with',
+                'had_existing_tracks': False}
+
+    # Build a secondary index by filename for fallback matching
+    # This helps when title extraction differs between providers (e.g., "01 - Song" vs "Song")
+    existing_by_filename = {}
+    for (title, artist), norm_path in existing_normalized_paths.items():
+        if norm_path:
+            # Extract filename from normalized path
+            filename = norm_path.split('/')[-1].lower() if '/' in norm_path else norm_path.lower()
+            if filename and filename not in existing_by_filename:
+                existing_by_filename[filename] = norm_path
 
     # Normalize the sample paths (basic normalization without provider prefix)
     def basic_normalize(path):
@@ -2009,25 +2034,36 @@ def basic_normalize(path):
         artist = track.get('artist') or track.get('Artist') or track.get('AlbumArtist')
         file_path = track.get('file_path') or track.get('Path') or track.get('path')
 
-        if not title or not artist or not file_path:
+        if not file_path:
+            continue
+
+        new_normalized = basic_normalize(file_path)
+        if not new_normalized:
             continue
 
-        key = (title.lower(), artist.lower())
-        existing_path = existing_normalized_paths.get(key)
+        # Try matching by title+artist first
+        existing_path = None
+        if title and artist:
+            key = (title.lower(), artist.lower())
+            existing_path = existing_normalized_paths.get(key)
+
+        # Fallback: match by filename (helps when title extraction differs between providers)
+        if not existing_path:
+            new_filename = new_normalized.split('/')[-1].lower() if '/' in new_normalized else new_normalized.lower()
+            existing_path = existing_by_filename.get(new_filename)
 
         if existing_path:
-            new_normalized = basic_normalize(file_path)
-            if new_normalized:
-                matches.append({
-                    'title': title,
-                    'artist': artist,
-                    'new_path': new_normalized,
-                    'existing_path': existing_path
-                })
+            matches.append({
+                'title': title or '(unknown)',
+                'artist': artist or '(unknown)',
+                'new_path': new_normalized,
+                'existing_path': existing_path
+            })
 
     if not matches:
         return {'detected_prefix': '', 'confidence': 'none', 'matches_found': 0,
-                'sample_comparisons': [], 'message': 'No matching tracks found between providers'}
+                'sample_comparisons': [], 'message': 'No matching tracks found between providers',
+                'had_existing_tracks': True}
 
     # Detect prefix by finding common suffix
     prefix_candidates = {}
@@ -2068,7 +2104,8 @@ def basic_normalize(path):
     if not prefix_candidates:
         return {'detected_prefix': '', 'confidence': 'low', 'matches_found': len(matches),
                 'sample_comparisons': sample_comparisons[:5],
-                'message': 'Could not detect consistent prefix pattern'}
+                'message': 'Could not detect consistent prefix pattern',
+                'had_existing_tracks': True}
 
     # Find most common prefix
     most_common_prefix = max(prefix_candidates, key=prefix_candidates.get)
@@ -2090,5 +2127,6 @@ def basic_normalize(path):
         'confidence': confidence,
         'matches_found': len(matches),
         'prefix_occurrences': occurrence_count,
-        'sample_comparisons': sample_comparisons[:5]
+        'sample_comparisons': sample_comparisons[:5],
+        'had_existing_tracks': True
     }
\ No newline at end of file
diff --git a/app_setup.py b/app_setup.py
index 3da287a4..813ed3a0 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -221,6 +221,75 @@ def delete_provider(provider_id):
         return cur.rowcount > 0
 
 
+# ##############################################################################
+# PROVIDER CONFIG VALIDATION
+# ##############################################################################
+
+PROVIDER_SCHEMAS = {
+    'jellyfin': {
+        'required': ['url', 'user_id', 'token'],
+        'optional': ['music_path_prefix'],
+    },
+    'navidrome': {
+        'required': ['url', 'user', 'password'],
+        'optional': ['music_path_prefix'],
+    },
+    'lyrion': {
+        'required': ['url'],
+        'optional': ['music_path_prefix'],
+    },
+    'emby': {
+        'required': ['url', 'user_id', 'token'],
+        'optional': ['music_path_prefix'],
+    },
+    'localfiles': {
+        'required': ['music_directory'],
+        'optional': ['supported_formats', 'scan_subdirectories', 'playlist_directory', 'music_path_prefix'],
+    },
+}
+
+
+def validate_provider_config(provider_type: str, config_data: dict) -> tuple:
+    """
+    Validate provider configuration data.
+
+    Args:
+        provider_type: Type of provider (jellyfin, navidrome, etc.)
+        config_data: Configuration dictionary to validate
+
+    Returns:
+        Tuple of (is_valid: bool, errors: list[str])
+    """
+    errors = []
+
+    if provider_type not in PROVIDER_SCHEMAS:
+        return False, [f"Unknown provider type: {provider_type}"]
+
+    schema = PROVIDER_SCHEMAS[provider_type]
+
+    # Check required fields
+    for field in schema['required']:
+        if not config_data.get(field):
+            errors.append(f"Missing required field: {field}")
+
+    # Validate URL fields
+    url_fields = ['url']
+    for field in url_fields:
+        if field in config_data and config_data[field]:
+            url = config_data[field]
+            if not url.startswith(('http://', 'https://')):
+                errors.append(f"{field} must start with http:// or https://")
+
+    # Validate music_directory for localfiles
+    if provider_type == 'localfiles' and config_data.get('music_directory'):
+        import os
+        music_dir = config_data['music_directory']
+        if not os.path.isabs(music_dir):
+            errors.append("music_directory must be an absolute path")
+
+    return len(errors) == 0, errors
+
+
 def create_default_provider_from_env():
     """
     Create a default provider from environment variables if no providers exist.
@@ -254,13 +323,6 @@ def create_default_provider_from_env():
         config_data = {
             'url': config.LYRION_URL,
         }
-    elif provider_type == 'mpd':
-        config_data = {
-            'host': config.MPD_HOST,
-            'port': config.MPD_PORT,
-            'password': config.MPD_PASSWORD,
-            'music_directory': config.MPD_MUSIC_DIRECTORY,
-        }
     elif provider_type == 'emby':
         config_data = {
             'url': config.EMBY_URL,
@@ -415,6 +477,11 @@ def create_provider():
     if provider_type not in PROVIDER_TYPES:
         return jsonify({'error': f'Unknown provider type: {provider_type}'}), 400
 
+    # Validate provider configuration
+    is_valid, validation_errors = validate_provider_config(provider_type, config_data)
+    if not is_valid:
+        return jsonify({'error': 'Validation failed', 'details': validation_errors}), 400
+
     try:
         provider_id = add_provider(provider_type, name, config_data, enabled, priority)
         return jsonify({'id': provider_id, 'message': 'Provider created'}), 201
@@ -458,6 +525,12 @@ def update_provider_endpoint(provider_id):
             if config_data[key] == '********':
                 config_data[key] = provider['config'].get(key)
 
+        # Validate the merged config
+        merged_config = {**provider.get('config', {}), **config_data}
+        is_valid, validation_errors = validate_provider_config(provider['provider_type'], merged_config)
+        if not is_valid:
+            return jsonify({'error': 'Validation failed', 'details': validation_errors}), 400
+
     success = update_provider(
         provider_id,
         name=data.get('name'),
@@ -552,6 +625,9 @@ def test_provider_config():
               detect_prefix:
                 type: boolean
                 description: Whether to auto-detect music_path_prefix (default true)
+              existing_sample_tracks:
+                type: object
+                description: Dict of provider_type -> list of tracks from previously tested providers
     responses:
       200:
         description: Connection test result with optional prefix detection
@@ -563,6 +639,7 @@ def test_provider_config():
     provider_type = data.get('provider_type')
     config_data = data.get('config', {})
     detect_prefix = data.get('detect_prefix', True)
+    existing_sample_tracks = data.get('existing_sample_tracks', {})
 
     if not provider_type:
         return jsonify({'error': 'provider_type is required'}), 400
@@ -582,17 +659,23 @@ def test_provider_config():
             sample_tracks = get_sample_tracks_from_provider(provider_type, config_data, limit=50)
 
             if sample_tracks:
-                # Detect prefix by comparing with existing tracks
-                prefix_result = detect_music_path_prefix(sample_tracks)
+                # Return sample tracks so frontend can cache them for subsequent provider tests
+                result['sample_tracks'] = sample_tracks
+
+                # Detect prefix by comparing with existing tracks (DB + cached tracks from previously tested providers)
+                prefix_result = detect_music_path_prefix(sample_tracks, extra_sample_tracks=existing_sample_tracks)
                 result['prefix_detection'] = prefix_result
 
-                # If we detected a prefix with medium or high confidence, suggest it
-                if prefix_result.get('confidence') in ('high', 'medium'):
+                # If we detected a prefix with any matches, suggest it for auto-fill
+                if prefix_result.get('matches_found', 0) > 0:
                     result['suggested_prefix'] = prefix_result.get('detected_prefix', '')
-                    result['message'] += f" Detected path prefix: '{prefix_result.get('detected_prefix', '')}' ({prefix_result.get('confidence')} confidence)"
-                elif prefix_result.get('matches_found', 0) == 0:
-                    # No matching tracks found - this is likely the first provider
+                    if prefix_result.get('confidence') in ('high', 'medium'):
+                        result['message'] += f" Detected path prefix: '{prefix_result.get('detected_prefix', '')}' ({prefix_result.get('confidence')} confidence)"
+                elif not prefix_result.get('had_existing_tracks', True):
+                    # No existing tracks at all - this is truly the first provider
                     result['prefix_detection']['message'] = 'No existing tracks to compare with (first provider setup)'
+                # If had_existing_tracks is True but matches_found is 0, keep the original message
+                # ("No matching tracks found between providers") which is more accurate
             else:
                 result['prefix_detection'] = {
                     'detected_prefix': '',
@@ -781,3 +864,85 @@ def get_server_info():
         'postgres_host': os.environ.get('POSTGRES_HOST', 'postgres'),
         'redis_url': os.environ.get('REDIS_URL', 'redis://redis:6379/0'),
     })
+
+
+@setup_bp.route('/api/setup/browse-directories', methods=['GET'])
+def browse_directories():
+    """
+    Browse directories on the server for file path selection.
+    ---
+    tags:
+      - Setup
+    parameters:
+      - name: path
+        in: query
+        required: false
+        description: Directory path to list. Defaults to root paths.
+        schema:
+          type: string
+    responses:
+      200:
+        description: List of directories
+    """
+    import os
+
+    requested_path = request.args.get('path', '')
+
+    # Security: prevent path traversal
+    if '..' in requested_path:
+        return jsonify({'error': 'Invalid path'}), 400
+
+    directories = []
+
+    if not requested_path:
+        # Return common root paths for Docker/Linux systems
+        root_paths = ['/music', '/data', '/media', '/mnt', '/home']
+        for path in root_paths:
+            if os.path.isdir(path):
+                directories.append({
+                    'name': path,
+                    'path': path,
+                    'is_root': True
+                })
+        # Also check if there are any mounted volumes at root
+        try:
+            for item in os.listdir('/'):
+                full_path = f'/{item}'
+                if os.path.isdir(full_path) and item not in ['proc', 'sys', 'dev', 'run', 'tmp', 'var', 'etc', 'usr', 'bin', 'sbin', 'lib', 'lib64', 'boot', 'root']:
+                    if full_path not in [d['path'] for d in directories]:
+                        directories.append({
+                            'name': item,
+                            'path': full_path,
+                            'is_root': True
+                        })
+        except PermissionError:
+            pass
+    else:
+        # List contents of the requested path
+        try:
+            if os.path.isdir(requested_path):
+                for item in sorted(os.listdir(requested_path)):
+                    full_path = os.path.join(requested_path, item)
+                    if os.path.isdir(full_path):
+                        # Check if directory is accessible
+                        try:
+                            os.listdir(full_path)
+                            accessible = True
+                        except PermissionError:
+                            accessible = False
+
+                        directories.append({
+                            'name': item,
+                            'path': full_path,
+                            'accessible': accessible
+                        })
+        except PermissionError:
+            return jsonify({'error': 'Permission denied'}), 403
+        except FileNotFoundError:
+            return jsonify({'error': 'Path not found'}), 404
+
+    return jsonify({
+        'current_path': requested_path or '/',
+        'parent_path': os.path.dirname(requested_path) if requested_path else None,
+        'directories': directories
+    })
diff --git a/config.py b/config.py
index 334bd411..cc933177 100644
--- a/config.py
+++ b/config.py
@@ -2,7 +2,7 @@
 import os
 
 # --- Media Server Type ---
-MEDIASERVER_TYPE = os.environ.get("MEDIASERVER_TYPE", "jellyfin").lower() # Possible values: jellyfin, navidrome, lyrion, mpd, emby, localfiles
+MEDIASERVER_TYPE = os.environ.get("MEDIASERVER_TYPE", "jellyfin").lower() # Possible values: jellyfin, navidrome, lyrion, emby, localfiles
 
 # --- Jellyfin and DB Constants (Read from Environment Variables first) ---
 
@@ -42,13 +42,6 @@
 # These are used only if MEDIASERVER_TYPE is "lyrion".
 LYRION_URL = os.environ.get("LYRION_URL", "http://your_lyrion_url:9000")
 
-# --- MPD (Music Player Daemon) Constants ---
-# These are used only if MEDIASERVER_TYPE is "mpd".
-MPD_HOST = os.environ.get("MPD_HOST", "localhost")
-MPD_PORT = int(os.environ.get("MPD_PORT", "6600"))
-MPD_PASSWORD = os.environ.get("MPD_PASSWORD", "")  # Optional password, leave empty if none
-MPD_MUSIC_DIRECTORY = os.environ.get("MPD_MUSIC_DIRECTORY", "/var/lib/mpd/music")  # Path to MPD's music directory for file access
-
 # --- Local Files Provider Constants ---
 # These are used only if MEDIASERVER_TYPE is "localfiles".
 LOCALFILES_MUSIC_DIRECTORY = os.environ.get("LOCALFILES_MUSIC_DIRECTORY", "/music")  # Path to local music directory
diff --git a/deployment/docker-compose-unified-nvidia-test.yaml b/deployment/docker-compose-unified-nvidia-test.yaml
new file mode 100644
index 00000000..2489b3d9
--- /dev/null
+++ b/deployment/docker-compose-unified-nvidia-test.yaml
@@ -0,0 +1,233 @@
+# AudioMuse-AI Unified Docker Compose - NVIDIA GPU Local Build (Testing)
+# =============================================================================
+# This deployment file builds images locally with NVIDIA GPU acceleration support.
+# Use this for development and testing of local changes.
+#
+# For production with pre-built images, use docker-compose-unified-nvidia.yaml
+# For CPU-only systems, use docker-compose-unified.yaml
+#
+# Requirements:
+#   - NVIDIA GPU with CUDA support
+#   - NVIDIA Container Toolkit installed
+#   - nvidia-docker2 or Docker 19.03+ with nvidia runtime
+#
+# Quick Start:
+#   1. Copy .env.example to .env and configure your settings
+#   2. Build and run: docker-compose -f docker-compose-unified-nvidia-test.yaml up -d --build
+#   3. Open http://localhost:8000 and complete the setup wizard
+#
+# All provider-specific settings are now configured via the GUI setup wizard
+# or the .env file. No need to use different docker-compose files for different
+# media servers!
+# =============================================================================
+
+version: '3.8'
+
+services:
+  # ---------------------------------------------------------------------------
+  # Redis - Task Queue
+  # ---------------------------------------------------------------------------
+  redis:
+    image: redis:7-alpine
+    container_name: audiomuse-redis
+    ports:
+      - "${REDIS_PORT:-6379}:6379"
+    volumes:
+      - redis-data:/data
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD", "redis-cli", "ping"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+
+  # ---------------------------------------------------------------------------
+  # PostgreSQL - Database
+  # ---------------------------------------------------------------------------
+  postgres:
+    image: postgres:15-alpine
+    container_name: audiomuse-postgres
+    environment:
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+    ports:
+      - "${POSTGRES_PORT:-5432}:5432"
+    volumes:
+      - postgres-data:/var/lib/postgresql/data
+    restart: unless-stopped
+    healthcheck:
+      test: ["CMD-SHELL", "pg_isready -U ${POSTGRES_USER:-audiomuse}"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Flask Application (Web UI & API) - NVIDIA GPU LOCAL BUILD
+  # ---------------------------------------------------------------------------
+  audiomuse-ai-flask:
+    build:
+      context: ..
+      dockerfile: Dockerfile
+      args:
+        BASE_IMAGE: nvidia/cuda:12.8.1-cudnn-runtime-ubuntu24.04
+    image: audiomuse-ai:local-unified-nvidia-test
+    container_name: audiomuse-ai-flask-app
+    ports:
+      - "${FRONTEND_PORT:-8000}:8000"
+    environment:
+      SERVICE_TYPE: "flask"
+      TZ: "${TZ:-UTC}"
+      # Media Server Configuration
+      # Configure via GUI setup wizard or set here for legacy support
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      # Jellyfin (if using)
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      # Navidrome (if using)
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      # Lyrion (if using)
+      LYRION_URL: "${LYRION_URL:-}"
+      # MPD (if using)
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      # Emby (if using)
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      # Local Files Provider (default)
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      LOCALFILES_FORMATS: "${LOCALFILES_FORMATS:-.mp3,.flac,.ogg,.m4a,.wav,.wma,.aac,.opus}"
+      LOCALFILES_SCAN_SUBDIRS: "${LOCALFILES_SCAN_SUBDIRS:-true}"
+      # Database Configuration
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+      POSTGRES_HOST: "postgres"
+      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
+      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
+      # AI Configuration
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # Features
+      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
+      TEMP_DIR: "/app/temp_audio"
+    volumes:
+      - temp-audio-flask:/app/temp_audio
+      # Music directory mount - use MUSIC_PATH env var for bind mount, or named volume by default
+      # For local files provider with your own music: set MUSIC_PATH=/path/to/your/music
+      # For GUI setup with external providers (Jellyfin, etc.): the default named volume works fine
+      - ../test/provider_testing_stack/providers/test_music:/music
+    depends_on:
+      redis:
+        condition: service_healthy
+      postgres:
+        condition: service_healthy
+    restart: unless-stopped
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              device_ids: ["${NVIDIA_GPU_ID:-0}"]
+              capabilities: [gpu]
+
+  # ---------------------------------------------------------------------------
+  # AudioMuse-AI Worker (Background Tasks & ML Analysis) - NVIDIA GPU LOCAL BUILD
+  # ---------------------------------------------------------------------------
+  audiomuse-ai-worker:
+    build:
+      context: ..
+      dockerfile: Dockerfile
+      args:
+        BASE_IMAGE: nvidia/cuda:12.8.1-cudnn-runtime-ubuntu24.04
+    image: audiomuse-ai:local-unified-nvidia-test
+    container_name: audiomuse-ai-worker-instance
+    environment:
+      SERVICE_TYPE: "worker"
+      TZ: "${TZ:-UTC}"
+      # NVIDIA GPU Settings
+      NVIDIA_VISIBLE_DEVICES: "${NVIDIA_GPU_ID:-0}"
+      NVIDIA_DRIVER_CAPABILITIES: "compute,utility"
+      # Media Server Configuration (same as flask service)
+      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-localfiles}"
+      JELLYFIN_URL: "${JELLYFIN_URL:-}"
+      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID:-}"
+      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN:-}"
+      NAVIDROME_URL: "${NAVIDROME_URL:-}"
+      NAVIDROME_USER: "${NAVIDROME_USER:-}"
+      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
+      LYRION_URL: "${LYRION_URL:-}"
+      MPD_HOST: "${MPD_HOST:-}"
+      MPD_PORT: "${MPD_PORT:-6600}"
+      MPD_PASSWORD: "${MPD_PASSWORD:-}"
+      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
+      EMBY_URL: "${EMBY_URL:-}"
+      EMBY_USER_ID: "${EMBY_USER_ID:-}"
+      EMBY_TOKEN: "${EMBY_TOKEN:-}"
+      LOCALFILES_MUSIC_DIRECTORY: "${LOCALFILES_MUSIC_DIRECTORY:-/music}"
+      LOCALFILES_PLAYLIST_DIR: "${LOCALFILES_PLAYLIST_DIR:-/music/playlists}"
+      LOCALFILES_FORMATS: "${LOCALFILES_FORMATS:-.mp3,.flac,.ogg,.m4a,.wav,.wma,.aac,.opus}"
+      LOCALFILES_SCAN_SUBDIRS: "${LOCALFILES_SCAN_SUBDIRS:-true}"
+      # Database Configuration
+      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
+      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
+      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
+      POSTGRES_HOST: "postgres"
+      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
+      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
+      # AI Configuration
+      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER:-NONE}"
+      OPENAI_API_KEY: "${OPENAI_API_KEY:-}"
+      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL:-}"
+      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME:-}"
+      GEMINI_API_KEY: "${GEMINI_API_KEY:-}"
+      MISTRAL_API_KEY: "${MISTRAL_API_KEY:-}"
+      # Features - Enable GPU clustering for NVIDIA
+      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
+      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-true}"
+      TEMP_DIR: "/app/temp_audio"
+    volumes:
+      - temp-audio-worker:/app/temp_audio
+      # Music directory mount - same as flask service
+      - ../test/provider_testing_stack/providers/test_music:/music
+    depends_on:
+      redis:
+        condition: service_healthy
+      postgres:
+        condition: service_healthy
+    restart: unless-stopped
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              device_ids: ["${NVIDIA_GPU_ID:-0}"]
+              capabilities: [gpu]
+
+# =============================================================================
+# Volumes
+# =============================================================================
+volumes:
+  redis-data:
+    name: audiomuse-redis-data-test
+  postgres-data:
+    name: audiomuse-postgres-data-test
+  temp-audio-flask:
+    name: audiomuse-temp-flask-test
+  temp-audio-worker:
+    name: audiomuse-temp-worker-test
+  # Default music volume - only used if MUSIC_PATH env var is not set
+  # For local files: set MUSIC_PATH=/your/music/folder in .env or environment
+  music-data:
+    name: audiomuse-music-data-test
diff --git a/deployment/docker-compose-unified-nvidia.yaml b/deployment/docker-compose-unified-nvidia.yaml
index b355eb1b..c86f8153 100644
--- a/deployment/docker-compose-unified-nvidia.yaml
+++ b/deployment/docker-compose-unified-nvidia.yaml
@@ -114,8 +114,10 @@ services:
       TEMP_DIR: "/app/temp_audio"
     volumes:
       - temp-audio-flask:/app/temp_audio
-      # Mount music directory for local files provider
-      - ${MUSIC_PATH:-./music}:/music:ro
+      # Music directory mount - use MUSIC_PATH env var for bind mount, or named volume by default
+      # For local files provider with your own music: set MUSIC_PATH=/path/to/your/music
+      # For GUI setup with external providers (Jellyfin, etc.): the default named volume works fine
+      - ${MUSIC_PATH:-music-data}:/music
     depends_on:
       redis:
         condition: service_healthy
@@ -180,8 +182,8 @@ services:
       TEMP_DIR: "/app/temp_audio"
     volumes:
       - temp-audio-worker:/app/temp_audio
-      # Mount music directory for local files provider
-      - ${MUSIC_PATH:-./music}:/music:ro
+      # Music directory mount - same as flask service
+      - ${MUSIC_PATH:-music-data}:/music
     depends_on:
       redis:
         condition: service_healthy
@@ -208,3 +210,7 @@ volumes:
     name: audiomuse-temp-flask
   temp-audio-worker:
     name: audiomuse-temp-worker
+  # Default music volume - only used if MUSIC_PATH env var is not set
+  # For local files: set MUSIC_PATH=/your/music/folder in .env or environment
+  music-data:
+    name: audiomuse-music-data
diff --git a/deployment/docker-compose-unified.yaml b/deployment/docker-compose-unified.yaml
index bdb8be31..e6541931 100644
--- a/deployment/docker-compose-unified.yaml
+++ b/deployment/docker-compose-unified.yaml
@@ -109,8 +109,10 @@ services:
       TEMP_DIR: "/app/temp_audio"
     volumes:
       - temp-audio-flask:/app/temp_audio
-      # Mount music directory for local files provider
-      - ${MUSIC_PATH:-./music}:/music:ro
+      # Music directory mount - use MUSIC_PATH env var for bind mount, or named volume by default
+      # For local files provider with your own music: set MUSIC_PATH=/path/to/your/music
+      # For GUI setup with external providers (Jellyfin, etc.): the default named volume works fine
+      - ${MUSIC_PATH:-music-data}:/music
     depends_on:
       redis:
         condition: service_healthy
@@ -165,8 +167,8 @@ services:
       TEMP_DIR: "/app/temp_audio"
     volumes:
       - temp-audio-worker:/app/temp_audio
-      # Mount music directory for local files provider
-      - ${MUSIC_PATH:-./music}:/music:ro
+      # Music directory mount - same as flask service
+      - ${MUSIC_PATH:-music-data}:/music
     depends_on:
       redis:
         condition: service_healthy
@@ -186,3 +188,7 @@ volumes:
     name: audiomuse-temp-flask
   temp-audio-worker:
     name: audiomuse-temp-worker
+  # Default music volume - only used if MUSIC_PATH env var is not set
+  # For local files: set MUSIC_PATH=/your/music/folder in .env or environment
+  music-data:
+    name: audiomuse-music-data
diff --git a/requirements/common-noavx2.txt b/requirements/common-noavx2.txt
index 4c15ed09..56543855 100644
--- a/requirements/common-noavx2.txt
+++ b/requirements/common-noavx2.txt
@@ -19,7 +19,6 @@ google-genai==1.57.0
 mistralai
 umap-learn
 pydub
-python-mpd2
 psutil
 onnx==1.14.1
 resampy
diff --git a/requirements/common.txt b/requirements/common.txt
index 6589cd7e..bdb40da4 100644
--- a/requirements/common.txt
+++ b/requirements/common.txt
@@ -20,7 +20,6 @@ mistralai
 umap-learn 
 # Use pozalabs fork to avoid Python 3.12 SyntaxWarning until upstream releases a proper fix (see: https://github.com/jiaaro/pydub/issues/801)
 pozalabs-pydub==0.37.0
-python-mpd2
 psutil
 onnx==1.20.0
 resampy
diff --git a/tasks/analysis.py b/tasks/analysis.py
index c0d16389..dfe4a737 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -661,13 +661,13 @@ def analyze_album_task(album_id, album_name, top_n_moods, parent_task_id, provid
     from .mulan_analyzer import analyze_audio_file as mulan_analyze
     from config import MULAN_ENABLED
 
-    # Get provider_id for track linking (use passed value or get primary provider)
-    active_provider_id = provider_id if provider_id is not None else get_primary_provider_id()
-    
     current_job = get_current_job(redis_conn)
     current_task_id = current_job.id if current_job else str(uuid.uuid4())
 
     with app.app_context():
+        # Get provider_id for track linking (use passed value or get primary provider)
+        # Must be inside app.app_context() since get_primary_provider_id() uses get_db()
+        active_provider_id = provider_id if provider_id is not None else get_primary_provider_id()
         initial_details = {"album_name": album_name, "log": [f"[{time.strftime('%Y-%m-%d %H:%M:%S')}] Album analysis task started."]}
         save_task_status(current_task_id, "album_analysis", TASK_STATUS_STARTED, parent_task_id=parent_task_id, sub_type_identifier=album_id, progress=0, details=initial_details)
         tracks_analyzed_count, tracks_skipped_count, current_progress_val = 0, 0, 0
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index 0680380e..1c8e06a7 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -10,7 +10,6 @@
 - jellyfin: Jellyfin Media Server
 - navidrome: Navidrome (Subsonic API)
 - lyrion: Lyrion Music Server (formerly LMS)
-- mpd: Music Player Daemon
 - emby: Emby Media Server
 - localfiles: Local file system scanner
 
@@ -65,19 +64,6 @@
     get_top_played_songs as lyrion_get_top_played_songs,
     get_last_played_time as lyrion_get_last_played_time,
 )
-from tasks.mediaserver_mpd import (
-    get_all_playlists as mpd_get_all_playlists,
-    delete_playlist as mpd_delete_playlist,
-    get_recent_albums as mpd_get_recent_albums,
-    get_tracks_from_album as mpd_get_tracks_from_album,
-    download_track as mpd_download_track,
-    get_all_songs as mpd_get_all_songs,
-    get_playlist_by_name as mpd_get_playlist_by_name,
-    create_playlist as mpd_create_playlist,
-    create_instant_playlist as mpd_create_instant_playlist,
-    get_top_played_songs as mpd_get_top_played_songs,
-    get_last_played_time as mpd_get_last_played_time,
-)
 from tasks.mediaserver_emby import (
     resolve_user as emby_resolve_user,
     get_all_playlists as emby_get_all_playlists,
@@ -135,12 +121,6 @@
         'supports_user_auth': False,
         'supports_play_history': True,
     },
-    'mpd': {
-        'name': 'MPD',
-        'description': 'Music Player Daemon - Flexible music server',
-        'supports_user_auth': False,
-        'supports_play_history': False,
-    },
     'emby': {
         'name': 'Emby',
         'description': 'Emby Media Server - Personal media server',
@@ -161,6 +141,137 @@ def get_available_provider_types():
     return PROVIDER_TYPES.copy()
 
 
+# ##############################################################################
+# PROVIDER FACTORY
+# ##############################################################################
+
+# Provider module mapping for dynamic dispatch
+PROVIDER_MODULES = {
+    'jellyfin': 'tasks.mediaserver_jellyfin',
+    'navidrome': 'tasks.mediaserver_navidrome',
+    'lyrion': 'tasks.mediaserver_lyrion',
+    'emby': 'tasks.mediaserver_emby',
+    'localfiles': 'tasks.mediaserver_localfiles',
+}
+
+# Pre-imported function maps for performance (avoid repeated imports)
+_PROVIDER_FUNCTIONS = {
+    'jellyfin': {
+        'get_all_playlists': jellyfin_get_all_playlists,
+        'delete_playlist': jellyfin_delete_playlist,
+        'get_recent_albums': jellyfin_get_recent_albums,
+        'get_tracks_from_album': jellyfin_get_tracks_from_album,
+        'download_track': jellyfin_download_track,
+        'get_all_songs': jellyfin_get_all_songs,
+        'get_playlist_by_name': jellyfin_get_playlist_by_name,
+        'create_playlist': jellyfin_create_playlist,
+        'create_instant_playlist': jellyfin_create_instant_playlist,
+        'get_top_played_songs': jellyfin_get_top_played_songs,
+        'get_last_played_time': jellyfin_get_last_played_time,
+    },
+    'navidrome': {
+        'get_all_playlists': navidrome_get_all_playlists,
+        'delete_playlist': navidrome_delete_playlist,
+        'get_recent_albums': navidrome_get_recent_albums,
+        'get_tracks_from_album': navidrome_get_tracks_from_album,
+        'download_track': navidrome_download_track,
+        'get_all_songs': navidrome_get_all_songs,
+        'get_playlist_by_name': navidrome_get_playlist_by_name,
+        'create_playlist': navidrome_create_playlist,
+        'create_instant_playlist': navidrome_create_instant_playlist,
+        'get_top_played_songs': navidrome_get_top_played_songs,
+        'get_last_played_time': navidrome_get_last_played_time,
+    },
+    'lyrion': {
+        'get_all_playlists': lyrion_get_all_playlists,
+        'delete_playlist': lyrion_delete_playlist,
+        'get_recent_albums': lyrion_get_recent_albums,
+        'get_tracks_from_album': lyrion_get_tracks_from_album,
+        'download_track': lyrion_download_track,
+        'get_all_songs': lyrion_get_all_songs,
+        'get_playlist_by_name': lyrion_get_playlist_by_name,
+        'create_playlist': lyrion_create_playlist,
+        'create_instant_playlist': lyrion_create_instant_playlist,
+        'get_top_played_songs': lyrion_get_top_played_songs,
+        'get_last_played_time': lyrion_get_last_played_time,
+    },
+    'emby': {
+        'get_all_playlists': emby_get_all_playlists,
+        'delete_playlist': emby_delete_playlist,
+        'get_recent_albums': emby_get_recent_albums,
+        'get_tracks_from_album': emby_get_tracks_from_album,
+        'download_track': emby_download_track,
+        'get_all_songs': emby_get_all_songs,
+        'get_playlist_by_name': emby_get_playlist_by_name,
+        'create_playlist': emby_create_playlist,
+        'create_instant_playlist': emby_create_instant_playlist,
+        'get_top_played_songs': emby_get_top_played_songs,
+        'get_last_played_time': emby_get_last_played_time,
+    },
+    'localfiles': {
+        'get_all_playlists': localfiles_get_all_playlists,
+        'delete_playlist': localfiles_delete_playlist,
+        'get_recent_albums': localfiles_get_recent_albums,
+        'get_tracks_from_album': localfiles_get_tracks_from_album,
+        'download_track': localfiles_download_track,
+        'get_all_songs': localfiles_get_all_songs,
+        'get_playlist_by_name': localfiles_get_playlist_by_name,
+        'create_playlist': localfiles_create_playlist,
+        'create_instant_playlist': localfiles_create_instant_playlist,
+        'get_top_played_songs': localfiles_get_top_played_songs,
+        'get_last_played_time': localfiles_get_last_played_time,
+    },
+}
+
+
+def get_provider_function(provider_type: str, function_name: str):
+    """
+    Get a specific function for a provider type.
+
+    Args:
+        provider_type: Type of provider (jellyfin, navidrome, etc.)
+        function_name: Name of the function to retrieve
+
+    Returns:
+        The provider function, or None if not found
+
+    Usage:
+        get_all_songs = get_provider_function('jellyfin', 'get_all_songs')
+        songs = get_all_songs()
+    """
+    provider_funcs = _PROVIDER_FUNCTIONS.get(provider_type)
+    if not provider_funcs:
+        logger.warning(f"Unknown provider type: {provider_type}")
+        return None
+    return provider_funcs.get(function_name)
+
+
+def dispatch_to_provider(function_name: str, provider_type: str = None, *args, **kwargs):
+    """
+    Dispatch a function call to the appropriate provider.
+
+    Args:
+        function_name: Name of the function to call
+        provider_type: Optional provider type override (defaults to config.MEDIASERVER_TYPE)
+        *args, **kwargs: Arguments to pass to the function
+
+    Returns:
+        Result of the provider function call
+
+    Usage:
+        songs = dispatch_to_provider('get_all_songs')
+        songs = dispatch_to_provider('get_all_songs', provider_type='navidrome')
+    """
+    if provider_type is None:
+        provider_type = config.MEDIASERVER_TYPE
+
+    func = get_provider_function(provider_type, function_name)
+    if func is None:
+        raise ValueError(f"Function '{function_name}' not found for provider '{provider_type}'")
+
+    return func(*args, **kwargs)
+
+
 # ##############################################################################
 # PUBLIC API (Dispatcher functions)
 # ##############################################################################
@@ -189,9 +300,6 @@ def delete_automatic_playlists():
     elif config.MEDIASERVER_TYPE == 'lyrion':
         playlists_to_check = lyrion_get_all_playlists()
         delete_function = lyrion_delete_playlist
-    elif config.MEDIASERVER_TYPE == 'mpd':
-        playlists_to_check = mpd_get_all_playlists()
-        delete_function = mpd_delete_playlist
     elif config.MEDIASERVER_TYPE == 'emby':
         playlists_to_check = emby_get_all_playlists()
         delete_function = emby_delete_playlist
@@ -210,7 +318,6 @@ def get_recent_albums(limit):
     if config.MEDIASERVER_TYPE == 'jellyfin': return jellyfin_get_recent_albums(limit)
     if config.MEDIASERVER_TYPE == 'navidrome': return navidrome_get_recent_albums(limit)
     if config.MEDIASERVER_TYPE == 'lyrion': return lyrion_get_recent_albums(limit)
-    if config.MEDIASERVER_TYPE == 'mpd': return mpd_get_recent_albums(limit)
     if config.MEDIASERVER_TYPE == 'emby': return emby_get_recent_albums(limit)
     if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_recent_albums(limit)
     return []
@@ -239,7 +346,6 @@ def get_tracks_from_album(album_id):
     if config.MEDIASERVER_TYPE == 'jellyfin': return jellyfin_get_tracks_from_album(album_id)
     if config.MEDIASERVER_TYPE == 'navidrome': return navidrome_get_tracks_from_album(album_id)
     if config.MEDIASERVER_TYPE == 'lyrion': return lyrion_get_tracks_from_album(album_id)
-    if config.MEDIASERVER_TYPE == 'mpd': return mpd_get_tracks_from_album(album_id)
     if config.MEDIASERVER_TYPE == 'emby': return emby_get_tracks_from_album(album_id)
     if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_tracks_from_album(album_id)
     return []
@@ -251,7 +357,6 @@ def download_track(temp_dir, item):
     if config.MEDIASERVER_TYPE == 'jellyfin': downloaded_path = jellyfin_download_track(temp_dir, item)
     elif config.MEDIASERVER_TYPE == 'navidrome': downloaded_path = navidrome_download_track(temp_dir, item)
     elif config.MEDIASERVER_TYPE == 'lyrion': downloaded_path = lyrion_download_track(temp_dir, item)
-    elif config.MEDIASERVER_TYPE == 'mpd': downloaded_path = mpd_download_track(temp_dir, item)
     elif config.MEDIASERVER_TYPE == 'emby': downloaded_path = emby_download_track(temp_dir, item)
     elif config.MEDIASERVER_TYPE == 'localfiles': downloaded_path = localfiles_download_track(temp_dir, item)
     
@@ -329,7 +434,6 @@ def get_all_songs():
     if config.MEDIASERVER_TYPE == 'jellyfin': return jellyfin_get_all_songs()
     if config.MEDIASERVER_TYPE == 'navidrome': return navidrome_get_all_songs()
     if config.MEDIASERVER_TYPE == 'lyrion': return lyrion_get_all_songs()
-    if config.MEDIASERVER_TYPE == 'mpd': return mpd_get_all_songs()
     if config.MEDIASERVER_TYPE == 'emby': return emby_get_all_songs()
     if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_all_songs()
     return []
@@ -340,7 +444,6 @@ def get_playlist_by_name(playlist_name):
     if config.MEDIASERVER_TYPE == 'jellyfin': return jellyfin_get_playlist_by_name(playlist_name)
     if config.MEDIASERVER_TYPE == 'navidrome': return navidrome_get_playlist_by_name(playlist_name)
     if config.MEDIASERVER_TYPE == 'lyrion': return lyrion_get_playlist_by_name(playlist_name)
-    if config.MEDIASERVER_TYPE == 'mpd': return mpd_get_playlist_by_name(playlist_name)
     if config.MEDIASERVER_TYPE == 'emby': return emby_get_playlist_by_name(playlist_name)
     if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_playlist_by_name(playlist_name)
     return None
@@ -352,7 +455,6 @@ def create_playlist(base_name, item_ids):
     if config.MEDIASERVER_TYPE == 'jellyfin': jellyfin_create_playlist(base_name, item_ids)
     elif config.MEDIASERVER_TYPE == 'navidrome': navidrome_create_playlist(base_name, item_ids)
     elif config.MEDIASERVER_TYPE == 'lyrion': lyrion_create_playlist(base_name, item_ids)
-    elif config.MEDIASERVER_TYPE == 'mpd': mpd_create_playlist(base_name, item_ids)
     elif config.MEDIASERVER_TYPE == 'emby': emby_create_playlist(base_name, item_ids)
     elif config.MEDIASERVER_TYPE == 'localfiles': localfiles_create_playlist(base_name, item_ids)
 
@@ -367,8 +469,6 @@ def create_instant_playlist(playlist_name, item_ids, user_creds=None):
         return navidrome_create_instant_playlist(playlist_name, item_ids, user_creds)
     if config.MEDIASERVER_TYPE == 'lyrion':
         return lyrion_create_instant_playlist(playlist_name, item_ids)
-    if config.MEDIASERVER_TYPE == 'mpd':
-        return mpd_create_instant_playlist(playlist_name, item_ids, user_creds)
     if config.MEDIASERVER_TYPE == 'emby':
         return emby_create_instant_playlist(playlist_name, item_ids, user_creds)
     if config.MEDIASERVER_TYPE == 'localfiles':
@@ -383,8 +483,6 @@ def get_top_played_songs(limit, user_creds=None):
         return navidrome_get_top_played_songs(limit, user_creds)
     if config.MEDIASERVER_TYPE == 'lyrion':
         return lyrion_get_top_played_songs(limit)
-    if config.MEDIASERVER_TYPE == 'mpd':
-        return mpd_get_top_played_songs(limit, user_creds)
     if config.MEDIASERVER_TYPE == 'emby':
         return emby_get_top_played_songs(limit, user_creds)
     if config.MEDIASERVER_TYPE == 'localfiles':
@@ -399,8 +497,6 @@ def get_last_played_time(item_id, user_creds=None):
         return navidrome_get_last_played_time(item_id, user_creds)
     if config.MEDIASERVER_TYPE == 'lyrion':
         return lyrion_get_last_played_time(item_id)
-    if config.MEDIASERVER_TYPE == 'mpd':
-        return mpd_get_last_played_time(item_id, user_creds)
     if config.MEDIASERVER_TYPE == 'emby':
         return emby_get_last_played_time(item_id, user_creds)
     if config.MEDIASERVER_TYPE == 'localfiles':
@@ -480,24 +576,6 @@ def test_provider_connection(provider_type: str, config_dict: dict = None):
                 return True, f"Connected to Emby at {url}"
             return False, f"Emby returned status {resp.status_code}"
 
-        elif provider_type == 'mpd':
-            try:
-                from mpd import MPDClient
-                host = config_dict.get('host') if config_dict else config.MPD_HOST
-                port = config_dict.get('port') if config_dict else config.MPD_PORT
-                password = config_dict.get('password') if config_dict else config.MPD_PASSWORD
-                client = MPDClient()
-                client.timeout = 10
-                client.connect(host, int(port))
-                if password:
-                    client.password(password)
-                stats = client.stats()
-                client.close()
-                client.disconnect()
-                return True, f"Connected to MPD at {host}:{port} ({stats.get('songs', 0)} songs)"
-            except Exception as e:
-                return False, f"MPD connection error: {str(e)}"
-
         else:
             return False, f"Unknown provider type: {provider_type}"
 
@@ -642,38 +720,6 @@ def get_sample_tracks_from_provider(provider_type: str, config_dict: dict, limit
                 })
             return tracks
 
-        elif provider_type == 'mpd':
-            try:
-                from mpd import MPDClient
-                host = config_dict.get('host', 'localhost')
-                port = int(config_dict.get('port', 6600))
-                password = config_dict.get('password')
-
-                client = MPDClient()
-                client.timeout = 10
-                client.connect(host, port)
-                if password:
-                    client.password(password)
-
-                # List all songs and take a sample
-                all_songs = client.listallinfo()
-                client.close()
-                client.disconnect()
-
-                tracks = []
-                count = 0
-                for song in all_songs:
-                    if song.get('file') and count < limit:
-                        tracks.append({
-                            'title': song.get('title'),
-                            'artist': song.get('artist') or song.get('albumartist'),
-                            'file_path': song.get('file')
-                        })
-                        count += 1
-                return tracks
-            except Exception:
-                return []
-
         elif provider_type == 'localfiles':
             import os
             music_dir = config_dict.get('music_directory')
@@ -766,17 +812,6 @@ def _get_provider_config_fields(provider_type: str):
              'description': 'Lyrion server URL (e.g., http://192.168.1.100:9000)'},
             music_path_prefix_field,
         ],
-        'mpd': [
-            {'name': 'host', 'label': 'Host', 'type': 'text', 'required': True,
-             'description': 'MPD server hostname or IP', 'default': 'localhost'},
-            {'name': 'port', 'label': 'Port', 'type': 'number', 'required': True,
-             'description': 'MPD port number', 'default': 6600},
-            {'name': 'password', 'label': 'Password', 'type': 'password', 'required': False,
-             'description': 'MPD password (if configured)'},
-            {'name': 'music_directory', 'label': 'Music Directory', 'type': 'path', 'required': True,
-             'description': 'Path to music files on the MPD server'},
-            music_path_prefix_field,
-        ],
         'emby': [
             {'name': 'url', 'label': 'Server URL', 'type': 'url', 'required': True,
              'description': 'Emby server URL (e.g., http://192.168.1.100:8096)'},
@@ -786,6 +821,16 @@ def _get_provider_config_fields(provider_type: str):
              'description': 'API key from Emby settings'},
             music_path_prefix_field,
         ],
+        'localfiles': [
+            {'name': 'music_directory', 'label': 'Music Directory', 'type': 'path', 'required': True,
+             'description': 'Path to your music library folder (e.g., /music)', 'default': '/music'},
+            {'name': 'playlist_directory', 'label': 'Playlist Directory', 'type': 'path', 'required': False,
+             'description': 'Where to save generated playlists', 'default': '/music/playlists'},
+            {'name': 'formats', 'label': 'Audio Formats', 'type': 'text', 'required': False,
+             'description': 'Comma-separated list of formats to scan', 'default': '.mp3,.flac,.ogg,.m4a,.wav'},
+            {'name': 'scan_subdirs', 'label': 'Scan Subdirectories', 'type': 'boolean', 'required': False,
+             'description': 'Recursively scan subdirectories', 'default': True},
+        ],
     }
     return fields.get(provider_type, [])
 
@@ -849,21 +894,102 @@ def get_all_playlists_multi_provider(provider_ids=None):
 
 def _get_playlists_for_provider_type(provider_type):
     """Get playlists for a specific provider type using current config."""
-    if provider_type == 'jellyfin':
-        return jellyfin_get_all_playlists()
-    elif provider_type == 'navidrome':
-        return navidrome_get_all_playlists()
-    elif provider_type == 'lyrion':
-        return lyrion_get_all_playlists()
-    elif provider_type == 'mpd':
-        return mpd_get_all_playlists()
-    elif provider_type == 'emby':
-        return emby_get_all_playlists()
-    elif provider_type == 'localfiles':
-        return localfiles_get_all_playlists()
+    func = get_provider_function(provider_type, 'get_all_playlists')
+    if func:
+        return func()
     return []
 
 
+def remap_item_ids_for_provider(item_ids: list, source_provider_id: int, target_provider_id: int) -> list:
+    """
+    Remap item IDs from one provider's namespace to another's using file_path as the common key.
+
+    When creating playlists across providers, item_ids from the source provider need to be
+    translated to the target provider's item_ids. This is done by:
+    1. Looking up file_path for each source item_id in the score table
+    2. Finding the matching item_id in the target provider by file_path
+
+    Args:
+        item_ids: List of item IDs from the source provider
+        source_provider_id: ID of the source provider
+        target_provider_id: ID of the target provider
+
+    Returns:
+        List of remapped item IDs for the target provider (preserving order, skipping unmatchable)
+    """
+    if not item_ids:
+        return []
+
+    # If same provider, no remapping needed
+    if source_provider_id == target_provider_id:
+        return item_ids
+
+    from app_helper import get_db
+
+    db = get_db()
+    remapped_ids = []
+
+    try:
+        with db.cursor() as cur:
+            # Get file_paths for source item_ids
+            cur.execute("""
+                SELECT item_id, file_path
+                FROM score
+                WHERE item_id = ANY(%s) AND file_path IS NOT NULL
+            """, (item_ids,))
+            source_id_to_path = {row[0]: row[1] for row in cur.fetchall()}
+
+            if not source_id_to_path:
+                logger.warning(f"No file_paths found for source item_ids (provider {source_provider_id})")
+                return item_ids  # Fall back to original IDs
+
+            # Get the file paths we need to look up
+            paths_to_find = list(source_id_to_path.values())
+
+            # Find matching item_ids in target provider by file_path
+            # The score table has file_path but item_ids are provider-specific
+            # We need to normalize paths and match
+            cur.execute("""
+                SELECT item_id, file_path
+                FROM score
+                WHERE file_path = ANY(%s)
+            """, (paths_to_find,))
+            path_to_ids = {}
+            for row in cur.fetchall():
+                path = row[1]
+                if path not in path_to_ids:
+                    path_to_ids[path] = []
+                path_to_ids[path].append(row[0])
+
+            # Remap in order, preserving the original playlist order
+            for orig_id in item_ids:
+                path = source_id_to_path.get(orig_id)
+                if path and path in path_to_ids:
+                    # Use the first matching ID (there might be multiple if same file analyzed multiple times)
+                    target_ids = path_to_ids[path]
+                    if target_ids:
+                        # Prefer an ID that's different from source if available (for cross-provider)
+                        for tid in target_ids:
+                            if tid != orig_id:
+                                remapped_ids.append(tid)
+                                break
+                        else:
+                            # All IDs are the same, use the first one
+                            remapped_ids.append(target_ids[0])
+                else:
+                    # No match found, keep original ID (might work if providers share IDs)
+                    logger.debug(f"No cross-provider match for item_id {orig_id}, keeping original")
+                    remapped_ids.append(orig_id)
+
+            logger.info(f"Remapped {len(remapped_ids)} of {len(item_ids)} item IDs for cross-provider playlist")
+
+    except Exception as e:
+        logger.error(f"Error remapping item IDs: {e}")
+        return item_ids  # Fall back to original IDs
+
+    return remapped_ids
+
+
 def create_playlist_multi_provider(playlist_name, item_ids, provider_ids=None, user_creds=None):
     """
     Create a playlist on one or more providers.
@@ -912,20 +1038,41 @@ def create_playlist_multi_provider(playlist_name, item_ids, provider_ids=None, u
             provider = get_provider_by_id(provider_ids)
             providers = [provider] if provider else []
 
+    # Determine source provider for ID remapping
+    # If we have a primary provider, use its IDs as the source
+    source_provider_id = get_primary_provider_id()
+    if not source_provider_id and providers:
+        source_provider_id = providers[0]['id']
+
     # Create playlist on each provider
     for provider in providers:
         provider_id = provider['id']
         provider_type = provider['provider_type']
 
         try:
-            # For now, use the dispatcher which uses current config
-            # In the future, we may want provider-specific config
-            created = _create_playlist_for_provider_type(provider_type, playlist_name, item_ids, user_creds)
+            # Remap item IDs if creating on a different provider
+            if source_provider_id and provider_id != source_provider_id:
+                remapped_ids = remap_item_ids_for_provider(item_ids, source_provider_id, provider_id)
+                logger.info(f"Cross-provider playlist: remapped {len(item_ids)} IDs for provider {provider.get('name')}")
+            else:
+                remapped_ids = item_ids
+
+            if not remapped_ids:
+                logger.warning(f"No valid track IDs after remapping for provider {provider.get('name')}")
+                results[provider_id] = {
+                    'success': False,
+                    'error': 'No valid track IDs after cross-provider remapping',
+                    'provider_name': provider.get('name', provider_type)
+                }
+                continue
+
+            created = _create_playlist_for_provider_type(provider_type, playlist_name, remapped_ids, user_creds)
 
             results[provider_id] = {
                 'success': True,
                 'playlist_id': created.get('Id') or created.get('id') if created else None,
-                'provider_name': provider.get('name', provider_type)
+                'provider_name': provider.get('name', provider_type),
+                'tracks_added': len(remapped_ids)
             }
         except Exception as e:
             logger.error(f"Failed to create playlist on provider {provider.get('name')}: {e}")
@@ -946,8 +1093,6 @@ def _create_playlist_for_provider_type(provider_type, playlist_name, item_ids, u
         return navidrome_create_instant_playlist(playlist_name, item_ids, user_creds)
     elif provider_type == 'lyrion':
         return lyrion_create_instant_playlist(playlist_name, item_ids)
-    elif provider_type == 'mpd':
-        return mpd_create_instant_playlist(playlist_name, item_ids, user_creds)
     elif provider_type == 'emby':
         return emby_create_instant_playlist(playlist_name, item_ids, user_creds)
     elif provider_type == 'localfiles':
diff --git a/tasks/mediaserver_localfiles.py b/tasks/mediaserver_localfiles.py
index 8cd40360..0d1574d1 100644
--- a/tasks/mediaserver_localfiles.py
+++ b/tasks/mediaserver_localfiles.py
@@ -88,7 +88,7 @@ def extract_metadata(file_path: str) -> Dict:
     """
     Extract metadata from an audio file using mutagen.
 
-    Returns a dict with keys: title, artist, album, album_artist, track_number, year, genre
+    Returns a dict with keys: title, artist, album, album_artist, track_number, year, genre, rating
     """
     metadata = {
         'title': os.path.splitext(os.path.basename(file_path))[0],  # Default to filename
@@ -99,6 +99,7 @@ def extract_metadata(file_path: str) -> Dict:
         'year': None,
         'genre': None,
         'duration': None,
+        'rating': None,
     }
 
     if not MUTAGEN_AVAILABLE:
@@ -176,12 +177,128 @@ def extract_metadata(file_path: str) -> Dict:
                 val = tags['genre']
                 metadata['genre'] = val[0] if isinstance(val, list) else str(val)
 
+        # Extract rating from non-easy tags (requires re-opening without easy=True)
+        metadata['rating'] = _extract_rating(file_path)
+
     except Exception as e:
         logger.warning(f"Error extracting metadata from {file_path}: {e}")
 
     return metadata
 
 
+def _extract_rating(file_path: str) -> Optional[int]:
+    """
+    Extract rating from audio file tags.
+
+    Supports:
+    - ID3 POPM (Popularimeter) frame for MP3 (0-255 scale, converted to 0-5)
+    - ID3 TXXX:RATING frame for MP3
+    - FLAC/OGG Vorbis RATING comment
+    - MP4/M4A rating
+
+    Returns rating on 0-5 scale, or None if not found.
+    """
+    if not MUTAGEN_AVAILABLE:
+        return None
+
+    try:
+        audio = MutagenFile(file_path, easy=False)
+        if audio is None:
+            return None
+
+        ext = os.path.splitext(file_path)[1].lower()
+
+        # MP3 files - check ID3 tags
+        if ext == '.mp3' and audio.tags:
+            # Try POPM (Popularimeter) frame first
+            for key in audio.tags.keys():
+                if key.startswith('POPM'):
+                    popm = audio.tags[key]
+                    if hasattr(popm, 'rating'):
+                        # POPM rating is 0-255, convert to 0-5 scale
+                        # Common mappings: 0=0, 1=1, 64=2, 128=3, 196=4, 255=5
+                        popm_rating = popm.rating
+                        if popm_rating == 0:
+                            return 0
+                        elif popm_rating <= 31:
+                            return 1
+                        elif popm_rating <= 95:
+                            return 2
+                        elif popm_rating <= 159:
+                            return 3
+                        elif popm_rating <= 223:
+                            return 4
+                        else:
+                            return 5
+
+            # Try TXXX:RATING frame
+            for key in audio.tags.keys():
+                if key.startswith('TXXX') and 'RATING' in str(key).upper():
+                    try:
+                        rating_str = str(audio.tags[key].text[0])
+                        rating = int(float(rating_str))
+                        # Normalize to 0-5 if needed
+                        if rating > 5:
+                            rating = min(5, rating // 20)  # Assume 0-100 scale
+                        return max(0, min(5, rating))
+                    except (ValueError, IndexError, AttributeError):
+                        pass
+
+        # FLAC files - check Vorbis comments
+        elif ext == '.flac' and hasattr(audio, 'tags') and audio.tags:
+            for key in ['RATING', 'FMPS_RATING', 'rating']:
+                if key in audio.tags:
+                    try:
+                        rating_str = audio.tags[key][0]
+                        rating = float(rating_str)
+                        # FMPS uses 0-1 scale, convert to 0-5
+                        if rating <= 1:
+                            return round(rating * 5)
+                        # Direct 0-5 scale
+                        return max(0, min(5, int(rating)))
+                    except (ValueError, IndexError):
+                        pass
+
+        # OGG files - similar to FLAC
+        elif ext in ('.ogg', '.opus') and hasattr(audio, 'tags') and audio.tags:
+            for key in ['RATING', 'FMPS_RATING', 'rating']:
+                if key in audio.tags:
+                    try:
+                        rating_str = audio.tags[key][0]
+                        rating = float(rating_str)
+                        if rating <= 1:
+                            return round(rating * 5)
+                        return max(0, min(5, int(rating)))
+                    except (ValueError, IndexError):
+                        pass
+
+        # M4A/MP4 files
+        elif ext in ('.m4a', '.mp4') and hasattr(audio, 'tags') and audio.tags:
+            # iTunes rating stored in 'rtng' atom (0-100) or as custom tag
+            if 'rtng' in audio.tags:
+                try:
+                    rating = audio.tags['rtng'][0]
+                    # iTunes uses 0-100 scale
+                    return max(0, min(5, rating // 20))
+                except (IndexError, TypeError):
+                    pass
+            # Check for custom rating tags
+            for key in audio.tags.keys():
+                if 'rating' in str(key).lower():
+                    try:
+                        rating = int(audio.tags[key][0])
+                        if rating > 5:
+                            rating = min(5, rating // 20)
+                        return max(0, min(5, rating))
+                    except (ValueError, IndexError, TypeError):
+                        pass
+
+    except Exception as e:
+        logger.debug(f"Error extracting rating from {file_path}: {e}")
+
+    return None
+
+
 def _format_song(file_path: str, base_path: str) -> Dict:
     """Format a local file into the standard song format used by AudioMuse-AI."""
     normalized_path = normalize_file_path(file_path, base_path)
@@ -210,6 +327,7 @@ def _format_song(file_path: str, base_path: str) -> Dict:
         'Year': metadata['year'],
         'Genre': metadata['genre'],
         'Duration': metadata['duration'],
+        'Rating': metadata.get('rating'),
         'FileSize': file_size,
         'last-modified': file_modified.isoformat() if file_modified else None,
         # For compatibility with other providers
@@ -495,7 +613,7 @@ def create_playlist(base_name: str, item_ids: List[str]) -> Optional[str]:
         return None
 
     # Write M3U file
-    playlist_name = f"{base_name}_automatic.m3u"
+    playlist_name = f"{base_name}.m3u"
     playlist_path = os.path.join(playlist_dir, playlist_name)
 
     try:
diff --git a/tasks/mediaserver_mpd.py b/tasks/mediaserver_mpd.py
deleted file mode 100644
index 43fc3a44..00000000
--- a/tasks/mediaserver_mpd.py
+++ /dev/null
@@ -1,308 +0,0 @@
-# tasks/mediaserver_mpd.py
-
-import logging
-import os
-import shutil
-from datetime import datetime
-import config
-import requests # <-- ADDED: Needed for HTTP downloads
-import random   # <-- ADDED: For shuffling albums
-
-# Add the MPD client library dependency
-# NOTE: This implementation requires the 'python-mpd2' library.
-# Install it with: pip install python-mpd2
-try:
-    import mpd
-except ImportError:
-    # Handle the case where the library isn't installed.
-    # You might want to log a more prominent warning or exit if MPD is the configured server type.
-    pass
-
-logger = logging.getLogger(__name__)
-
-# ##############################################################################
-# MPD (MUSIC PLAYER DAEMON) IMPLEMENTATION
-# ##############################################################################
-
-def _connect():
-    """Establishes a connection to the MPD server."""
-    # Set use_unicode=True to ensure all communication with the server,
-    # including file paths, is handled as UTF-8.
-    client = mpd.MPDClient(use_unicode=True)
-    client.timeout = 60
-    client.idletimeout = 30
-
-
-    try:
-        logger.info(f"Calling MPD connect('{config.MPD_HOST}', {config.MPD_PORT}, timeout=None)")
-        client.connect(config.MPD_HOST, config.MPD_PORT)
-        logger.info(f"Successfully connected to MPD server. Status: {client.status()}")
-
-        if config.MPD_PASSWORD:
-            logger.info("Authenticating with MPD password")
-            client.password(config.MPD_PASSWORD)
-
-        return client
-    except Exception as e:
-        logger.error(f"Failed to connect or configure MPD server: {e}", exc_info=True)
-        _disconnect_safely(client)
-        return None
-
-def _format_song(song_dict):
-    """Formats an MPD song dictionary to the standard format used in this script."""
-    # The 'Id' will be the file path, which is unique.
-    return {
-        'Id': song_dict.get('file'),
-        'Name': song_dict.get('title', os.path.basename(song_dict.get('file', ''))),
-        'AlbumArtist': song_dict.get('albumartist'),
-        'OriginalAlbumArtist': song_dict.get('albumartist'),
-        'Artist': song_dict.get('artist'),
-        'Album': song_dict.get('album'),
-        'Path': song_dict.get('file'),
-        'last-modified': song_dict.get('last-modified')
-    }
-
-def _disconnect_safely(client):
-    """Safely closes and disconnects the MPD client."""
-    if not client:
-        return
-    try:
-        client.close()
-        client.disconnect()
-    except (mpd.ConnectionError, IOError, BrokenPipeError):
-        pass # Ignore errors on disconnect, as the connection might already be lost.
-
-def get_recent_albums(limit):
-    """
-    [EFFICIENT VERSION] Fetches a random selection of albums from MPD.
-    
-    NOTE: Finding the chronologically "most recent" albums requires a full
-    scan of every song in the library, which is extremely slow on large collections.
-    This function provides a fast and practical alternative by returning a random
-    sample, which is much better for discovering content to analyze.
-    """
-    client = _connect()
-    if not client:
-        return []
-
-    albums = []
-    try:
-        logger.info("Fetching a random selection of albums for analysis...")
-        
-        # This is a very fast command that gets all unique album names.
-        album_names = client.list('album')
-        
-        # If the user wants all albums, don't shuffle, just format.
-        fetch_all = (limit == 0)
-        if fetch_all:
-            logger.info(f"Formatting all {len(album_names)} albums.")
-            albums_to_process = album_names
-        else:
-            logger.info(f"Found {len(album_names)} total albums. Shuffling to select {limit} random ones.")
-            random.shuffle(album_names)
-            albums_to_process = album_names[:limit]
-
-        # Format the selected albums into the expected dictionary structure.
-        # We use a placeholder date as the true 'last_modified' is unknown without a full scan.
-        now = datetime.now()
-        albums = [{'Id': name, 'Name': name, 'last_modified': now} for name in albums_to_process]
-        
-        logger.info(f"Selected {len(albums)} albums to process.")
-
-    except Exception as e:
-        logger.error(f"MPD get_recent_albums failed: {e}", exc_info=True)
-    finally:
-        _disconnect_safely(client)
-
-    return albums
-
-def get_tracks_from_album(album_id):
-    """Fetches all audio tracks for a given album name from MPD. album_id is the album name."""
-    client = _connect()
-    if not client:
-        return []
-        
-    tracks = []
-    try:
-        # Use client.find("album", album_id) to search by metadata tag.
-        songs = client.find("album", album_id)
-        tracks = [_format_song(s) for s in songs if 'file' in s]
-        logger.info(f"Found {len(tracks)} tracks for album '{album_id}'.")
-    except Exception as e:
-        logger.error(f"MPD get_tracks_from_album failed for album '{album_id}': {e}", exc_info=True)
-    finally:
-        _disconnect_safely(client)
-    return tracks
-
-def download_track(temp_dir, item):
-    """
-    Downloads a track from a remote MPD server using its built-in HTTP streamer.
-    This function assumes MPD's HTTP stream is available on port 8000.
-    """
-    try:
-        track_path = item.get('Path')
-        if not track_path:
-            logger.error("MPD item has no 'Path' attribute to download.")
-            return None
-
-        # Construct the HTTP stream URL for the track.
-        # This uses the same MPD_HOST but assumes port 8000 for the HTTP stream.
-        # The path needs to be URL-encoded to handle special characters.
-        from urllib.parse import quote
-        encoded_path = quote(track_path)
-        download_url = f"http://{config.MPD_HOST}:8000/{encoded_path}"
-
-        logger.info(f"Downloading track from URL: {download_url}")
-
-        # Use requests library to download the file in a streaming fashion
-        with requests.get(download_url, stream=True) as r:
-            r.raise_for_status()  # This will raise an exception for bad status codes (4xx or 5xx)
-
-            # Create a safe local filename
-            file_extension = os.path.splitext(track_path)[1]
-            track_id = os.path.basename(track_path).replace(file_extension, '')
-            local_filename = os.path.join(temp_dir, f"{track_id}{file_extension}")
-
-            # Write the content to the local file in chunks
-            with open(local_filename, 'wb') as f:
-                for chunk in r.iter_content(chunk_size=8192):
-                    f.write(chunk)
-            
-            logger.info(f"Successfully downloaded '{item.get('Name', 'Unknown')}' to '{local_filename}'")
-            return local_filename
-
-    except requests.exceptions.RequestException as e:
-        logger.error(f"HTTP download failed for track {item.get('Name', 'Unknown')}: {e}", exc_info=True)
-        return None
-    except Exception as e:
-        logger.error(f"An unexpected error occurred during download of {item.get('Name', 'Unknown')}: {e}", exc_info=True)
-        return None
-
-def get_all_songs():
-    """Fetches all songs from MPD using a robust, song-by-song method."""
-    client = _connect()
-    if not client:
-        return []
-        
-    all_formatted_songs = []
-    try:
-        logger.info("Fetching all songs from MPD database (robust method)...")
-        
-        all_files = client.list('file')
-        logger.info(f"Found {len(all_files)} files to process.")
-
-        for i, file_path_dict in enumerate(all_files):
-            try:
-                # FIX: The list command returns a list of dicts. We need the value from the 'file' key.
-                file_path_str = file_path_dict.get('file')
-                if not file_path_str:
-                    continue
-                
-                song_info_list = client.listallinfo(file_path_str)
-                if song_info_list and 'file' in song_info_list[0]:
-                    all_formatted_songs.append(_format_song(song_info_list[0]))
-                
-                if (i + 1) % 1000 == 0:
-                    logger.info(f"Formatted {i+1}/{len(all_files)} songs...")
-            except Exception:
-                # Ignore errors for individual files (e.g., playlist files, etc.)
-                pass
-
-        logger.info(f"Successfully formatted {len(all_formatted_songs)} songs from MPD")
-        
-    except Exception as e:
-        logger.error(f"MPD get_all_songs failed: {e}", exc_info=True)
-    finally:
-        _disconnect_safely(client)
-    return all_formatted_songs
-
-def get_playlist_by_name(playlist_name):
-    """Finds an MPD playlist by its exact name."""
-    client = _connect()
-    if not client:
-        return None
-        
-    try:
-        playlists = client.listplaylists()
-        for p in playlists:
-            if p.get('playlist') == playlist_name:
-                return {'Id': playlist_name, 'Name': playlist_name}
-    except Exception as e:
-        logger.error(f"MPD get_playlist_by_name failed for '{playlist_name}': {e}", exc_info=True)
-    finally:
-        _disconnect_safely(client)
-    return None
-
-def create_playlist(base_name, item_ids):
-    """Creates a new playlist on MPD. item_ids are file paths."""
-    client = _connect()
-    if not client:
-        return
-
-    try:
-        # Check if playlist exists and clear it, otherwise MPD appends.
-        if any(p.get('playlist') == base_name for p in client.listplaylists()):
-             client.playlistclear(base_name)
-             logger.info(f"Cleared existing MPD playlist '{base_name}'.")
-
-        for item_path in item_ids:
-            client.playlistadd(base_name, item_path)
-        logger.info(f"✅ Created/updated MPD playlist '{base_name}' with {len(item_ids)} songs.")
-    except Exception as e:
-        logger.error(f"Exception creating MPD playlist '{base_name}': {e}", exc_info=True)
-    finally:
-        _disconnect_safely(client)
-
-def get_all_playlists():
-    """Fetches all playlists from MPD."""
-    client = _connect()
-    if not client:
-        return []
-        
-    playlists = []
-    try:
-        mpd_playlists = client.listplaylists()
-        playlists = [{'Id': p.get('playlist'), 'Name': p.get('playlist')} for p in mpd_playlists]
-    except Exception as e:
-        logger.error(f"MPD get_all_playlists failed: {e}", exc_info=True)
-    finally:
-        _disconnect_safely(client)
-    return playlists
-
-def delete_playlist(playlist_id):
-    """Deletes a playlist on MPD. playlist_id is the playlist name."""
-    client = _connect()
-    if not client:
-        return False
-        
-    success = False
-    try:
-        client.rm(playlist_id)
-        logger.info(f"🗑️ Deleted MPD playlist: {playlist_id}")
-        success = True
-    except Exception as e:
-        logger.error(f"Exception deleting MPD playlist '{playlist_id}': {e}", exc_info=True)
-    finally:
-        _disconnect_safely(client)
-    return success
-
-# --- User-specific MPD functions (STUBS) ---
-# MPD is a single-user daemon and does not track play counts or last played times by default.
-def get_top_played_songs(limit, user_creds=None):
-    """Not supported by MPD. Returns an empty list."""
-    logger.warning("get_top_played_songs is not supported by the MPD backend.")
-    return []
-
-def get_last_played_time(item_id, user_creds=None):
-    """Not supported by MPD. Returns None."""
-    logger.warning("get_last_played_time is not supported by the MPD backend.")
-    return None
-
-def create_instant_playlist(playlist_name, item_ids, user_creds=None):
-    """Creates a new instant playlist on MPD."""
-    final_playlist_name = f"{playlist_name.strip()}_instant"
-    # For MPD, this is the same as a regular playlist. user_creds are ignored.
-    create_playlist(final_playlist_name, item_ids)
-    # The return value for this function in other implementations is a dict.
-    return {'Id': final_playlist_name, 'Name': final_playlist_name}
-
diff --git a/tasks/song_alchemy.py b/tasks/song_alchemy.py
index 3e6bf229..e57c04fa 100644
--- a/tasks/song_alchemy.py
+++ b/tasks/song_alchemy.py
@@ -836,11 +836,6 @@ def _centroid_from_member_coords(items, is_add=True):
                     item = details_map.get(cid, {})
                     item['distance'] = distances.get(cid)
                     item['embedding_2d'] = proj_map.get(cid)
-                    # Ensure album/album_artist is present
-                    if 'album' not in item or not item['album']:
-                        item['album'] = 'Unknown'
-                    if 'album_artist' not in item or not item['album_artist']:
-                        item['album_artist'] = 'Unknown'
                     ordered.append(item)
             else:
                 # Softmax with temperature (temperature may be None or >0)
@@ -890,11 +885,6 @@ def _centroid_from_member_coords(items, is_add=True):
                     item = details_map.get(cid, {})
                     item['distance'] = distances.get(cid)
                     item['embedding_2d'] = proj_map.get(cid)
-                    # Ensure album/album_artist is present
-                    if 'album' not in item or not item['album']:
-                        item['album'] = 'Unknown'
-                    if 'album_artist' not in item or not item['album_artist']:
-                        item['album_artist'] = 'Unknown'
                     ordered.append(item)
         except Exception as e:
             # Fallback deterministic ordering by best match
@@ -904,11 +894,6 @@ def _centroid_from_member_coords(items, is_add=True):
                 item = details_map.get(i, {})
                 item['distance'] = distances.get(i)
                 item['embedding_2d'] = proj_map.get(i)
-                # Ensure album/album_artist is present
-                if 'album' not in item or not item['album']:
-                    item['album'] = 'Unknown'
-                if 'album_artist' not in item or not item['album_artist']:
-                    item['album_artist'] = 'Unknown'
                 ordered.append(item)
 
     # Prepare filtered_out details
@@ -920,11 +905,6 @@ def _centroid_from_member_coords(items, is_add=True):
             if fid in details_f_map:
                 fd = details_f_map[fid]
                 fd['embedding_2d'] = proj_map.get(fid)
-                # Ensure album/album_artist is present
-                if 'album' not in fd or not fd['album']:
-                    fd['album'] = 'Unknown'
-                if 'album_artist' not in fd or not fd['album_artist']:
-                    fd['album_artist'] = 'Unknown'
                 filtered_details.append(fd)
 
     # Centroid projections
diff --git a/tasks/voyager_manager.py b/tasks/voyager_manager.py
index 565c3d30..c9a3c26c 100644
--- a/tasks/voyager_manager.py
+++ b/tasks/voyager_manager.py
@@ -491,20 +491,20 @@ def _deduplicate_and_filter_neighbors(song_results: list, db_conn, original_song
     def fetch_details_batch(id_batch):
         batch_details = {}
         with db_conn.cursor(cursor_factory=DictCursor) as cur:
-            cur.execute("SELECT item_id, title, author, album, album_artist FROM score WHERE item_id = ANY(%s)", (id_batch,))
+            cur.execute("SELECT item_id, title, author, album FROM score WHERE item_id = ANY(%s)", (id_batch,))
             rows = cur.fetchall()
             for row in rows:
-                batch_details[row['item_id']] = {'title': row['title'], 'author': row['author'], 'album': row.get('album'), 'album_artist': row.get('album_artist')}
+                batch_details[row['item_id']] = {'title': row['title'], 'author': row['author'], 'album': row.get('album')}
         return batch_details
-    
+
     # Split item_ids into batches for parallel DB queries
     id_batches = [item_ids[i:i + BATCH_SIZE_DB_OPS] for i in range(0, len(item_ids), BATCH_SIZE_DB_OPS)]
-    
+
     if len(id_batches) > 1:
         # Use parallel DB queries for large datasets
         executor = _get_thread_pool()
         future_to_batch = {executor.submit(fetch_details_batch, batch): batch for batch in id_batches}
-        
+
         for future in as_completed(future_to_batch):
             batch_details = future.result()
             item_details.update(batch_details)
@@ -770,7 +770,7 @@ def _radius_walk_get_candidates(
         # Fetch details in batch (uses app_helper get_score_data_by_ids)
         try:
             track_details_list = get_score_data_by_ids(item_ids_to_fetch)
-            details_map = {d['item_id']: {'title': d.get('title'), 'author': d.get('author'), 'album': d.get('album'), 'album_artist': d.get('album_artist')} for d in track_details_list}
+            details_map = {d['item_id']: {'title': d.get('title'), 'author': d.get('author'), 'album': d.get('album')} for d in track_details_list}
         except Exception:
             details_map = {}
 
@@ -1460,27 +1460,27 @@ def find_nearest_neighbors_by_vector(query_vector: np.ndarray, n: int = 100, eli
     def fetch_details_batch(id_batch):
         batch_details = {}
         with db_conn.cursor(cursor_factory=DictCursor) as cur:
-            cur.execute("SELECT item_id, title, author, album, album_artist FROM score WHERE item_id = ANY(%s)", (id_batch,))
+            cur.execute("SELECT item_id, title, author, album FROM score WHERE item_id = ANY(%s)", (id_batch,))
             rows = cur.fetchall()
             for row in rows:
-                batch_details[row['item_id']] = {'title': row['title'], 'author': row['author'], 'album': row.get('album'), 'album_artist': row.get('album_artist')}
+                batch_details[row['item_id']] = {'title': row['title'], 'author': row['author'], 'album': row.get('album')}
         return batch_details
-    
+
     # Split item_ids into batches for parallel DB queries
     id_batches = [item_ids[i:i + BATCH_SIZE_DB_OPS] for i in range(0, len(item_ids), BATCH_SIZE_DB_OPS)]
-    
+
     if len(id_batches) > 1:
         # Use parallel DB queries for large datasets
         executor = _get_thread_pool()
         future_to_batch = {executor.submit(fetch_details_batch, batch): batch for batch in id_batches}
-        
+
         for future in as_completed(future_to_batch):
             batch_details = future.result()
             item_details.update(batch_details)
     else:
         # Use single query for small datasets
         item_details = fetch_details_batch(item_ids)
-            
+
     unique_songs_by_content = []
     added_songs_details = []
     for song in distance_filtered_results:
diff --git a/templates/settings.html b/templates/settings.html
index 1116c7c1..fff4605a 100644
--- a/templates/settings.html
+++ b/templates/settings.html
@@ -22,7 +22,7 @@
 
     /* Settings Sections */
     .settings-section {
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         border-radius: 8px;
         margin-bottom: 1.5rem;
         overflow: hidden;
@@ -39,7 +39,7 @@
     }
 
     .section-header:hover {
-        background: rgba(var(--primary-rgb), 0.05);
+        background: rgba(37, 99, 235, 0.05);
     }
 
     .section-header h2 {
@@ -106,15 +106,15 @@
         padding: 0.5rem 0.75rem;
         border: 1px solid var(--border-color);
         border-radius: 4px;
-        background: var(--bg-primary);
-        color: var(--text-color);
+        background: var(--bg-card);
+        color: var(--text-main);
         font-size: 0.95rem;
     }
 
     .field-group input:focus,
     .field-group select:focus {
         outline: none;
-        border-color: var(--primary-color);
+        border-color: var(--color-primary);
     }
 
     .field-group .checkbox-label {
@@ -148,12 +148,12 @@
     }
 
     .option-card:hover {
-        border-color: var(--primary-color);
+        border-color: var(--color-primary);
     }
 
     .option-card.selected {
-        border-color: var(--primary-color);
-        background: rgba(var(--primary-rgb), 0.1);
+        border-color: var(--color-primary);
+        background: rgba(37, 99, 235, 0.1);
     }
 
     .option-card .card-icon {
@@ -181,7 +181,7 @@
         align-items: center;
         justify-content: space-between;
         padding: 1rem;
-        background: var(--bg-primary);
+        background: var(--bg-card);
         border-radius: 8px;
         margin-bottom: 0.5rem;
     }
@@ -214,8 +214,8 @@
     }
 
     .badge-primary {
-        background: rgba(var(--primary-rgb), 0.2);
-        color: var(--primary-color);
+        background: rgba(37, 99, 235, 0.2);
+        color: var(--color-primary);
     }
 
     .badge-enabled {
@@ -237,13 +237,13 @@
         padding: 0.4rem 0.75rem;
         border: 1px solid var(--border-color);
         border-radius: 4px;
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         cursor: pointer;
         font-size: 0.85rem;
     }
 
     .provider-item .provider-actions button:hover {
-        background: var(--bg-primary);
+        background: var(--bg-card);
     }
 
     .provider-item .provider-actions button.btn-danger {
@@ -272,13 +272,13 @@
     }
 
     .add-provider-btn:hover {
-        border-color: var(--primary-color);
-        color: var(--primary-color);
+        border-color: var(--color-primary);
+        color: var(--color-primary);
     }
 
     /* Worker Connection Info */
     .connection-info {
-        background: var(--bg-primary);
+        background: var(--bg-card);
         padding: 1rem;
         border-radius: 8px;
         margin-top: 1rem;
@@ -304,7 +304,7 @@
     .connection-info .info-value {
         flex: 1;
         font-family: monospace;
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         padding: 0.5rem 0.75rem;
         border-radius: 4px;
         font-size: 0.9rem;
@@ -314,13 +314,13 @@
         padding: 0.4rem 0.75rem;
         border: 1px solid var(--border-color);
         border-radius: 4px;
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         cursor: pointer;
         font-size: 0.8rem;
     }
 
     .connection-info .copy-btn:hover {
-        background: var(--bg-primary);
+        background: var(--bg-card);
     }
 
     .connection-info .copy-btn.copied {
@@ -333,7 +333,7 @@
     .save-bar {
         position: sticky;
         bottom: 0;
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         padding: 1rem 1.5rem;
         margin: 2rem -1rem -1rem -1rem;
         border-top: 1px solid var(--border-color);
@@ -350,7 +350,7 @@
     }
 
     .btn-save {
-        background: var(--primary-color);
+        background: var(--color-primary);
         border: none;
         color: white;
     }
@@ -383,7 +383,7 @@
     }
 
     .modal {
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         border-radius: 8px;
         max-width: 500px;
         width: 90%;
@@ -430,12 +430,12 @@
     }
 
     .modal-footer .btn-cancel {
-        background: var(--bg-primary);
+        background: var(--bg-card);
         border: 1px solid var(--border-color);
     }
 
     .modal-footer .btn-primary {
-        background: var(--primary-color);
+        background: var(--color-primary);
         border: none;
         color: white;
     }
@@ -447,7 +447,7 @@
         right: 2rem;
         padding: 1rem 1.5rem;
         border-radius: 8px;
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         border: 1px solid var(--border-color);
         box-shadow: 0 4px 12px rgba(0, 0, 0, 0.15);
         z-index: 1001;
@@ -795,18 +795,19 @@ <h3 id="modal-title">Add Provider</h3>
     }
 
     function applySettings() {
-        // Deployment
-        document.querySelectorAll('.option-card[data-value]').forEach(card => {
-            const parent = card.parentElement;
-            const isDeployment = parent.previousElementSibling?.textContent.includes('Deployment');
-            const isHardware = parent.previousElementSibling?.textContent.includes('Hardware');
-
-            if (isDeployment && settings.deployment_type === card.dataset.value) {
-                selectOption(card, 'deployment', false);
-            } else if (isHardware && settings.hardware_type === card.dataset.value) {
-                selectOption(card, 'hardware', false);
-            }
-        });
+        // Deployment - directly select by data-value
+        const deploymentValue = settings.deployment_type || 'unified';
+        const deploymentCard = document.querySelector(`.option-card[data-value="${deploymentValue}"][onclick*="deployment"]`);
+        if (deploymentCard) {
+            selectOption(deploymentCard, 'deployment', false);
+        }
+
+        // Hardware - directly select by data-value
+        const hardwareValue = settings.hardware_type || 'cpu';
+        const hardwareCard = document.querySelector(`.option-card[data-value="${hardwareValue}"][onclick*="hardware"]`);
+        if (hardwareCard) {
+            selectOption(hardwareCard, 'hardware', false);
+        }
 
         // Analysis
         document.getElementById('clap-enabled').checked = settings.clap_enabled !== false;
diff --git a/templates/setup.html b/templates/setup.html
index db51bf49..624b2711 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -50,14 +50,14 @@
     }
 
     .progress-step.completed:not(:last-child)::after {
-        background: var(--primary-color);
+        background: var(--color-primary);
     }
 
     .step-number {
         width: 32px;
         height: 32px;
         border-radius: 50%;
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         border: 2px solid var(--border-color);
         display: flex;
         align-items: center;
@@ -68,14 +68,14 @@
     }
 
     .progress-step.active .step-number {
-        border-color: var(--primary-color);
-        background: var(--primary-color);
+        border-color: var(--color-primary);
+        background: var(--color-primary);
         color: white;
     }
 
     .progress-step.completed .step-number {
-        border-color: var(--primary-color);
-        background: var(--primary-color);
+        border-color: var(--color-primary);
+        background: var(--color-primary);
         color: white;
     }
 
@@ -86,7 +86,7 @@
     }
 
     .progress-step.active .step-label {
-        color: var(--text-color);
+        color: var(--text-main);
         font-weight: 500;
     }
 
@@ -106,7 +106,7 @@
     }
 
     .step-section {
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         border-radius: 8px;
         padding: 1.5rem;
         margin-bottom: 1.5rem;
@@ -131,7 +131,7 @@
     }
 
     .provider-card {
-        background: var(--bg-primary);
+        background: var(--bg-card);
         border: 2px solid var(--border-color);
         border-radius: 8px;
         padding: 1rem;
@@ -140,12 +140,12 @@
     }
 
     .provider-card:hover {
-        border-color: var(--primary-color);
+        border-color: var(--color-primary);
     }
 
     .provider-card.selected {
-        border-color: var(--primary-color);
-        background: rgba(var(--primary-rgb), 0.1);
+        border-color: var(--color-primary);
+        background: rgba(37, 99, 235, 0.1);
     }
 
     .provider-card .provider-name {
@@ -160,7 +160,7 @@
 
     .provider-card .provider-check {
         display: none;
-        color: var(--primary-color);
+        color: var(--color-primary);
         font-size: 1.2rem;
     }
 
@@ -172,7 +172,7 @@
     .provider-config {
         margin-top: 1.5rem;
         padding: 1rem;
-        background: var(--bg-primary);
+        background: var(--bg-card);
         border-radius: 8px;
         display: none;
     }
@@ -208,19 +208,19 @@
         padding: 0.5rem;
         border: 1px solid var(--border-color);
         border-radius: 4px;
-        background: var(--bg-secondary);
-        color: var(--text-color);
+        background: var(--bg-body);
+        color: var(--text-main);
     }
 
     .config-field input:focus,
     .config-field select:focus {
         outline: none;
-        border-color: var(--primary-color);
+        border-color: var(--color-primary);
     }
 
     /* Test Connection Button */
     .test-connection-btn {
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         border: 1px solid var(--border-color);
         padding: 0.5rem 1rem;
         border-radius: 4px;
@@ -231,7 +231,7 @@
     }
 
     .test-connection-btn:hover {
-        background: var(--bg-primary);
+        background: var(--bg-card);
     }
 
     .test-result {
@@ -251,6 +251,170 @@
         color: #dc3545;
     }
 
+    /* Browse Input Group */
+    .input-with-browse {
+        display: flex;
+        gap: 0.5rem;
+    }
+
+    .input-with-browse input {
+        flex: 1;
+    }
+
+    .browse-btn {
+        padding: 0.5rem 1rem;
+        background: var(--bg-body);
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+        cursor: pointer;
+        white-space: nowrap;
+        color: var(--text-main);
+    }
+
+    .browse-btn:hover {
+        background: var(--bg-card);
+        border-color: var(--color-primary);
+    }
+
+    /* Directory Browser Modal */
+    .modal-overlay {
+        display: none;
+        position: fixed;
+        top: 0;
+        left: 0;
+        right: 0;
+        bottom: 0;
+        background: rgba(0, 0, 0, 0.5);
+        z-index: 1000;
+        align-items: center;
+        justify-content: center;
+    }
+
+    .modal-overlay.visible {
+        display: flex;
+    }
+
+    .modal-content {
+        background: var(--bg-card);
+        border-radius: 8px;
+        width: 90%;
+        max-width: 500px;
+        max-height: 80vh;
+        display: flex;
+        flex-direction: column;
+        box-shadow: 0 4px 20px rgba(0, 0, 0, 0.3);
+    }
+
+    .modal-header {
+        padding: 1rem 1.5rem;
+        border-bottom: 1px solid var(--border-color);
+        display: flex;
+        justify-content: space-between;
+        align-items: center;
+    }
+
+    .modal-header h3 {
+        margin: 0;
+        font-size: 1.1rem;
+    }
+
+    .modal-close {
+        background: none;
+        border: none;
+        font-size: 1.5rem;
+        cursor: pointer;
+        color: var(--text-muted);
+        padding: 0;
+        line-height: 1;
+    }
+
+    .modal-close:hover {
+        color: var(--text-main);
+    }
+
+    .modal-body {
+        padding: 1rem 1.5rem;
+        overflow-y: auto;
+        flex: 1;
+    }
+
+    .current-path {
+        padding: 0.5rem;
+        background: var(--bg-body);
+        border-radius: 4px;
+        font-family: monospace;
+        font-size: 0.9rem;
+        margin-bottom: 1rem;
+        word-break: break-all;
+    }
+
+    .directory-list {
+        list-style: none;
+        padding: 0;
+        margin: 0;
+    }
+
+    .directory-item {
+        padding: 0.75rem;
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+        margin-bottom: 0.5rem;
+        cursor: pointer;
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+        transition: all 0.15s ease;
+    }
+
+    .directory-item:hover {
+        background: rgba(37, 99, 235, 0.1);
+        border-color: var(--color-primary);
+    }
+
+    .directory-item.parent {
+        font-style: italic;
+        color: var(--text-muted);
+    }
+
+    .directory-item .folder-icon {
+        font-size: 1.2rem;
+    }
+
+    .directory-item.inaccessible {
+        opacity: 0.5;
+        cursor: not-allowed;
+    }
+
+    .modal-footer {
+        padding: 1rem 1.5rem;
+        border-top: 1px solid var(--border-color);
+        display: flex;
+        justify-content: flex-end;
+        gap: 0.5rem;
+    }
+
+    .modal-footer button {
+        padding: 0.5rem 1rem;
+        border-radius: 4px;
+        cursor: pointer;
+    }
+
+    .modal-footer .btn-cancel {
+        background: var(--bg-body);
+        border: 1px solid var(--border-color);
+        color: var(--text-main);
+    }
+
+    .modal-footer .btn-select {
+        background: var(--color-primary);
+        border: none;
+        color: white;
+    }
+
+    .modal-footer .btn-select:hover {
+        background: var(--color-primary-hover);
+    }
+
     /* Navigation Buttons */
     .step-navigation {
         display: flex;
@@ -269,23 +433,23 @@
     }
 
     .btn-prev {
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         border: 1px solid var(--border-color);
-        color: var(--text-color);
+        color: var(--text-main);
     }
 
     .btn-prev:hover {
-        background: var(--bg-primary);
+        background: var(--bg-card);
     }
 
     .btn-next, .btn-complete {
-        background: var(--primary-color);
+        background: var(--color-primary);
         border: none;
         color: white;
     }
 
     .btn-next:hover, .btn-complete:hover {
-        opacity: 0.9;
+        background: var(--color-primary-hover);
     }
 
     .btn-next:disabled, .btn-complete:disabled {
@@ -305,7 +469,7 @@
     }
 
     .advanced-toggle:hover {
-        color: var(--text-color);
+        color: var(--text-main);
     }
 
     .advanced-content {
@@ -335,12 +499,12 @@
     }
 
     .hardware-option:hover {
-        border-color: var(--primary-color);
+        border-color: var(--color-primary);
     }
 
     .hardware-option.selected {
-        border-color: var(--primary-color);
-        background: rgba(var(--primary-rgb), 0.1);
+        border-color: var(--color-primary);
+        background: rgba(37, 99, 235, 0.1);
     }
 
     .hardware-option .option-icon {
@@ -380,8 +544,8 @@
 
     /* Existing Install Banner */
     .existing-install-banner {
-        background: rgba(var(--primary-rgb), 0.1);
-        border: 1px solid var(--primary-color);
+        background: rgba(37, 99, 235, 0.1);
+        border: 1px solid var(--color-primary);
         border-radius: 8px;
         padding: 1rem;
         margin-bottom: 1.5rem;
@@ -404,6 +568,36 @@
         font-size: 0.9rem;
     }
 
+    .existing-providers-list {
+        list-style: none;
+        padding: 0;
+        margin: 0.5rem 0;
+    }
+
+    .existing-providers-list li {
+        padding: 0.4rem 0;
+        font-size: 0.9rem;
+    }
+
+    .provider-badge {
+        display: inline-block;
+        padding: 0.15rem 0.4rem;
+        border-radius: 4px;
+        font-size: 0.75rem;
+        font-weight: 500;
+        margin-left: 0.5rem;
+    }
+
+    .provider-badge.enabled {
+        background: rgba(40, 167, 69, 0.2);
+        color: #28a745;
+    }
+
+    .provider-badge.disabled {
+        background: rgba(108, 117, 125, 0.2);
+        color: #6c757d;
+    }
+
     /* Provider List */
     .configured-providers {
         margin-top: 1rem;
@@ -414,7 +608,7 @@
         align-items: center;
         justify-content: space-between;
         padding: 1rem;
-        background: var(--bg-primary);
+        background: var(--bg-card);
         border-radius: 8px;
         margin-bottom: 0.5rem;
     }
@@ -458,7 +652,7 @@
         display: flex;
         align-items: center;
         gap: 0.5rem;
-        background: var(--bg-primary);
+        background: var(--bg-card);
         padding: 0.75rem;
         border-radius: 4px;
         border: 1px solid var(--border-color);
@@ -475,13 +669,13 @@
         padding: 0.25rem 0.75rem;
         border: 1px solid var(--border-color);
         border-radius: 4px;
-        background: var(--bg-secondary);
+        background: var(--bg-body);
         cursor: pointer;
         font-size: 0.85rem;
     }
 
     .copy-btn:hover {
-        background: var(--bg-primary);
+        background: var(--bg-card);
     }
 
     .copy-btn.copied {
@@ -685,7 +879,7 @@ <h3>Worker Connection Info</h3>
                 </div>
             </div>
 
-            <div class="step-section" style="margin-top: 1rem; padding: 1rem; background: rgba(var(--primary-rgb), 0.1); border-radius: 8px;">
+            <div class="step-section" style="margin-top: 1rem; padding: 1rem; background: rgba(37, 99, 235, 0.1); border-radius: 8px;">
                 <h4 style="margin-top: 0;">Quick Setup for Workers</h4>
                 <ol style="margin: 0.5rem 0 0 1.5rem; padding: 0;">
                     <li>Copy .env.example to the worker machine</li>
@@ -696,6 +890,30 @@ <h4 style="margin-top: 0;">Quick Setup for Workers</h4>
             </div>
         </div>
 
+        <div class="step-section">
+            <h3>AI Integration (Optional)</h3>
+            <p class="description">
+                AudioMuse-AI can use AI to generate creative playlist names based on the songs in each cluster.
+                This is purely cosmetic - it doesn't affect the analysis or clustering, just the names given to playlists.
+            </p>
+
+            <div class="config-field">
+                <label for="setting-ai-provider">AI Provider</label>
+                <select id="setting-ai-provider" onchange="updateAIProviderFields()">
+                    <option value="NONE" selected>None (Use Default Names)</option>
+                    <option value="OLLAMA">Ollama (Local)</option>
+                    <option value="OPENAI">OpenAI / OpenRouter</option>
+                    <option value="GEMINI">Google Gemini</option>
+                    <option value="MISTRAL">Mistral AI</option>
+                </select>
+                <div class="field-help">AI service for generating creative playlist names</div>
+            </div>
+
+            <div id="ai-provider-config" class="provider-config">
+                <!-- Dynamically populated based on selected AI provider -->
+            </div>
+        </div>
+
         <div class="advanced-toggle" onclick="toggleAdvanced()">
             <span id="advanced-arrow">&#9654;</span>
             <span>Advanced Settings</span>
@@ -721,25 +939,6 @@ <h3>Database Configuration</h3>
                     <div class="field-help">Redis connection URL (set via REDIS_URL env var)</div>
                 </div>
             </div>
-
-            <div class="step-section">
-                <h3>AI Playlist Naming</h3>
-                <p class="description">
-                    Optionally configure an AI provider for creative playlist names.
-                </p>
-
-                <div class="config-field">
-                    <label for="setting-ai-provider">AI Provider</label>
-                    <select id="setting-ai-provider">
-                        <option value="NONE" selected>None (Use Default Names)</option>
-                        <option value="OLLAMA">Ollama (Local)</option>
-                        <option value="OPENAI">OpenAI / OpenRouter</option>
-                        <option value="GEMINI">Google Gemini</option>
-                        <option value="MISTRAL">Mistral AI</option>
-                    </select>
-                    <div class="field-help">AI service for generating creative playlist names</div>
-                </div>
-            </div>
         </div>
 
         <div class="step-navigation">
@@ -776,6 +975,26 @@ <h3>What's Next?</h3>
         </div>
     </div>
 </div>
+
+<!-- Directory Browser Modal -->
+<div class="modal-overlay" id="directory-browser-modal">
+    <div class="modal-content">
+        <div class="modal-header">
+            <h3>Browse Directories</h3>
+            <button class="modal-close" onclick="closeBrowseModal()">&times;</button>
+        </div>
+        <div class="modal-body">
+            <div class="current-path" id="browse-current-path">/</div>
+            <ul class="directory-list" id="directory-list">
+                <!-- Populated by JS -->
+            </ul>
+        </div>
+        <div class="modal-footer">
+            <button class="btn-cancel" onclick="closeBrowseModal()">Cancel</button>
+            <button class="btn-select" onclick="selectCurrentDirectory()">Select This Folder</button>
+        </div>
+    </div>
+</div>
 {% endblock %}
 
 {% block bodyAdditions %}
@@ -791,14 +1010,24 @@ <h3>What's Next?</h3>
     let existingProviders = [];
     let serverInfo = { host: window.location.hostname, port: window.location.port || '8000' };
 
+    // Directory browser state
+    let browseCurrentPath = '/';
+    let browseTargetInput = null;
+
+    // Track tested providers for mandatory test connection and cross-provider prefix detection
+    let testedProviders = new Set();  // Track which providers have been successfully tested
+    let testedProviderTracks = {};    // Cache sample tracks: { 'jellyfin': [{title, artist, file_path}, ...], ... }
+
     // Initialize
     document.addEventListener('DOMContentLoaded', async function() {
         await loadSetupStatus();
         await loadProviderTypes();
+        await loadSettings();
         await loadServerInfo();
         renderProviderGrid();
         setupHardwareOptions();
         setupDeploymentOptions();
+        applyExistingSettings();
     });
 
     async function loadSetupStatus() {
@@ -809,7 +1038,15 @@ <h3>What's Next?</h3>
             existingProviders = data.providers || [];
 
             if (data.setup_completed && existingProviders.length > 0) {
-                // Show existing installation info
+                // Build provider list HTML
+                const providerListHtml = existingProviders.map(p => {
+                    const badges = [];
+                    if (p.enabled) badges.push('<span class="provider-badge enabled">Enabled</span>');
+                    else badges.push('<span class="provider-badge disabled">Disabled</span>');
+                    return `<li><strong>${p.name || p.provider_type}</strong> (${p.provider_type}) ${badges.join(' ')}</li>`;
+                }).join('');
+
+                // Show existing installation info with provider list
                 const info = document.getElementById('existing-install-info');
                 info.style.display = 'block';
                 info.innerHTML = `
@@ -817,8 +1054,11 @@ <h3>What's Next?</h3>
                         <div class="banner-icon">&#9989;</div>
                         <div class="banner-content">
                             <h4>Existing Installation Detected</h4>
-                            <p>You have ${existingProviders.length} provider(s) configured.
-                               You can modify your settings or add new providers.</p>
+                            <p>You have ${existingProviders.length} provider(s) configured:</p>
+                            <ul class="existing-providers-list">${providerListHtml}</ul>
+                            <p style="margin-top: 0.5rem; color: var(--text-muted);">
+                                <a href="/settings" style="color: var(--color-primary);">Go to Settings</a> to modify existing providers, or continue below to add new ones.
+                            </p>
                         </div>
                     </div>
                 `;
@@ -828,6 +1068,125 @@ <h4>Existing Installation Detected</h4>
         }
     }
 
+    let existingSettings = {};
+
+    async function loadSettings() {
+        try {
+            const response = await fetch('/api/setup/settings');
+            existingSettings = await response.json();
+        } catch (err) {
+            console.error('Error loading settings:', err);
+        }
+    }
+
+    function applyExistingSettings() {
+        // Apply hardware type from saved settings
+        if (existingSettings.hardware_type) {
+            selectedHardware = existingSettings.hardware_type;
+            document.querySelectorAll('.hardware-option[data-hardware]').forEach(option => {
+                option.classList.remove('selected');
+                if (option.dataset.hardware === selectedHardware) {
+                    option.classList.add('selected');
+                }
+            });
+            // Update GPU clustering option state
+            const gpuClustering = document.getElementById('setting-gpu-clustering');
+            if (selectedHardware === 'nvidia') {
+                gpuClustering.disabled = false;
+            } else {
+                gpuClustering.disabled = true;
+                gpuClustering.checked = false;
+            }
+        }
+
+        // Apply deployment type from saved settings
+        if (existingSettings.deployment_type) {
+            selectedDeployment = existingSettings.deployment_type;
+            document.querySelectorAll('.hardware-option[data-deployment]').forEach(option => {
+                option.classList.remove('selected');
+                if (option.dataset.deployment === selectedDeployment) {
+                    option.classList.add('selected');
+                }
+            });
+            updateWorkerConfigVisibility();
+        }
+
+        // Apply other settings
+        if (existingSettings.clap_enabled !== undefined) {
+            document.getElementById('setting-clap-enabled').checked = existingSettings.clap_enabled !== false;
+        }
+        if (existingSettings.gpu_clustering !== undefined) {
+            document.getElementById('setting-gpu-clustering').checked = existingSettings.gpu_clustering === true;
+        }
+        if (existingSettings.ai_provider) {
+            document.getElementById('setting-ai-provider').value = existingSettings.ai_provider;
+            updateAIProviderFields();
+        }
+    }
+
+    // AI Provider configuration fields - names match config.py environment variables
+    const aiProviderFields = {
+        'OLLAMA': [
+            {name: 'ollama_server_url', label: 'Server URL', type: 'url', default: 'http://localhost:11434/api/generate', description: 'URL of your Ollama server'},
+            {name: 'ollama_model_name', label: 'Model Name', type: 'text', default: 'llama3.1:8b', description: 'Ollama model to use for playlist naming'}
+        ],
+        'OPENAI': [
+            {name: 'openai_server_url', label: 'Server URL', type: 'url', default: 'https://api.openai.com/v1', description: 'OpenAI API endpoint (or OpenRouter URL)'},
+            {name: 'openai_model_name', label: 'Model Name', type: 'text', default: 'gpt-4o-mini', description: 'Model to use (e.g., gpt-4o-mini, gpt-4o)'},
+            {name: 'openai_api_key', label: 'API Key', type: 'password', required: true, description: 'Your OpenAI or OpenRouter API key'}
+        ],
+        'GEMINI': [
+            {name: 'gemini_api_key', label: 'API Key', type: 'password', required: true, description: 'Your Google Gemini API key'},
+            {name: 'gemini_model_name', label: 'Model Name', type: 'text', default: 'gemini-2.0-flash', description: 'Gemini model to use'}
+        ],
+        'MISTRAL': [
+            {name: 'mistral_api_key', label: 'API Key', type: 'password', required: true, description: 'Your Mistral AI API key'},
+            {name: 'mistral_model_name', label: 'Model Name', type: 'text', default: 'ministral-3b-latest', description: 'Mistral model to use'}
+        ]
+    };
+
+    function updateAIProviderFields() {
+        const provider = document.getElementById('setting-ai-provider').value;
+        const configDiv = document.getElementById('ai-provider-config');
+
+        if (provider === 'NONE' || !aiProviderFields[provider]) {
+            configDiv.style.display = 'none';
+            configDiv.classList.remove('visible');
+            configDiv.innerHTML = '';
+            return;
+        }
+
+        configDiv.style.display = 'block';
+        configDiv.classList.add('visible');
+
+        const fields = aiProviderFields[provider];
+        let html = `<h4>${provider} Configuration</h4>`;
+
+        fields.forEach(field => {
+            // Check for existing saved value
+            const savedValue = existingSettings[field.name] || '';
+            const displayValue = field.type === 'password' ? '' : (savedValue || field.default || '');
+            const placeholder = field.default || '';
+
+            html += `
+                <div class="config-field">
+                    <label for="ai-config-${field.name}">
+                        ${field.label}${field.required ? ' *' : ''}
+                    </label>
+                    <input type="${field.type === 'password' ? 'password' : 'text'}"
+                           id="ai-config-${field.name}"
+                           value="${displayValue}"
+                           placeholder="${placeholder}"
+                           data-ai-field="${field.name}"
+                           ${field.required ? 'required' : ''}>
+                    <div class="field-help">${field.description || ''}</div>
+                </div>
+            `;
+        });
+
+        configDiv.innerHTML = html;
+    }
+
     async function loadProviderTypes() {
         try {
             const response = await fetch('/api/setup/providers/types');
@@ -867,6 +1226,9 @@ <h4>Existing Installation Detected</h4>
         if (idx >= 0) {
             selectedProviders.splice(idx, 1);
             delete providerConfigs[type];
+            // Clear tested state when provider is deselected
+            testedProviders.delete(type);
+            delete testedProviderTracks[type];
         } else {
             selectedProviders.push(type);
             providerConfigs[type] = {};
@@ -900,6 +1262,11 @@ <h4>Existing Installation Detected</h4>
                 const fieldDiv = document.createElement('div');
                 fieldDiv.className = 'config-field';
 
+                // Only show browse button for localfiles provider directory fields
+                // (not for music_path_prefix which is just a text prefix, not a browsable path)
+                const isLocalFilesDirectory = (type === 'localfiles') &&
+                    (field.name === 'music_directory' || field.name === 'playlist_directory');
+
                 let inputHtml = '';
                 if (field.type === 'password') {
                     inputHtml = `<input type="password" id="config-${type}-${field.name}"
@@ -913,6 +1280,15 @@ <h4>Existing Installation Detected</h4>
                     inputHtml = `<input type="number" id="config-${type}-${field.name}"
                                  value="${field.default || ''}"
                                  data-provider="${type}" data-field="${field.name}">`;
+                } else if (isLocalFilesDirectory) {
+                    // Path field with browse button (only for localfiles directories)
+                    inputHtml = `<div class="input-with-browse">
+                                    <input type="text" id="config-${type}-${field.name}"
+                                         value="${field.default || ''}"
+                                         placeholder="${field.default || ''}"
+                                         data-provider="${type}" data-field="${field.name}">
+                                    <button type="button" class="browse-btn" onclick="openBrowseModal('config-${type}-${field.name}')">Browse</button>
+                                 </div>`;
                 } else {
                     inputHtml = `<input type="text" id="config-${type}-${field.name}"
                                  value="${field.default || ''}"
@@ -958,10 +1334,15 @@ <h4>Existing Installation Detected</h4>
         resultDiv.textContent = 'Testing connection...';
 
         try {
+            // Include cached sample tracks from previously tested providers for cross-provider prefix detection
             const response = await fetch('/api/setup/providers/test', {
                 method: 'POST',
                 headers: { 'Content-Type': 'application/json' },
-                body: JSON.stringify({ provider_type: type, config })
+                body: JSON.stringify({
+                    provider_type: type,
+                    config,
+                    existing_sample_tracks: testedProviderTracks
+                })
             });
             const data = await response.json();
 
@@ -970,28 +1351,39 @@ <h4>Existing Installation Detected</h4>
             // Build result message with prefix detection info
             let resultHTML = `<strong>${data.success ? 'Success' : 'Failed'}:</strong> ${data.message}`;
 
-            // Handle prefix detection result
-            if (data.success && data.prefix_detection) {
-                const pd = data.prefix_detection;
+            // Handle successful test
+            if (data.success) {
+                // Mark this provider as tested
+                testedProviders.add(type);
 
-                // Auto-fill the music_path_prefix field if prefix detected with confidence
-                if (data.suggested_prefix !== undefined) {
-                    const prefixInput = document.querySelector(`[data-provider="${type}"][data-field="music_path_prefix"]`);
-                    if (prefixInput && !prefixInput.value) {
-                        prefixInput.value = data.suggested_prefix;
-                        resultHTML += `<br><small>Auto-filled path prefix: "${data.suggested_prefix}"</small>`;
-                    }
+                // Cache sample tracks for use when testing subsequent providers
+                if (data.sample_tracks && data.sample_tracks.length > 0) {
+                    testedProviderTracks[type] = data.sample_tracks;
                 }
 
-                // Show prefix detection details
-                if (pd.confidence && pd.confidence !== 'none') {
-                    resultHTML += `<br><small>Path prefix detection: ${pd.confidence} confidence`;
-                    if (pd.matches_found) {
-                        resultHTML += ` (${pd.matches_found} matching tracks found)`;
+                // Handle prefix detection result
+                if (data.prefix_detection) {
+                    const pd = data.prefix_detection;
+
+                    // Auto-fill the music_path_prefix field if prefix detected with confidence
+                    if (data.suggested_prefix !== undefined) {
+                        const prefixInput = document.querySelector(`[data-provider="${type}"][data-field="music_path_prefix"]`);
+                        if (prefixInput && !prefixInput.value) {
+                            prefixInput.value = data.suggested_prefix;
+                            resultHTML += `<br><small>Auto-filled path prefix: "${data.suggested_prefix}"</small>`;
+                        }
+                    }
+
+                    // Show prefix detection details
+                    if (pd.confidence && pd.confidence !== 'none') {
+                        resultHTML += `<br><small>Path prefix detection: ${pd.confidence} confidence`;
+                        if (pd.matches_found) {
+                            resultHTML += ` (${pd.matches_found} matching tracks found)`;
+                        }
+                        resultHTML += `</small>`;
+                    } else if (pd.message) {
+                        resultHTML += `<br><small>${pd.message}</small>`;
                     }
-                    resultHTML += `</small>`;
-                } else if (pd.message) {
-                    resultHTML += `<br><small>${pd.message}</small>`;
                 }
             }
 
@@ -1155,6 +1547,17 @@ <h4>Existing Installation Detected</h4>
                 alert('Please select at least one media provider.');
                 return;
             }
+
+            // Check all selected providers have been tested
+            const untestedProviders = selectedProviders.filter(p => !testedProviders.has(p));
+            if (untestedProviders.length > 0) {
+                const names = untestedProviders.map(p => {
+                    const pt = providerTypes.find(t => t.type === p);
+                    return pt ? pt.name : p;
+                }).join(', ');
+                alert(`Please test connection for: ${names}`);
+                return;
+            }
         }
         if (currentStep < 4) {
             showStep(currentStep + 1);
@@ -1191,6 +1594,20 @@ <h4>Existing Installation Detected</h4>
                 : 'docker-compose-worker-cpu.yaml (workers)');
         }
 
+        // Get AI provider summary
+        const aiProvider = document.getElementById('setting-ai-provider').value;
+        let aiProviderSummary = aiProvider;
+        if (aiProvider !== 'NONE' && aiProviderFields[aiProvider]) {
+            // Get model name if configured
+            const modelField = aiProviderFields[aiProvider].find(f => f.name.includes('_model'));
+            if (modelField) {
+                const modelInput = document.getElementById(`ai-config-${modelField.name}`);
+                if (modelInput && modelInput.value) {
+                    aiProviderSummary += ` (${modelInput.value})`;
+                }
+            }
+        }
+
         summary.innerHTML = `
             <div class="summary-item">
                 <span class="summary-label">Deployment Mode</span>
@@ -1218,11 +1635,29 @@ <h4>Existing Installation Detected</h4>
             </div>
             <div class="summary-item">
                 <span class="summary-label">AI Playlist Naming</span>
-                <span class="summary-value">${document.getElementById('setting-ai-provider').value}</span>
+                <span class="summary-value">${aiProviderSummary}</span>
             </div>
         `;
     }
 
+    function collectAIProviderSettings() {
+        const provider = document.getElementById('setting-ai-provider').value;
+        const settings = { ai_provider: provider };
+
+        if (provider !== 'NONE' && aiProviderFields[provider]) {
+            // Collect all AI config field values
+            const inputs = document.querySelectorAll('[data-ai-field]');
+            inputs.forEach(input => {
+                const fieldName = input.dataset.aiField;
+                if (input.value) {
+                    settings[fieldName] = input.value;
+                }
+            });
+        }
+
+        return settings;
+    }
+
     async function completeSetup() {
         try {
             // Save providers
@@ -1241,7 +1676,10 @@ <h4>Existing Installation Detected</h4>
                 });
             }
 
-            // Save settings
+            // Collect AI provider settings
+            const aiSettings = collectAIProviderSettings();
+
+            // Save settings (including AI provider config)
             await fetch('/api/setup/settings', {
                 method: 'PUT',
                 headers: { 'Content-Type': 'application/json' },
@@ -1250,7 +1688,7 @@ <h4>Existing Installation Detected</h4>
                     hardware_type: selectedHardware,
                     clap_enabled: document.getElementById('setting-clap-enabled').checked,
                     gpu_clustering: document.getElementById('setting-gpu-clustering').checked,
-                    ai_provider: document.getElementById('setting-ai-provider').value
+                    ...aiSettings
                 })
             });
 
@@ -1266,5 +1704,88 @@ <h4>Existing Installation Detected</h4>
             alert('Error saving configuration: ' + err.message);
         }
     }
+
+    // Directory Browser Functions
+    function openBrowseModal(inputId) {
+        browseTargetInput = document.getElementById(inputId);
+        browseCurrentPath = browseTargetInput.value || '/';
+
+        const modal = document.getElementById('directory-browser-modal');
+        modal.classList.add('visible');
+
+        loadDirectories(browseCurrentPath);
+    }
+
+    function closeBrowseModal() {
+        const modal = document.getElementById('directory-browser-modal');
+        modal.classList.remove('visible');
+        browseTargetInput = null;
+    }
+
+    async function loadDirectories(path) {
+        const listEl = document.getElementById('directory-list');
+        const pathEl = document.getElementById('browse-current-path');
+
+        listEl.innerHTML = '<li style="padding: 1rem; color: var(--text-muted);">Loading...</li>';
+        pathEl.textContent = path || '/';
+        browseCurrentPath = path;
+
+        try {
+            const url = path ? `/api/setup/browse-directories?path=${encodeURIComponent(path)}` : '/api/setup/browse-directories';
+            const response = await fetch(url);
+            const data = await response.json();
+
+            if (data.error) {
+                listEl.innerHTML = `<li style="padding: 1rem; color: var(--color-danger);">${data.error}</li>`;
+                return;
+            }
+
+            listEl.innerHTML = '';
+
+            // Add parent directory option if not at root
+            if (data.parent_path !== null) {
+                const parentLi = document.createElement('li');
+                parentLi.className = 'directory-item parent';
+                parentLi.innerHTML = '<span class="folder-icon">📁</span> .. (Parent Directory)';
+                parentLi.onclick = () => loadDirectories(data.parent_path);
+                listEl.appendChild(parentLi);
+            }
+
+            // Add directories
+            if (data.directories.length === 0) {
+                const emptyLi = document.createElement('li');
+                emptyLi.style.padding = '1rem';
+                emptyLi.style.color = 'var(--text-muted)';
+                emptyLi.textContent = 'No subdirectories found';
+                listEl.appendChild(emptyLi);
+            } else {
+                data.directories.forEach(dir => {
+                    const li = document.createElement('li');
+                    li.className = 'directory-item' + (dir.accessible === false ? ' inaccessible' : '');
+                    li.innerHTML = `<span class="folder-icon">📁</span> ${dir.name}`;
+
+                    if (dir.accessible !== false) {
+                        li.onclick = () => loadDirectories(dir.path);
+                    }
+
+                    listEl.appendChild(li);
+                });
+            }
+
+            pathEl.textContent = data.current_path;
+            browseCurrentPath = data.current_path;
+
+        } catch (err) {
+            console.error('Error loading directories:', err);
+            listEl.innerHTML = `<li style="padding: 1rem; color: var(--color-danger);">Error loading directories: ${err.message}</li>`;
+        }
+    }
+
+    function selectCurrentDirectory() {
+        if (browseTargetInput && browseCurrentPath) {
+            browseTargetInput.value = browseCurrentPath;
+        }
+        closeBrowseModal();
+    }
 </script>
 {% endblock %}

From 0342a9d7d6ab8bb7efe0b1b73645f540d9f3e369 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Thu, 5 Feb 2026 09:26:44 +0000
Subject: [PATCH 14/33] Add comprehensive testing and comparison suite for
 dual-instance comparison

Builds a complete testing framework that connects to two AudioMuse-AI
instances (e.g., main vs feature branch) via API, PostgreSQL, Docker,
and compares results across all dimensions:

- Database comparator: schema validation (17 tables), row counts, data
  quality (NULL rates, duplicates, mood_vector format), embedding
  integrity (dimensions, coverage, NaN checks), referential integrity,
  score distributions, playlist quality, index presence, task health,
  provider config, and app settings comparison

- API comparator: tests 30+ endpoints including config, playlists,
  search, similarity, map, CLAP, alchemy, path finding, sonic
  fingerprint, artist similarity, setup/providers, cron, external API,
  and error handling - comparing status codes, response shapes, keys,
  and list lengths between instances

- Docker comparator: container health/status, restart counts, resource
  usage (memory/CPU), log error pattern analysis (tracebacks, OOM,
  timeouts, DB errors), warning detection, and service connectivity
  tests for Redis and PostgreSQL

- Performance comparator: endpoint latency benchmarks (p50/p95/p99/mean)
  with warmup, concurrent load testing with configurable users,
  database query performance benchmarks for 8 critical queries

- Existing test integration: discovers and runs all 17 unit test files,
  2 integration tests, and 8 E2E API tests from the existing test suite,
  with per-file results and instance-specific E2E execution

- HTML report generator: self-contained dark-themed report with status
  badges, per-category expandable sections, filterable tables, side-by-
  side instance comparison, and visual performance bar charts

- CLI with full argument support, YAML config files, environment
  variable configuration, test category selection (--only/--skip),
  and --discover mode listing all 27 available tests

https://claude.ai/code/session_0122SF3fSXM3e2dNqaJB5NDn
---
 testing_suite/__init__.py                     |    9 +
 testing_suite/__main__.py                     |    5 +
 testing_suite/comparators/__init__.py         |    0
 testing_suite/comparators/api_comparator.py   |  760 +++++++++++
 testing_suite/comparators/db_comparator.py    | 1142 +++++++++++++++++
 .../comparators/docker_comparator.py          |  541 ++++++++
 .../comparators/performance_comparator.py     |  447 +++++++
 testing_suite/comparison_config.example.yaml  |   91 ++
 testing_suite/config.py                       |  211 +++
 testing_suite/orchestrator.py                 |  163 +++
 testing_suite/reports/__init__.py             |    0
 testing_suite/reports/html_report.py          |  359 ++++++
 testing_suite/requirements.txt                |    7 +
 testing_suite/run_comparison.py               |  325 +++++
 testing_suite/test_runner/__init__.py         |    0
 testing_suite/test_runner/existing_tests.py   |  469 +++++++
 testing_suite/utils.py                        |  434 +++++++
 17 files changed, 4963 insertions(+)
 create mode 100644 testing_suite/__init__.py
 create mode 100644 testing_suite/__main__.py
 create mode 100644 testing_suite/comparators/__init__.py
 create mode 100644 testing_suite/comparators/api_comparator.py
 create mode 100644 testing_suite/comparators/db_comparator.py
 create mode 100644 testing_suite/comparators/docker_comparator.py
 create mode 100644 testing_suite/comparators/performance_comparator.py
 create mode 100644 testing_suite/comparison_config.example.yaml
 create mode 100644 testing_suite/config.py
 create mode 100644 testing_suite/orchestrator.py
 create mode 100644 testing_suite/reports/__init__.py
 create mode 100644 testing_suite/reports/html_report.py
 create mode 100644 testing_suite/requirements.txt
 create mode 100644 testing_suite/run_comparison.py
 create mode 100644 testing_suite/test_runner/__init__.py
 create mode 100644 testing_suite/test_runner/existing_tests.py
 create mode 100644 testing_suite/utils.py

diff --git a/testing_suite/__init__.py b/testing_suite/__init__.py
new file mode 100644
index 00000000..9f60c65e
--- /dev/null
+++ b/testing_suite/__init__.py
@@ -0,0 +1,9 @@
+# AudioMuse-AI Testing & Comparison Suite
+# Compares two instances (e.g., main branch vs feature branch) across:
+# - API endpoints (results, response shapes, status codes)
+# - Database quality (schema, data integrity, embeddings, track counts)
+# - Docker container health and logs
+# - Performance benchmarks (latency, throughput)
+# - Existing unit and integration tests
+
+__version__ = "1.0.0"
diff --git a/testing_suite/__main__.py b/testing_suite/__main__.py
new file mode 100644
index 00000000..018ad6bd
--- /dev/null
+++ b/testing_suite/__main__.py
@@ -0,0 +1,5 @@
+"""Allow running the testing suite as a module: python -m testing_suite"""
+from testing_suite.run_comparison import main
+import sys
+
+sys.exit(main())
diff --git a/testing_suite/comparators/__init__.py b/testing_suite/comparators/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/testing_suite/comparators/api_comparator.py b/testing_suite/comparators/api_comparator.py
new file mode 100644
index 00000000..fecb265d
--- /dev/null
+++ b/testing_suite/comparators/api_comparator.py
@@ -0,0 +1,760 @@
+"""
+API Comparison Module for AudioMuse-AI Testing Suite.
+
+Tests all API endpoints on both instances and compares:
+  - HTTP status codes
+  - Response shapes (keys, types, list lengths)
+  - Response content (values where deterministic)
+  - Error handling and edge cases
+  - Endpoint availability
+  - Task lifecycle (start -> poll -> success)
+"""
+
+import json
+import logging
+import time
+import warnings
+from typing import Any, Dict, List, Optional, Tuple
+
+from testing_suite.config import ComparisonConfig, InstanceConfig
+from testing_suite.utils import (
+    ComparisonReport, TestResult, TestStatus,
+    http_get, http_post, timed_request, wait_for_task_success, pct_diff
+)
+
+logger = logging.getLogger(__name__)
+
+
+class APIComparator:
+    """Tests and compares API endpoints across two AudioMuse-AI instances."""
+
+    def __init__(self, config: ComparisonConfig):
+        self.config = config
+        self.url_a = config.instance_a.api_url.rstrip('/')
+        self.url_b = config.instance_b.api_url.rstrip('/')
+        self.name_a = config.instance_a.name
+        self.name_b = config.instance_b.name
+        self.timeout = config.api_timeout
+        self.retries = config.api_retries
+        self.retry_delay = config.api_retry_delay
+
+    def run_all(self, report: ComparisonReport):
+        """Run all API comparison tests."""
+        logger.info("Starting API comparison tests...")
+
+        # Check connectivity first
+        alive_a = self._check_alive(self.url_a)
+        alive_b = self._check_alive(self.url_b)
+
+        report.add_result(TestResult(
+            category="api",
+            name="Instance A connectivity",
+            status=TestStatus.PASS if alive_a else TestStatus.ERROR,
+            message=f"{self.url_a}: {'reachable' if alive_a else 'unreachable'}",
+            instance_a_value=alive_a,
+        ))
+        report.add_result(TestResult(
+            category="api",
+            name="Instance B connectivity",
+            status=TestStatus.PASS if alive_b else TestStatus.ERROR,
+            message=f"{self.url_b}: {'reachable' if alive_b else 'unreachable'}",
+            instance_b_value=alive_b,
+        ))
+
+        if not alive_a and not alive_b:
+            report.add_result(TestResult(
+                category="api",
+                name="API Tests",
+                status=TestStatus.ERROR,
+                message="Neither instance is reachable; skipping all API tests",
+            ))
+            return
+
+        # Run endpoint tests
+        self._test_config_endpoint(report, alive_a, alive_b)
+        self._test_playlists_endpoint(report, alive_a, alive_b)
+        self._test_active_tasks_endpoint(report, alive_a, alive_b)
+        self._test_last_task_endpoint(report, alive_a, alive_b)
+        self._test_search_tracks_endpoint(report, alive_a, alive_b)
+        self._test_similar_tracks_endpoint(report, alive_a, alive_b)
+        self._test_max_distance_endpoint(report, alive_a, alive_b)
+        self._test_map_endpoint(report, alive_a, alive_b)
+        self._test_map_cache_status(report, alive_a, alive_b)
+        self._test_clap_stats(report, alive_a, alive_b)
+        self._test_clap_warmup_status(report, alive_a, alive_b)
+        self._test_clap_top_queries(report, alive_a, alive_b)
+        self._test_setup_status(report, alive_a, alive_b)
+        self._test_setup_providers(report, alive_a, alive_b)
+        self._test_setup_settings(report, alive_a, alive_b)
+        self._test_setup_server_info(report, alive_a, alive_b)
+        self._test_provider_types(report, alive_a, alive_b)
+        self._test_providers_enabled(report, alive_a, alive_b)
+        self._test_cron_entries(report, alive_a, alive_b)
+        self._test_waveform_endpoint(report, alive_a, alive_b)
+        self._test_find_path_endpoint(report, alive_a, alive_b)
+        self._test_sonic_fingerprint(report, alive_a, alive_b)
+        self._test_alchemy_endpoint(report, alive_a, alive_b)
+        self._test_artist_projections(report, alive_a, alive_b)
+        self._test_search_artists(report, alive_a, alive_b)
+        self._test_external_search(report, alive_a, alive_b)
+        self._test_chat_config_defaults(report, alive_a, alive_b)
+        self._test_error_handling(report, alive_a, alive_b)
+        self._test_collection_last_task(report, alive_a, alive_b)
+
+        logger.info("API comparison tests complete.")
+
+    # ------------------------------------------------------------------
+    # Connectivity
+    # ------------------------------------------------------------------
+
+    def _check_alive(self, url: str) -> bool:
+        """Check if an instance is reachable."""
+        try:
+            resp = http_get(f"{url}/api/config", timeout=15, retries=2, retry_delay=1)
+            return resp.status_code == 200
+        except Exception:
+            return False
+
+    # ------------------------------------------------------------------
+    # Helper: compare GET endpoint on both instances
+    # ------------------------------------------------------------------
+
+    def _compare_get(self, report: ComparisonReport, path: str, test_name: str,
+                     params: dict = None, alive_a: bool = True, alive_b: bool = True,
+                     expected_status: int = 200, check_keys: list = None,
+                     compare_list_length: bool = False):
+        """
+        Hit a GET endpoint on both instances and compare the results.
+        Adds test results to the report.
+        """
+        t0 = time.time()
+        resp_a = resp_b = None
+        data_a = data_b = None
+
+        try:
+            if alive_a:
+                resp_a, lat_a = timed_request("GET", f"{self.url_a}{path}",
+                                               params=params, timeout=self.timeout,
+                                               retries=self.retries, retry_delay=self.retry_delay)
+            if alive_b:
+                resp_b, lat_b = timed_request("GET", f"{self.url_b}{path}",
+                                               params=params, timeout=self.timeout,
+                                               retries=self.retries, retry_delay=self.retry_delay)
+        except Exception as e:
+            report.add_result(TestResult(
+                category="api",
+                name=f"{test_name}: request",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+            return None, None
+
+        # Status code comparison
+        status_a = resp_a.status_code if resp_a else None
+        status_b = resp_b.status_code if resp_b else None
+
+        if alive_a and alive_b:
+            if status_a == expected_status and status_b == expected_status:
+                status = TestStatus.PASS
+                msg = f"Both returned {expected_status}"
+            elif status_a == status_b:
+                status = TestStatus.WARN
+                msg = f"Both returned {status_a} (expected {expected_status})"
+            else:
+                status = TestStatus.FAIL
+                msg = f"Status codes differ: A={status_a}, B={status_b}"
+
+            report.add_result(TestResult(
+                category="api",
+                name=f"{test_name}: status code",
+                status=status,
+                message=msg,
+                instance_a_value=status_a,
+                instance_b_value=status_b,
+                duration_seconds=time.time() - t0,
+                details={"latency_a": lat_a if alive_a else None,
+                          "latency_b": lat_b if alive_b else None},
+            ))
+
+        # Parse JSON response
+        try:
+            if resp_a and resp_a.status_code == expected_status:
+                data_a = resp_a.json()
+            if resp_b and resp_b.status_code == expected_status:
+                data_b = resp_b.json()
+        except Exception as e:
+            report.add_result(TestResult(
+                category="api",
+                name=f"{test_name}: JSON parse",
+                status=TestStatus.ERROR,
+                message=f"JSON parse error: {e}",
+                duration_seconds=time.time() - t0,
+            ))
+            return data_a, data_b
+
+        # Key comparison (if both have JSON data)
+        if data_a is not None and data_b is not None:
+            if isinstance(data_a, dict) and isinstance(data_b, dict):
+                keys_a = set(data_a.keys())
+                keys_b = set(data_b.keys())
+                if keys_a == keys_b:
+                    key_status = TestStatus.PASS
+                    key_msg = f"Same keys: {sorted(keys_a)}"
+                else:
+                    key_status = TestStatus.FAIL
+                    missing_b = keys_a - keys_b
+                    missing_a = keys_b - keys_a
+                    key_msg = f"Keys differ: only_A={missing_b}, only_B={missing_a}"
+
+                report.add_result(TestResult(
+                    category="api",
+                    name=f"{test_name}: response shape",
+                    status=key_status,
+                    message=key_msg,
+                    instance_a_value=sorted(keys_a),
+                    instance_b_value=sorted(keys_b),
+                    duration_seconds=time.time() - t0,
+                ))
+
+            if isinstance(data_a, list) and isinstance(data_b, list):
+                if compare_list_length:
+                    len_a = len(data_a)
+                    len_b = len(data_b)
+                    if len_a == len_b:
+                        l_status = TestStatus.PASS
+                        l_msg = f"Same list length: {len_a}"
+                    else:
+                        diff = pct_diff(len_a, len_b)
+                        l_status = TestStatus.WARN if diff <= 20 else TestStatus.FAIL
+                        l_msg = f"List lengths differ: A={len_a}, B={len_b} ({diff:.1f}%)"
+
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"{test_name}: list length",
+                        status=l_status,
+                        message=l_msg,
+                        instance_a_value=len_a,
+                        instance_b_value=len_b,
+                        duration_seconds=time.time() - t0,
+                    ))
+
+            # Check specific keys exist
+            if check_keys and isinstance(data_a, dict) and isinstance(data_b, dict):
+                for key in check_keys:
+                    has_a = key in data_a
+                    has_b = key in data_b
+                    if has_a and has_b:
+                        kstatus = TestStatus.PASS
+                    elif has_a or has_b:
+                        kstatus = TestStatus.FAIL
+                    else:
+                        kstatus = TestStatus.WARN
+
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"{test_name}: key '{key}'",
+                        status=kstatus,
+                        message=f"A has '{key}': {has_a}, B has '{key}': {has_b}",
+                        duration_seconds=time.time() - t0,
+                    ))
+
+        return data_a, data_b
+
+    def _compare_post(self, report: ComparisonReport, path: str, test_name: str,
+                      json_data: dict = None, alive_a: bool = True, alive_b: bool = True,
+                      expected_status: int = 200, check_keys: list = None):
+        """Hit a POST endpoint on both instances and compare results."""
+        t0 = time.time()
+        resp_a = resp_b = None
+        data_a = data_b = None
+
+        try:
+            if alive_a:
+                resp_a, lat_a = timed_request("POST", f"{self.url_a}{path}",
+                                               json_data=json_data, timeout=self.timeout,
+                                               retries=self.retries, retry_delay=self.retry_delay)
+            if alive_b:
+                resp_b, lat_b = timed_request("POST", f"{self.url_b}{path}",
+                                               json_data=json_data, timeout=self.timeout,
+                                               retries=self.retries, retry_delay=self.retry_delay)
+        except Exception as e:
+            report.add_result(TestResult(
+                category="api",
+                name=f"{test_name}: request",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+            return None, None
+
+        status_a = resp_a.status_code if resp_a else None
+        status_b = resp_b.status_code if resp_b else None
+
+        if alive_a and alive_b:
+            if status_a == expected_status and status_b == expected_status:
+                status = TestStatus.PASS
+                msg = f"Both returned {expected_status}"
+            elif status_a == status_b:
+                status = TestStatus.WARN
+                msg = f"Both returned {status_a} (expected {expected_status})"
+            else:
+                status = TestStatus.FAIL
+                msg = f"Status codes differ: A={status_a}, B={status_b}"
+
+            report.add_result(TestResult(
+                category="api",
+                name=f"{test_name}: status code",
+                status=status,
+                message=msg,
+                instance_a_value=status_a,
+                instance_b_value=status_b,
+                duration_seconds=time.time() - t0,
+                details={"latency_a": lat_a if alive_a else None,
+                          "latency_b": lat_b if alive_b else None},
+            ))
+
+        try:
+            if resp_a and resp_a.status_code == expected_status:
+                data_a = resp_a.json()
+            if resp_b and resp_b.status_code == expected_status:
+                data_b = resp_b.json()
+        except Exception:
+            pass
+
+        if data_a is not None and data_b is not None and isinstance(data_a, dict) and isinstance(data_b, dict):
+            keys_a = set(data_a.keys())
+            keys_b = set(data_b.keys())
+            if keys_a == keys_b:
+                report.add_result(TestResult(
+                    category="api", name=f"{test_name}: response shape",
+                    status=TestStatus.PASS, message=f"Same keys: {sorted(keys_a)}",
+                    duration_seconds=time.time() - t0,
+                ))
+            else:
+                report.add_result(TestResult(
+                    category="api", name=f"{test_name}: response shape",
+                    status=TestStatus.FAIL,
+                    message=f"Keys differ: only_A={keys_a - keys_b}, only_B={keys_b - keys_a}",
+                    duration_seconds=time.time() - t0,
+                ))
+
+            if check_keys:
+                for key in check_keys:
+                    has_a = key in data_a
+                    has_b = key in data_b
+                    report.add_result(TestResult(
+                        category="api", name=f"{test_name}: key '{key}'",
+                        status=TestStatus.PASS if (has_a and has_b) else TestStatus.FAIL,
+                        message=f"A: {has_a}, B: {has_b}",
+                        duration_seconds=time.time() - t0,
+                    ))
+
+        return data_a, data_b
+
+    # ------------------------------------------------------------------
+    # Individual endpoint tests
+    # ------------------------------------------------------------------
+
+    def _test_config_endpoint(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/config", "GET /api/config",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_playlists_endpoint(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/playlists", "GET /api/playlists",
+                          alive_a=alive_a, alive_b=alive_b,
+                          compare_list_length=True)
+
+    def _test_active_tasks_endpoint(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/active_tasks", "GET /api/active_tasks",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_last_task_endpoint(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/last_task", "GET /api/last_task",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_search_tracks_endpoint(self, report, alive_a, alive_b):
+        params = {
+            "artist": self.config.test_track_artist_1,
+            "title": self.config.test_track_title_1,
+        }
+        data_a, data_b = self._compare_get(
+            report, "/api/search_tracks", "GET /api/search_tracks",
+            params=params, alive_a=alive_a, alive_b=alive_b,
+            compare_list_length=True)
+
+        # Validate response has expected track fields
+        t0 = time.time()
+        for label, data in [("A", data_a), ("B", data_b)]:
+            if data and isinstance(data, list) and data:
+                track = data[0]
+                expected = {"item_id", "title"}
+                present = expected.intersection(track.keys())
+                if present == expected:
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"GET /api/search_tracks: {label} track fields",
+                        status=TestStatus.PASS,
+                        message=f"Track has required fields: {expected}",
+                        duration_seconds=time.time() - t0,
+                    ))
+                else:
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"GET /api/search_tracks: {label} track fields",
+                        status=TestStatus.FAIL,
+                        message=f"Missing fields: {expected - present}. Has: {set(track.keys())}",
+                        duration_seconds=time.time() - t0,
+                    ))
+
+    def _test_similar_tracks_endpoint(self, report, alive_a, alive_b):
+        params = {
+            "title": self.config.test_track_title_1,
+            "artist": self.config.test_track_artist_1,
+            "n": 5,
+        }
+        data_a, data_b = self._compare_get(
+            report, "/api/similar_tracks", "GET /api/similar_tracks",
+            params=params, alive_a=alive_a, alive_b=alive_b,
+            compare_list_length=True)
+
+        # Validate result tracks have item_id
+        t0 = time.time()
+        for label, data in [("A", data_a), ("B", data_b)]:
+            if data and isinstance(data, list):
+                has_ids = all('item_id' in t for t in data)
+                report.add_result(TestResult(
+                    category="api",
+                    name=f"GET /api/similar_tracks: {label} item_ids present",
+                    status=TestStatus.PASS if has_ids else TestStatus.FAIL,
+                    message=f"All tracks have item_id: {has_ids} ({len(data)} tracks)",
+                    duration_seconds=time.time() - t0,
+                ))
+
+    def _test_max_distance_endpoint(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/max_distance", "GET /api/max_distance",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_map_endpoint(self, report, alive_a, alive_b):
+        data_a, data_b = self._compare_get(
+            report, "/api/map", "GET /api/map",
+            params={"percent": 10}, alive_a=alive_a, alive_b=alive_b,
+            check_keys=["items"])
+
+        # Validate items structure
+        t0 = time.time()
+        for label, data in [("A", data_a), ("B", data_b)]:
+            if data and isinstance(data, dict) and "items" in data:
+                items = data["items"]
+                if isinstance(items, list) and items:
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"GET /api/map: {label} items non-empty",
+                        status=TestStatus.PASS,
+                        message=f"{len(items)} items returned",
+                        duration_seconds=time.time() - t0,
+                    ))
+                else:
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"GET /api/map: {label} items non-empty",
+                        status=TestStatus.WARN,
+                        message=f"Empty items list",
+                        duration_seconds=time.time() - t0,
+                    ))
+
+    def _test_map_cache_status(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/map_cache_status", "GET /api/map_cache_status",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_clap_stats(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/clap/stats", "GET /api/clap/stats",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_clap_warmup_status(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/clap/warmup/status", "GET /api/clap/warmup/status",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_clap_top_queries(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/clap/top_queries", "GET /api/clap/top_queries",
+                          alive_a=alive_a, alive_b=alive_b,
+                          compare_list_length=True)
+
+    def _test_setup_status(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/setup/status", "GET /api/setup/status",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_setup_providers(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/setup/providers", "GET /api/setup/providers",
+                          alive_a=alive_a, alive_b=alive_b,
+                          compare_list_length=True)
+
+    def _test_setup_settings(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/setup/settings", "GET /api/setup/settings",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_setup_server_info(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/setup/server-info", "GET /api/setup/server-info",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_provider_types(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/setup/providers/types", "GET /api/setup/providers/types",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_providers_enabled(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/providers/enabled", "GET /api/providers/enabled",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_cron_entries(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/cron", "GET /api/cron",
+                          alive_a=alive_a, alive_b=alive_b,
+                          compare_list_length=True)
+
+    def _test_waveform_endpoint(self, report, alive_a, alive_b):
+        # Waveform needs a track query param - test without to verify error handling
+        self._compare_get(report, "/api/waveform", "GET /api/waveform (no params)",
+                          alive_a=alive_a, alive_b=alive_b,
+                          expected_status=400)
+
+    def _test_find_path_endpoint(self, report, alive_a, alive_b):
+        """Test /api/find_path by first finding two track IDs."""
+        t0 = time.time()
+        try:
+            # Find track IDs from both instances
+            id_a_start = self._find_track_id(self.url_a,
+                                              self.config.test_track_artist_1,
+                                              self.config.test_track_title_1) if alive_a else None
+            id_a_end = self._find_track_id(self.url_a,
+                                            self.config.test_track_artist_2,
+                                            self.config.test_track_title_2) if alive_a else None
+            id_b_start = self._find_track_id(self.url_b,
+                                              self.config.test_track_artist_1,
+                                              self.config.test_track_title_1) if alive_b else None
+            id_b_end = self._find_track_id(self.url_b,
+                                            self.config.test_track_artist_2,
+                                            self.config.test_track_title_2) if alive_b else None
+
+            for label, url, start_id, end_id in [
+                ("A", self.url_a, id_a_start, id_a_end),
+                ("B", self.url_b, id_b_start, id_b_end),
+            ]:
+                if not start_id or not end_id:
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"GET /api/find_path ({label}): track lookup",
+                        status=TestStatus.SKIP,
+                        message="Could not find test tracks",
+                        duration_seconds=time.time() - t0,
+                    ))
+                    continue
+
+                resp, lat = timed_request("GET", f"{url}/api/find_path",
+                                           params={"start_song_id": start_id,
+                                                   "end_song_id": end_id,
+                                                   "max_steps": 10},
+                                           timeout=self.timeout, retries=self.retries,
+                                           retry_delay=self.retry_delay)
+
+                if resp.status_code == 200:
+                    data = resp.json()
+                    path = data.get('path', data) if isinstance(data, dict) else data
+                    path_len = len(path) if isinstance(path, list) else 0
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"GET /api/find_path ({label})",
+                        status=TestStatus.PASS if path_len > 0 else TestStatus.WARN,
+                        message=f"Path length: {path_len}, latency: {lat:.2f}s",
+                        instance_a_value=path_len if label == "A" else None,
+                        instance_b_value=path_len if label == "B" else None,
+                        duration_seconds=time.time() - t0,
+                        details={"latency": lat},
+                    ))
+                else:
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"GET /api/find_path ({label})",
+                        status=TestStatus.FAIL,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0,
+                    ))
+        except Exception as e:
+            report.add_result(TestResult(
+                category="api",
+                name="GET /api/find_path",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+
+    def _test_sonic_fingerprint(self, report, alive_a, alive_b):
+        """Test sonic fingerprint generation on both instances."""
+        payload = {"n": 1, "jellyfin_user_identifier": "admin", "jellyfin_token": ""}
+        self._compare_post(report, "/api/sonic_fingerprint/generate",
+                           "POST /api/sonic_fingerprint/generate",
+                           json_data=payload, alive_a=alive_a, alive_b=alive_b)
+
+    def _test_alchemy_endpoint(self, report, alive_a, alive_b):
+        """Test song alchemy (requires track IDs)."""
+        t0 = time.time()
+        try:
+            for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+                if not alive:
+                    continue
+
+                add_id = self._find_track_id(url, self.config.test_track_artist_1,
+                                              self.config.test_track_title_1)
+                sub_id = self._find_track_id(url, self.config.test_track_artist_2,
+                                              self.config.test_track_title_2)
+
+                if not add_id or not sub_id:
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"POST /api/alchemy ({label}): track lookup",
+                        status=TestStatus.SKIP,
+                        message="Could not find test tracks for alchemy",
+                        duration_seconds=time.time() - t0,
+                    ))
+                    continue
+
+                payload = {
+                    "items": [
+                        {"id": add_id, "op": "ADD"},
+                        {"id": sub_id, "op": "SUBTRACT"},
+                    ],
+                    "n": 5,
+                    "temperature": 1,
+                    "subtract_distance": 0.2,
+                }
+
+                resp, lat = timed_request("POST", f"{url}/api/alchemy",
+                                           json_data=payload, timeout=self.timeout,
+                                           retries=self.retries, retry_delay=self.retry_delay)
+
+                if resp.status_code == 200:
+                    data = resp.json()
+                    expected_keys = {"results", "projection"}
+                    has_keys = expected_keys.issubset(data.keys()) if isinstance(data, dict) else False
+                    results_count = len(data.get("results", [])) if isinstance(data, dict) else 0
+
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"POST /api/alchemy ({label})",
+                        status=TestStatus.PASS if has_keys and results_count > 0 else TestStatus.WARN,
+                        message=f"Has expected keys: {has_keys}, results: {results_count}, latency: {lat:.2f}s",
+                        duration_seconds=time.time() - t0,
+                        details={"latency": lat, "result_count": results_count},
+                    ))
+                else:
+                    report.add_result(TestResult(
+                        category="api",
+                        name=f"POST /api/alchemy ({label})",
+                        status=TestStatus.FAIL,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0,
+                    ))
+        except Exception as e:
+            report.add_result(TestResult(
+                category="api",
+                name="POST /api/alchemy",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+
+    def _test_artist_projections(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/artist_projections", "GET /api/artist_projections",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_search_artists(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/search_artists", "GET /api/search_artists",
+                          params={"q": "Red Hot"}, alive_a=alive_a, alive_b=alive_b,
+                          compare_list_length=True)
+
+    def _test_external_search(self, report, alive_a, alive_b):
+        self._compare_get(report, "/external/search", "GET /external/search",
+                          params={"q": "piano"}, alive_a=alive_a, alive_b=alive_b,
+                          compare_list_length=True)
+
+    def _test_chat_config_defaults(self, report, alive_a, alive_b):
+        self._compare_get(report, "/chat/api/config_defaults", "GET /chat/api/config_defaults",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_collection_last_task(self, report, alive_a, alive_b):
+        self._compare_get(report, "/api/collection/last_task", "GET /api/collection/last_task",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    # ------------------------------------------------------------------
+    # Error handling tests
+    # ------------------------------------------------------------------
+
+    def _test_error_handling(self, report, alive_a, alive_b):
+        """Test that both instances handle errors consistently."""
+        error_cases = [
+            ("/api/status/nonexistent_task_id_12345", "Nonexistent task status", 200),
+            ("/api/track", "Track without item_id", 400),
+            ("/api/similar_tracks", "Similar tracks without params", 400),
+        ]
+
+        for path, desc, expected_status in error_cases:
+            t0 = time.time()
+            try:
+                resp_a = http_get(f"{self.url_a}{path}", timeout=15, retries=1) if alive_a else None
+                resp_b = http_get(f"{self.url_b}{path}", timeout=15, retries=1) if alive_b else None
+
+                status_a = resp_a.status_code if resp_a else None
+                status_b = resp_b.status_code if resp_b else None
+
+                if alive_a and alive_b:
+                    if status_a == status_b:
+                        report.add_result(TestResult(
+                            category="api",
+                            name=f"Error handling: {desc}",
+                            status=TestStatus.PASS,
+                            message=f"Consistent error codes: {status_a}",
+                            instance_a_value=status_a,
+                            instance_b_value=status_b,
+                            duration_seconds=time.time() - t0,
+                        ))
+                    else:
+                        report.add_result(TestResult(
+                            category="api",
+                            name=f"Error handling: {desc}",
+                            status=TestStatus.WARN,
+                            message=f"Different error codes: A={status_a}, B={status_b}",
+                            instance_a_value=status_a,
+                            instance_b_value=status_b,
+                            duration_seconds=time.time() - t0,
+                        ))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api",
+                    name=f"Error handling: {desc}",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+    # ------------------------------------------------------------------
+    # Helpers
+    # ------------------------------------------------------------------
+
+    def _find_track_id(self, base_url: str, artist: str, title: str) -> Optional[str]:
+        """Find a track's item_id via the search API."""
+        try:
+            resp = http_get(f"{base_url}/api/search_tracks",
+                            params={"artist": artist, "title": title},
+                            timeout=30, retries=2, retry_delay=1)
+            if resp.status_code == 200:
+                results = resp.json()
+                if isinstance(results, list) and results:
+                    # Try exact match first
+                    for track in results:
+                        track_artist = track.get("author") or track.get("artist") or ""
+                        if track_artist.lower() == artist.lower() and \
+                           track.get("title", "").lower() == title.lower():
+                            return track["item_id"]
+                    # Fallback to first result
+                    return results[0].get("item_id")
+        except Exception as e:
+            logger.debug(f"Track search failed: {e}")
+        return None
diff --git a/testing_suite/comparators/db_comparator.py b/testing_suite/comparators/db_comparator.py
new file mode 100644
index 00000000..41d5e5ec
--- /dev/null
+++ b/testing_suite/comparators/db_comparator.py
@@ -0,0 +1,1142 @@
+"""
+Database Comparison Module for AudioMuse-AI Testing Suite.
+
+Compares two PostgreSQL instances across:
+  - Schema presence and structure (all expected tables and columns)
+  - Row counts and data volume
+  - Data quality (NULL rates, value distributions, outliers)
+  - Embedding integrity (dimensions, NaN checks, storage sizes)
+  - Index and constraint validation
+  - Cross-table referential integrity
+  - Score/analysis value distributions
+  - Playlist quality metrics
+"""
+
+import json
+import logging
+import struct
+import time
+from typing import Any, Dict, List, Optional, Tuple
+
+from testing_suite.config import ComparisonConfig, InstanceConfig
+from testing_suite.utils import (
+    ComparisonReport, TestResult, TestStatus,
+    pg_query, pg_query_dict, pg_scalar, pct_diff
+)
+
+logger = logging.getLogger(__name__)
+
+# ---------------------------------------------------------------------------
+# Expected schema definition (ground truth)
+# ---------------------------------------------------------------------------
+
+EXPECTED_TABLES = {
+    "score": [
+        "item_id", "title", "author", "album", "album_artist",
+        "tempo", "key", "scale", "mood_vector", "energy",
+        "other_features", "year", "rating", "file_path", "track_id"
+    ],
+    "embedding": ["item_id", "embedding"],
+    "clap_embedding": ["item_id", "embedding"],
+    "playlist": ["id", "playlist_name", "item_id", "title", "author"],
+    "task_status": [
+        "id", "task_id", "parent_task_id", "task_type", "sub_type_identifier",
+        "status", "progress", "details", "timestamp", "start_time", "end_time"
+    ],
+    "voyager_index_data": [
+        "index_name", "index_data", "id_map_json", "embedding_dimension", "created_at"
+    ],
+    "artist_index_data": [
+        "index_name", "index_data", "artist_map_json", "gmm_params_json", "created_at"
+    ],
+    "map_projection_data": [
+        "index_name", "projection_data", "id_map_json", "embedding_dimension", "created_at"
+    ],
+    "artist_component_projection": [
+        "index_name", "projection_data", "artist_component_map_json", "created_at"
+    ],
+    "cron": ["id", "name", "task_type", "cron_expr", "enabled", "last_run", "created_at"],
+    "artist_mapping": ["artist_name", "artist_id"],
+    "text_search_queries": ["id", "query_text", "score", "rank", "created_at"],
+    "provider": [
+        "id", "provider_type", "name", "config", "enabled",
+        "priority", "created_at", "updated_at"
+    ],
+    "track": [
+        "id", "file_path_hash", "file_path", "normalized_path",
+        "file_size", "file_modified", "created_at", "updated_at"
+    ],
+    "provider_track": [
+        "id", "provider_id", "track_id", "item_id",
+        "title", "artist", "album", "last_synced"
+    ],
+    "app_settings": ["key", "value", "category", "description", "updated_at"],
+}
+
+# Critical columns that should not be NULL in the score table
+SCORE_CRITICAL_COLUMNS = ["item_id", "title", "author", "tempo", "key", "scale", "mood_vector"]
+
+# Columns to check for statistical distribution in score
+SCORE_NUMERIC_COLUMNS = ["tempo", "energy"]
+
+
+def _safe_dsn_connect(dsn: str, instance_name: str) -> bool:
+    """Test if we can connect to the database."""
+    try:
+        pg_scalar(dsn, "SELECT 1")
+        return True
+    except Exception as e:
+        logger.warning(f"Cannot connect to {instance_name} database: {e}")
+        return False
+
+
+class DatabaseComparator:
+    """Compares two PostgreSQL database instances."""
+
+    def __init__(self, config: ComparisonConfig):
+        self.config = config
+        self.dsn_a = config.instance_a.pg_dsn
+        self.dsn_b = config.instance_b.pg_dsn
+        self.name_a = config.instance_a.name
+        self.name_b = config.instance_b.name
+
+    def run_all(self, report: ComparisonReport):
+        """Run all database comparison tests and add results to report."""
+        logger.info("Starting database comparison tests...")
+
+        # Check connectivity first
+        can_a = _safe_dsn_connect(self.dsn_a, self.name_a)
+        can_b = _safe_dsn_connect(self.dsn_b, self.name_b)
+
+        if not can_a and not can_b:
+            report.add_result(TestResult(
+                category="database",
+                name="DB Connectivity",
+                status=TestStatus.ERROR,
+                message="Cannot connect to either database instance"
+            ))
+            return
+
+        if not can_a or not can_b:
+            report.add_result(TestResult(
+                category="database",
+                name="DB Connectivity",
+                status=TestStatus.WARN,
+                message=f"Only connected to {'A' if can_a else 'B'} instance"
+            ))
+
+        # Run test suites
+        if can_a and can_b:
+            self._test_schema_comparison(report)
+            self._test_row_counts(report)
+            self._test_data_quality(report)
+            self._test_embedding_integrity(report)
+            self._test_referential_integrity(report)
+            self._test_score_distributions(report)
+            self._test_playlist_quality(report)
+            self._test_index_data_presence(report)
+            self._test_task_status_health(report)
+            self._test_provider_config(report)
+            self._test_app_settings(report)
+        elif can_a or can_b:
+            # Single-instance validation
+            dsn = self.dsn_a if can_a else self.dsn_b
+            name = self.name_a if can_a else self.name_b
+            self._test_single_instance_schema(report, dsn, name)
+            self._test_single_instance_quality(report, dsn, name)
+
+        logger.info("Database comparison tests complete.")
+
+    # ------------------------------------------------------------------
+    # Schema comparison
+    # ------------------------------------------------------------------
+
+    def _test_schema_comparison(self, report: ComparisonReport):
+        """Compare table existence and column structure between instances."""
+        for table_name, expected_cols in EXPECTED_TABLES.items():
+            t0 = time.time()
+            try:
+                cols_a = self._get_table_columns(self.dsn_a, table_name)
+                cols_b = self._get_table_columns(self.dsn_b, table_name)
+
+                table_exists_a = cols_a is not None
+                table_exists_b = cols_b is not None
+
+                if not table_exists_a and not table_exists_b:
+                    # Optional tables like mulan_embedding may not exist
+                    report.add_result(TestResult(
+                        category="database",
+                        name=f"Schema: {table_name} existence",
+                        status=TestStatus.SKIP,
+                        message=f"Table '{table_name}' does not exist in either instance",
+                        duration_seconds=time.time() - t0,
+                    ))
+                    continue
+
+                if table_exists_a != table_exists_b:
+                    report.add_result(TestResult(
+                        category="database",
+                        name=f"Schema: {table_name} existence",
+                        status=TestStatus.FAIL,
+                        message=f"Table '{table_name}' exists in {'A only' if table_exists_a else 'B only'}",
+                        instance_a_value=table_exists_a,
+                        instance_b_value=table_exists_b,
+                        duration_seconds=time.time() - t0,
+                    ))
+                    continue
+
+                # Compare columns
+                set_a = set(cols_a)
+                set_b = set(cols_b)
+                missing_in_b = set_a - set_b
+                missing_in_a = set_b - set_a
+
+                if set_a == set_b:
+                    status = TestStatus.PASS
+                    msg = f"Columns match ({len(set_a)} columns)"
+                else:
+                    status = TestStatus.FAIL
+                    msg = f"Column mismatch: missing_in_B={missing_in_b}, missing_in_A={missing_in_a}"
+
+                # Also check against expected columns
+                expected_set = set(expected_cols)
+                missing_expected_a = expected_set - set_a
+                missing_expected_b = expected_set - set_b
+
+                if missing_expected_a or missing_expected_b:
+                    if status == TestStatus.PASS:
+                        status = TestStatus.WARN
+                    msg += f" | Expected cols missing: A={missing_expected_a or 'none'}, B={missing_expected_b or 'none'}"
+
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Schema: {table_name} columns",
+                    status=status,
+                    message=msg,
+                    instance_a_value=sorted(set_a),
+                    instance_b_value=sorted(set_b),
+                    duration_seconds=time.time() - t0,
+                ))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Schema: {table_name}",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+    # ------------------------------------------------------------------
+    # Row counts
+    # ------------------------------------------------------------------
+
+    def _test_row_counts(self, report: ComparisonReport):
+        """Compare row counts across all tables."""
+        tables_to_count = [
+            "score", "embedding", "clap_embedding", "playlist",
+            "task_status", "voyager_index_data", "artist_index_data",
+            "map_projection_data", "cron", "artist_mapping",
+            "text_search_queries", "provider", "track", "provider_track",
+            "app_settings"
+        ]
+        for table_name in tables_to_count:
+            t0 = time.time()
+            try:
+                count_a = self._safe_count(self.dsn_a, table_name)
+                count_b = self._safe_count(self.dsn_b, table_name)
+
+                if count_a is None and count_b is None:
+                    report.add_result(TestResult(
+                        category="database",
+                        name=f"Row Count: {table_name}",
+                        status=TestStatus.SKIP,
+                        message="Table does not exist in either instance",
+                        duration_seconds=time.time() - t0,
+                    ))
+                    continue
+
+                diff_pct = pct_diff(count_a or 0, count_b or 0) if (count_a or count_b) else 0
+
+                if count_a == count_b:
+                    status = TestStatus.PASS
+                    msg = f"Both have {count_a} rows"
+                elif diff_pct <= self.config.db_row_count_tolerance_pct:
+                    status = TestStatus.WARN
+                    msg = f"A={count_a}, B={count_b} (diff {diff_pct:.1f}% within tolerance)"
+                else:
+                    status = TestStatus.FAIL
+                    msg = f"A={count_a}, B={count_b} (diff {diff_pct:.1f}% exceeds {self.config.db_row_count_tolerance_pct}%)"
+
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Row Count: {table_name}",
+                    status=status,
+                    message=msg,
+                    instance_a_value=count_a,
+                    instance_b_value=count_b,
+                    diff=diff_pct,
+                    duration_seconds=time.time() - t0,
+                ))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Row Count: {table_name}",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+    # ------------------------------------------------------------------
+    # Data quality checks
+    # ------------------------------------------------------------------
+
+    def _test_data_quality(self, report: ComparisonReport):
+        """Check NULL rates and data quality in the score table."""
+        for col in SCORE_CRITICAL_COLUMNS:
+            t0 = time.time()
+            try:
+                null_pct_a = self._null_percentage(self.dsn_a, "score", col)
+                null_pct_b = self._null_percentage(self.dsn_b, "score", col)
+
+                if null_pct_a is None and null_pct_b is None:
+                    continue
+
+                threshold = self.config.db_score_null_threshold_pct
+                problems = []
+                if null_pct_a is not None and null_pct_a > threshold:
+                    problems.append(f"A has {null_pct_a:.1f}% NULLs")
+                if null_pct_b is not None and null_pct_b > threshold:
+                    problems.append(f"B has {null_pct_b:.1f}% NULLs")
+
+                if problems:
+                    status = TestStatus.FAIL
+                    msg = f"score.{col}: " + "; ".join(problems) + f" (threshold {threshold}%)"
+                else:
+                    status = TestStatus.PASS
+                    msg = f"score.{col}: A={null_pct_a:.1f}% NULL, B={null_pct_b:.1f}% NULL (OK)"
+
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Data Quality: score.{col} NULLs",
+                    status=status,
+                    message=msg,
+                    instance_a_value=null_pct_a,
+                    instance_b_value=null_pct_b,
+                    duration_seconds=time.time() - t0,
+                ))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Data Quality: score.{col}",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+        # Check for duplicate item_ids in score
+        t0 = time.time()
+        try:
+            dupes_a = pg_scalar(self.dsn_a,
+                "SELECT COUNT(*) FROM (SELECT item_id FROM score GROUP BY item_id HAVING COUNT(*) > 1) sub")
+            dupes_b = pg_scalar(self.dsn_b,
+                "SELECT COUNT(*) FROM (SELECT item_id FROM score GROUP BY item_id HAVING COUNT(*) > 1) sub")
+
+            if (dupes_a or 0) == 0 and (dupes_b or 0) == 0:
+                status = TestStatus.PASS
+                msg = "No duplicate item_ids in either instance"
+            else:
+                status = TestStatus.FAIL
+                msg = f"Duplicate item_ids: A={dupes_a}, B={dupes_b}"
+
+            report.add_result(TestResult(
+                category="database",
+                name="Data Quality: score duplicate item_ids",
+                status=status,
+                message=msg,
+                instance_a_value=dupes_a,
+                instance_b_value=dupes_b,
+                duration_seconds=time.time() - t0,
+            ))
+        except Exception as e:
+            report.add_result(TestResult(
+                category="database",
+                name="Data Quality: score duplicates",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+
+        # Check mood_vector format validity
+        t0 = time.time()
+        try:
+            invalid_moods_a = pg_scalar(self.dsn_a, """
+                SELECT COUNT(*) FROM score
+                WHERE mood_vector IS NOT NULL
+                AND mood_vector NOT LIKE '%:%'
+            """)
+            invalid_moods_b = pg_scalar(self.dsn_b, """
+                SELECT COUNT(*) FROM score
+                WHERE mood_vector IS NOT NULL
+                AND mood_vector NOT LIKE '%:%'
+            """)
+
+            if (invalid_moods_a or 0) == 0 and (invalid_moods_b or 0) == 0:
+                status = TestStatus.PASS
+                msg = "All mood_vectors have valid format"
+            else:
+                status = TestStatus.WARN
+                msg = f"Invalid mood_vector format: A={invalid_moods_a}, B={invalid_moods_b}"
+
+            report.add_result(TestResult(
+                category="database",
+                name="Data Quality: mood_vector format",
+                status=status,
+                message=msg,
+                instance_a_value=invalid_moods_a,
+                instance_b_value=invalid_moods_b,
+                duration_seconds=time.time() - t0,
+            ))
+        except Exception as e:
+            report.add_result(TestResult(
+                category="database",
+                name="Data Quality: mood_vector format",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+
+    # ------------------------------------------------------------------
+    # Embedding integrity
+    # ------------------------------------------------------------------
+
+    def _test_embedding_integrity(self, report: ComparisonReport):
+        """Check embedding dimensions, storage, and coverage."""
+        for emb_table, expected_dim in [
+            ("embedding", self.config.db_embedding_dimension_expected),
+            ("clap_embedding", self.config.db_clap_dimension_expected),
+        ]:
+            t0 = time.time()
+            try:
+                count_a = self._safe_count(self.dsn_a, emb_table)
+                count_b = self._safe_count(self.dsn_b, emb_table)
+                score_count_a = self._safe_count(self.dsn_a, "score")
+                score_count_b = self._safe_count(self.dsn_b, "score")
+
+                if count_a is None and count_b is None:
+                    report.add_result(TestResult(
+                        category="database",
+                        name=f"Embedding: {emb_table} existence",
+                        status=TestStatus.SKIP,
+                        message=f"Table {emb_table} does not exist",
+                        duration_seconds=time.time() - t0,
+                    ))
+                    continue
+
+                # Coverage check
+                coverage_a = (count_a / score_count_a * 100) if score_count_a else 0
+                coverage_b = (count_b / score_count_b * 100) if score_count_b else 0
+
+                if coverage_a >= 95 and coverage_b >= 95:
+                    status = TestStatus.PASS
+                elif coverage_a >= 80 and coverage_b >= 80:
+                    status = TestStatus.WARN
+                else:
+                    status = TestStatus.FAIL
+
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Embedding: {emb_table} coverage",
+                    status=status,
+                    message=f"Coverage: A={coverage_a:.1f}% ({count_a}/{score_count_a}), "
+                            f"B={coverage_b:.1f}% ({count_b}/{score_count_b})",
+                    instance_a_value=coverage_a,
+                    instance_b_value=coverage_b,
+                    duration_seconds=time.time() - t0,
+                ))
+
+                # NULL embedding check
+                null_emb_a = pg_scalar(self.dsn_a,
+                    f"SELECT COUNT(*) FROM {emb_table} WHERE embedding IS NULL")
+                null_emb_b = pg_scalar(self.dsn_b,
+                    f"SELECT COUNT(*) FROM {emb_table} WHERE embedding IS NULL")
+
+                if (null_emb_a or 0) == 0 and (null_emb_b or 0) == 0:
+                    status = TestStatus.PASS
+                    msg = "No NULL embeddings"
+                else:
+                    status = TestStatus.FAIL
+                    msg = f"NULL embeddings: A={null_emb_a}, B={null_emb_b}"
+
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Embedding: {emb_table} NULL check",
+                    status=status,
+                    message=msg,
+                    instance_a_value=null_emb_a,
+                    instance_b_value=null_emb_b,
+                    duration_seconds=time.time() - t0,
+                ))
+
+                # Average embedding size (proxy for dimension check)
+                avg_size_a = pg_scalar(self.dsn_a,
+                    f"SELECT AVG(octet_length(embedding)) FROM {emb_table} WHERE embedding IS NOT NULL")
+                avg_size_b = pg_scalar(self.dsn_b,
+                    f"SELECT AVG(octet_length(embedding)) FROM {emb_table} WHERE embedding IS NOT NULL")
+
+                if avg_size_a and avg_size_b:
+                    # float32 = 4 bytes per dimension
+                    approx_dim_a = int(float(avg_size_a) / 4) if avg_size_a else 0
+                    approx_dim_b = int(float(avg_size_b) / 4) if avg_size_b else 0
+
+                    if approx_dim_a == approx_dim_b:
+                        status = TestStatus.PASS
+                    else:
+                        status = TestStatus.FAIL
+
+                    report.add_result(TestResult(
+                        category="database",
+                        name=f"Embedding: {emb_table} avg dimension",
+                        status=status,
+                        message=f"Approx dimensions: A~{approx_dim_a}, B~{approx_dim_b} "
+                                f"(avg bytes: A={float(avg_size_a):.0f}, B={float(avg_size_b):.0f})",
+                        instance_a_value=approx_dim_a,
+                        instance_b_value=approx_dim_b,
+                        duration_seconds=time.time() - t0,
+                    ))
+
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Embedding: {emb_table}",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+    # ------------------------------------------------------------------
+    # Referential integrity
+    # ------------------------------------------------------------------
+
+    def _test_referential_integrity(self, report: ComparisonReport):
+        """Check foreign key relationships are intact."""
+        # Embeddings should all reference valid score rows
+        for emb_table in ["embedding", "clap_embedding"]:
+            t0 = time.time()
+            try:
+                orphans_a = pg_scalar(self.dsn_a, f"""
+                    SELECT COUNT(*) FROM {emb_table} e
+                    LEFT JOIN score s ON e.item_id = s.item_id
+                    WHERE s.item_id IS NULL
+                """)
+                orphans_b = pg_scalar(self.dsn_b, f"""
+                    SELECT COUNT(*) FROM {emb_table} e
+                    LEFT JOIN score s ON e.item_id = s.item_id
+                    WHERE s.item_id IS NULL
+                """)
+
+                if orphans_a is None and orphans_b is None:
+                    continue
+
+                if (orphans_a or 0) == 0 and (orphans_b or 0) == 0:
+                    status = TestStatus.PASS
+                    msg = f"No orphaned rows in {emb_table}"
+                else:
+                    status = TestStatus.FAIL
+                    msg = f"Orphaned {emb_table} rows: A={orphans_a}, B={orphans_b}"
+
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Referential: {emb_table} -> score",
+                    status=status,
+                    message=msg,
+                    instance_a_value=orphans_a,
+                    instance_b_value=orphans_b,
+                    duration_seconds=time.time() - t0,
+                ))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Referential: {emb_table} -> score",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+        # provider_track -> provider and track references
+        t0 = time.time()
+        try:
+            orphan_provider_a = pg_scalar(self.dsn_a, """
+                SELECT COUNT(*) FROM provider_track pt
+                LEFT JOIN provider p ON pt.provider_id = p.id
+                WHERE p.id IS NULL
+            """)
+            orphan_provider_b = pg_scalar(self.dsn_b, """
+                SELECT COUNT(*) FROM provider_track pt
+                LEFT JOIN provider p ON pt.provider_id = p.id
+                WHERE p.id IS NULL
+            """)
+
+            if (orphan_provider_a or 0) == 0 and (orphan_provider_b or 0) == 0:
+                status = TestStatus.PASS
+                msg = "No orphaned provider_track -> provider rows"
+            else:
+                status = TestStatus.FAIL
+                msg = f"Orphaned provider refs: A={orphan_provider_a}, B={orphan_provider_b}"
+
+            report.add_result(TestResult(
+                category="database",
+                name="Referential: provider_track -> provider",
+                status=status,
+                message=msg,
+                instance_a_value=orphan_provider_a,
+                instance_b_value=orphan_provider_b,
+                duration_seconds=time.time() - t0,
+            ))
+        except Exception as e:
+            # Tables may not exist in some deployments
+            if "does not exist" in str(e).lower() or "relation" in str(e).lower():
+                report.add_result(TestResult(
+                    category="database",
+                    name="Referential: provider_track -> provider",
+                    status=TestStatus.SKIP,
+                    message="Multi-provider tables not present",
+                    duration_seconds=time.time() - t0,
+                ))
+            else:
+                report.add_result(TestResult(
+                    category="database",
+                    name="Referential: provider_track -> provider",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+    # ------------------------------------------------------------------
+    # Score distributions
+    # ------------------------------------------------------------------
+
+    def _test_score_distributions(self, report: ComparisonReport):
+        """Compare statistical distributions of score columns."""
+        for col in SCORE_NUMERIC_COLUMNS:
+            t0 = time.time()
+            try:
+                stats_a = self._get_column_stats(self.dsn_a, "score", col)
+                stats_b = self._get_column_stats(self.dsn_b, "score", col)
+
+                if not stats_a or not stats_b:
+                    continue
+
+                # Compare means
+                mean_diff = pct_diff(stats_a['avg'], stats_b['avg']) if stats_a['avg'] and stats_b['avg'] else 0
+
+                if mean_diff <= 10:
+                    status = TestStatus.PASS
+                elif mean_diff <= 25:
+                    status = TestStatus.WARN
+                else:
+                    status = TestStatus.FAIL
+
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Distribution: score.{col}",
+                    status=status,
+                    message=(
+                        f"A: min={stats_a['min']:.3f}, max={stats_a['max']:.3f}, "
+                        f"avg={stats_a['avg']:.3f}, stddev={stats_a['stddev']:.3f} | "
+                        f"B: min={stats_b['min']:.3f}, max={stats_b['max']:.3f}, "
+                        f"avg={stats_b['avg']:.3f}, stddev={stats_b['stddev']:.3f} | "
+                        f"Mean diff: {mean_diff:.1f}%"
+                    ),
+                    instance_a_value=stats_a,
+                    instance_b_value=stats_b,
+                    diff=mean_diff,
+                    duration_seconds=time.time() - t0,
+                ))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Distribution: score.{col}",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+        # Key distribution comparison
+        t0 = time.time()
+        try:
+            keys_a = pg_query_dict(self.dsn_a,
+                "SELECT key, COUNT(*) as cnt FROM score WHERE key IS NOT NULL GROUP BY key ORDER BY cnt DESC")
+            keys_b = pg_query_dict(self.dsn_b,
+                "SELECT key, COUNT(*) as cnt FROM score WHERE key IS NOT NULL GROUP BY key ORDER BY cnt DESC")
+
+            keys_set_a = set(r['key'] for r in keys_a)
+            keys_set_b = set(r['key'] for r in keys_b)
+
+            if keys_set_a == keys_set_b:
+                status = TestStatus.PASS
+                msg = f"Same key values detected ({len(keys_set_a)} keys)"
+            else:
+                status = TestStatus.WARN
+                diff_keys = keys_set_a.symmetric_difference(keys_set_b)
+                msg = f"Key distribution differs: unique to one side: {diff_keys}"
+
+            report.add_result(TestResult(
+                category="database",
+                name="Distribution: score.key values",
+                status=status,
+                message=msg,
+                instance_a_value=[r['key'] for r in keys_a[:12]],
+                instance_b_value=[r['key'] for r in keys_b[:12]],
+                duration_seconds=time.time() - t0,
+            ))
+        except Exception as e:
+            report.add_result(TestResult(
+                category="database",
+                name="Distribution: score.key values",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+
+    # ------------------------------------------------------------------
+    # Playlist quality
+    # ------------------------------------------------------------------
+
+    def _test_playlist_quality(self, report: ComparisonReport):
+        """Check playlist table quality."""
+        t0 = time.time()
+        try:
+            # Distinct playlists
+            pl_count_a = pg_scalar(self.dsn_a,
+                "SELECT COUNT(DISTINCT playlist_name) FROM playlist")
+            pl_count_b = pg_scalar(self.dsn_b,
+                "SELECT COUNT(DISTINCT playlist_name) FROM playlist")
+
+            diff = pct_diff(pl_count_a or 0, pl_count_b or 0)
+
+            if pl_count_a == pl_count_b:
+                status = TestStatus.PASS
+            elif diff <= 20:
+                status = TestStatus.WARN
+            else:
+                status = TestStatus.FAIL
+
+            report.add_result(TestResult(
+                category="database",
+                name="Playlist: distinct count",
+                status=status,
+                message=f"Distinct playlists: A={pl_count_a}, B={pl_count_b} (diff {diff:.1f}%)",
+                instance_a_value=pl_count_a,
+                instance_b_value=pl_count_b,
+                diff=diff,
+                duration_seconds=time.time() - t0,
+            ))
+
+            # Average tracks per playlist
+            avg_tracks_a = pg_scalar(self.dsn_a, """
+                SELECT AVG(cnt) FROM (
+                    SELECT COUNT(*) as cnt FROM playlist GROUP BY playlist_name
+                ) sub
+            """)
+            avg_tracks_b = pg_scalar(self.dsn_b, """
+                SELECT AVG(cnt) FROM (
+                    SELECT COUNT(*) as cnt FROM playlist GROUP BY playlist_name
+                ) sub
+            """)
+
+            if avg_tracks_a and avg_tracks_b:
+                diff = pct_diff(float(avg_tracks_a), float(avg_tracks_b))
+                status = TestStatus.PASS if diff <= 20 else TestStatus.WARN
+
+                report.add_result(TestResult(
+                    category="database",
+                    name="Playlist: avg tracks per playlist",
+                    status=status,
+                    message=f"Avg tracks/playlist: A={float(avg_tracks_a):.1f}, B={float(avg_tracks_b):.1f}",
+                    instance_a_value=float(avg_tracks_a),
+                    instance_b_value=float(avg_tracks_b),
+                    diff=diff,
+                    duration_seconds=time.time() - t0,
+                ))
+
+            # Playlists with NULL item_ids
+            null_items_a = pg_scalar(self.dsn_a,
+                "SELECT COUNT(*) FROM playlist WHERE item_id IS NULL")
+            null_items_b = pg_scalar(self.dsn_b,
+                "SELECT COUNT(*) FROM playlist WHERE item_id IS NULL")
+
+            if (null_items_a or 0) == 0 and (null_items_b or 0) == 0:
+                status = TestStatus.PASS
+                msg = "No NULL item_ids in playlists"
+            else:
+                status = TestStatus.WARN
+                msg = f"NULL item_ids in playlist: A={null_items_a}, B={null_items_b}"
+
+            report.add_result(TestResult(
+                category="database",
+                name="Playlist: NULL item_ids",
+                status=status,
+                message=msg,
+                instance_a_value=null_items_a,
+                instance_b_value=null_items_b,
+                duration_seconds=time.time() - t0,
+            ))
+
+        except Exception as e:
+            report.add_result(TestResult(
+                category="database",
+                name="Playlist quality",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+
+    # ------------------------------------------------------------------
+    # Index data presence
+    # ------------------------------------------------------------------
+
+    def _test_index_data_presence(self, report: ComparisonReport):
+        """Check that Voyager/Artist indexes and map projections are present."""
+        for table, desc in [
+            ("voyager_index_data", "Voyager HNSW index"),
+            ("artist_index_data", "Artist GMM index"),
+            ("map_projection_data", "Map projection"),
+            ("artist_component_projection", "Artist projection"),
+        ]:
+            t0 = time.time()
+            try:
+                count_a = self._safe_count(self.dsn_a, table)
+                count_b = self._safe_count(self.dsn_b, table)
+
+                if count_a is None and count_b is None:
+                    report.add_result(TestResult(
+                        category="database",
+                        name=f"Index: {desc}",
+                        status=TestStatus.SKIP,
+                        message=f"Table {table} does not exist",
+                        duration_seconds=time.time() - t0,
+                    ))
+                    continue
+
+                if (count_a or 0) > 0 and (count_b or 0) > 0:
+                    status = TestStatus.PASS
+                    msg = f"Present in both: A={count_a}, B={count_b}"
+                elif (count_a or 0) > 0 or (count_b or 0) > 0:
+                    status = TestStatus.WARN
+                    msg = f"Only in {'A' if count_a else 'B'}: A={count_a}, B={count_b}"
+                else:
+                    status = TestStatus.WARN
+                    msg = "Empty in both instances (may need rebuild)"
+
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Index: {desc}",
+                    status=status,
+                    message=msg,
+                    instance_a_value=count_a,
+                    instance_b_value=count_b,
+                    duration_seconds=time.time() - t0,
+                ))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Index: {desc}",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+    # ------------------------------------------------------------------
+    # Task status health
+    # ------------------------------------------------------------------
+
+    def _test_task_status_health(self, report: ComparisonReport):
+        """Check task_status table for stuck or failed tasks."""
+        t0 = time.time()
+        try:
+            # Failed tasks
+            failed_a = pg_scalar(self.dsn_a,
+                "SELECT COUNT(*) FROM task_status WHERE status = 'FAILURE'")
+            failed_b = pg_scalar(self.dsn_b,
+                "SELECT COUNT(*) FROM task_status WHERE status = 'FAILURE'")
+
+            report.add_result(TestResult(
+                category="database",
+                name="Tasks: failed count",
+                status=TestStatus.PASS if (failed_a or 0) == (failed_b or 0) else TestStatus.WARN,
+                message=f"Failed tasks: A={failed_a}, B={failed_b}",
+                instance_a_value=failed_a,
+                instance_b_value=failed_b,
+                duration_seconds=time.time() - t0,
+            ))
+
+            # Stuck tasks (STARTED more than 2 hours ago)
+            stuck_a = pg_scalar(self.dsn_a, """
+                SELECT COUNT(*) FROM task_status
+                WHERE status IN ('STARTED', 'PROGRESS')
+                AND start_time < EXTRACT(EPOCH FROM NOW()) - 7200
+            """)
+            stuck_b = pg_scalar(self.dsn_b, """
+                SELECT COUNT(*) FROM task_status
+                WHERE status IN ('STARTED', 'PROGRESS')
+                AND start_time < EXTRACT(EPOCH FROM NOW()) - 7200
+            """)
+
+            if (stuck_a or 0) == 0 and (stuck_b or 0) == 0:
+                status = TestStatus.PASS
+                msg = "No stuck tasks"
+            else:
+                status = TestStatus.WARN
+                msg = f"Stuck tasks (>2hr): A={stuck_a}, B={stuck_b}"
+
+            report.add_result(TestResult(
+                category="database",
+                name="Tasks: stuck check",
+                status=status,
+                message=msg,
+                instance_a_value=stuck_a,
+                instance_b_value=stuck_b,
+                duration_seconds=time.time() - t0,
+            ))
+
+            # Success rate
+            total_a = self._safe_count(self.dsn_a, "task_status") or 1
+            total_b = self._safe_count(self.dsn_b, "task_status") or 1
+            success_a = pg_scalar(self.dsn_a,
+                "SELECT COUNT(*) FROM task_status WHERE status = 'SUCCESS'") or 0
+            success_b = pg_scalar(self.dsn_b,
+                "SELECT COUNT(*) FROM task_status WHERE status = 'SUCCESS'") or 0
+
+            rate_a = success_a / total_a * 100
+            rate_b = success_b / total_b * 100
+
+            report.add_result(TestResult(
+                category="database",
+                name="Tasks: success rate",
+                status=TestStatus.PASS if abs(rate_a - rate_b) < 10 else TestStatus.WARN,
+                message=f"Success rate: A={rate_a:.1f}%, B={rate_b:.1f}%",
+                instance_a_value=rate_a,
+                instance_b_value=rate_b,
+                diff=abs(rate_a - rate_b),
+                duration_seconds=time.time() - t0,
+            ))
+
+        except Exception as e:
+            report.add_result(TestResult(
+                category="database",
+                name="Tasks health",
+                status=TestStatus.ERROR,
+                message=str(e),
+                duration_seconds=time.time() - t0,
+            ))
+
+    # ------------------------------------------------------------------
+    # Provider config
+    # ------------------------------------------------------------------
+
+    def _test_provider_config(self, report: ComparisonReport):
+        """Compare provider configurations."""
+        t0 = time.time()
+        try:
+            providers_a = pg_query_dict(self.dsn_a,
+                "SELECT provider_type, name, enabled, priority FROM provider ORDER BY id")
+            providers_b = pg_query_dict(self.dsn_b,
+                "SELECT provider_type, name, enabled, priority FROM provider ORDER BY id")
+
+            if not providers_a and not providers_b:
+                report.add_result(TestResult(
+                    category="database",
+                    name="Provider: configuration",
+                    status=TestStatus.SKIP,
+                    message="No providers configured in either instance",
+                    duration_seconds=time.time() - t0,
+                ))
+                return
+
+            types_a = set(p['provider_type'] for p in providers_a)
+            types_b = set(p['provider_type'] for p in providers_b)
+
+            if types_a == types_b:
+                status = TestStatus.PASS
+                msg = f"Same provider types: {types_a}"
+            else:
+                status = TestStatus.WARN
+                msg = f"Provider types differ: A={types_a}, B={types_b}"
+
+            report.add_result(TestResult(
+                category="database",
+                name="Provider: configuration match",
+                status=status,
+                message=msg,
+                instance_a_value=[dict(p) for p in providers_a],
+                instance_b_value=[dict(p) for p in providers_b],
+                duration_seconds=time.time() - t0,
+            ))
+        except Exception as e:
+            if "does not exist" in str(e).lower():
+                report.add_result(TestResult(
+                    category="database",
+                    name="Provider: configuration",
+                    status=TestStatus.SKIP,
+                    message="Provider table not present",
+                    duration_seconds=time.time() - t0,
+                ))
+            else:
+                report.add_result(TestResult(
+                    category="database",
+                    name="Provider: configuration",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+    # ------------------------------------------------------------------
+    # App settings
+    # ------------------------------------------------------------------
+
+    def _test_app_settings(self, report: ComparisonReport):
+        """Compare app_settings between instances."""
+        t0 = time.time()
+        try:
+            settings_a = pg_query_dict(self.dsn_a,
+                "SELECT key, value, category FROM app_settings ORDER BY key")
+            settings_b = pg_query_dict(self.dsn_b,
+                "SELECT key, value, category FROM app_settings ORDER BY key")
+
+            keys_a = set(s['key'] for s in settings_a)
+            keys_b = set(s['key'] for s in settings_b)
+
+            if keys_a == keys_b:
+                status = TestStatus.PASS
+                msg = f"Same settings keys ({len(keys_a)} settings)"
+            else:
+                missing_b = keys_a - keys_b
+                missing_a = keys_b - keys_a
+                status = TestStatus.WARN
+                msg = f"Settings differ: missing_in_B={missing_b}, missing_in_A={missing_a}"
+
+            report.add_result(TestResult(
+                category="database",
+                name="App Settings: key comparison",
+                status=status,
+                message=msg,
+                instance_a_value=sorted(keys_a),
+                instance_b_value=sorted(keys_b),
+                duration_seconds=time.time() - t0,
+            ))
+        except Exception as e:
+            if "does not exist" in str(e).lower():
+                report.add_result(TestResult(
+                    category="database",
+                    name="App Settings",
+                    status=TestStatus.SKIP,
+                    message="app_settings table not present",
+                    duration_seconds=time.time() - t0,
+                ))
+            else:
+                report.add_result(TestResult(
+                    category="database",
+                    name="App Settings",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0,
+                ))
+
+    # ------------------------------------------------------------------
+    # Single-instance tests (when only one DB is available)
+    # ------------------------------------------------------------------
+
+    def _test_single_instance_schema(self, report: ComparisonReport, dsn: str, name: str):
+        """Validate schema for a single instance."""
+        for table_name, expected_cols in EXPECTED_TABLES.items():
+            t0 = time.time()
+            cols = self._get_table_columns(dsn, table_name)
+            if cols is None:
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Schema ({name}): {table_name}",
+                    status=TestStatus.SKIP,
+                    message=f"Table does not exist in {name}",
+                    duration_seconds=time.time() - t0,
+                ))
+            else:
+                missing = set(expected_cols) - set(cols)
+                status = TestStatus.PASS if not missing else TestStatus.WARN
+                report.add_result(TestResult(
+                    category="database",
+                    name=f"Schema ({name}): {table_name}",
+                    status=status,
+                    message=f"Columns: {sorted(cols)}. Missing expected: {missing or 'none'}",
+                    duration_seconds=time.time() - t0,
+                ))
+
+    def _test_single_instance_quality(self, report: ComparisonReport, dsn: str, name: str):
+        """Validate data quality for a single instance."""
+        for col in SCORE_CRITICAL_COLUMNS:
+            t0 = time.time()
+            try:
+                null_pct = self._null_percentage(dsn, "score", col)
+                if null_pct is not None:
+                    status = TestStatus.PASS if null_pct <= self.config.db_score_null_threshold_pct else TestStatus.FAIL
+                    report.add_result(TestResult(
+                        category="database",
+                        name=f"Quality ({name}): score.{col} NULLs",
+                        status=status,
+                        message=f"{null_pct:.1f}% NULL",
+                        duration_seconds=time.time() - t0,
+                    ))
+            except Exception:
+                pass
+
+    # ------------------------------------------------------------------
+    # Helper methods
+    # ------------------------------------------------------------------
+
+    def _get_table_columns(self, dsn: str, table_name: str) -> Optional[List[str]]:
+        """Get column names for a table, or None if table doesn't exist."""
+        try:
+            rows = pg_query(dsn,
+                "SELECT column_name FROM information_schema.columns WHERE table_name = %s ORDER BY ordinal_position",
+                (table_name,))
+            if not rows:
+                return None
+            return [r[0] for r in rows]
+        except Exception:
+            return None
+
+    def _safe_count(self, dsn: str, table_name: str) -> Optional[int]:
+        """Get row count for a table, or None if table doesn't exist."""
+        try:
+            return pg_scalar(dsn, f"SELECT COUNT(*) FROM {table_name}")
+        except Exception:
+            return None
+
+    def _null_percentage(self, dsn: str, table: str, column: str) -> Optional[float]:
+        """Get percentage of NULL values in a column."""
+        try:
+            total = pg_scalar(dsn, f"SELECT COUNT(*) FROM {table}")
+            if not total:
+                return None
+            nulls = pg_scalar(dsn, f"SELECT COUNT(*) FROM {table} WHERE {column} IS NULL")
+            return (nulls / total) * 100
+        except Exception:
+            return None
+
+    def _get_column_stats(self, dsn: str, table: str, column: str) -> Optional[dict]:
+        """Get min/max/avg/stddev for a numeric column."""
+        try:
+            rows = pg_query(dsn, f"""
+                SELECT MIN({column}), MAX({column}), AVG({column}), STDDEV({column})
+                FROM {table}
+                WHERE {column} IS NOT NULL
+            """)
+            if rows and rows[0][0] is not None:
+                return {
+                    'min': float(rows[0][0]),
+                    'max': float(rows[0][1]),
+                    'avg': float(rows[0][2]),
+                    'stddev': float(rows[0][3]) if rows[0][3] else 0.0,
+                }
+        except Exception:
+            pass
+        return None
diff --git a/testing_suite/comparators/docker_comparator.py b/testing_suite/comparators/docker_comparator.py
new file mode 100644
index 00000000..2ee95834
--- /dev/null
+++ b/testing_suite/comparators/docker_comparator.py
@@ -0,0 +1,541 @@
+"""
+Docker Comparison Module for AudioMuse-AI Testing Suite.
+
+Compares two Docker deployments across:
+  - Container health and status
+  - Resource usage (memory, CPU)
+  - Log analysis (error rates, warning patterns)
+  - Service connectivity (Redis, PostgreSQL, Flask, Worker)
+  - Container uptime and restart counts
+  - Log-based error pattern detection
+"""
+
+import json
+import logging
+import re
+import time
+from collections import Counter
+from typing import Any, Dict, List, Optional, Tuple
+
+from testing_suite.config import ComparisonConfig, InstanceConfig
+from testing_suite.utils import (
+    ComparisonReport, TestResult, TestStatus,
+    docker_exec, docker_logs, docker_inspect, pct_diff
+)
+
+logger = logging.getLogger(__name__)
+
+# Log patterns to search for
+ERROR_PATTERNS = [
+    (r"(?i)traceback \(most recent call last\)", "Python Traceback"),
+    (r"(?i)error|exception", "Error/Exception"),
+    (r"(?i)out of memory|oom|killed", "OOM/Memory Kill"),
+    (r"(?i)connection refused|connection reset|broken pipe", "Connection Error"),
+    (r"(?i)timeout|timed out", "Timeout"),
+    (r"(?i)permission denied|access denied", "Permission Error"),
+    (r"(?i)disk full|no space left", "Disk Space"),
+    (r"(?i)segmentation fault|segfault|core dump", "Crash/Segfault"),
+    (r"(?i)worker .* died|worker .* killed", "Worker Death"),
+    (r"(?i)database .* error|psycopg2\..*error", "Database Error"),
+    (r"(?i)redis\..*error|redis connection", "Redis Error"),
+]
+
+WARNING_PATTERNS = [
+    (r"(?i)deprecat", "Deprecation Warning"),
+    (r"(?i)warning", "Warning"),
+    (r"(?i)retry|retrying", "Retry Attempt"),
+    (r"(?i)slow query|slow request", "Slow Operation"),
+    (r"(?i)memory usage|memory pressure", "Memory Pressure"),
+]
+
+
+def _get_ssh_params(instance: InstanceConfig) -> dict:
+    """Extract SSH parameters from instance config."""
+    return {
+        "ssh_host": instance.ssh_host,
+        "ssh_user": instance.ssh_user,
+        "ssh_key": instance.ssh_key,
+        "ssh_port": instance.ssh_port,
+    }
+
+
+class DockerComparator:
+    """Compares Docker deployment health across two AudioMuse-AI instances."""
+
+    def __init__(self, config: ComparisonConfig):
+        self.config = config
+        self.inst_a = config.instance_a
+        self.inst_b = config.instance_b
+
+    def run_all(self, report: ComparisonReport):
+        """Run all Docker comparison tests."""
+        logger.info("Starting Docker comparison tests...")
+
+        # Test each container type on both instances
+        containers = [
+            ("flask", "docker_flask_container", "Flask App Server"),
+            ("worker", "docker_worker_container", "RQ Worker"),
+            ("postgres", "docker_postgres_container", "PostgreSQL"),
+            ("redis", "docker_redis_container", "Redis"),
+        ]
+
+        for container_key, attr_name, description in containers:
+            name_a = getattr(self.inst_a, attr_name)
+            name_b = getattr(self.inst_b, attr_name)
+
+            self._test_container_health(report, name_a, name_b, description,
+                                        self.inst_a, self.inst_b)
+            self._test_container_resource_usage(report, name_a, name_b, description,
+                                                 self.inst_a, self.inst_b)
+
+        # Log analysis for flask and worker containers
+        for attr_name, description in [
+            ("docker_flask_container", "Flask"),
+            ("docker_worker_container", "Worker"),
+        ]:
+            name_a = getattr(self.inst_a, attr_name)
+            name_b = getattr(self.inst_b, attr_name)
+            self._test_log_error_analysis(report, name_a, name_b, description,
+                                           self.inst_a, self.inst_b)
+
+        # Service connectivity tests
+        self._test_redis_connectivity(report)
+        self._test_postgres_connectivity(report)
+
+        logger.info("Docker comparison tests complete.")
+
+    # ------------------------------------------------------------------
+    # Container health
+    # ------------------------------------------------------------------
+
+    def _test_container_health(self, report: ComparisonReport,
+                                name_a: str, name_b: str, description: str,
+                                inst_a: InstanceConfig, inst_b: InstanceConfig):
+        """Check container status, uptime, and restart count."""
+        t0 = time.time()
+
+        info_a = docker_inspect(name_a, **_get_ssh_params(inst_a))
+        info_b = docker_inspect(name_b, **_get_ssh_params(inst_b))
+
+        # Container running status
+        running_a = self._is_running(info_a)
+        running_b = self._is_running(info_b)
+
+        if running_a is None and running_b is None:
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: container status",
+                status=TestStatus.SKIP,
+                message="Cannot inspect containers (Docker not available or containers not found)",
+                duration_seconds=time.time() - t0,
+            ))
+            return
+
+        if running_a and running_b:
+            status = TestStatus.PASS
+            msg = "Both containers running"
+        elif running_a or running_b:
+            status = TestStatus.FAIL
+            msg = f"Only {'A' if running_a else 'B'} is running"
+        else:
+            status = TestStatus.FAIL
+            msg = "Neither container is running"
+
+        report.add_result(TestResult(
+            category="docker",
+            name=f"{description}: container status",
+            status=status,
+            message=msg,
+            instance_a_value=f"running={running_a}",
+            instance_b_value=f"running={running_b}",
+            duration_seconds=time.time() - t0,
+        ))
+
+        # Restart count
+        restarts_a = self._get_restart_count(info_a)
+        restarts_b = self._get_restart_count(info_b)
+
+        if restarts_a is not None or restarts_b is not None:
+            if (restarts_a or 0) == 0 and (restarts_b or 0) == 0:
+                r_status = TestStatus.PASS
+                r_msg = "No restarts on either instance"
+            elif (restarts_a or 0) > 5 or (restarts_b or 0) > 5:
+                r_status = TestStatus.FAIL
+                r_msg = f"High restart count: A={restarts_a}, B={restarts_b}"
+            else:
+                r_status = TestStatus.WARN
+                r_msg = f"Restarts: A={restarts_a}, B={restarts_b}"
+
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: restart count",
+                status=r_status,
+                message=r_msg,
+                instance_a_value=restarts_a,
+                instance_b_value=restarts_b,
+                duration_seconds=time.time() - t0,
+            ))
+
+        # Health check status
+        health_a = self._get_health_status(info_a)
+        health_b = self._get_health_status(info_b)
+
+        if health_a or health_b:
+            if health_a == health_b:
+                h_status = TestStatus.PASS
+                h_msg = f"Same health status: {health_a}"
+            else:
+                h_status = TestStatus.WARN
+                h_msg = f"Health differs: A={health_a}, B={health_b}"
+
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: health check",
+                status=h_status,
+                message=h_msg,
+                instance_a_value=health_a,
+                instance_b_value=health_b,
+                duration_seconds=time.time() - t0,
+            ))
+
+    # ------------------------------------------------------------------
+    # Resource usage
+    # ------------------------------------------------------------------
+
+    def _test_container_resource_usage(self, report: ComparisonReport,
+                                        name_a: str, name_b: str, description: str,
+                                        inst_a: InstanceConfig, inst_b: InstanceConfig):
+        """Compare memory and CPU usage between containers."""
+        t0 = time.time()
+
+        stats_a = self._get_container_stats(name_a, inst_a)
+        stats_b = self._get_container_stats(name_b, inst_b)
+
+        if not stats_a and not stats_b:
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: resource usage",
+                status=TestStatus.SKIP,
+                message="Cannot get container stats",
+                duration_seconds=time.time() - t0,
+            ))
+            return
+
+        # Memory usage
+        mem_a = stats_a.get('memory_mb') if stats_a else None
+        mem_b = stats_b.get('memory_mb') if stats_b else None
+
+        if mem_a is not None and mem_b is not None:
+            diff = pct_diff(mem_a, mem_b)
+            if diff <= 20:
+                status = TestStatus.PASS
+            elif diff <= 50:
+                status = TestStatus.WARN
+            else:
+                status = TestStatus.FAIL
+
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: memory usage",
+                status=status,
+                message=f"A={mem_a:.1f}MB, B={mem_b:.1f}MB (diff {diff:.1f}%)",
+                instance_a_value=mem_a,
+                instance_b_value=mem_b,
+                diff=diff,
+                duration_seconds=time.time() - t0,
+            ))
+
+        # CPU usage
+        cpu_a = stats_a.get('cpu_pct') if stats_a else None
+        cpu_b = stats_b.get('cpu_pct') if stats_b else None
+
+        if cpu_a is not None and cpu_b is not None:
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: CPU usage",
+                status=TestStatus.PASS,
+                message=f"A={cpu_a:.1f}%, B={cpu_b:.1f}%",
+                instance_a_value=cpu_a,
+                instance_b_value=cpu_b,
+                duration_seconds=time.time() - t0,
+            ))
+
+    # ------------------------------------------------------------------
+    # Log error analysis
+    # ------------------------------------------------------------------
+
+    def _test_log_error_analysis(self, report: ComparisonReport,
+                                  name_a: str, name_b: str, description: str,
+                                  inst_a: InstanceConfig, inst_b: InstanceConfig):
+        """Analyze container logs for error patterns."""
+        t0 = time.time()
+
+        # Fetch logs
+        logs_a_stdout, logs_a_stderr, rc_a = docker_logs(
+            name_a, tail=2000, **_get_ssh_params(inst_a), timeout=30)
+        logs_b_stdout, logs_b_stderr, rc_b = docker_logs(
+            name_b, tail=2000, **_get_ssh_params(inst_b), timeout=30)
+
+        if rc_a != 0 and rc_b != 0:
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: log analysis",
+                status=TestStatus.SKIP,
+                message="Cannot fetch logs from either container",
+                duration_seconds=time.time() - t0,
+            ))
+            return
+
+        # Combine stdout + stderr for analysis
+        logs_a = (logs_a_stdout or '') + '\n' + (logs_a_stderr or '')
+        logs_b = (logs_b_stdout or '') + '\n' + (logs_b_stderr or '')
+
+        # Error pattern matching
+        errors_a = self._count_patterns(logs_a, ERROR_PATTERNS)
+        errors_b = self._count_patterns(logs_b, ERROR_PATTERNS)
+
+        total_errors_a = sum(errors_a.values())
+        total_errors_b = sum(errors_b.values())
+
+        if total_errors_a == 0 and total_errors_b == 0:
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: error patterns",
+                status=TestStatus.PASS,
+                message="No error patterns detected in recent logs",
+                duration_seconds=time.time() - t0,
+            ))
+        else:
+            # Compare error counts
+            if total_errors_a <= total_errors_b:
+                status = TestStatus.WARN
+            else:
+                status = TestStatus.WARN
+
+            if total_errors_a > 50 or total_errors_b > 50:
+                status = TestStatus.FAIL
+
+            report.add_result(TestResult(
+                category="docker",
+                name=f"{description}: error count",
+                status=status,
+                message=f"Errors in last 2000 log lines: A={total_errors_a}, B={total_errors_b}",
+                instance_a_value=total_errors_a,
+                instance_b_value=total_errors_b,
+                duration_seconds=time.time() - t0,
+                details={"errors_a": dict(errors_a), "errors_b": dict(errors_b)},
+            ))
+
+            # Detailed per-pattern breakdown
+            all_patterns = set(errors_a.keys()) | set(errors_b.keys())
+            for pattern_name in sorted(all_patterns):
+                cnt_a = errors_a.get(pattern_name, 0)
+                cnt_b = errors_b.get(pattern_name, 0)
+
+                if cnt_a == 0 and cnt_b == 0:
+                    continue
+
+                if cnt_a == cnt_b:
+                    p_status = TestStatus.WARN
+                elif cnt_a > cnt_b * 2 or cnt_b > cnt_a * 2:
+                    p_status = TestStatus.FAIL
+                else:
+                    p_status = TestStatus.WARN
+
+                report.add_result(TestResult(
+                    category="docker",
+                    name=f"{description}: {pattern_name}",
+                    status=p_status,
+                    message=f"A={cnt_a}, B={cnt_b}",
+                    instance_a_value=cnt_a,
+                    instance_b_value=cnt_b,
+                    duration_seconds=time.time() - t0,
+                ))
+
+        # Warning pattern matching
+        warnings_a = self._count_patterns(logs_a, WARNING_PATTERNS)
+        warnings_b = self._count_patterns(logs_b, WARNING_PATTERNS)
+
+        total_warnings_a = sum(warnings_a.values())
+        total_warnings_b = sum(warnings_b.values())
+
+        report.add_result(TestResult(
+            category="docker",
+            name=f"{description}: warning count",
+            status=TestStatus.PASS if total_warnings_a < 100 and total_warnings_b < 100 else TestStatus.WARN,
+            message=f"Warnings: A={total_warnings_a}, B={total_warnings_b}",
+            instance_a_value=total_warnings_a,
+            instance_b_value=total_warnings_b,
+            duration_seconds=time.time() - t0,
+            details={"warnings_a": dict(warnings_a), "warnings_b": dict(warnings_b)},
+        ))
+
+        # Check for Python tracebacks specifically (important indicator)
+        tb_count_a = logs_a.count("Traceback (most recent call last)")
+        tb_count_b = logs_b.count("Traceback (most recent call last)")
+
+        if tb_count_a == 0 and tb_count_b == 0:
+            tb_status = TestStatus.PASS
+            tb_msg = "No Python tracebacks in recent logs"
+        elif tb_count_a > 10 or tb_count_b > 10:
+            tb_status = TestStatus.FAIL
+            tb_msg = f"Tracebacks: A={tb_count_a}, B={tb_count_b}"
+        else:
+            tb_status = TestStatus.WARN
+            tb_msg = f"Tracebacks: A={tb_count_a}, B={tb_count_b}"
+
+        report.add_result(TestResult(
+            category="docker",
+            name=f"{description}: Python tracebacks",
+            status=tb_status,
+            message=tb_msg,
+            instance_a_value=tb_count_a,
+            instance_b_value=tb_count_b,
+            duration_seconds=time.time() - t0,
+        ))
+
+    # ------------------------------------------------------------------
+    # Service connectivity
+    # ------------------------------------------------------------------
+
+    def _test_redis_connectivity(self, report: ComparisonReport):
+        """Test Redis connectivity from within the Flask container."""
+        t0 = time.time()
+        for label, inst in [("A", self.inst_a), ("B", self.inst_b)]:
+            container = inst.docker_flask_container
+            stdout, stderr, rc = docker_exec(
+                container, "python -c \"from redis import Redis; r=Redis.from_url('" +
+                inst.redis_url + "'); print(r.ping())\"",
+                **_get_ssh_params(inst), timeout=15,
+            )
+            if rc == 0 and "True" in stdout:
+                status = TestStatus.PASS
+                msg = "Redis ping successful"
+            elif rc == -2:
+                status = TestStatus.SKIP
+                msg = "Docker not available"
+            else:
+                status = TestStatus.WARN
+                msg = f"Redis ping failed: {stderr[:200] if stderr else stdout[:200]}"
+
+            report.add_result(TestResult(
+                category="docker",
+                name=f"Redis connectivity ({label})",
+                status=status,
+                message=msg,
+                duration_seconds=time.time() - t0,
+            ))
+
+    def _test_postgres_connectivity(self, report: ComparisonReport):
+        """Test PostgreSQL connectivity from within the Flask container."""
+        t0 = time.time()
+        for label, inst in [("A", self.inst_a), ("B", self.inst_b)]:
+            container = inst.docker_flask_container
+            stdout, stderr, rc = docker_exec(
+                container,
+                f"python -c \"import psycopg2; c=psycopg2.connect('{inst.pg_dsn}', connect_timeout=5); "
+                f"cur=c.cursor(); cur.execute('SELECT 1'); print(cur.fetchone()[0]); c.close()\"",
+                **_get_ssh_params(inst), timeout=15,
+            )
+            if rc == 0 and "1" in stdout:
+                status = TestStatus.PASS
+                msg = "PostgreSQL SELECT 1 successful"
+            elif rc == -2:
+                status = TestStatus.SKIP
+                msg = "Docker not available"
+            else:
+                status = TestStatus.WARN
+                msg = f"PostgreSQL test failed: {stderr[:200] if stderr else stdout[:200]}"
+
+            report.add_result(TestResult(
+                category="docker",
+                name=f"PostgreSQL connectivity ({label})",
+                status=status,
+                message=msg,
+                duration_seconds=time.time() - t0,
+            ))
+
+    # ------------------------------------------------------------------
+    # Helpers
+    # ------------------------------------------------------------------
+
+    def _is_running(self, info: Optional[dict]) -> Optional[bool]:
+        """Check if container is running from inspect data."""
+        if not info:
+            return None
+        state = info.get("State", {})
+        return state.get("Running", False)
+
+    def _get_restart_count(self, info: Optional[dict]) -> Optional[int]:
+        """Get container restart count from inspect data."""
+        if not info:
+            return None
+        return info.get("RestartCount", 0)
+
+    def _get_health_status(self, info: Optional[dict]) -> Optional[str]:
+        """Get container health status from inspect data."""
+        if not info:
+            return None
+        state = info.get("State", {})
+        health = state.get("Health", {})
+        return health.get("Status") if health else None
+
+    def _get_container_stats(self, name: str, inst: InstanceConfig) -> Optional[dict]:
+        """Get container resource stats via docker stats --no-stream."""
+        ssh_params = _get_ssh_params(inst)
+        cmd_parts = ["docker", "stats", "--no-stream", "--format",
+                      "{{.MemUsage}}|||{{.CPUPerc}}", name]
+
+        if ssh_params.get("ssh_host"):
+            import subprocess
+            ssh_cmd = ["ssh", "-o", "StrictHostKeyChecking=no",
+                       "-p", str(ssh_params.get("ssh_port", 22))]
+            if ssh_params.get("ssh_key"):
+                ssh_cmd += ["-i", ssh_params["ssh_key"]]
+            host = f"{ssh_params['ssh_user']}@{ssh_params['ssh_host']}" \
+                if ssh_params.get("ssh_user") else ssh_params["ssh_host"]
+            ssh_cmd.append(host)
+            ssh_cmd.append(" ".join(cmd_parts))
+            full_cmd = ssh_cmd
+        else:
+            full_cmd = cmd_parts
+
+        try:
+            import subprocess
+            proc = subprocess.run(full_cmd, capture_output=True, text=True, timeout=15)
+            if proc.returncode == 0 and proc.stdout.strip():
+                parts = proc.stdout.strip().split("|||")
+                if len(parts) == 2:
+                    mem_str = parts[0].strip()
+                    cpu_str = parts[1].strip().rstrip('%')
+
+                    # Parse memory (e.g., "512MiB / 16GiB")
+                    mem_match = re.search(r'([\d.]+)(Ki|Mi|Gi|B)', mem_str)
+                    memory_mb = 0.0
+                    if mem_match:
+                        val = float(mem_match.group(1))
+                        unit = mem_match.group(2)
+                        if unit == "Gi":
+                            memory_mb = val * 1024
+                        elif unit == "Mi":
+                            memory_mb = val
+                        elif unit == "Ki":
+                            memory_mb = val / 1024
+                        else:
+                            memory_mb = val / (1024 * 1024)
+
+                    cpu_pct = float(cpu_str) if cpu_str else 0.0
+
+                    return {"memory_mb": memory_mb, "cpu_pct": cpu_pct}
+        except Exception as e:
+            logger.debug(f"Stats fetch failed for {name}: {e}")
+        return None
+
+    def _count_patterns(self, log_text: str, patterns: list) -> Counter:
+        """Count occurrences of each pattern in log text."""
+        counts = Counter()
+        for pattern, name in patterns:
+            matches = re.findall(pattern, log_text)
+            if matches:
+                counts[name] = len(matches)
+        return counts
diff --git a/testing_suite/comparators/performance_comparator.py b/testing_suite/comparators/performance_comparator.py
new file mode 100644
index 00000000..21a573d1
--- /dev/null
+++ b/testing_suite/comparators/performance_comparator.py
@@ -0,0 +1,447 @@
+"""
+Performance Comparison Module for AudioMuse-AI Testing Suite.
+
+Benchmarks and compares performance between two instances:
+  - API endpoint latency (p50, p95, p99, mean, max)
+  - Throughput under concurrent load
+  - Database query performance
+  - Search/similarity response times
+  - Memory-intensive operations (map, alchemy, clustering)
+  - Warmup vs steady-state performance
+"""
+
+import logging
+import statistics
+import time
+from concurrent.futures import ThreadPoolExecutor, as_completed
+from typing import Any, Dict, List, Optional, Tuple
+
+from testing_suite.config import ComparisonConfig, InstanceConfig
+from testing_suite.utils import (
+    ComparisonReport, TestResult, TestStatus,
+    http_get, http_post, timed_request, pct_diff, format_duration,
+    pg_query, pg_scalar
+)
+
+logger = logging.getLogger(__name__)
+
+
+def _percentile(data: List[float], pct: float) -> float:
+    """Calculate a percentile from a sorted list of values."""
+    if not data:
+        return 0.0
+    sorted_data = sorted(data)
+    k = (len(sorted_data) - 1) * (pct / 100.0)
+    f = int(k)
+    c = f + 1
+    if c >= len(sorted_data):
+        return sorted_data[-1]
+    return sorted_data[f] + (k - f) * (sorted_data[c] - sorted_data[f])
+
+
+def _latency_stats(latencies: List[float]) -> dict:
+    """Compute latency statistics from a list of measurements."""
+    if not latencies:
+        return {"count": 0, "mean": 0, "median": 0, "p95": 0, "p99": 0,
+                "min": 0, "max": 0, "stddev": 0}
+    return {
+        "count": len(latencies),
+        "mean": statistics.mean(latencies),
+        "median": statistics.median(latencies),
+        "p95": _percentile(latencies, 95),
+        "p99": _percentile(latencies, 99),
+        "min": min(latencies),
+        "max": max(latencies),
+        "stddev": statistics.stdev(latencies) if len(latencies) > 1 else 0.0,
+    }
+
+
+class PerformanceComparator:
+    """Benchmarks and compares performance between two instances."""
+
+    def __init__(self, config: ComparisonConfig):
+        self.config = config
+        self.url_a = config.instance_a.api_url.rstrip('/')
+        self.url_b = config.instance_b.api_url.rstrip('/')
+        self.name_a = config.instance_a.name
+        self.name_b = config.instance_b.name
+        self.warmup_n = config.perf_warmup_requests
+        self.bench_n = config.perf_benchmark_requests
+        self.concurrent = config.perf_concurrent_users
+
+    def run_all(self, report: ComparisonReport):
+        """Run all performance comparison tests."""
+        logger.info("Starting performance comparison tests...")
+
+        # Check connectivity
+        alive_a = self._check_alive(self.url_a)
+        alive_b = self._check_alive(self.url_b)
+
+        if not alive_a and not alive_b:
+            report.add_result(TestResult(
+                category="performance",
+                name="Connectivity",
+                status=TestStatus.ERROR,
+                message="Neither instance reachable; skipping performance tests",
+            ))
+            return
+
+        # Define endpoint benchmarks
+        benchmarks = [
+            # (path, method, params/json, description, expected_status)
+            ("/api/config", "GET", None, "Config endpoint", 200),
+            ("/api/playlists", "GET", None, "Playlists list", 200),
+            ("/api/active_tasks", "GET", None, "Active tasks", 200),
+            ("/api/last_task", "GET", None, "Last task", 200),
+            ("/api/search_tracks?artist=Red+Hot&title=By", "GET", None, "Track search", 200),
+            ("/api/similar_tracks?title=By+the+Way&artist=Red+Hot+Chili+Peppers&n=5", "GET", None, "Similar tracks", 200),
+            ("/api/map?percent=10", "GET", None, "Map visualization", 200),
+            ("/api/map_cache_status", "GET", None, "Map cache status", 200),
+            ("/api/clap/stats", "GET", None, "CLAP stats", 200),
+            ("/api/clap/top_queries", "GET", None, "CLAP top queries", 200),
+            ("/api/setup/status", "GET", None, "Setup status", 200),
+            ("/api/setup/providers", "GET", None, "Providers list", 200),
+            ("/api/setup/settings", "GET", None, "App settings", 200),
+            ("/api/cron", "GET", None, "Cron entries", 200),
+            ("/api/search_artists?q=Red", "GET", None, "Artist search", 200),
+            ("/external/search?q=piano", "GET", None, "External search", 200),
+        ]
+
+        # Run latency benchmarks for each endpoint
+        for path, method, data, desc, expected_status in benchmarks:
+            self._benchmark_endpoint(report, path, method, data, desc,
+                                      expected_status, alive_a, alive_b)
+
+        # Concurrent load test on a few key endpoints
+        self._concurrent_load_test(report, alive_a, alive_b)
+
+        # Database query performance
+        self._benchmark_db_queries(report)
+
+        logger.info("Performance comparison tests complete.")
+
+    # ------------------------------------------------------------------
+    # Endpoint latency benchmark
+    # ------------------------------------------------------------------
+
+    def _benchmark_endpoint(self, report: ComparisonReport, path: str,
+                             method: str, data: Any, description: str,
+                             expected_status: int, alive_a: bool, alive_b: bool):
+        """Benchmark a single endpoint on both instances."""
+        t0 = time.time()
+        latencies_a = []
+        latencies_b = []
+        errors_a = 0
+        errors_b = 0
+
+        # Warmup phase
+        for _ in range(self.warmup_n):
+            try:
+                if alive_a:
+                    if method == "GET":
+                        http_get(f"{self.url_a}{path}", timeout=30, retries=1)
+                    else:
+                        http_post(f"{self.url_a}{path}", json_data=data, timeout=30, retries=1)
+            except Exception:
+                pass
+            try:
+                if alive_b:
+                    if method == "GET":
+                        http_get(f"{self.url_b}{path}", timeout=30, retries=1)
+                    else:
+                        http_post(f"{self.url_b}{path}", json_data=data, timeout=30, retries=1)
+            except Exception:
+                pass
+
+        # Benchmark phase
+        for i in range(self.bench_n):
+            if alive_a:
+                try:
+                    start = time.perf_counter()
+                    if method == "GET":
+                        resp = http_get(f"{self.url_a}{path}", timeout=60, retries=1)
+                    else:
+                        resp = http_post(f"{self.url_a}{path}", json_data=data, timeout=60, retries=1)
+                    elapsed = time.perf_counter() - start
+                    if resp.status_code == expected_status:
+                        latencies_a.append(elapsed)
+                    else:
+                        errors_a += 1
+                except Exception:
+                    errors_a += 1
+
+            if alive_b:
+                try:
+                    start = time.perf_counter()
+                    if method == "GET":
+                        resp = http_get(f"{self.url_b}{path}", timeout=60, retries=1)
+                    else:
+                        resp = http_post(f"{self.url_b}{path}", json_data=data, timeout=60, retries=1)
+                    elapsed = time.perf_counter() - start
+                    if resp.status_code == expected_status:
+                        latencies_b.append(elapsed)
+                    else:
+                        errors_b += 1
+                except Exception:
+                    errors_b += 1
+
+        stats_a = _latency_stats(latencies_a)
+        stats_b = _latency_stats(latencies_b)
+
+        # Determine status based on relative performance
+        if stats_a['mean'] > 0 and stats_b['mean'] > 0:
+            ratio = stats_b['mean'] / stats_a['mean']
+            if ratio <= 1.2:  # B is within 20% of A
+                status = TestStatus.PASS
+                comparison = f"B is {ratio:.2f}x vs A"
+            elif ratio <= 2.0:
+                status = TestStatus.WARN
+                comparison = f"B is {ratio:.2f}x slower than A"
+            else:
+                status = TestStatus.FAIL
+                comparison = f"B is {ratio:.2f}x slower than A"
+
+            # Also check if B is faster
+            if ratio < 0.8:
+                status = TestStatus.PASS
+                comparison = f"B is {1/ratio:.2f}x faster than A"
+        else:
+            status = TestStatus.WARN if (latencies_a or latencies_b) else TestStatus.SKIP
+            comparison = "Cannot compare (one or both had no successful requests)"
+
+        report.add_result(TestResult(
+            category="performance",
+            name=f"Latency: {description}",
+            status=status,
+            message=(
+                f"{comparison} | "
+                f"A: mean={format_duration(stats_a['mean'])}, "
+                f"p95={format_duration(stats_a['p95'])}, "
+                f"p99={format_duration(stats_a['p99'])} "
+                f"({errors_a} errors) | "
+                f"B: mean={format_duration(stats_b['mean'])}, "
+                f"p95={format_duration(stats_b['p95'])}, "
+                f"p99={format_duration(stats_b['p99'])} "
+                f"({errors_b} errors)"
+            ),
+            instance_a_value=stats_a,
+            instance_b_value=stats_b,
+            diff=pct_diff(stats_a['mean'], stats_b['mean']) if stats_a['mean'] and stats_b['mean'] else None,
+            duration_seconds=time.time() - t0,
+            details={
+                "path": path,
+                "method": method,
+                "warmup_requests": self.warmup_n,
+                "benchmark_requests": self.bench_n,
+                "errors_a": errors_a,
+                "errors_b": errors_b,
+            },
+        ))
+
+    # ------------------------------------------------------------------
+    # Concurrent load test
+    # ------------------------------------------------------------------
+
+    def _concurrent_load_test(self, report: ComparisonReport,
+                               alive_a: bool, alive_b: bool):
+        """Test throughput under concurrent load."""
+        endpoints = [
+            "/api/config",
+            "/api/search_tracks?artist=Red+Hot&title=By",
+            "/api/playlists",
+        ]
+
+        for path in endpoints:
+            t0 = time.time()
+            results_a = self._run_concurrent(self.url_a, path, self.concurrent,
+                                              self.bench_n) if alive_a else None
+            results_b = self._run_concurrent(self.url_b, path, self.concurrent,
+                                              self.bench_n) if alive_b else None
+
+            if results_a and results_b:
+                throughput_a = results_a['successful'] / results_a['total_time'] if results_a['total_time'] > 0 else 0
+                throughput_b = results_b['successful'] / results_b['total_time'] if results_b['total_time'] > 0 else 0
+
+                if throughput_a > 0 and throughput_b > 0:
+                    ratio = throughput_b / throughput_a
+                    if ratio >= 0.8:
+                        status = TestStatus.PASS
+                    elif ratio >= 0.5:
+                        status = TestStatus.WARN
+                    else:
+                        status = TestStatus.FAIL
+                else:
+                    status = TestStatus.WARN
+                    ratio = 0
+
+                report.add_result(TestResult(
+                    category="performance",
+                    name=f"Concurrent Load: {path.split('?')[0]}",
+                    status=status,
+                    message=(
+                        f"{self.concurrent} concurrent users, {self.bench_n} requests each | "
+                        f"A: {throughput_a:.1f} req/s, "
+                        f"mean={format_duration(results_a['mean_latency'])}, "
+                        f"{results_a['errors']} errors | "
+                        f"B: {throughput_b:.1f} req/s, "
+                        f"mean={format_duration(results_b['mean_latency'])}, "
+                        f"{results_b['errors']} errors"
+                    ),
+                    instance_a_value={"throughput_rps": throughput_a, **results_a},
+                    instance_b_value={"throughput_rps": throughput_b, **results_b},
+                    duration_seconds=time.time() - t0,
+                ))
+            else:
+                report.add_result(TestResult(
+                    category="performance",
+                    name=f"Concurrent Load: {path.split('?')[0]}",
+                    status=TestStatus.SKIP,
+                    message="Cannot run concurrent test (one or both instances unavailable)",
+                    duration_seconds=time.time() - t0,
+                ))
+
+    def _run_concurrent(self, base_url: str, path: str,
+                         concurrent: int, requests_per_worker: int) -> dict:
+        """Run concurrent requests and measure throughput."""
+        latencies = []
+        errors = 0
+
+        def worker():
+            nonlocal errors
+            local_latencies = []
+            for _ in range(requests_per_worker):
+                try:
+                    start = time.perf_counter()
+                    resp = http_get(f"{base_url}{path}", timeout=30, retries=1)
+                    elapsed = time.perf_counter() - start
+                    if resp.status_code == 200:
+                        local_latencies.append(elapsed)
+                    else:
+                        errors += 1
+                except Exception:
+                    errors += 1
+            return local_latencies
+
+        overall_start = time.perf_counter()
+        with ThreadPoolExecutor(max_workers=concurrent) as executor:
+            futures = [executor.submit(worker) for _ in range(concurrent)]
+            for f in as_completed(futures):
+                try:
+                    latencies.extend(f.result())
+                except Exception:
+                    errors += 1
+        total_time = time.perf_counter() - overall_start
+
+        return {
+            "successful": len(latencies),
+            "errors": errors,
+            "total_time": total_time,
+            "mean_latency": statistics.mean(latencies) if latencies else 0,
+            "p95_latency": _percentile(latencies, 95) if latencies else 0,
+        }
+
+    # ------------------------------------------------------------------
+    # Database query performance
+    # ------------------------------------------------------------------
+
+    def _benchmark_db_queries(self, report: ComparisonReport):
+        """Benchmark critical database queries on both instances."""
+        queries = [
+            ("SELECT COUNT(*) FROM score", "Score count"),
+            ("SELECT COUNT(*) FROM embedding", "Embedding count"),
+            ("SELECT COUNT(*) FROM playlist", "Playlist count"),
+            ("SELECT COUNT(DISTINCT playlist_name) FROM playlist", "Distinct playlists"),
+            ("SELECT item_id, title, author FROM score LIMIT 100", "Score fetch 100"),
+            ("SELECT s.item_id, s.title FROM score s JOIN embedding e ON s.item_id = e.item_id LIMIT 50",
+             "Score-embedding join 50"),
+            ("SELECT AVG(tempo), AVG(energy) FROM score WHERE tempo IS NOT NULL", "Score aggregation"),
+            ("SELECT key, COUNT(*) FROM score WHERE key IS NOT NULL GROUP BY key", "Key distribution"),
+        ]
+
+        dsn_a = self.config.instance_a.pg_dsn
+        dsn_b = self.config.instance_b.pg_dsn
+
+        can_a = self._test_db(dsn_a)
+        can_b = self._test_db(dsn_b)
+
+        if not can_a and not can_b:
+            report.add_result(TestResult(
+                category="performance",
+                name="DB Query Performance",
+                status=TestStatus.SKIP,
+                message="Cannot connect to either database",
+            ))
+            return
+
+        for sql, desc in queries:
+            t0 = time.time()
+            latencies_a = []
+            latencies_b = []
+
+            for _ in range(max(3, self.bench_n // 2)):
+                if can_a:
+                    try:
+                        start = time.perf_counter()
+                        pg_query(dsn_a, sql)
+                        latencies_a.append(time.perf_counter() - start)
+                    except Exception:
+                        pass
+
+                if can_b:
+                    try:
+                        start = time.perf_counter()
+                        pg_query(dsn_b, sql)
+                        latencies_b.append(time.perf_counter() - start)
+                    except Exception:
+                        pass
+
+            stats_a = _latency_stats(latencies_a)
+            stats_b = _latency_stats(latencies_b)
+
+            if stats_a['mean'] > 0 and stats_b['mean'] > 0:
+                ratio = stats_b['mean'] / stats_a['mean']
+                if ratio <= 1.5:
+                    status = TestStatus.PASS
+                elif ratio <= 3.0:
+                    status = TestStatus.WARN
+                else:
+                    status = TestStatus.FAIL
+                comparison = f"B/A ratio: {ratio:.2f}x"
+            else:
+                status = TestStatus.WARN
+                comparison = "Insufficient data"
+
+            report.add_result(TestResult(
+                category="performance",
+                name=f"DB Query: {desc}",
+                status=status,
+                message=(
+                    f"{comparison} | "
+                    f"A: mean={format_duration(stats_a['mean'])}, "
+                    f"p95={format_duration(stats_a['p95'])} | "
+                    f"B: mean={format_duration(stats_b['mean'])}, "
+                    f"p95={format_duration(stats_b['p95'])}"
+                ),
+                instance_a_value=stats_a,
+                instance_b_value=stats_b,
+                diff=pct_diff(stats_a['mean'], stats_b['mean']) if stats_a['mean'] and stats_b['mean'] else None,
+                duration_seconds=time.time() - t0,
+            ))
+
+    # ------------------------------------------------------------------
+    # Helpers
+    # ------------------------------------------------------------------
+
+    def _check_alive(self, url: str) -> bool:
+        try:
+            resp = http_get(f"{url}/api/config", timeout=15, retries=2, retry_delay=1)
+            return resp.status_code == 200
+        except Exception:
+            return False
+
+    def _test_db(self, dsn: str) -> bool:
+        try:
+            pg_scalar(dsn, "SELECT 1")
+            return True
+        except Exception:
+            return False
diff --git a/testing_suite/comparison_config.example.yaml b/testing_suite/comparison_config.example.yaml
new file mode 100644
index 00000000..a73217f3
--- /dev/null
+++ b/testing_suite/comparison_config.example.yaml
@@ -0,0 +1,91 @@
+# AudioMuse-AI Testing & Comparison Suite - Example Configuration
+#
+# Copy this file to comparison_config.yaml and customize for your setup.
+#
+# Usage:
+#   python -m testing_suite --config testing_suite/comparison_config.yaml
+#   python -m testing_suite --config testing_suite/comparison_config.yaml --only api,performance
+#   python -m testing_suite --config testing_suite/comparison_config.yaml --skip docker
+
+# Instance A - Main branch (baseline)
+instance_a:
+  name: "main"
+  branch: "main"
+  # API connection
+  api_url: "http://192.168.1.100:8000"
+  api_timeout: 120
+  # PostgreSQL connection
+  pg_host: "192.168.1.100"
+  pg_port: 5432
+  pg_user: "audiomuse"
+  pg_password: "audiomusepassword"
+  pg_database: "audiomusedb"
+  # Redis connection
+  redis_url: "redis://192.168.1.100:6379/0"
+  # Docker container names
+  docker_flask_container: "audiomuse-ai-flask-app"
+  docker_worker_container: "audiomuse-ai-worker-instance"
+  docker_postgres_container: "audiomuse-postgres"
+  docker_redis_container: "audiomuse-redis"
+  # SSH for remote Docker access (leave empty for local)
+  ssh_host: ""
+  ssh_user: ""
+  ssh_key: ""
+  ssh_port: 22
+
+# Instance B - Feature branch (under test)
+instance_b:
+  name: "feature"
+  branch: "feature-branch"
+  api_url: "http://192.168.1.101:8000"
+  api_timeout: 120
+  pg_host: "192.168.1.101"
+  pg_port: 5432
+  pg_user: "audiomuse"
+  pg_password: "audiomusepassword"
+  pg_database: "audiomusedb"
+  redis_url: "redis://192.168.1.101:6379/0"
+  docker_flask_container: "audiomuse-ai-flask-app"
+  docker_worker_container: "audiomuse-ai-worker-instance"
+  docker_postgres_container: "audiomuse-postgres"
+  docker_redis_container: "audiomuse-redis"
+  ssh_host: ""
+  ssh_user: ""
+  ssh_key: ""
+  ssh_port: 22
+
+# Test modules to run (true/false)
+run_api_tests: true
+run_db_tests: true
+run_docker_tests: true
+run_performance_tests: true
+run_existing_unit_tests: true
+run_existing_integration_tests: true
+
+# Performance test settings
+perf_warmup_requests: 3        # Warmup requests per endpoint before measuring
+perf_benchmark_requests: 10    # Measured requests per endpoint
+perf_concurrent_users: 5       # Concurrent users for load tests
+
+# API test settings
+api_retries: 3                 # Retries on connection errors
+api_retry_delay: 2.0           # Seconds between retries
+api_task_timeout: 1200         # Timeout for long-running tasks (20 min)
+
+# Database quality thresholds
+db_row_count_tolerance_pct: 5.0    # % difference allowed in row counts
+db_embedding_dimension_expected: 200
+db_clap_dimension_expected: 512
+db_score_null_threshold_pct: 10.0  # Max % NULLs in critical columns
+
+# Reporting
+output_dir: "testing_suite/reports/output"
+report_format: "both"    # html, json, or both
+verbose: false
+
+# Test track references (used for functional API tests)
+# These should be tracks that exist in both instances' music libraries
+test_track_artist_1: "Red Hot Chili Peppers"
+test_track_title_1: "By the Way"
+test_track_artist_2: "System of a Down"
+test_track_title_2: "Attack"
diff --git a/testing_suite/config.py b/testing_suite/config.py
new file mode 100644
index 00000000..1419c884
--- /dev/null
+++ b/testing_suite/config.py
@@ -0,0 +1,211 @@
+"""
+Configuration for the AudioMuse-AI Testing & Comparison Suite.
+
+Defines connection parameters for two instances (Instance A / Instance B)
+which typically correspond to main branch and feature branch deployments.
+
+Configuration can be provided via:
+  1. Environment variables (INSTANCE_A_*, INSTANCE_B_*)
+  2. A YAML config file (--config flag)
+  3. CLI arguments
+"""
+
+import os
+import json
+import logging
+from dataclasses import dataclass, field, asdict
+from typing import Optional
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass
+class InstanceConfig:
+    """Connection configuration for a single AudioMuse-AI instance."""
+
+    # Identity
+    name: str = "instance"
+    branch: str = "unknown"
+
+    # API connection
+    api_url: str = "http://localhost:8000"
+    api_timeout: int = 120
+
+    # PostgreSQL connection
+    pg_host: str = "localhost"
+    pg_port: int = 5432
+    pg_user: str = "audiomuse"
+    pg_password: str = "audiomusepassword"
+    pg_database: str = "audiomusedb"
+
+    # Redis connection
+    redis_url: str = "redis://localhost:6379/0"
+
+    # Docker container names (for log collection)
+    docker_flask_container: str = "audiomuse-ai-flask-app"
+    docker_worker_container: str = "audiomuse-ai-worker-instance"
+    docker_postgres_container: str = "audiomuse-postgres"
+    docker_redis_container: str = "audiomuse-redis"
+
+    # Docker compose file (optional, for status checks)
+    docker_compose_file: str = ""
+
+    # SSH details if instances are remote
+    ssh_host: str = ""
+    ssh_user: str = ""
+    ssh_key: str = ""
+    ssh_port: int = 22
+
+    @property
+    def pg_dsn(self) -> str:
+        """Construct PostgreSQL DSN from components."""
+        from urllib.parse import quote
+        user = quote(self.pg_user, safe='')
+        password = quote(self.pg_password, safe='')
+        return f"postgresql://{user}:{password}@{self.pg_host}:{self.pg_port}/{self.pg_database}"
+
+    def to_dict(self) -> dict:
+        return asdict(self)
+
+
+@dataclass
+class ComparisonConfig:
+    """Top-level configuration for the comparison suite."""
+
+    # Instance configurations
+    instance_a: InstanceConfig = field(default_factory=lambda: InstanceConfig(
+        name="main", branch="main"
+    ))
+    instance_b: InstanceConfig = field(default_factory=lambda: InstanceConfig(
+        name="feature", branch="feature"
+    ))
+
+    # Test control flags
+    run_api_tests: bool = True
+    run_db_tests: bool = True
+    run_docker_tests: bool = True
+    run_performance_tests: bool = True
+    run_existing_unit_tests: bool = True
+    run_existing_integration_tests: bool = True
+
+    # Performance test settings
+    perf_warmup_requests: int = 3
+    perf_benchmark_requests: int = 10
+    perf_concurrent_users: int = 5
+
+    # API test settings
+    api_retries: int = 3
+    api_retry_delay: float = 2.0
+    api_task_timeout: int = 1200  # 20 minutes for long-running tasks
+
+    # Database comparison thresholds
+    db_row_count_tolerance_pct: float = 5.0  # % difference allowed in row counts
+    db_embedding_dimension_expected: int = 200
+    db_clap_dimension_expected: int = 512
+    db_score_null_threshold_pct: float = 10.0  # Max % of NULL values in critical columns
+
+    # Reporting
+    output_dir: str = "testing_suite/reports/output"
+    report_format: str = "html"  # html, json, or both
+    verbose: bool = False
+
+    # Test track references for functional tests
+    test_track_artist_1: str = "Red Hot Chili Peppers"
+    test_track_title_1: str = "By the Way"
+    test_track_artist_2: str = "System of a Down"
+    test_track_title_2: str = "Attack"
+
+    def to_dict(self) -> dict:
+        return {
+            "instance_a": self.instance_a.to_dict(),
+            "instance_b": self.instance_b.to_dict(),
+            "run_api_tests": self.run_api_tests,
+            "run_db_tests": self.run_db_tests,
+            "run_docker_tests": self.run_docker_tests,
+            "run_performance_tests": self.run_performance_tests,
+            "run_existing_unit_tests": self.run_existing_unit_tests,
+            "run_existing_integration_tests": self.run_existing_integration_tests,
+            "perf_warmup_requests": self.perf_warmup_requests,
+            "perf_benchmark_requests": self.perf_benchmark_requests,
+            "perf_concurrent_users": self.perf_concurrent_users,
+            "output_dir": self.output_dir,
+            "report_format": self.report_format,
+        }
+
+
+def load_config_from_yaml(path: str) -> ComparisonConfig:
+    """Load comparison config from a YAML file."""
+    try:
+        import yaml
+    except ImportError:
+        raise ImportError("PyYAML is required for YAML config files: pip install pyyaml")
+
+    with open(path, 'r') as f:
+        data = yaml.safe_load(f)
+
+    config = ComparisonConfig()
+
+    if 'instance_a' in data:
+        for k, v in data['instance_a'].items():
+            if hasattr(config.instance_a, k):
+                setattr(config.instance_a, k, v)
+
+    if 'instance_b' in data:
+        for k, v in data['instance_b'].items():
+            if hasattr(config.instance_b, k):
+                setattr(config.instance_b, k, v)
+
+    # Top-level settings
+    for k, v in data.items():
+        if k not in ('instance_a', 'instance_b') and hasattr(config, k):
+            setattr(config, k, v)
+
+    return config
+
+
+def load_config_from_env() -> ComparisonConfig:
+    """Load comparison config from environment variables."""
+    config = ComparisonConfig()
+
+    # Instance A
+    a = config.instance_a
+    a.name = os.getenv("INSTANCE_A_NAME", a.name)
+    a.branch = os.getenv("INSTANCE_A_BRANCH", a.branch)
+    a.api_url = os.getenv("INSTANCE_A_API_URL", a.api_url)
+    a.pg_host = os.getenv("INSTANCE_A_PG_HOST", a.pg_host)
+    a.pg_port = int(os.getenv("INSTANCE_A_PG_PORT", str(a.pg_port)))
+    a.pg_user = os.getenv("INSTANCE_A_PG_USER", a.pg_user)
+    a.pg_password = os.getenv("INSTANCE_A_PG_PASSWORD", a.pg_password)
+    a.pg_database = os.getenv("INSTANCE_A_PG_DATABASE", a.pg_database)
+    a.redis_url = os.getenv("INSTANCE_A_REDIS_URL", a.redis_url)
+    a.docker_flask_container = os.getenv("INSTANCE_A_FLASK_CONTAINER", a.docker_flask_container)
+    a.docker_worker_container = os.getenv("INSTANCE_A_WORKER_CONTAINER", a.docker_worker_container)
+    a.docker_postgres_container = os.getenv("INSTANCE_A_PG_CONTAINER", a.docker_postgres_container)
+    a.ssh_host = os.getenv("INSTANCE_A_SSH_HOST", a.ssh_host)
+    a.ssh_user = os.getenv("INSTANCE_A_SSH_USER", a.ssh_user)
+    a.ssh_key = os.getenv("INSTANCE_A_SSH_KEY", a.ssh_key)
+
+    # Instance B
+    b = config.instance_b
+    b.name = os.getenv("INSTANCE_B_NAME", b.name)
+    b.branch = os.getenv("INSTANCE_B_BRANCH", b.branch)
+    b.api_url = os.getenv("INSTANCE_B_API_URL", b.api_url)
+    b.pg_host = os.getenv("INSTANCE_B_PG_HOST", b.pg_host)
+    b.pg_port = int(os.getenv("INSTANCE_B_PG_PORT", str(b.pg_port)))
+    b.pg_user = os.getenv("INSTANCE_B_PG_USER", b.pg_user)
+    b.pg_password = os.getenv("INSTANCE_B_PG_PASSWORD", b.pg_password)
+    b.pg_database = os.getenv("INSTANCE_B_PG_DATABASE", b.pg_database)
+    b.redis_url = os.getenv("INSTANCE_B_REDIS_URL", b.redis_url)
+    b.docker_flask_container = os.getenv("INSTANCE_B_FLASK_CONTAINER", b.docker_flask_container)
+    b.docker_worker_container = os.getenv("INSTANCE_B_WORKER_CONTAINER", b.docker_worker_container)
+    b.docker_postgres_container = os.getenv("INSTANCE_B_PG_CONTAINER", b.docker_postgres_container)
+    b.ssh_host = os.getenv("INSTANCE_B_SSH_HOST", b.ssh_host)
+    b.ssh_user = os.getenv("INSTANCE_B_SSH_USER", b.ssh_user)
+    b.ssh_key = os.getenv("INSTANCE_B_SSH_KEY", b.ssh_key)
+
+    # Global settings
+    config.verbose = os.getenv("COMPARISON_VERBOSE", "false").lower() == "true"
+    config.output_dir = os.getenv("COMPARISON_OUTPUT_DIR", config.output_dir)
+    config.report_format = os.getenv("COMPARISON_REPORT_FORMAT", config.report_format)
+
+    return config
diff --git a/testing_suite/orchestrator.py b/testing_suite/orchestrator.py
new file mode 100644
index 00000000..7e6849f9
--- /dev/null
+++ b/testing_suite/orchestrator.py
@@ -0,0 +1,163 @@
+"""
+Main Orchestrator for the AudioMuse-AI Testing & Comparison Suite.
+
+Coordinates all comparison modules and generates the final report.
+"""
+
+import json
+import logging
+import os
+import time
+from datetime import datetime
+
+from testing_suite.config import ComparisonConfig
+from testing_suite.utils import ComparisonReport
+from testing_suite.comparators.api_comparator import APIComparator
+from testing_suite.comparators.db_comparator import DatabaseComparator
+from testing_suite.comparators.docker_comparator import DockerComparator
+from testing_suite.comparators.performance_comparator import PerformanceComparator
+from testing_suite.test_runner.existing_tests import ExistingTestRunner
+from testing_suite.reports.html_report import generate_html_report
+
+logger = logging.getLogger(__name__)
+
+
+class ComparisonOrchestrator:
+    """Orchestrates all comparison modules and produces the final report."""
+
+    def __init__(self, config: ComparisonConfig):
+        self.config = config
+        self.report = ComparisonReport(
+            instance_a_name=config.instance_a.name,
+            instance_b_name=config.instance_b.name,
+            instance_a_branch=config.instance_a.branch,
+            instance_b_branch=config.instance_b.branch,
+            config_snapshot=config.to_dict(),
+        )
+
+    def run(self) -> ComparisonReport:
+        """Run all configured comparison modules and return the report."""
+        overall_start = time.time()
+
+        logger.info("=" * 70)
+        logger.info("AudioMuse-AI Testing & Comparison Suite")
+        logger.info("=" * 70)
+        logger.info(f"Instance A: {self.config.instance_a.name} "
+                     f"({self.config.instance_a.branch}) "
+                     f"@ {self.config.instance_a.api_url}")
+        logger.info(f"Instance B: {self.config.instance_b.name} "
+                     f"({self.config.instance_b.branch}) "
+                     f"@ {self.config.instance_b.api_url}")
+        logger.info("-" * 70)
+
+        # Run each module based on config flags
+        modules = []
+
+        if self.config.run_db_tests:
+            modules.append(("Database Comparison", DatabaseComparator(self.config)))
+
+        if self.config.run_api_tests:
+            modules.append(("API Comparison", APIComparator(self.config)))
+
+        if self.config.run_docker_tests:
+            modules.append(("Docker Comparison", DockerComparator(self.config)))
+
+        if self.config.run_performance_tests:
+            modules.append(("Performance Benchmark", PerformanceComparator(self.config)))
+
+        if self.config.run_existing_unit_tests or self.config.run_existing_integration_tests:
+            modules.append(("Existing Tests", ExistingTestRunner(self.config)))
+
+        for name, module in modules:
+            logger.info(f"\n{'='*50}")
+            logger.info(f"Running: {name}")
+            logger.info(f"{'='*50}")
+            try:
+                module_start = time.time()
+                module.run_all(self.report)
+                module_duration = time.time() - module_start
+                logger.info(f"{name} completed in {module_duration:.1f}s")
+            except Exception as e:
+                logger.error(f"{name} failed with error: {e}", exc_info=True)
+                from testing_suite.utils import TestResult, TestStatus
+                self.report.add_result(TestResult(
+                    category=name.lower().replace(" ", "_"),
+                    name=f"{name}: Module Error",
+                    status=TestStatus.ERROR,
+                    message=f"Module failed: {str(e)}",
+                ))
+
+        # Generate reports
+        self._generate_reports()
+
+        overall_duration = time.time() - overall_start
+        logger.info(f"\n{'='*70}")
+        logger.info(f"Testing complete in {overall_duration:.1f}s")
+        logger.info(f"Overall status: {self.report.overall_status.value}")
+        logger.info(f"Total: {self.report.total_tests} tests, "
+                     f"{self.report.total_passed} passed, "
+                     f"{self.report.total_failed} failed, "
+                     f"{self.report.total_errors} errors")
+        logger.info(f"{'='*70}")
+
+        return self.report
+
+    def _generate_reports(self):
+        """Generate output reports in configured formats."""
+        os.makedirs(self.config.output_dir, exist_ok=True)
+        timestamp = datetime.utcnow().strftime("%Y%m%d_%H%M%S")
+
+        # JSON report (always generated)
+        json_path = os.path.join(self.config.output_dir, f"comparison_{timestamp}.json")
+        with open(json_path, 'w') as f:
+            json.dump(self.report.to_dict(), f, indent=2, default=str)
+        logger.info(f"JSON report saved: {json_path}")
+
+        # HTML report
+        if self.config.report_format in ("html", "both"):
+            html_path = os.path.join(self.config.output_dir, f"comparison_{timestamp}.html")
+            generate_html_report(self.report, html_path)
+            logger.info(f"HTML report saved: {html_path}")
+
+        # Also save a latest symlink/copy
+        for ext in ["json", "html"]:
+            src = os.path.join(self.config.output_dir, f"comparison_{timestamp}.{ext}")
+            dst = os.path.join(self.config.output_dir, f"comparison_latest.{ext}")
+            if os.path.exists(src):
+                try:
+                    if os.path.exists(dst) or os.path.islink(dst):
+                        os.unlink(dst)
+                    os.symlink(os.path.basename(src), dst)
+                except OSError:
+                    # Symlinks may not work on all systems; copy instead
+                    import shutil
+                    shutil.copy2(src, dst)
+
+    def print_summary(self):
+        """Print a concise summary to stdout."""
+        print(f"\n{'='*60}")
+        print(f"  COMPARISON REPORT SUMMARY")
+        print(f"{'='*60}")
+        print(f"  Instance A: {self.report.instance_a_name} ({self.report.instance_a_branch})")
+        print(f"  Instance B: {self.report.instance_b_name} ({self.report.instance_b_branch})")
+        print(f"  Overall: {self.report.overall_status.value}")
+        print(f"  Total: {self.report.total_tests} | "
+              f"Pass: {self.report.total_passed} | "
+              f"Fail: {self.report.total_failed} | "
+              f"Error: {self.report.total_errors}")
+        print(f"{'='*60}")
+
+        for cat_name, cat in self.report.categories.items():
+            indicator = "PASS" if cat.failed == 0 and cat.errors == 0 else "FAIL"
+            print(f"  [{indicator:4s}] {cat_name:25s}  "
+                  f"P:{cat.passed:3d}  F:{cat.failed:3d}  "
+                  f"W:{cat.warned:3d}  S:{cat.skipped:3d}  E:{cat.errors:3d}")
+
+            # Show failed tests
+            for r in cat.results:
+                if r.status.value in ("FAIL", "ERROR"):
+                    print(f"         X {r.name}: {r.message[:80]}")
+
+        print(f"{'='*60}")
+        print(f"  Reports: {self.config.output_dir}/comparison_latest.*")
+        print(f"{'='*60}\n")
diff --git a/testing_suite/reports/__init__.py b/testing_suite/reports/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/testing_suite/reports/html_report.py b/testing_suite/reports/html_report.py
new file mode 100644
index 00000000..527268df
--- /dev/null
+++ b/testing_suite/reports/html_report.py
@@ -0,0 +1,359 @@
+"""
+HTML Report Generator for AudioMuse-AI Testing Suite.
+
+Generates a comprehensive, self-contained HTML report with:
+  - Overall pass/fail summary with status badges
+  - Per-category breakdowns with expandable details
+  - Color-coded results (green/red/yellow/gray)
+  - Performance charts (latency comparisons)
+  - Filterable and sortable tables
+  - Instance A vs B side-by-side comparisons
+"""
+
+import json
+import os
+from datetime import datetime
+from typing import Dict
+
+from testing_suite.utils import ComparisonReport, TestStatus
+
+
+def generate_html_report(report: ComparisonReport, output_path: str) -> str:
+    """Generate a self-contained HTML report and write it to output_path."""
+    os.makedirs(os.path.dirname(output_path) or ".", exist_ok=True)
+
+    report_dict = report.to_dict()
+    categories = report_dict.get("categories", {})
+
+    # Build category HTML sections
+    category_sections = ""
+    for cat_name, cat_data in categories.items():
+        category_sections += _build_category_section(cat_name, cat_data)
+
+    # Build performance chart data (if performance category exists)
+    perf_chart_data = _build_performance_chart_data(categories.get("performance", {}))
+
+    html = f"""<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>AudioMuse-AI Comparison Report</title>
+<style>
+* {{ margin: 0; padding: 0; box-sizing: border-box; }}
+body {{ font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; background: #0d1117; color: #c9d1d9; line-height: 1.6; padding: 20px; }}
+.container {{ max-width: 1400px; margin: 0 auto; }}
+h1 {{ color: #58a6ff; margin-bottom: 10px; font-size: 28px; }}
+h2 {{ color: #79c0ff; margin: 30px 0 15px; font-size: 22px; border-bottom: 1px solid #21262d; padding-bottom: 8px; }}
+h3 {{ color: #c9d1d9; margin: 15px 0 10px; font-size: 16px; }}
+.header {{ background: #161b22; border: 1px solid #30363d; border-radius: 8px; padding: 24px; margin-bottom: 24px; }}
+.header-meta {{ color: #8b949e; font-size: 14px; margin-top: 8px; }}
+.summary-grid {{ display: grid; grid-template-columns: repeat(auto-fit, minmax(200px, 1fr)); gap: 16px; margin: 20px 0; }}
+.summary-card {{ background: #161b22; border: 1px solid #30363d; border-radius: 8px; padding: 20px; text-align: center; }}
+.summary-card .number {{ font-size: 36px; font-weight: bold; }}
+.summary-card .label {{ color: #8b949e; font-size: 14px; margin-top: 4px; }}
+.status-pass {{ color: #3fb950; }}
+.status-fail {{ color: #f85149; }}
+.status-warn {{ color: #d29922; }}
+.status-skip {{ color: #8b949e; }}
+.status-error {{ color: #f85149; }}
+.badge {{ display: inline-block; padding: 2px 10px; border-radius: 12px; font-size: 12px; font-weight: 600; text-transform: uppercase; }}
+.badge-pass {{ background: #1b4332; color: #3fb950; }}
+.badge-fail {{ background: #490202; color: #f85149; }}
+.badge-warn {{ background: #3d2e00; color: #d29922; }}
+.badge-skip {{ background: #21262d; color: #8b949e; }}
+.badge-error {{ background: #490202; color: #f85149; }}
+.category {{ background: #161b22; border: 1px solid #30363d; border-radius: 8px; margin-bottom: 20px; overflow: hidden; }}
+.category-header {{ padding: 16px 20px; cursor: pointer; display: flex; justify-content: space-between; align-items: center; border-bottom: 1px solid #21262d; }}
+.category-header:hover {{ background: #1c2128; }}
+.category-header .cat-title {{ font-size: 18px; font-weight: 600; }}
+.category-header .cat-stats {{ display: flex; gap: 12px; font-size: 13px; }}
+.category-body {{ display: none; }}
+.category-body.open {{ display: block; }}
+table {{ width: 100%; border-collapse: collapse; font-size: 13px; }}
+th {{ background: #1c2128; padding: 10px 12px; text-align: left; color: #8b949e; font-weight: 600; position: sticky; top: 0; }}
+td {{ padding: 10px 12px; border-bottom: 1px solid #21262d; }}
+tr:hover {{ background: #1c2128; }}
+.message-cell {{ max-width: 600px; word-wrap: break-word; white-space: pre-wrap; font-size: 12px; }}
+.duration {{ color: #8b949e; font-size: 12px; }}
+.filter-bar {{ margin: 10px 0; padding: 10px 16px; display: flex; gap: 10px; align-items: center; flex-wrap: wrap; }}
+.filter-btn {{ background: #21262d; border: 1px solid #30363d; color: #c9d1d9; padding: 4px 12px; border-radius: 6px; cursor: pointer; font-size: 12px; }}
+.filter-btn:hover, .filter-btn.active {{ background: #30363d; }}
+.instances {{ display: grid; grid-template-columns: 1fr 1fr; gap: 16px; margin: 10px 0; }}
+.instance-box {{ background: #1c2128; border: 1px solid #30363d; border-radius: 6px; padding: 12px; }}
+.instance-box h4 {{ color: #79c0ff; margin-bottom: 8px; }}
+.toggle-arrow {{ transition: transform 0.2s; font-size: 12px; }}
+.toggle-arrow.open {{ transform: rotate(90deg); }}
+.perf-bar {{ display: flex; align-items: center; gap: 8px; margin: 2px 0; }}
+.perf-bar-a {{ background: #388bfd; height: 18px; border-radius: 3px; min-width: 2px; }}
+.perf-bar-b {{ background: #f0883e; height: 18px; border-radius: 3px; min-width: 2px; }}
+.perf-legend {{ display: flex; gap: 16px; margin: 10px 0; font-size: 12px; }}
+.perf-legend span {{ display: flex; align-items: center; gap: 4px; }}
+.perf-legend .dot-a {{ width: 10px; height: 10px; background: #388bfd; border-radius: 50%; }}
+.perf-legend .dot-b {{ width: 10px; height: 10px; background: #f0883e; border-radius: 50%; }}
+.overall-badge {{ font-size: 20px; padding: 6px 20px; }}
+footer {{ text-align: center; color: #484f58; margin-top: 40px; padding: 20px; font-size: 12px; }}
+</style>
+</head>
+<body>
+<div class="container">
+  <div class="header">
+    <h1>AudioMuse-AI Comparison Report</h1>
+    <div class="header-meta">
+      Generated: {report.timestamp} UTC<br>
+      Instance A: <strong>{report.instance_a_name}</strong> (branch: {report.instance_a_branch})<br>
+      Instance B: <strong>{report.instance_b_name}</strong> (branch: {report.instance_b_branch})
+    </div>
+  </div>
+
+  <div class="summary-grid">
+    <div class="summary-card">
+      <div class="number {_status_class(report.overall_status)}">{report.overall_status.value}</div>
+      <div class="label">Overall Status</div>
+    </div>
+    <div class="summary-card">
+      <div class="number">{report.total_tests}</div>
+      <div class="label">Total Tests</div>
+    </div>
+    <div class="summary-card">
+      <div class="number status-pass">{report.total_passed}</div>
+      <div class="label">Passed</div>
+    </div>
+    <div class="summary-card">
+      <div class="number status-fail">{report.total_failed}</div>
+      <div class="label">Failed</div>
+    </div>
+    <div class="summary-card">
+      <div class="number status-error">{report.total_errors}</div>
+      <div class="label">Errors</div>
+    </div>
+    <div class="summary-card">
+      <div class="number status-warn">{sum(c.warned for c in report.categories.values())}</div>
+      <div class="label">Warnings</div>
+    </div>
+  </div>
+
+  {category_sections}
+
+  {_build_perf_visual(perf_chart_data) if perf_chart_data else ""}
+
+</div>
+
+<footer>
+  AudioMuse-AI Testing &amp; Comparison Suite v1.0.0
+</footer>
+
+<script>
+document.querySelectorAll('.category-header').forEach(header => {{
+  header.addEventListener('click', () => {{
+    const body = header.nextElementSibling;
+    const arrow = header.querySelector('.toggle-arrow');
+    body.classList.toggle('open');
+    arrow.classList.toggle('open');
+  }});
+}});
+
+function filterResults(cat, status) {{
+  const table = document.getElementById('table-' + cat);
+  if (!table) return;
+  const rows = table.querySelectorAll('tbody tr');
+  rows.forEach(row => {{
+    if (status === 'all' || row.dataset.status === status) {{
+      row.style.display = '';
+    }} else {{
+      row.style.display = 'none';
+    }}
+  }});
+}}
+</script>
+</body>
+</html>"""
+
+    with open(output_path, 'w') as f:
+        f.write(html)
+
+    return output_path
+
+
+def _status_class(status) -> str:
+    """Get CSS class for a status value."""
+    if isinstance(status, TestStatus):
+        status = status.value
+    return f"status-{status.lower()}"
+
+
+def _badge_html(status) -> str:
+    """Generate a badge HTML element for a status."""
+    if isinstance(status, TestStatus):
+        status = status.value
+    return f'<span class="badge badge-{status.lower()}">{status}</span>'
+
+
+def _build_category_section(cat_name: str, cat_data: dict) -> str:
+    """Build HTML section for a test category."""
+    total = cat_data.get("total", 0)
+    passed = cat_data.get("passed", 0)
+    failed = cat_data.get("failed", 0)
+    warned = cat_data.get("warned", 0)
+    skipped = cat_data.get("skipped", 0)
+    errors = cat_data.get("errors", 0)
+    results = cat_data.get("results", [])
+
+    # Category display name
+    display_names = {
+        "api": "API Endpoints",
+        "database": "Database Quality",
+        "docker": "Docker & Infrastructure",
+        "performance": "Performance Benchmarks",
+        "existing_tests": "Existing Test Suite",
+    }
+    display_name = display_names.get(cat_name, cat_name.replace("_", " ").title())
+
+    # Build table rows
+    rows = ""
+    for r in results:
+        status = r.get("status", "SKIP")
+        duration = r.get("duration_seconds", 0)
+        duration_str = f"{duration:.2f}s" if duration else "-"
+
+        # Format values for display
+        val_a = r.get("instance_a_value", "")
+        val_b = r.get("instance_b_value", "")
+        if isinstance(val_a, (dict, list)):
+            val_a = json.dumps(val_a, indent=1, default=str)[:200]
+        if isinstance(val_b, (dict, list)):
+            val_b = json.dumps(val_b, indent=1, default=str)[:200]
+
+        rows += f"""
+        <tr data-status="{status.lower()}">
+          <td>{_badge_html(status)}</td>
+          <td>{r.get('name', '')}</td>
+          <td class="message-cell">{_escape_html(r.get('message', ''))}</td>
+          <td><small>{_escape_html(str(val_a)[:150])}</small></td>
+          <td><small>{_escape_html(str(val_b)[:150])}</small></td>
+          <td class="duration">{duration_str}</td>
+        </tr>"""
+
+    return f"""
+  <div class="category">
+    <div class="category-header">
+      <div>
+        <span class="toggle-arrow">&#9654;</span>
+        <span class="cat-title">{display_name}</span>
+      </div>
+      <div class="cat-stats">
+        <span class="status-pass">{passed} passed</span>
+        <span class="status-fail">{failed} failed</span>
+        <span class="status-warn">{warned} warn</span>
+        <span class="status-skip">{skipped} skip</span>
+        <span class="status-error">{errors} err</span>
+        <span>({total} total)</span>
+      </div>
+    </div>
+    <div class="category-body">
+      <div class="filter-bar">
+        <span style="color:#8b949e;font-size:12px;">Filter:</span>
+        <button class="filter-btn" onclick="filterResults('{cat_name}','all')">All</button>
+        <button class="filter-btn" onclick="filterResults('{cat_name}','pass')">Pass</button>
+        <button class="filter-btn" onclick="filterResults('{cat_name}','fail')">Fail</button>
+        <button class="filter-btn" onclick="filterResults('{cat_name}','warn')">Warn</button>
+        <button class="filter-btn" onclick="filterResults('{cat_name}','error')">Error</button>
+        <button class="filter-btn" onclick="filterResults('{cat_name}','skip')">Skip</button>
+      </div>
+      <table id="table-{cat_name}">
+        <thead>
+          <tr>
+            <th style="width:70px">Status</th>
+            <th style="width:250px">Test Name</th>
+            <th>Message</th>
+            <th style="width:150px">Instance A</th>
+            <th style="width:150px">Instance B</th>
+            <th style="width:70px">Duration</th>
+          </tr>
+        </thead>
+        <tbody>
+          {rows}
+        </tbody>
+      </table>
+    </div>
+  </div>"""
+
+
+def _build_performance_chart_data(perf_category: dict) -> list:
+    """Extract performance comparison data for visualization."""
+    if not perf_category:
+        return []
+
+    chart_data = []
+    for result in perf_category.get("results", []):
+        name = result.get("name", "")
+        if not name.startswith("Latency:"):
+            continue
+
+        val_a = result.get("instance_a_value", {})
+        val_b = result.get("instance_b_value", {})
+
+        if isinstance(val_a, dict) and isinstance(val_b, dict):
+            mean_a = val_a.get("mean", 0)
+            mean_b = val_b.get("mean", 0)
+            if mean_a > 0 or mean_b > 0:
+                chart_data.append({
+                    "name": name.replace("Latency: ", ""),
+                    "mean_a": mean_a,
+                    "mean_b": mean_b,
+                    "p95_a": val_a.get("p95", 0),
+                    "p95_b": val_b.get("p95", 0),
+                })
+
+    return chart_data
+
+
+def _build_perf_visual(chart_data: list) -> str:
+    """Build a visual performance comparison section."""
+    if not chart_data:
+        return ""
+
+    max_val = max(
+        max(d["mean_a"], d["mean_b"], d["p95_a"], d["p95_b"])
+        for d in chart_data
+    ) or 1
+
+    bars = ""
+    for d in chart_data:
+        width_a = max(2, int(d["mean_a"] / max_val * 400))
+        width_b = max(2, int(d["mean_b"] / max_val * 400))
+
+        bars += f"""
+      <div style="margin-bottom:12px;">
+        <div style="font-size:13px;color:#c9d1d9;margin-bottom:4px;">{d['name']}</div>
+        <div class="perf-bar">
+          <div style="width:30px;text-align:right;font-size:11px;color:#8b949e;">A</div>
+          <div class="perf-bar-a" style="width:{width_a}px;" title="Mean: {d['mean_a']*1000:.1f}ms, P95: {d['p95_a']*1000:.1f}ms"></div>
+          <span style="font-size:11px;color:#8b949e;">{d['mean_a']*1000:.1f}ms</span>
+        </div>
+        <div class="perf-bar">
+          <div style="width:30px;text-align:right;font-size:11px;color:#8b949e;">B</div>
+          <div class="perf-bar-b" style="width:{width_b}px;" title="Mean: {d['mean_b']*1000:.1f}ms, P95: {d['p95_b']*1000:.1f}ms"></div>
+          <span style="font-size:11px;color:#8b949e;">{d['mean_b']*1000:.1f}ms</span>
+        </div>
+      </div>"""
+
+    return f"""
+  <h2>Performance Visual Comparison (Mean Latency)</h2>
+  <div class="perf-legend">
+    <span><span class="dot-a"></span> Instance A</span>
+    <span><span class="dot-b"></span> Instance B</span>
+  </div>
+  <div style="background:#161b22;border:1px solid #30363d;border-radius:8px;padding:20px;">
+    {bars}
+  </div>"""
+
+
+def _escape_html(text: str) -> str:
+    """Escape HTML special characters."""
+    return (str(text)
+            .replace("&", "&amp;")
+            .replace("<", "&lt;")
+            .replace(">", "&gt;")
+            .replace('"', "&quot;")
+            .replace("'", "&#39;"))
diff --git a/testing_suite/requirements.txt b/testing_suite/requirements.txt
new file mode 100644
index 00000000..ecec1016
--- /dev/null
+++ b/testing_suite/requirements.txt
@@ -0,0 +1,7 @@
+# Requirements for the AudioMuse-AI Testing & Comparison Suite
+requests>=2.28.0
+psycopg2-binary>=2.9.0
+pyyaml>=6.0
+pytest>=7.0.0
+pytest-json-report>=1.5.0
+pytest-timeout>=2.1.0
diff --git a/testing_suite/run_comparison.py b/testing_suite/run_comparison.py
new file mode 100644
index 00000000..b07ea7ce
--- /dev/null
+++ b/testing_suite/run_comparison.py
@@ -0,0 +1,325 @@
+#!/usr/bin/env python3
+"""
+AudioMuse-AI Testing & Comparison Suite - CLI Entry Point
+
+Comprehensive tool to test all features, database quality, API results,
+and performance between two AudioMuse-AI instances (e.g., main branch vs feature branch).
+
+Usage:
+  # Quick comparison with two API URLs (minimal config):
+  python -m testing_suite.run_comparison \
+    --url-a http://main-instance:8000 \
+    --url-b http://feature-instance:8000
+
+  # Full comparison with database and Docker access:
+  python -m testing_suite.run_comparison \
+    --url-a http://main:8000 --url-b http://feature:8000 \
+    --pg-host-a main-db-host --pg-host-b feature-db-host \
+    --flask-container-a audiomuse-main-flask --flask-container-b audiomuse-feature-flask
+
+  # From YAML config file:
+  python -m testing_suite.run_comparison --config comparison_config.yaml
+
+  # Only run specific test categories:
+  python -m testing_suite.run_comparison \
+    --url-a http://main:8000 --url-b http://feature:8000 \
+    --only api,performance
+
+  # Skip slow tests:
+  python -m testing_suite.run_comparison \
+    --url-a http://main:8000 --url-b http://feature:8000 \
+    --skip docker,existing_tests
+
+  # Discover available tests:
+  python -m testing_suite.run_comparison --discover
+
+  # Verbose output:
+  python -m testing_suite.run_comparison \
+    --url-a http://main:8000 --url-b http://feature:8000 -v
+"""
+
+import argparse
+import logging
+import sys
+import os
+
+# Add project root to path
+sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
+
+from testing_suite.config import (
+    ComparisonConfig, InstanceConfig,
+    load_config_from_yaml, load_config_from_env,
+)
+from testing_suite.orchestrator import ComparisonOrchestrator
+from testing_suite.test_runner.existing_tests import ExistingTestRunner
+
+
+def build_parser() -> argparse.ArgumentParser:
+    parser = argparse.ArgumentParser(
+        description="AudioMuse-AI Testing & Comparison Suite",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog=__doc__,
+    )
+
+    # Config source
+    parser.add_argument("--config", "-c", type=str, default="",
+                        help="Path to YAML config file")
+
+    # Discovery mode
+    parser.add_argument("--discover", action="store_true",
+                        help="Discover and list all available tests, then exit")
+
+    # Instance A
+    grp_a = parser.add_argument_group("Instance A (main/baseline)")
+    grp_a.add_argument("--url-a", type=str, default="",
+                       help="API URL for instance A (e.g., http://localhost:8000)")
+    grp_a.add_argument("--name-a", type=str, default="main",
+                       help="Name for instance A (default: main)")
+    grp_a.add_argument("--branch-a", type=str, default="main",
+                       help="Branch name for instance A")
+    grp_a.add_argument("--pg-host-a", type=str, default="",
+                       help="PostgreSQL host for instance A")
+    grp_a.add_argument("--pg-port-a", type=int, default=5432,
+                       help="PostgreSQL port for instance A")
+    grp_a.add_argument("--pg-user-a", type=str, default="audiomuse",
+                       help="PostgreSQL user for instance A")
+    grp_a.add_argument("--pg-pass-a", type=str, default="audiomusepassword",
+                       help="PostgreSQL password for instance A")
+    grp_a.add_argument("--pg-db-a", type=str, default="audiomusedb",
+                       help="PostgreSQL database for instance A")
+    grp_a.add_argument("--redis-a", type=str, default="",
+                       help="Redis URL for instance A")
+    grp_a.add_argument("--flask-container-a", type=str, default="audiomuse-ai-flask-app",
+                       help="Docker flask container name for A")
+    grp_a.add_argument("--worker-container-a", type=str, default="audiomuse-ai-worker-instance",
+                       help="Docker worker container name for A")
+    grp_a.add_argument("--ssh-host-a", type=str, default="",
+                       help="SSH host for remote Docker access (instance A)")
+    grp_a.add_argument("--ssh-user-a", type=str, default="",
+                       help="SSH user for remote Docker access (instance A)")
+    grp_a.add_argument("--ssh-key-a", type=str, default="",
+                       help="SSH key file for remote Docker access (instance A)")
+
+    # Instance B
+    grp_b = parser.add_argument_group("Instance B (feature/test)")
+    grp_b.add_argument("--url-b", type=str, default="",
+                       help="API URL for instance B (e.g., http://localhost:8001)")
+    grp_b.add_argument("--name-b", type=str, default="feature",
+                       help="Name for instance B (default: feature)")
+    grp_b.add_argument("--branch-b", type=str, default="feature",
+                       help="Branch name for instance B")
+    grp_b.add_argument("--pg-host-b", type=str, default="",
+                       help="PostgreSQL host for instance B")
+    grp_b.add_argument("--pg-port-b", type=int, default=5432,
+                       help="PostgreSQL port for instance B")
+    grp_b.add_argument("--pg-user-b", type=str, default="audiomuse",
+                       help="PostgreSQL user for instance B")
+    grp_b.add_argument("--pg-pass-b", type=str, default="audiomusepassword",
+                       help="PostgreSQL password for instance B")
+    grp_b.add_argument("--pg-db-b", type=str, default="audiomusedb",
+                       help="PostgreSQL database for instance B")
+    grp_b.add_argument("--redis-b", type=str, default="",
+                       help="Redis URL for instance B")
+    grp_b.add_argument("--flask-container-b", type=str, default="audiomuse-ai-flask-app",
+                       help="Docker flask container name for B")
+    grp_b.add_argument("--worker-container-b", type=str, default="audiomuse-ai-worker-instance",
+                       help="Docker worker container name for B")
+    grp_b.add_argument("--ssh-host-b", type=str, default="",
+                       help="SSH host for remote Docker access (instance B)")
+    grp_b.add_argument("--ssh-user-b", type=str, default="",
+                       help="SSH user for remote Docker access (instance B)")
+    grp_b.add_argument("--ssh-key-b", type=str, default="",
+                       help="SSH key file for remote Docker access (instance B)")
+
+    # Test selection
+    grp_t = parser.add_argument_group("Test Selection")
+    grp_t.add_argument("--only", type=str, default="",
+                       help="Only run these categories (comma-separated: api,db,docker,performance,existing_tests)")
+    grp_t.add_argument("--skip", type=str, default="",
+                       help="Skip these categories (comma-separated)")
+
+    # Performance settings
+    grp_p = parser.add_argument_group("Performance Settings")
+    grp_p.add_argument("--warmup", type=int, default=3,
+                       help="Warmup requests before benchmarking (default: 3)")
+    grp_p.add_argument("--bench-requests", type=int, default=10,
+                       help="Benchmark requests per endpoint (default: 10)")
+    grp_p.add_argument("--concurrent", type=int, default=5,
+                       help="Concurrent users for load test (default: 5)")
+
+    # Output
+    grp_o = parser.add_argument_group("Output")
+    grp_o.add_argument("--output-dir", "-o", type=str, default="testing_suite/reports/output",
+                       help="Output directory for reports")
+    grp_o.add_argument("--format", type=str, default="both", choices=["html", "json", "both"],
+                       help="Report format (default: both)")
+    grp_o.add_argument("-v", "--verbose", action="store_true",
+                       help="Verbose output")
+
+    return parser
+
+
+def build_config(args) -> ComparisonConfig:
+    """Build ComparisonConfig from CLI arguments."""
+    # Start with YAML file or env if specified
+    if args.config:
+        config = load_config_from_yaml(args.config)
+    else:
+        config = load_config_from_env()
+
+    # CLI overrides
+    a = config.instance_a
+    b = config.instance_b
+
+    if args.url_a:
+        a.api_url = args.url_a
+    if args.name_a:
+        a.name = args.name_a
+    if args.branch_a:
+        a.branch = args.branch_a
+    if args.pg_host_a:
+        a.pg_host = args.pg_host_a
+    a.pg_port = args.pg_port_a
+    if args.pg_user_a:
+        a.pg_user = args.pg_user_a
+    if args.pg_pass_a:
+        a.pg_password = args.pg_pass_a
+    if args.pg_db_a:
+        a.pg_database = args.pg_db_a
+    if args.redis_a:
+        a.redis_url = args.redis_a
+    if args.flask_container_a:
+        a.docker_flask_container = args.flask_container_a
+    if args.worker_container_a:
+        a.docker_worker_container = args.worker_container_a
+    if args.ssh_host_a:
+        a.ssh_host = args.ssh_host_a
+    if args.ssh_user_a:
+        a.ssh_user = args.ssh_user_a
+    if args.ssh_key_a:
+        a.ssh_key = args.ssh_key_a
+
+    if args.url_b:
+        b.api_url = args.url_b
+    if args.name_b:
+        b.name = args.name_b
+    if args.branch_b:
+        b.branch = args.branch_b
+    if args.pg_host_b:
+        b.pg_host = args.pg_host_b
+    b.pg_port = args.pg_port_b
+    if args.pg_user_b:
+        b.pg_user = args.pg_user_b
+    if args.pg_pass_b:
+        b.pg_password = args.pg_pass_b
+    if args.pg_db_b:
+        b.pg_database = args.pg_db_b
+    if args.redis_b:
+        b.redis_url = args.redis_b
+    if args.flask_container_b:
+        b.docker_flask_container = args.flask_container_b
+    if args.worker_container_b:
+        b.docker_worker_container = args.worker_container_b
+    if args.ssh_host_b:
+        b.ssh_host = args.ssh_host_b
+    if args.ssh_user_b:
+        b.ssh_user = args.ssh_user_b
+    if args.ssh_key_b:
+        b.ssh_key = args.ssh_key_b
+
+    # Performance settings
+    config.perf_warmup_requests = args.warmup
+    config.perf_benchmark_requests = args.bench_requests
+    config.perf_concurrent_users = args.concurrent
+
+    # Output settings
+    config.output_dir = args.output_dir
+    config.report_format = args.format
+    config.verbose = args.verbose
+
+    # Test selection
+    if args.only:
+        categories = set(args.only.split(","))
+        config.run_api_tests = "api" in categories
+        config.run_db_tests = "db" in categories or "database" in categories
+        config.run_docker_tests = "docker" in categories
+        config.run_performance_tests = "performance" in categories or "perf" in categories
+        config.run_existing_unit_tests = "existing_tests" in categories or "unit" in categories
+        config.run_existing_integration_tests = "existing_tests" in categories or "integration" in categories
+
+    if args.skip:
+        skip = set(args.skip.split(","))
+        if "api" in skip:
+            config.run_api_tests = False
+        if "db" in skip or "database" in skip:
+            config.run_db_tests = False
+        if "docker" in skip:
+            config.run_docker_tests = False
+        if "performance" in skip or "perf" in skip:
+            config.run_performance_tests = False
+        if "existing_tests" in skip or "unit" in skip:
+            config.run_existing_unit_tests = False
+        if "existing_tests" in skip or "integration" in skip:
+            config.run_existing_integration_tests = False
+
+    return config
+
+
+def main():
+    parser = build_parser()
+    args = parser.parse_args()
+
+    # Setup logging
+    level = logging.DEBUG if args.verbose else logging.INFO
+    logging.basicConfig(
+        level=level,
+        format="%(asctime)s [%(levelname)s] %(name)s: %(message)s",
+        datefmt="%H:%M:%S",
+    )
+
+    # Discovery mode
+    if args.discover:
+        discovery = ExistingTestRunner.discover_tests()
+        print("\n=== AudioMuse-AI Test Discovery ===\n")
+
+        print(f"Unit Tests ({len(discovery['unit_tests'])} files):")
+        for t in discovery["unit_tests"]:
+            status = "OK" if t["exists"] else "MISSING"
+            print(f"  [{status}] {t['file']}")
+
+        print(f"\nIntegration Tests ({len(discovery['integration_tests'])} files):")
+        for t in discovery["integration_tests"]:
+            status = "OK" if t["exists"] else "MISSING"
+            print(f"  [{status}] {t['file']}")
+
+        print(f"\nE2E API Tests ({len(discovery['e2e_tests'])} tests):")
+        for t in discovery["e2e_tests"]:
+            print(f"  [OK] {t['name']} ({t['file']})")
+
+        total = (len(discovery["unit_tests"]) +
+                 len(discovery["integration_tests"]) +
+                 len(discovery["e2e_tests"]))
+        print(f"\nTotal: {total} test files/entries discovered.\n")
+        return 0
+
+    # Validate minimum config
+    config = build_config(args)
+
+    if not config.instance_a.api_url or not config.instance_b.api_url:
+        if not args.config:
+            parser.error("At least --url-a and --url-b are required "
+                         "(or use --config for YAML config)")
+
+    # Run comparison
+    orchestrator = ComparisonOrchestrator(config)
+    report = orchestrator.run()
+    orchestrator.print_summary()
+
+    # Exit code based on results
+    if report.total_failed > 0 or report.total_errors > 0:
+        return 1
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/testing_suite/test_runner/__init__.py b/testing_suite/test_runner/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/testing_suite/test_runner/existing_tests.py b/testing_suite/test_runner/existing_tests.py
new file mode 100644
index 00000000..c8a388fd
--- /dev/null
+++ b/testing_suite/test_runner/existing_tests.py
@@ -0,0 +1,469 @@
+"""
+Existing Test Integration Module for AudioMuse-AI Testing Suite.
+
+Discovers and runs existing unit and integration tests from the codebase
+against both instances, collecting and comparing results.
+
+Integrates:
+  - tests/unit/ (17 unit test modules via pytest)
+  - test/test.py (E2E API integration tests)
+  - test/test_analysis_integration.py (ONNX model integration)
+  - test/test_clap_analysis_integration.py (CLAP model integration)
+"""
+
+import json
+import logging
+import os
+import subprocess
+import time
+from pathlib import Path
+from typing import Any, Dict, List, Optional, Tuple
+
+from testing_suite.config import ComparisonConfig, InstanceConfig
+from testing_suite.utils import (
+    ComparisonReport, TestResult, TestStatus, pct_diff
+)
+
+logger = logging.getLogger(__name__)
+
+PROJECT_ROOT = Path(__file__).resolve().parents[2]
+
+# Known unit test files
+UNIT_TEST_DIR = PROJECT_ROOT / "tests" / "unit"
+UNIT_TEST_FILES = [
+    "test_ai.py",
+    "test_analysis.py",
+    "test_app_analysis.py",
+    "test_artist_gmm_manager.py",
+    "test_clap_text_search.py",
+    "test_clustering.py",
+    "test_clustering_helper.py",
+    "test_clustering_postprocessing.py",
+    "test_commons.py",
+    "test_mediaserver.py",
+    "test_memory_cleanup.py",
+    "test_memory_utils.py",
+    "test_path_manager.py",
+    "test_song_alchemy.py",
+    "test_sonic_fingerprint_manager.py",
+    "test_string_sanitization.py",
+    "test_voyager_manager.py",
+]
+
+# Integration test files
+INTEGRATION_TEST_DIR = PROJECT_ROOT / "test"
+INTEGRATION_TEST_FILES = [
+    "test_analysis_integration.py",
+    "test_clap_analysis_integration.py",
+]
+
+# E2E API test (requires a running instance)
+E2E_TEST_FILE = PROJECT_ROOT / "test" / "test.py"
+
+# Individual E2E test names (from test/test.py)
+E2E_TEST_NAMES = [
+    "test_analysis_smoke_flow",
+    "test_instant_playlist_functionality",
+    "test_sonic_fingerprint_and_playlist",
+    "test_song_alchemy_and_playlist",
+    "test_map_visualization",
+    "test_annoy_similarity_and_playlist",
+    "test_song_path_and_playlist",
+    "test_clustering_smoke_flow",
+]
+
+
+def _parse_pytest_json(json_path: str) -> dict:
+    """Parse pytest JSON report."""
+    try:
+        with open(json_path, 'r') as f:
+            return json.load(f)
+    except Exception as e:
+        logger.warning(f"Could not parse pytest JSON report: {e}")
+        return {}
+
+
+def _run_pytest(test_path: str, extra_args: list = None,
+                env_override: dict = None, timeout: int = 600,
+                json_report: bool = True) -> Tuple[dict, str, int]:
+    """
+    Run pytest and capture results.
+    Returns (parsed_json_result, stdout, returncode).
+    """
+    cmd = ["python", "-m", "pytest", "-v", "--tb=short"]
+
+    json_path = None
+    if json_report:
+        json_path = f"/tmp/pytest_report_{int(time.time() * 1000)}.json"
+        cmd += [f"--json-report", f"--json-report-file={json_path}"]
+
+    cmd.append(str(test_path))
+
+    if extra_args:
+        cmd.extend(extra_args)
+
+    env = os.environ.copy()
+    if env_override:
+        env.update(env_override)
+
+    # Ensure project root is in PYTHONPATH
+    python_path = env.get("PYTHONPATH", "")
+    env["PYTHONPATH"] = f"{PROJECT_ROOT}:{python_path}" if python_path else str(PROJECT_ROOT)
+
+    try:
+        proc = subprocess.run(
+            cmd, capture_output=True, text=True, timeout=timeout,
+            cwd=str(PROJECT_ROOT), env=env,
+        )
+        stdout = proc.stdout + proc.stderr
+        returncode = proc.returncode
+
+        # Parse JSON report if available
+        result = {}
+        if json_path and os.path.exists(json_path):
+            result = _parse_pytest_json(json_path)
+            os.unlink(json_path)
+
+        return result, stdout, returncode
+
+    except subprocess.TimeoutExpired:
+        return {}, f"pytest timed out after {timeout}s", -1
+    except Exception as e:
+        return {}, str(e), -2
+
+
+def _parse_stdout_results(stdout: str) -> dict:
+    """
+    Parse pytest stdout for test results when JSON report is not available.
+    Returns dict with passed, failed, error, skipped counts and test names.
+    """
+    import re
+
+    results = {
+        "passed": 0,
+        "failed": 0,
+        "errors": 0,
+        "skipped": 0,
+        "tests": [],
+    }
+
+    # Parse individual test results: PASSED, FAILED, ERROR, SKIPPED
+    for line in stdout.split('\n'):
+        line = line.strip()
+        if " PASSED" in line:
+            results["passed"] += 1
+            results["tests"].append({"name": line.split(" PASSED")[0].strip(), "status": "passed"})
+        elif " FAILED" in line:
+            results["failed"] += 1
+            results["tests"].append({"name": line.split(" FAILED")[0].strip(), "status": "failed"})
+        elif " ERROR" in line:
+            results["errors"] += 1
+            results["tests"].append({"name": line.split(" ERROR")[0].strip(), "status": "error"})
+        elif " SKIPPED" in line:
+            results["skipped"] += 1
+            results["tests"].append({"name": line.split(" SKIPPED")[0].strip(), "status": "skipped"})
+
+    # Try to parse summary line like "5 passed, 1 failed, 2 skipped"
+    summary_match = re.search(
+        r'(\d+)\s+passed.*?(?:(\d+)\s+failed)?.*?(?:(\d+)\s+skipped)?.*?(?:(\d+)\s+error)?',
+        stdout
+    )
+    if summary_match:
+        if summary_match.group(1):
+            results["passed"] = max(results["passed"], int(summary_match.group(1)))
+        if summary_match.group(2):
+            results["failed"] = max(results["failed"], int(summary_match.group(2)))
+        if summary_match.group(3):
+            results["skipped"] = max(results["skipped"], int(summary_match.group(3)))
+        if summary_match.group(4):
+            results["errors"] = max(results["errors"], int(summary_match.group(4)))
+
+    return results
+
+
+class ExistingTestRunner:
+    """Runs existing tests and integrates results into the comparison report."""
+
+    def __init__(self, config: ComparisonConfig):
+        self.config = config
+
+    def run_all(self, report: ComparisonReport):
+        """Run all existing test suites."""
+        logger.info("Starting existing test integration...")
+
+        if self.config.run_existing_unit_tests:
+            self._run_unit_tests(report)
+
+        if self.config.run_existing_integration_tests:
+            self._run_integration_tests(report)
+            self._run_e2e_tests(report)
+
+        logger.info("Existing test integration complete.")
+
+    # ------------------------------------------------------------------
+    # Unit tests
+    # ------------------------------------------------------------------
+
+    def _run_unit_tests(self, report: ComparisonReport):
+        """Run unit tests from tests/unit/ directory."""
+        t0 = time.time()
+
+        if not UNIT_TEST_DIR.exists():
+            report.add_result(TestResult(
+                category="existing_tests",
+                name="Unit Tests: directory check",
+                status=TestStatus.ERROR,
+                message=f"Unit test directory not found: {UNIT_TEST_DIR}",
+                duration_seconds=time.time() - t0,
+            ))
+            return
+
+        # Run entire unit test suite
+        logger.info("Running unit test suite...")
+        result, stdout, rc = _run_pytest(
+            str(UNIT_TEST_DIR),
+            extra_args=["-x", "--timeout=120"],
+            timeout=600,
+            json_report=True,
+        )
+
+        # Parse results
+        if result and "summary" in result:
+            summary = result["summary"]
+            passed = summary.get("passed", 0)
+            failed = summary.get("failed", 0)
+            errors = summary.get("error", 0)
+            skipped = summary.get("skipped", 0)
+            total = summary.get("total", passed + failed + errors + skipped)
+        else:
+            # Fallback to stdout parsing
+            parsed = _parse_stdout_results(stdout)
+            passed = parsed["passed"]
+            failed = parsed["failed"]
+            errors = parsed["errors"]
+            skipped = parsed["skipped"]
+            total = passed + failed + errors + skipped
+
+        if failed == 0 and errors == 0:
+            status = TestStatus.PASS
+        elif errors > 0:
+            status = TestStatus.ERROR
+        else:
+            status = TestStatus.FAIL
+
+        report.add_result(TestResult(
+            category="existing_tests",
+            name="Unit Tests: overall",
+            status=status,
+            message=(
+                f"Total={total}, Passed={passed}, Failed={failed}, "
+                f"Errors={errors}, Skipped={skipped} | "
+                f"Return code: {rc}"
+            ),
+            instance_a_value={
+                "total": total, "passed": passed, "failed": failed,
+                "errors": errors, "skipped": skipped,
+            },
+            duration_seconds=time.time() - t0,
+            details={"returncode": rc, "stdout_tail": stdout[-2000:] if stdout else ""},
+        ))
+
+        # Report individual test file results
+        for test_file in UNIT_TEST_FILES:
+            test_path = UNIT_TEST_DIR / test_file
+            if not test_path.exists():
+                report.add_result(TestResult(
+                    category="existing_tests",
+                    name=f"Unit: {test_file}",
+                    status=TestStatus.SKIP,
+                    message=f"File not found: {test_path}",
+                ))
+                continue
+
+            tf0 = time.time()
+            file_result, file_stdout, file_rc = _run_pytest(
+                str(test_path),
+                extra_args=["--timeout=60"],
+                timeout=120,
+                json_report=False,
+            )
+
+            parsed = _parse_stdout_results(file_stdout)
+
+            if file_rc == 0:
+                file_status = TestStatus.PASS
+            elif file_rc == 1:
+                file_status = TestStatus.FAIL
+            elif file_rc == 5:
+                file_status = TestStatus.SKIP  # No tests collected
+            else:
+                file_status = TestStatus.ERROR
+
+            report.add_result(TestResult(
+                category="existing_tests",
+                name=f"Unit: {test_file}",
+                status=file_status,
+                message=(
+                    f"Passed={parsed['passed']}, Failed={parsed['failed']}, "
+                    f"Errors={parsed['errors']}, Skipped={parsed['skipped']}"
+                ),
+                instance_a_value=parsed,
+                duration_seconds=time.time() - tf0,
+                details={"returncode": file_rc},
+            ))
+
+    # ------------------------------------------------------------------
+    # Integration tests
+    # ------------------------------------------------------------------
+
+    def _run_integration_tests(self, report: ComparisonReport):
+        """Run integration tests from test/ directory."""
+        for test_file in INTEGRATION_TEST_FILES:
+            test_path = INTEGRATION_TEST_DIR / test_file
+            if not test_path.exists():
+                report.add_result(TestResult(
+                    category="existing_tests",
+                    name=f"Integration: {test_file}",
+                    status=TestStatus.SKIP,
+                    message=f"File not found: {test_path}",
+                ))
+                continue
+
+            t0 = time.time()
+            result, stdout, rc = _run_pytest(
+                str(test_path),
+                extra_args=["-m", "integration", "--timeout=300"],
+                timeout=600,
+                json_report=False,
+            )
+
+            parsed = _parse_stdout_results(stdout)
+
+            if rc == 0:
+                status = TestStatus.PASS
+            elif rc == 5:
+                status = TestStatus.SKIP
+            elif rc == 1:
+                status = TestStatus.FAIL
+            else:
+                status = TestStatus.ERROR
+
+            report.add_result(TestResult(
+                category="existing_tests",
+                name=f"Integration: {test_file}",
+                status=status,
+                message=(
+                    f"Passed={parsed['passed']}, Failed={parsed['failed']}, "
+                    f"Errors={parsed['errors']}, Skipped={parsed['skipped']}"
+                ),
+                instance_a_value=parsed,
+                duration_seconds=time.time() - t0,
+                details={"returncode": rc, "stdout_tail": stdout[-1000:] if stdout else ""},
+            ))
+
+    # ------------------------------------------------------------------
+    # E2E API tests (against both instances)
+    # ------------------------------------------------------------------
+
+    def _run_e2e_tests(self, report: ComparisonReport):
+        """Run E2E API tests from test/test.py against both instances."""
+        if not E2E_TEST_FILE.exists():
+            report.add_result(TestResult(
+                category="existing_tests",
+                name="E2E Tests: file check",
+                status=TestStatus.SKIP,
+                message=f"E2E test file not found: {E2E_TEST_FILE}",
+            ))
+            return
+
+        instances = []
+        if self.config.instance_a.api_url:
+            instances.append(("A", self.config.instance_a))
+        if self.config.instance_b.api_url:
+            instances.append(("B", self.config.instance_b))
+
+        for label, instance in instances:
+            # Run non-destructive E2E tests (skip analysis and clustering which modify state)
+            safe_tests = [
+                "test_map_visualization",
+                "test_annoy_similarity_and_playlist",
+            ]
+
+            for test_name in safe_tests:
+                t0 = time.time()
+                result, stdout, rc = _run_pytest(
+                    str(E2E_TEST_FILE),
+                    extra_args=["-k", test_name, "--timeout=300"],
+                    env_override={"BASE_URL": instance.api_url},
+                    timeout=600,
+                    json_report=False,
+                )
+
+                parsed = _parse_stdout_results(stdout)
+
+                if rc == 0:
+                    status = TestStatus.PASS
+                elif rc == 5:
+                    status = TestStatus.SKIP
+                elif rc == 1:
+                    status = TestStatus.FAIL
+                else:
+                    status = TestStatus.ERROR
+
+                report.add_result(TestResult(
+                    category="existing_tests",
+                    name=f"E2E ({label}): {test_name}",
+                    status=status,
+                    message=(
+                        f"Instance {label} ({instance.api_url}): "
+                        f"Passed={parsed['passed']}, Failed={parsed['failed']}"
+                    ),
+                    instance_a_value=parsed if label == "A" else None,
+                    instance_b_value=parsed if label == "B" else None,
+                    duration_seconds=time.time() - t0,
+                    details={"returncode": rc, "instance": label,
+                             "api_url": instance.api_url,
+                             "stdout_tail": stdout[-500:] if stdout else ""},
+                ))
+
+    # ------------------------------------------------------------------
+    # Discovery: list all available tests
+    # ------------------------------------------------------------------
+
+    @staticmethod
+    def discover_tests() -> dict:
+        """Discover all available tests and return a structured summary."""
+        discovery = {
+            "unit_tests": [],
+            "integration_tests": [],
+            "e2e_tests": [],
+        }
+
+        # Unit tests
+        if UNIT_TEST_DIR.exists():
+            for f in sorted(UNIT_TEST_DIR.glob("test_*.py")):
+                discovery["unit_tests"].append({
+                    "file": str(f.relative_to(PROJECT_ROOT)),
+                    "name": f.stem,
+                    "exists": True,
+                })
+
+        # Integration tests
+        for f in INTEGRATION_TEST_FILES:
+            path = INTEGRATION_TEST_DIR / f
+            discovery["integration_tests"].append({
+                "file": str(path.relative_to(PROJECT_ROOT)),
+                "name": Path(f).stem,
+                "exists": path.exists(),
+            })
+
+        # E2E tests
+        if E2E_TEST_FILE.exists():
+            for name in E2E_TEST_NAMES:
+                discovery["e2e_tests"].append({
+                    "file": str(E2E_TEST_FILE.relative_to(PROJECT_ROOT)),
+                    "name": name,
+                    "exists": True,
+                })
+
+        return discovery
diff --git a/testing_suite/utils.py b/testing_suite/utils.py
new file mode 100644
index 00000000..e296f471
--- /dev/null
+++ b/testing_suite/utils.py
@@ -0,0 +1,434 @@
+"""
+Shared utilities for the AudioMuse-AI Testing & Comparison Suite.
+
+Provides HTTP helpers, database connectors, Docker log fetchers,
+timing utilities, and result aggregation primitives.
+"""
+
+import json
+import logging
+import subprocess
+import time
+from dataclasses import dataclass, field, asdict
+from datetime import datetime
+from enum import Enum
+from typing import Any, Dict, List, Optional, Tuple
+
+import requests
+
+logger = logging.getLogger(__name__)
+
+
+# ---------------------------------------------------------------------------
+# Result types
+# ---------------------------------------------------------------------------
+
+class TestStatus(str, Enum):
+    PASS = "PASS"
+    FAIL = "FAIL"
+    WARN = "WARN"
+    SKIP = "SKIP"
+    ERROR = "ERROR"
+
+
+@dataclass
+class TestResult:
+    """A single test result entry."""
+    category: str       # e.g. "api", "database", "docker", "performance"
+    name: str           # descriptive test name
+    status: TestStatus
+    message: str = ""
+    instance_a_value: Any = None
+    instance_b_value: Any = None
+    diff: Any = None    # computed difference
+    duration_seconds: float = 0.0
+    details: Dict[str, Any] = field(default_factory=dict)
+
+    def to_dict(self) -> dict:
+        d = asdict(self)
+        d['status'] = self.status.value
+        # Ensure JSON-serializable
+        for k in ('instance_a_value', 'instance_b_value', 'diff', 'details'):
+            try:
+                json.dumps(d[k])
+            except (TypeError, ValueError):
+                d[k] = str(d[k])
+        return d
+
+
+@dataclass
+class CategorySummary:
+    """Summary for a test category."""
+    category: str
+    total: int = 0
+    passed: int = 0
+    failed: int = 0
+    warned: int = 0
+    skipped: int = 0
+    errors: int = 0
+    results: List[TestResult] = field(default_factory=list)
+
+    def add(self, result: TestResult):
+        self.results.append(result)
+        self.total += 1
+        if result.status == TestStatus.PASS:
+            self.passed += 1
+        elif result.status == TestStatus.FAIL:
+            self.failed += 1
+        elif result.status == TestStatus.WARN:
+            self.warned += 1
+        elif result.status == TestStatus.SKIP:
+            self.skipped += 1
+        elif result.status == TestStatus.ERROR:
+            self.errors += 1
+
+
+@dataclass
+class ComparisonReport:
+    """Full comparison report across all categories."""
+    timestamp: str = field(default_factory=lambda: datetime.utcnow().isoformat())
+    instance_a_name: str = ""
+    instance_b_name: str = ""
+    instance_a_branch: str = ""
+    instance_b_branch: str = ""
+    categories: Dict[str, CategorySummary] = field(default_factory=dict)
+    config_snapshot: Dict[str, Any] = field(default_factory=dict)
+
+    def add_result(self, result: TestResult):
+        cat = result.category
+        if cat not in self.categories:
+            self.categories[cat] = CategorySummary(category=cat)
+        self.categories[cat].add(result)
+
+    @property
+    def total_tests(self) -> int:
+        return sum(c.total for c in self.categories.values())
+
+    @property
+    def total_passed(self) -> int:
+        return sum(c.passed for c in self.categories.values())
+
+    @property
+    def total_failed(self) -> int:
+        return sum(c.failed for c in self.categories.values())
+
+    @property
+    def total_errors(self) -> int:
+        return sum(c.errors for c in self.categories.values())
+
+    @property
+    def overall_status(self) -> TestStatus:
+        if self.total_failed > 0 or self.total_errors > 0:
+            return TestStatus.FAIL
+        return TestStatus.PASS
+
+    def to_dict(self) -> dict:
+        return {
+            "timestamp": self.timestamp,
+            "instance_a": {"name": self.instance_a_name, "branch": self.instance_a_branch},
+            "instance_b": {"name": self.instance_b_name, "branch": self.instance_b_branch},
+            "overall_status": self.overall_status.value,
+            "summary": {
+                "total": self.total_tests,
+                "passed": self.total_passed,
+                "failed": self.total_failed,
+                "errors": self.total_errors,
+            },
+            "categories": {
+                name: {
+                    "total": cat.total,
+                    "passed": cat.passed,
+                    "failed": cat.failed,
+                    "warned": cat.warned,
+                    "skipped": cat.skipped,
+                    "errors": cat.errors,
+                    "results": [r.to_dict() for r in cat.results],
+                }
+                for name, cat in self.categories.items()
+            },
+            "config": self.config_snapshot,
+        }
+
+
+# ---------------------------------------------------------------------------
+# HTTP Helpers
+# ---------------------------------------------------------------------------
+
+def http_get(url: str, params: dict = None, timeout: int = 120,
+             retries: int = 3, retry_delay: float = 2.0) -> requests.Response:
+    """HTTP GET with retries on connection errors."""
+    last_exc = None
+    for attempt in range(1, retries + 1):
+        try:
+            resp = requests.get(url, params=params, timeout=timeout)
+            return resp
+        except requests.RequestException as e:
+            last_exc = e
+            if attempt < retries:
+                time.sleep(retry_delay)
+                logger.debug(f"Retry {attempt}/{retries} for GET {url}: {e}")
+    raise last_exc
+
+
+def http_post(url: str, json_data: dict = None, timeout: int = 120,
+              retries: int = 3, retry_delay: float = 2.0) -> requests.Response:
+    """HTTP POST with retries on connection errors."""
+    last_exc = None
+    for attempt in range(1, retries + 1):
+        try:
+            resp = requests.post(url, json=json_data, timeout=timeout)
+            return resp
+        except requests.RequestException as e:
+            last_exc = e
+            if attempt < retries:
+                time.sleep(retry_delay)
+                logger.debug(f"Retry {attempt}/{retries} for POST {url}: {e}")
+    raise last_exc
+
+
+def timed_request(method: str, url: str, **kwargs) -> Tuple[requests.Response, float]:
+    """Execute an HTTP request and return (response, elapsed_seconds)."""
+    start = time.perf_counter()
+    if method.upper() == "GET":
+        resp = http_get(url, **kwargs)
+    else:
+        resp = http_post(url, **kwargs)
+    elapsed = time.perf_counter() - start
+    return resp, elapsed
+
+
+def wait_for_task_success(base_url: str, task_id: str, timeout: int = 1200,
+                          retries: int = 3, retry_delay: float = 2.0) -> dict:
+    """Poll active_tasks until task completes, then verify success via last_task."""
+    start = time.time()
+    while time.time() - start < timeout:
+        act_resp = http_get(f'{base_url}/api/active_tasks', retries=retries,
+                            retry_delay=retry_delay)
+        act_resp.raise_for_status()
+        active = act_resp.json()
+
+        if active and active.get('task_id') == task_id:
+            time.sleep(2)
+            continue
+
+        last_resp = http_get(f'{base_url}/api/last_task', retries=retries,
+                             retry_delay=retry_delay)
+        last_resp.raise_for_status()
+        final = last_resp.json()
+        final_id = final.get('task_id')
+        final_state = (final.get('status') or final.get('state') or '').upper()
+
+        if final_id == task_id:
+            return final
+        # Task might have been superseded; keep polling briefly
+        time.sleep(2)
+
+    return {"status": "TIMEOUT", "task_id": task_id}
+
+
+# ---------------------------------------------------------------------------
+# Database Helpers
+# ---------------------------------------------------------------------------
+
+def get_pg_connection(dsn: str):
+    """Create a psycopg2 connection from DSN."""
+    import psycopg2
+    return psycopg2.connect(dsn, connect_timeout=30,
+                            options='-c statement_timeout=120000')
+
+
+def pg_query(dsn: str, sql: str, params: tuple = None) -> List[tuple]:
+    """Execute a read-only query and return all rows."""
+    import psycopg2
+    conn = psycopg2.connect(dsn, connect_timeout=30,
+                            options='-c statement_timeout=120000')
+    try:
+        with conn.cursor() as cur:
+            cur.execute(sql, params)
+            return cur.fetchall()
+    finally:
+        conn.close()
+
+
+def pg_query_dict(dsn: str, sql: str, params: tuple = None) -> List[dict]:
+    """Execute a query and return rows as dicts."""
+    import psycopg2
+    from psycopg2.extras import RealDictCursor
+    conn = psycopg2.connect(dsn, connect_timeout=30,
+                            options='-c statement_timeout=120000')
+    try:
+        with conn.cursor(cursor_factory=RealDictCursor) as cur:
+            cur.execute(sql, params)
+            return [dict(row) for row in cur.fetchall()]
+    finally:
+        conn.close()
+
+
+def pg_scalar(dsn: str, sql: str, params: tuple = None):
+    """Execute a query that returns a single scalar value."""
+    rows = pg_query(dsn, sql, params)
+    if rows and rows[0]:
+        return rows[0][0]
+    return None
+
+
+# ---------------------------------------------------------------------------
+# Docker Helpers
+# ---------------------------------------------------------------------------
+
+def docker_exec(container: str, command: str, ssh_host: str = "",
+                ssh_user: str = "", ssh_key: str = "",
+                ssh_port: int = 22, timeout: int = 30) -> Tuple[str, str, int]:
+    """
+    Run a command inside a Docker container (locally or via SSH).
+    Returns (stdout, stderr, returncode).
+    """
+    if ssh_host:
+        ssh_cmd = ["ssh", "-o", "StrictHostKeyChecking=no",
+                   "-p", str(ssh_port)]
+        if ssh_key:
+            ssh_cmd += ["-i", ssh_key]
+        ssh_cmd.append(f"{ssh_user}@{ssh_host}" if ssh_user else ssh_host)
+        ssh_cmd.append(f"docker exec {container} {command}")
+        full_cmd = ssh_cmd
+    else:
+        full_cmd = ["docker", "exec", container] + command.split()
+
+    try:
+        proc = subprocess.run(full_cmd, capture_output=True, text=True, timeout=timeout)
+        return proc.stdout, proc.stderr, proc.returncode
+    except subprocess.TimeoutExpired:
+        return "", "Command timed out", -1
+    except FileNotFoundError:
+        return "", "docker or ssh command not found", -2
+
+
+def docker_logs(container: str, tail: int = 500, since: str = "",
+                ssh_host: str = "", ssh_user: str = "", ssh_key: str = "",
+                ssh_port: int = 22, timeout: int = 30) -> Tuple[str, str, int]:
+    """
+    Fetch Docker container logs (locally or via SSH).
+    Returns (stdout, stderr, returncode).
+    """
+    cmd_parts = ["docker", "logs", f"--tail={tail}"]
+    if since:
+        cmd_parts += [f"--since={since}"]
+    cmd_parts.append(container)
+
+    if ssh_host:
+        ssh_cmd = ["ssh", "-o", "StrictHostKeyChecking=no",
+                   "-p", str(ssh_port)]
+        if ssh_key:
+            ssh_cmd += ["-i", ssh_key]
+        ssh_cmd.append(f"{ssh_user}@{ssh_host}" if ssh_user else ssh_host)
+        ssh_cmd.append(" ".join(cmd_parts))
+        full_cmd = ssh_cmd
+    else:
+        full_cmd = cmd_parts
+
+    try:
+        proc = subprocess.run(full_cmd, capture_output=True, text=True, timeout=timeout)
+        return proc.stdout, proc.stderr, proc.returncode
+    except subprocess.TimeoutExpired:
+        return "", "Logs fetch timed out", -1
+    except FileNotFoundError:
+        return "", "docker or ssh command not found", -2
+
+
+def docker_inspect(container: str, ssh_host: str = "", ssh_user: str = "",
+                   ssh_key: str = "", ssh_port: int = 22,
+                   timeout: int = 15) -> Optional[dict]:
+    """
+    Run docker inspect on a container and return the parsed JSON.
+    Returns None on failure.
+    """
+    cmd_parts = ["docker", "inspect", container]
+
+    if ssh_host:
+        ssh_cmd = ["ssh", "-o", "StrictHostKeyChecking=no",
+                   "-p", str(ssh_port)]
+        if ssh_key:
+            ssh_cmd += ["-i", ssh_key]
+        ssh_cmd.append(f"{ssh_user}@{ssh_host}" if ssh_user else ssh_host)
+        ssh_cmd.append(" ".join(cmd_parts))
+        full_cmd = ssh_cmd
+    else:
+        full_cmd = cmd_parts
+
+    try:
+        proc = subprocess.run(full_cmd, capture_output=True, text=True, timeout=timeout)
+        if proc.returncode == 0:
+            data = json.loads(proc.stdout)
+            return data[0] if isinstance(data, list) and data else data
+    except Exception as e:
+        logger.debug(f"docker inspect failed for {container}: {e}")
+    return None
+
+
+# ---------------------------------------------------------------------------
+# Comparison Helpers
+# ---------------------------------------------------------------------------
+
+def compare_values(a, b, tolerance_pct: float = 0.0) -> Tuple[bool, str]:
+    """
+    Compare two values. For numeric types, allow a percentage tolerance.
+    Returns (is_equal, description).
+    """
+    if a is None and b is None:
+        return True, "Both None"
+    if a is None or b is None:
+        return False, f"One is None: A={a}, B={b}"
+
+    if isinstance(a, (int, float)) and isinstance(b, (int, float)):
+        if a == 0 and b == 0:
+            return True, "Both zero"
+        if a == 0 or b == 0:
+            return False, f"A={a}, B={b}"
+        pct_diff = abs(a - b) / max(abs(a), abs(b)) * 100
+        if pct_diff <= tolerance_pct:
+            return True, f"Within tolerance ({pct_diff:.2f}% <= {tolerance_pct}%)"
+        return False, f"Difference {pct_diff:.2f}% exceeds tolerance {tolerance_pct}%"
+
+    if isinstance(a, str) and isinstance(b, str):
+        if a == b:
+            return True, "Strings match"
+        return False, f"Strings differ: '{a[:100]}' vs '{b[:100]}'"
+
+    if isinstance(a, dict) and isinstance(b, dict):
+        keys_a = set(a.keys())
+        keys_b = set(b.keys())
+        if keys_a != keys_b:
+            missing_in_b = keys_a - keys_b
+            missing_in_a = keys_b - keys_a
+            return False, f"Key mismatch: missing_in_B={missing_in_b}, missing_in_A={missing_in_a}"
+        return True, "Dict keys match"
+
+    if isinstance(a, list) and isinstance(b, list):
+        if len(a) == len(b):
+            return True, f"Lists same length ({len(a)})"
+        return False, f"List length differs: {len(a)} vs {len(b)}"
+
+    # Fallback
+    if a == b:
+        return True, "Values equal"
+    return False, f"Values differ: {a} vs {b}"
+
+
+def pct_diff(a: float, b: float) -> float:
+    """Calculate percentage difference between two values."""
+    if a == 0 and b == 0:
+        return 0.0
+    if a == 0 or b == 0:
+        return 100.0
+    return abs(a - b) / max(abs(a), abs(b)) * 100
+
+
+def format_duration(seconds: float) -> str:
+    """Format seconds into a human-readable string."""
+    if seconds < 1:
+        return f"{seconds*1000:.1f}ms"
+    if seconds < 60:
+        return f"{seconds:.2f}s"
+    minutes = int(seconds // 60)
+    secs = seconds % 60
+    return f"{minutes}m {secs:.1f}s"

From f42fe8f0614473f78b32b79b3fba0b00b2d90871 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Thu, 5 Feb 2026 09:27:30 +0000
Subject: [PATCH 15/33] Add .gitignore for testing suite report output
 directory

https://claude.ai/code/session_0122SF3fSXM3e2dNqaJB5NDn
---
 testing_suite/reports/output/.gitignore | 3 +++
 1 file changed, 3 insertions(+)
 create mode 100644 testing_suite/reports/output/.gitignore

diff --git a/testing_suite/reports/output/.gitignore b/testing_suite/reports/output/.gitignore
new file mode 100644
index 00000000..58f3ef52
--- /dev/null
+++ b/testing_suite/reports/output/.gitignore
@@ -0,0 +1,3 @@
+# Report output files are generated at runtime - do not commit
+*
+!.gitignore

From bfaa3f0907d57cc0fd61a2385fa5febb84adb060 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Thu, 5 Feb 2026 11:01:02 +0000
Subject: [PATCH 16/33] Add comprehensive README guide for the testing and
 comparison suite

Covers architecture, prerequisites, quick start, all three config methods
(CLI, YAML, env vars), detailed descriptions of all 5 test categories,
deployment scenarios (local, remote SSH, API-only), report formats,
selective testing, test discovery, result interpretation, and
troubleshooting.

https://claude.ai/code/session_0122SF3fSXM3e2dNqaJB5NDn
---
 testing_suite/README.md | 526 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 526 insertions(+)
 create mode 100644 testing_suite/README.md

diff --git a/testing_suite/README.md b/testing_suite/README.md
new file mode 100644
index 00000000..97296e9c
--- /dev/null
+++ b/testing_suite/README.md
@@ -0,0 +1,526 @@
+# AudioMuse-AI Testing & Comparison Suite
+
+A comprehensive tool for testing all features, database quality, API results, and performance of AudioMuse-AI — comparing two live instances side-by-side (e.g., **main branch** vs **feature branch**).
+
+## Table of Contents
+
+- [Overview](#overview)
+- [Architecture](#architecture)
+- [Prerequisites](#prerequisites)
+- [Quick Start](#quick-start)
+- [Configuration](#configuration)
+  - [CLI Arguments](#cli-arguments)
+  - [YAML Config File](#yaml-config-file)
+  - [Environment Variables](#environment-variables)
+- [Test Categories](#test-categories)
+  - [API Comparison](#1-api-comparison-30-endpoints)
+  - [Database Comparison](#2-database-comparison-17-tables)
+  - [Docker & Infrastructure](#3-docker--infrastructure)
+  - [Performance Benchmarks](#4-performance-benchmarks)
+  - [Existing Test Suite](#5-existing-test-suite-27-tests)
+- [Deployment Scenarios](#deployment-scenarios)
+  - [Same Machine (Different Ports)](#scenario-1-same-machine-different-ports)
+  - [Two Remote Machines](#scenario-2-two-remote-machines-via-ssh)
+  - [API-Only Comparison](#scenario-3-api-only-no-db-or-docker)
+- [Reports](#reports)
+- [Selective Testing](#selective-testing)
+- [Test Discovery](#test-discovery)
+- [Interpreting Results](#interpreting-results)
+- [Troubleshooting](#troubleshooting)
+
+---
+
+## Overview
+
+The testing suite connects to **two AudioMuse-AI instances** simultaneously via:
+
+| Connection     | What it tests                                                   |
+|----------------|-----------------------------------------------------------------|
+| **API (HTTP)** | All 30+ REST endpoints — response codes, shapes, values, errors |
+| **PostgreSQL** | Schema integrity, data quality, embedding health, distributions |
+| **Docker**     | Container health, resource usage, log error analysis            |
+| **Performance**| Latency benchmarks (p50/p95/p99), concurrent load, DB queries   |
+
+It also discovers and runs the **27 existing tests** (unit, integration, E2E) already in the codebase.
+
+The final output is a **self-contained HTML report** (dark theme, filterable, with visual performance charts) plus a **JSON report** for programmatic consumption.
+
+---
+
+## Architecture
+
+```
+testing_suite/
+├── run_comparison.py            # CLI entry point
+├── __main__.py                  # python -m testing_suite
+├── config.py                    # Configuration (CLI / YAML / env vars)
+├── utils.py                     # HTTP helpers, DB connectors, Docker log fetchers
+├── orchestrator.py              # Coordinates all modules, generates reports
+├── comparators/
+│   ├── api_comparator.py        # 30+ API endpoint tests
+│   ├── db_comparator.py         # Schema, data quality, embeddings, integrity
+│   ├── docker_comparator.py     # Container health, logs, resource usage
+│   └── performance_comparator.py # Latency, throughput, DB query benchmarks
+├── test_runner/
+│   └── existing_tests.py        # Discovers & runs 27 existing test files
+├── reports/
+│   ├── html_report.py           # Self-contained HTML report generator
+│   └── output/                  # Generated reports (gitignored)
+├── comparison_config.example.yaml
+└── requirements.txt
+```
+
+---
+
+## Prerequisites
+
+1. **Python 3.10+** on the machine running the suite
+2. **Both AudioMuse-AI instances running** (Flask app + Worker + PostgreSQL + Redis)
+3. **Network access** from the test runner to both instances (API ports, DB ports)
+
+Install dependencies:
+
+```bash
+pip install -r testing_suite/requirements.txt
+```
+
+The suite requires: `requests`, `psycopg2-binary`, `pyyaml`, `pytest`, `pytest-json-report`, `pytest-timeout`.
+
+> **Note:** Docker comparison features require the `docker` CLI accessible from the test runner (either locally or via SSH to the remote hosts).
+
+---
+
+## Quick Start
+
+### Minimal (API-only comparison)
+
+```bash
+python -m testing_suite \
+  --url-a http://192.168.1.100:8000 \
+  --url-b http://192.168.1.101:8000
+```
+
+This tests all API endpoints and runs existing unit tests. Database and Docker tests will be skipped if hosts aren't specified.
+
+### Full comparison
+
+```bash
+python -m testing_suite \
+  --url-a http://192.168.1.100:8000 \
+  --url-b http://192.168.1.101:8000 \
+  --pg-host-a 192.168.1.100 \
+  --pg-host-b 192.168.1.101 \
+  --flask-container-a audiomuse-main-flask \
+  --flask-container-b audiomuse-feature-flask \
+  --name-a main --branch-a main \
+  --name-b feature --branch-b fix/my-feature
+```
+
+### From config file
+
+```bash
+cp testing_suite/comparison_config.example.yaml my_config.yaml
+# Edit my_config.yaml with your instance details
+python -m testing_suite --config my_config.yaml
+```
+
+---
+
+## Configuration
+
+There are three ways to configure the suite (in order of precedence):
+
+### CLI Arguments
+
+All settings can be passed as command-line flags. Each instance has a matching set of flags suffixed with `-a` or `-b`:
+
+```
+Instance Connection:
+  --url-a / --url-b                API base URL (e.g., http://host:8000)
+  --name-a / --name-b              Display name (default: main / feature)
+  --branch-a / --branch-b          Git branch name for reporting
+
+PostgreSQL:
+  --pg-host-a / --pg-host-b        Database host
+  --pg-port-a / --pg-port-b        Database port (default: 5432)
+  --pg-user-a / --pg-user-b        Database user (default: audiomuse)
+  --pg-pass-a / --pg-pass-b        Database password (default: audiomusepassword)
+  --pg-db-a / --pg-db-b            Database name (default: audiomusedb)
+
+Redis:
+  --redis-a / --redis-b            Redis URL (default: redis://localhost:6379/0)
+
+Docker:
+  --flask-container-a / -b         Flask app container name
+  --worker-container-a / -b        RQ worker container name
+  --ssh-host-a / -b                SSH host for remote Docker access
+  --ssh-user-a / -b                SSH username
+  --ssh-key-a / -b                 SSH private key path
+
+Test Control:
+  --only CATEGORIES                Only run listed categories (comma-separated)
+  --skip CATEGORIES                Skip listed categories
+  --warmup N                       Warmup requests before benchmarking (default: 3)
+  --bench-requests N               Benchmark iterations per endpoint (default: 10)
+  --concurrent N                   Concurrent users for load test (default: 5)
+
+Output:
+  --output-dir PATH                Report output directory
+  --format {html,json,both}        Report format (default: both)
+  -v / --verbose                   Debug-level logging
+```
+
+### YAML Config File
+
+Copy and edit the example:
+
+```bash
+cp testing_suite/comparison_config.example.yaml comparison_config.yaml
+```
+
+The YAML file supports all the same settings. See `comparison_config.example.yaml` for the full annotated template with all available options including quality thresholds, test track references, and performance parameters.
+
+### Environment Variables
+
+Every setting can be set via environment variables with the `INSTANCE_A_` / `INSTANCE_B_` prefix:
+
+```bash
+export INSTANCE_A_API_URL=http://192.168.1.100:8000
+export INSTANCE_A_PG_HOST=192.168.1.100
+export INSTANCE_B_API_URL=http://192.168.1.101:8000
+export INSTANCE_B_PG_HOST=192.168.1.101
+export COMPARISON_VERBOSE=true
+export COMPARISON_OUTPUT_DIR=./reports
+
+python -m testing_suite
+```
+
+---
+
+## Test Categories
+
+### 1. API Comparison (30+ endpoints)
+
+Tests every AudioMuse-AI API endpoint on both instances and compares:
+
+| What's tested | Details |
+|---------------|---------|
+| **Status codes** | Both instances return the same HTTP status |
+| **Response shape** | Same JSON keys, same structure |
+| **List lengths** | Playlists, search results, etc. have comparable sizes |
+| **Required fields** | Track objects have `item_id`, `title`, etc. |
+| **Error handling** | Both handle invalid inputs the same way |
+| **Functional tests** | Track search, similarity, alchemy, path finding with real data |
+
+**Endpoints covered:**
+- `/api/config`, `/api/playlists`, `/api/active_tasks`, `/api/last_task`
+- `/api/search_tracks`, `/api/similar_tracks`, `/api/max_distance`
+- `/api/map`, `/api/map_cache_status`
+- `/api/clap/stats`, `/api/clap/warmup/status`, `/api/clap/top_queries`
+- `/api/alchemy`, `/api/find_path`, `/api/sonic_fingerprint/generate`
+- `/api/artist_projections`, `/api/search_artists`
+- `/api/setup/status`, `/api/setup/providers`, `/api/setup/settings`, `/api/setup/server-info`
+- `/api/setup/providers/types`, `/api/providers/enabled`
+- `/api/cron`, `/api/waveform`, `/api/collection/last_task`
+- `/external/search`, `/chat/api/config_defaults`
+- Error cases: nonexistent tasks, missing parameters
+
+### 2. Database Comparison (17 tables)
+
+Connects directly to both PostgreSQL instances and validates:
+
+| Category | Tests |
+|----------|-------|
+| **Schema** | All 17 expected tables exist with correct columns |
+| **Row counts** | Compared with configurable tolerance (default 5%) |
+| **Data quality** | NULL rates in critical score columns (item_id, title, author, tempo, key, scale, mood_vector) |
+| **Duplicates** | No duplicate item_ids in score table |
+| **Mood vector format** | Validates mood_vector string format |
+| **Embedding integrity** | Coverage (% of scores with embeddings), NULL checks, dimension consistency |
+| **Referential integrity** | No orphaned rows in embedding→score, provider_track→provider |
+| **Score distributions** | Statistical comparison of tempo, energy (min/max/avg/stddev) |
+| **Key distribution** | Musical key value comparison between instances |
+| **Playlist quality** | Distinct count, avg tracks per playlist, NULL item_ids |
+| **Index data** | Voyager HNSW, Artist GMM, Map projection, Artist projection presence |
+| **Task health** | Failed task count, stuck tasks (>2hr), success rate comparison |
+| **Provider config** | Same provider types and settings |
+| **App settings** | Same configuration keys |
+
+### 3. Docker & Infrastructure
+
+Analyzes container health and logs via the Docker CLI (local or SSH):
+
+| Category | Tests |
+|----------|-------|
+| **Container status** | Running/stopped for Flask, Worker, PostgreSQL, Redis |
+| **Restart counts** | Flags high restart counts (>5 = FAIL) |
+| **Health checks** | Docker health check status comparison |
+| **Memory usage** | MB comparison with % difference threshold |
+| **CPU usage** | Percentage comparison |
+| **Error patterns** | 11 patterns: tracebacks, OOM, connection errors, timeouts, permission, disk, crashes, worker deaths, DB errors, Redis errors |
+| **Warning patterns** | 5 patterns: deprecation, warnings, retries, slow ops, memory pressure |
+| **Python tracebacks** | Exact count comparison (>10 = FAIL) |
+| **Redis connectivity** | Ping test from inside Flask container |
+| **PostgreSQL connectivity** | SELECT 1 test from inside Flask container |
+
+### 4. Performance Benchmarks
+
+Measures and compares response times with statistical rigor:
+
+| Category | Details |
+|----------|---------|
+| **Endpoint latency** | 16 endpoints benchmarked with warmup phase, measuring p50/p95/p99/mean/max/stddev |
+| **Concurrent load** | Configurable concurrent users hitting key endpoints simultaneously, measuring throughput (req/s) |
+| **DB query performance** | 8 critical queries benchmarked: counts, joins, aggregations, group-bys |
+
+**Thresholds:**
+- **PASS**: Instance B within 20% of A (or faster)
+- **WARN**: Instance B 20-100% slower
+- **FAIL**: Instance B >2x slower
+
+### 5. Existing Test Suite (27 tests)
+
+Discovers and runs all tests already in the codebase:
+
+| Category | Files | Tests |
+|----------|-------|-------|
+| **Unit tests** | 17 files in `tests/unit/` | test_ai, test_analysis, test_app_analysis, test_artist_gmm_manager, test_clap_text_search, test_clustering, test_clustering_helper, test_clustering_postprocessing, test_commons, test_mediaserver, test_memory_cleanup, test_memory_utils, test_path_manager, test_song_alchemy, test_sonic_fingerprint_manager, test_string_sanitization, test_voyager_manager |
+| **Integration tests** | 2 files in `test/` | test_analysis_integration, test_clap_analysis_integration |
+| **E2E API tests** | 8 tests in `test/test.py` | analysis smoke, instant playlist, sonic fingerprint, song alchemy, map visualization, similarity, song path, clustering smoke |
+
+Unit tests run once (they mock dependencies). E2E tests run against both instances with the `BASE_URL` pointed at each.
+
+---
+
+## Deployment Scenarios
+
+### Scenario 1: Same Machine, Different Ports
+
+Two Docker Compose stacks running on ports 8000 and 8001:
+
+```bash
+python -m testing_suite \
+  --url-a http://localhost:8000 --url-b http://localhost:8001 \
+  --pg-host-a localhost --pg-port-a 5432 \
+  --pg-host-b localhost --pg-port-b 5433 \
+  --flask-container-a audiomuse-main-flask \
+  --flask-container-b audiomuse-feature-flask \
+  --worker-container-a audiomuse-main-worker \
+  --worker-container-b audiomuse-feature-worker
+```
+
+### Scenario 2: Two Remote Machines (via SSH)
+
+Instance A on server1, Instance B on server2:
+
+```bash
+python -m testing_suite \
+  --url-a http://server1:8000 --url-b http://server2:8000 \
+  --pg-host-a server1 --pg-host-b server2 \
+  --ssh-host-a server1 --ssh-user-a deploy --ssh-key-a ~/.ssh/id_rsa \
+  --ssh-host-b server2 --ssh-user-b deploy --ssh-key-b ~/.ssh/id_rsa
+```
+
+The suite will SSH into each server to run `docker inspect`, `docker logs`, and `docker stats`.
+
+### Scenario 3: API-Only (No DB or Docker)
+
+If you only have HTTP access to both instances:
+
+```bash
+python -m testing_suite \
+  --url-a http://main.example.com --url-b http://feature.example.com \
+  --only api,performance
+```
+
+---
+
+## Reports
+
+Every run produces two reports in the output directory (`testing_suite/reports/output/` by default):
+
+### HTML Report
+
+A self-contained, dark-themed HTML file with:
+- Overall pass/fail status badge
+- Summary cards (total, passed, failed, errors, warnings)
+- Per-category expandable sections
+- Filterable result tables (filter by Pass/Fail/Warn/Error/Skip)
+- Side-by-side Instance A vs Instance B values
+- Visual performance bar charts comparing latency
+
+Open in any browser: `testing_suite/reports/output/comparison_latest.html`
+
+### JSON Report
+
+Machine-readable format with full test details:
+
+```json
+{
+  "timestamp": "2025-01-15T10:30:00.000000",
+  "instance_a": {"name": "main", "branch": "main"},
+  "instance_b": {"name": "feature", "branch": "feature"},
+  "overall_status": "PASS",
+  "summary": {"total": 150, "passed": 142, "failed": 3, "errors": 0},
+  "categories": {
+    "api": {"total": 50, "passed": 48, "failed": 2, ...},
+    "database": {"total": 40, "passed": 38, ...},
+    ...
+  }
+}
+```
+
+---
+
+## Selective Testing
+
+### Run only specific categories
+
+```bash
+# API and database only
+python -m testing_suite --url-a ... --url-b ... --only api,db
+
+# Performance only
+python -m testing_suite --url-a ... --url-b ... --only performance
+
+# Existing unit tests only
+python -m testing_suite --url-a ... --url-b ... --only unit
+```
+
+**Category names:** `api`, `db` (or `database`), `docker`, `performance` (or `perf`), `existing_tests`, `unit`, `integration`
+
+### Skip specific categories
+
+```bash
+# Skip Docker and existing tests (faster)
+python -m testing_suite --url-a ... --url-b ... --skip docker,existing_tests
+
+# Skip performance benchmarks
+python -m testing_suite --url-a ... --url-b ... --skip perf
+```
+
+### Tune performance test parameters
+
+```bash
+# Light benchmarking (fast)
+python -m testing_suite --url-a ... --url-b ... --warmup 1 --bench-requests 3 --concurrent 2
+
+# Heavy benchmarking (thorough)
+python -m testing_suite --url-a ... --url-b ... --warmup 10 --bench-requests 50 --concurrent 20
+```
+
+---
+
+## Test Discovery
+
+List all available tests without running anything:
+
+```bash
+python -m testing_suite --discover
+```
+
+Output:
+
+```
+=== AudioMuse-AI Test Discovery ===
+
+Unit Tests (17 files):
+  [OK] tests/unit/test_ai.py
+  [OK] tests/unit/test_analysis.py
+  ...
+
+Integration Tests (2 files):
+  [OK] test/test_analysis_integration.py
+  [OK] test/test_clap_analysis_integration.py
+
+E2E API Tests (8 tests):
+  [OK] test_analysis_smoke_flow (test/test.py)
+  ...
+
+Total: 27 test files/entries discovered.
+```
+
+---
+
+## Interpreting Results
+
+### Status Codes
+
+| Status | Meaning |
+|--------|---------|
+| **PASS** | Both instances match or values are within acceptable thresholds |
+| **FAIL** | Significant difference detected, or a quality check failed |
+| **WARN** | Minor difference or non-critical issue detected |
+| **SKIP** | Test could not run (missing table, unreachable endpoint, etc.) |
+| **ERROR** | Test itself errored (connection failure, timeout, exception) |
+
+### Exit Codes
+
+The CLI returns:
+- `0` — All tests passed (or only warnings/skips)
+- `1` — One or more tests failed or errored
+
+This makes it suitable for CI/CD pipelines:
+
+```bash
+python -m testing_suite --config config.yaml || echo "Comparison found regressions!"
+```
+
+### Performance Comparison Logic
+
+- **B/A ratio ≤ 1.2** → PASS (B is within 20% of A)
+- **B/A ratio ≤ 2.0** → WARN (B is up to 2x slower)
+- **B/A ratio > 2.0** → FAIL (B is more than 2x slower)
+- If B is faster than A, that's always a PASS
+
+---
+
+## Troubleshooting
+
+### "Cannot connect to either database instance"
+
+- Verify PostgreSQL is accessible from the test runner machine
+- Check `--pg-host-a/b`, `--pg-port-a/b`, `--pg-user-a/b`, `--pg-pass-a/b`
+- Ensure `pg_hba.conf` allows connections from the test runner IP
+- Try: `psql -h <host> -p <port> -U <user> -d <dbname> -c "SELECT 1"`
+
+### "Neither instance is reachable"
+
+- Verify the API URLs are correct and the Flask servers are running
+- Check firewall rules allow traffic on port 8000
+- Try: `curl http://<host>:8000/api/config`
+
+### "Cannot inspect containers (Docker not available)"
+
+- Docker CLI must be installed on the test runner (or accessible via SSH)
+- Container names must match what's running (`docker ps --format '{{.Names}}'`)
+- For remote Docker access, SSH must be configured: `--ssh-host-a/b`, `--ssh-user-a/b`
+
+### "pytest-json-report not found"
+
+```bash
+pip install pytest-json-report
+```
+
+Or install all dependencies:
+
+```bash
+pip install -r testing_suite/requirements.txt
+```
+
+### Customizing test tracks
+
+The API functional tests (search, similarity, alchemy, path) use reference tracks. Set them to tracks that exist in your library:
+
+```bash
+python -m testing_suite --config my_config.yaml
+```
+
+In your YAML config:
+
+```yaml
+test_track_artist_1: "Artist In Your Library"
+test_track_title_1: "Song Title"
+test_track_artist_2: "Another Artist"
+test_track_title_2: "Another Song"
+```

From 1446375a40a86c6bfb967bc61d9336a4f3b87f1a Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Thu, 5 Feb 2026 19:47:09 +0100
Subject: [PATCH 17/33] bug fixes and hardware selection on setup

---
 app_setup.py         |  40 ++++++++
 tasks/analysis.py    |  34 +++++++
 tasks/mediaserver.py |   2 +-
 templates/setup.html | 220 +++++++++++++++++++++++++++++++++++++------
 4 files changed, 267 insertions(+), 29 deletions(-)

diff --git a/app_setup.py b/app_setup.py
index 813ed3a0..263cd5e6 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -71,6 +71,8 @@ def get_all_settings():
         settings = {}
         for row in rows:
             key, value, category, description = row
+            # Handle None category - use 'general' as default
+            category = category or 'general'
             if category not in settings:
                 settings[category] = {}
             settings[category][key] = {
@@ -483,6 +485,16 @@ def create_provider():
         return jsonify({'error': 'Validation failed', 'details': validation_errors}), 400
 
     try:
+        # Check if provider of this type already exists - upsert to prevent duplicates
+        existing_providers = get_all_providers()
+        existing = next((p for p in existing_providers if p['provider_type'] == provider_type), None)
+
+        if existing:
+            # Update existing provider instead of creating duplicate
+            update_provider(existing['id'], name=name, config_data=config_data, enabled=enabled, priority=priority)
+            logger.info(f"Updated existing provider {existing['id']} ({provider_type}) instead of creating duplicate")
+            return jsonify({'id': existing['id'], 'message': 'Provider updated', 'was_update': True}), 200
+
         provider_id = add_provider(provider_type, name, config_data, enabled, priority)
         return jsonify({'id': provider_id, 'message': 'Provider created'}), 201
     except Exception as e:
@@ -836,6 +848,7 @@ def get_server_info():
     """
     import socket
     import os
+    import subprocess
 
     # Try to get the server's IP address
     try:
@@ -856,6 +869,31 @@ def get_server_info():
     except Exception:
         host_ip = 'localhost'
 
+    # Detect GPU availability
+    gpu_available = False
+    gpu_name = None
+
+    # Method 1: Check if onnxruntime-gpu CUDA provider is available
+    try:
+        import onnxruntime as ort
+        providers = ort.get_available_providers()
+        if 'CUDAExecutionProvider' in providers:
+            gpu_available = True
+    except Exception:
+        pass
+
+    # Method 2: Try nvidia-smi for GPU name (if available)
+    if gpu_available:
+        try:
+            result = subprocess.run(
+                ['nvidia-smi', '--query-gpu=name', '--format=csv,noheader,nounits'],
+                capture_output=True, text=True, timeout=5
+            )
+            if result.returncode == 0 and result.stdout.strip():
+                gpu_name = result.stdout.strip().split('\n')[0]  # First GPU
+        except Exception:
+            pass
+
     return jsonify({
         'host': host_ip,
         'hostname': socket.gethostname() if hasattr(socket, 'gethostname') else 'unknown',
@@ -863,6 +901,8 @@ def get_server_info():
         'postgres_port': os.environ.get('POSTGRES_PORT', '5432'),
         'postgres_host': os.environ.get('POSTGRES_HOST', 'postgres'),
         'redis_url': os.environ.get('REDIS_URL', 'redis://redis:6379/0'),
+        'gpu_available': gpu_available,
+        'gpu_name': gpu_name,
     })
 
 
diff --git a/tasks/analysis.py b/tasks/analysis.py
index dfe4a737..5cfc7b93 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -1343,6 +1343,40 @@ def monitor_and_clear_jobs():
                 log_and_update_main(status_message, progress, checked_album_ids=list(checked_album_ids))
                 time.sleep(5)
 
+            # Wait for any album analysis jobs still running on the queue from a previous run.
+            # This handles the case where the main task resumes, finds all albums already checked,
+            # but their album tasks are still executing from the previous run.
+            from rq import Queue
+            default_queue = Queue('default', connection=redis_conn)
+            wait_count = 0
+            while True:
+                # Count album analysis jobs still running or queued
+                pending_album_jobs = 0
+                for job in default_queue.jobs:
+                    if hasattr(job, 'func_name') and 'analyze_album_task' in str(job.func_name):
+                        pending_album_jobs += 1
+
+                # Also check started job registry for running jobs
+                started_registry = default_queue.started_job_registry
+                for job_id in started_registry.get_job_ids():
+                    try:
+                        from rq.job import Job
+                        job = Job.fetch(job_id, connection=redis_conn)
+                        if hasattr(job, 'func_name') and 'analyze_album_task' in str(job.func_name):
+                            pending_album_jobs += 1
+                    except Exception:
+                        pass
+
+                if pending_album_jobs == 0:
+                    break
+
+                wait_count += 1
+                if wait_count == 1:
+                    log_and_update_main(f"Waiting for {pending_album_jobs} album analysis job(s) from previous run to complete...", 90)
+                elif wait_count % 6 == 0:  # Log every 30 seconds
+                    log_and_update_main(f"Still waiting for {pending_album_jobs} album analysis job(s)...", 90)
+                time.sleep(5)
+
             log_and_update_main("Performing final index rebuild...", 95)
             # Build Voyager index (song embeddings)
             build_and_store_voyager_index(get_db())
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index 1c8e06a7..2ada2e63 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -1108,7 +1108,7 @@ def get_enabled_providers_for_playlists():
     Returns:
         List of dicts with 'id', 'name', 'type' for each enabled provider
     """
-    from app_helper import get_providers
+    from app_setup import get_providers
 
     providers = get_providers(enabled_only=True)
     return [
diff --git a/templates/setup.html b/templates/setup.html
index 624b2711..99f07972 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -687,6 +687,71 @@
     .worker-connection-info .config-field {
         margin-bottom: 1.25rem;
     }
+
+    /* Hardware Info Display */
+    .hardware-info-box {
+        display: flex;
+        align-items: flex-start;
+        gap: 1rem;
+        padding: 1.25rem;
+        background: var(--bg-card);
+        border-radius: 8px;
+        border: 2px solid var(--border-color);
+    }
+
+    .hardware-info-box.gpu-detected {
+        border-color: #28a745;
+        background: rgba(40, 167, 69, 0.1);
+    }
+
+    .hardware-info-box .hw-icon {
+        font-size: 2.5rem;
+        line-height: 1;
+    }
+
+    .hardware-info-box .hw-details {
+        flex: 1;
+    }
+
+    .hardware-info-box .hw-title {
+        font-weight: bold;
+        font-size: 1.1rem;
+        margin-bottom: 0.25rem;
+    }
+
+    .hardware-info-box .hw-subtitle {
+        color: var(--text-muted);
+        font-size: 0.9rem;
+        margin-bottom: 0.75rem;
+    }
+
+    .hardware-info-box .hw-description {
+        font-size: 0.9rem;
+        line-height: 1.5;
+    }
+
+    .hardware-benefits {
+        margin-top: 1rem;
+        padding: 1rem;
+        background: rgba(37, 99, 235, 0.1);
+        border-radius: 8px;
+        border-left: 3px solid var(--color-primary);
+    }
+
+    .hardware-benefits h4 {
+        margin: 0 0 0.5rem 0;
+        font-size: 0.95rem;
+    }
+
+    .hardware-benefits ul {
+        margin: 0;
+        padding-left: 1.25rem;
+        font-size: 0.9rem;
+    }
+
+    .hardware-benefits li {
+        margin-bottom: 0.25rem;
+    }
 </style>
 {% endblock %}
 
@@ -751,11 +816,21 @@ <h3>Select Deployment Mode</h3>
             </div>
         </div>
 
-        <div class="step-section">
-            <h3>Select Hardware Configuration</h3>
+        <!-- Hardware Info for Unified Mode (read-only, auto-detected) -->
+        <div class="step-section" id="hardware-info-section">
+            <h3>Current Hardware Configuration</h3>
+            <div id="hardware-info-content">
+                <!-- Populated by JS based on auto-detection -->
+                <p class="description">Detecting hardware...</p>
+            </div>
+        </div>
+
+        <!-- Hardware Selection for Split Mode (selectable for worker config) -->
+        <div class="step-section" id="hardware-select-section" style="display: none;">
+            <h3>Worker Hardware Configuration</h3>
             <p class="description">
-                Choose your hardware setup for music analysis. GPU acceleration significantly speeds up
-                the ML analysis process.
+                Select the hardware configuration for your remote workers. This helps generate the correct
+                docker-compose recommendations.
             </p>
 
             <div class="hardware-options">
@@ -1080,25 +1155,6 @@ <h4>Existing Installation Detected</h4>
     }
 
     function applyExistingSettings() {
-        // Apply hardware type from saved settings
-        if (existingSettings.hardware_type) {
-            selectedHardware = existingSettings.hardware_type;
-            document.querySelectorAll('.hardware-option[data-hardware]').forEach(option => {
-                option.classList.remove('selected');
-                if (option.dataset.hardware === selectedHardware) {
-                    option.classList.add('selected');
-                }
-            });
-            // Update GPU clustering option state
-            const gpuClustering = document.getElementById('setting-gpu-clustering');
-            if (selectedHardware === 'nvidia') {
-                gpuClustering.disabled = false;
-            } else {
-                gpuClustering.disabled = true;
-                gpuClustering.checked = false;
-            }
-        }
-
         // Apply deployment type from saved settings
         if (existingSettings.deployment_type) {
             selectedDeployment = existingSettings.deployment_type;
@@ -1109,6 +1165,19 @@ <h4>Existing Installation Detected</h4>
                 }
             });
             updateWorkerConfigVisibility();
+            updateHardwareSections();
+        }
+
+        // For split mode, apply saved worker hardware selection
+        // For unified mode, hardware is auto-detected from server
+        if (selectedDeployment === 'split' && existingSettings.hardware_type) {
+            selectedHardware = existingSettings.hardware_type;
+            document.querySelectorAll('.hardware-option[data-hardware]').forEach(option => {
+                option.classList.remove('selected');
+                if (option.dataset.hardware === selectedHardware) {
+                    option.classList.add('selected');
+                }
+            });
         }
 
         // Apply other settings
@@ -1443,8 +1512,9 @@ <h4>Existing Installation Detected</h4>
                 this.classList.add('selected');
                 selectedDeployment = this.dataset.deployment;
 
-                // Show/hide worker config section
+                // Show/hide worker config section and hardware sections
                 updateWorkerConfigVisibility();
+                updateHardwareSections();
             };
         });
     }
@@ -1455,11 +1525,93 @@ <h4>Existing Installation Detected</h4>
             if (response.ok) {
                 const data = await response.json();
                 serverInfo = data;
+
+                // Auto-detect hardware based on GPU availability
+                if (data.gpu_available) {
+                    selectedHardware = 'nvidia';
+                } else {
+                    selectedHardware = 'cpu';
+                }
             }
         } catch (err) {
             console.log('Could not load server info, using defaults');
         }
         updateWorkerConnectionInfo();
+        updateHardwareSections();
+        renderHardwareInfo();
+    }
+
+    function updateHardwareSections() {
+        const infoSection = document.getElementById('hardware-info-section');
+        const selectSection = document.getElementById('hardware-select-section');
+
+        if (selectedDeployment === 'unified') {
+            // Unified: Show info (read-only), hide selection
+            infoSection.style.display = 'block';
+            selectSection.style.display = 'none';
+        } else {
+            // Split: Hide info, show selection for worker hardware
+            infoSection.style.display = 'none';
+            selectSection.style.display = 'block';
+        }
+    }
+
+    function renderHardwareInfo() {
+        const container = document.getElementById('hardware-info-content');
+        const gpuAvailable = serverInfo.gpu_available;
+        const gpuName = serverInfo.gpu_name;
+
+        let html = '';
+
+        if (gpuAvailable) {
+            html = `
+                <div class="hardware-info-box gpu-detected">
+                    <div class="hw-icon">&#9889;</div>
+                    <div class="hw-details">
+                        <div class="hw-title">NVIDIA GPU Detected</div>
+                        <div class="hw-subtitle">${gpuName || 'CUDA acceleration enabled'}</div>
+                        <div class="hw-description">
+                            Your system is running with GPU acceleration. Audio analysis will use CUDA
+                            for faster ML inference, significantly reducing processing time.
+                        </div>
+                    </div>
+                </div>
+            `;
+        } else {
+            html = `
+                <div class="hardware-info-box">
+                    <div class="hw-icon">&#128187;</div>
+                    <div class="hw-details">
+                        <div class="hw-title">CPU Mode</div>
+                        <div class="hw-subtitle">Running without GPU acceleration</div>
+                        <div class="hw-description">
+                            Your system is running in CPU-only mode. Audio analysis will work but may be slower
+                            for large libraries.
+                        </div>
+                    </div>
+                </div>
+                <div class="hardware-benefits">
+                    <h4>&#128161; Want faster analysis?</h4>
+                    <ul>
+                        <li><strong>5-10x faster</strong> audio fingerprinting with NVIDIA GPU</li>
+                        <li>Enables GPU-accelerated clustering with RAPIDS cuML</li>
+                        <li>Requires an NVIDIA GPU with CUDA support and the nvidia-container-toolkit</li>
+                        <li>Use <code>docker-compose-unified-nvidia.yaml</code> to enable GPU mode</li>
+                    </ul>
+                </div>
+            `;
+        }
+
+        container.innerHTML = html;
+
+        // Update GPU clustering checkbox based on detected hardware
+        const gpuClustering = document.getElementById('setting-gpu-clustering');
+        if (gpuAvailable) {
+            gpuClustering.disabled = false;
+        } else {
+            gpuClustering.disabled = true;
+            gpuClustering.checked = false;
+        }
     }
 
     function updateWorkerConfigVisibility() {
@@ -1581,12 +1733,24 @@ <h4>Existing Installation Detected</h4>
             ? 'Unified (server + worker on same machine)'
             : 'Split (workers on separate machines)';
 
+        // Hardware info differs by deployment mode
+        let hardwareLabel, hardwareValue;
+        if (selectedDeployment === 'unified') {
+            hardwareLabel = 'Server Hardware (Detected)';
+            hardwareValue = selectedHardware === 'nvidia'
+                ? `NVIDIA GPU${serverInfo.gpu_name ? ' (' + serverInfo.gpu_name + ')' : ''}`
+                : 'CPU Only';
+        } else {
+            hardwareLabel = 'Worker Hardware';
+            hardwareValue = selectedHardware === 'nvidia' ? 'NVIDIA GPU' : 'CPU Only';
+        }
+
         // Determine recommended compose files
         let composeFiles = [];
         if (selectedDeployment === 'unified') {
             composeFiles.push(selectedHardware === 'nvidia'
-                ? 'docker-compose-unified-nvidia.yaml'
-                : 'docker-compose-unified.yaml');
+                ? 'docker-compose-unified-nvidia.yaml (current)'
+                : 'docker-compose-unified.yaml (current)');
         } else {
             composeFiles.push('docker-compose-server.yaml (this machine)');
             composeFiles.push(selectedHardware === 'nvidia'
@@ -1614,8 +1778,8 @@ <h4>Existing Installation Detected</h4>
                 <span class="summary-value">${deploymentInfo}</span>
             </div>
             <div class="summary-item">
-                <span class="summary-label">Hardware</span>
-                <span class="summary-value">${selectedHardware === 'nvidia' ? 'NVIDIA GPU' : 'CPU Only'}</span>
+                <span class="summary-label">${hardwareLabel}</span>
+                <span class="summary-value">${hardwareValue}</span>
             </div>
             <div class="summary-item">
                 <span class="summary-label">Docker Compose Files</span>

From e22c9854f7d5f89471e3672317f95860de26052e Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Thu, 5 Feb 2026 21:17:16 +0100
Subject: [PATCH 18/33] bug fixes

---
 tasks/mediaserver.py                        |  95 ++-
 templates/clap_search.html                  |  40 +-
 templates/settings.html                     |  14 +-
 templates/setup.html                        |  11 +-
 testing_suite/comparators/api_comparator.py | 815 +++++++++++++++++++-
 testing_suite/comparison_config.yaml        |  78 ++
 testing_suite/config.py                     |   4 +
 testing_suite/run_comparison.py             |  10 +
 8 files changed, 1032 insertions(+), 35 deletions(-)
 create mode 100644 testing_suite/comparison_config.yaml

diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index 2ada2e63..3d26b327 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -1005,7 +1005,8 @@ def create_playlist_multi_provider(playlist_name, item_ids, provider_ids=None, u
     Returns:
         Dict with results for each provider: {provider_id: {'success': bool, 'playlist_id': str, 'error': str}}
     """
-    from app_helper import get_providers, get_provider_by_id, get_primary_provider_id
+    from app_setup import get_providers, get_provider_by_id
+    from app_helper import get_primary_provider_id
 
     if not playlist_name:
         raise ValueError("Playlist name is required")
@@ -1066,7 +1067,7 @@ def create_playlist_multi_provider(playlist_name, item_ids, provider_ids=None, u
                 }
                 continue
 
-            created = _create_playlist_for_provider_type(provider_type, playlist_name, remapped_ids, user_creds)
+            created = _create_playlist_for_provider_type(provider_type, playlist_name, remapped_ids, user_creds, provider.get('config'))
 
             results[provider_id] = {
                 'success': True,
@@ -1085,20 +1086,82 @@ def create_playlist_multi_provider(playlist_name, item_ids, provider_ids=None, u
     return results
 
 
-def _create_playlist_for_provider_type(provider_type, playlist_name, item_ids, user_creds=None):
-    """Create playlist on a specific provider type."""
-    if provider_type == 'jellyfin':
-        return jellyfin_create_instant_playlist(playlist_name, item_ids, user_creds)
-    elif provider_type == 'navidrome':
-        return navidrome_create_instant_playlist(playlist_name, item_ids, user_creds)
-    elif provider_type == 'lyrion':
-        return lyrion_create_instant_playlist(playlist_name, item_ids)
-    elif provider_type == 'emby':
-        return emby_create_instant_playlist(playlist_name, item_ids, user_creds)
-    elif provider_type == 'localfiles':
-        return localfiles_create_instant_playlist(playlist_name, item_ids, user_creds)
-    else:
-        raise ValueError(f"Unknown provider type: {provider_type}")
+def _create_playlist_for_provider_type(provider_type, playlist_name, item_ids, user_creds=None, provider_config=None):
+    """Create playlist on a specific provider type.
+
+    When called from multi-provider mode, provider_config contains the DB-stored
+    config (url, token, etc.).  We temporarily apply these values to the config
+    module so that downstream provider functions (which read config.JELLYFIN_URL
+    etc.) pick them up, and we build user_creds from the stored config when the
+    caller hasn't supplied explicit credentials.
+    """
+    # Build a mapping of config module attributes to override from the provider's
+    # stored DB config so that provider functions that read config.* work correctly
+    # even when environment variables are empty.
+    _config_overrides = {}
+    if provider_config:
+        if provider_type == 'jellyfin':
+            _config_overrides = {
+                'JELLYFIN_URL': provider_config.get('url', ''),
+                'JELLYFIN_TOKEN': provider_config.get('token', ''),
+                'JELLYFIN_USER_ID': provider_config.get('user_id', ''),
+            }
+            if not user_creds:
+                user_creds = {
+                    'token': provider_config.get('token', ''),
+                    'user_identifier': provider_config.get('user_id', ''),
+                }
+        elif provider_type == 'navidrome':
+            _config_overrides = {
+                'NAVIDROME_URL': provider_config.get('url', ''),
+                'NAVIDROME_USER': provider_config.get('user', ''),
+                'NAVIDROME_PASSWORD': provider_config.get('password', ''),
+            }
+        elif provider_type == 'emby':
+            _config_overrides = {
+                'EMBY_URL': provider_config.get('url', ''),
+                'EMBY_TOKEN': provider_config.get('token', ''),
+                'EMBY_USER_ID': provider_config.get('user_id', ''),
+            }
+            if not user_creds:
+                user_creds = {
+                    'token': provider_config.get('token', ''),
+                    'user_id': provider_config.get('user_id', ''),
+                }
+        elif provider_type == 'lyrion':
+            _config_overrides = {
+                'LYRION_URL': provider_config.get('url', ''),
+            }
+        elif provider_type == 'localfiles':
+            _config_overrides = {
+                'LOCALFILES_MUSIC_DIR': provider_config.get('music_directory', ''),
+                'LOCALFILES_PLAYLIST_DIR': provider_config.get('playlist_directory', ''),
+            }
+
+    # Temporarily apply config overrides
+    _saved = {}
+    for attr, val in _config_overrides.items():
+        if val:  # Only override if the provider config has a value
+            _saved[attr] = getattr(config, attr, '')
+            setattr(config, attr, val)
+
+    try:
+        if provider_type == 'jellyfin':
+            return jellyfin_create_instant_playlist(playlist_name, item_ids, user_creds)
+        elif provider_type == 'navidrome':
+            return navidrome_create_instant_playlist(playlist_name, item_ids, user_creds)
+        elif provider_type == 'lyrion':
+            return lyrion_create_instant_playlist(playlist_name, item_ids)
+        elif provider_type == 'emby':
+            return emby_create_instant_playlist(playlist_name, item_ids, user_creds)
+        elif provider_type == 'localfiles':
+            return localfiles_create_instant_playlist(playlist_name, item_ids, user_creds)
+        else:
+            raise ValueError(f"Unknown provider type: {provider_type}")
+    finally:
+        # Restore original config values
+        for attr, val in _saved.items():
+            setattr(config, attr, val)
 
 
 def get_enabled_providers_for_playlists():
diff --git a/templates/clap_search.html b/templates/clap_search.html
index 1e12ffd6..8909bd8a 100644
--- a/templates/clap_search.html
+++ b/templates/clap_search.html
@@ -194,7 +194,7 @@ <h1>AudioMuse-AI - Text Search</h1>
     {% endif %}
     
     <div class="search-container">
-        <form id="search-form">
+        <form id="search-form" onsubmit="return false">
             <div class="param-group">
                 <label for="search-query" class="label-with-tooltip">
                     Search Query:
@@ -313,9 +313,11 @@ <h3>Create a Playlist from Results</h3>
                     tag.className = 'example-tag';
                     tag.setAttribute('data-query', query);
                     tag.textContent = query;
-                    tag.addEventListener('click', function() {
+                    tag.addEventListener('click', function(e) {
+                        e.preventDefault();
+                        e.stopPropagation();
                         searchQuery.value = query;
-                        searchForm.dispatchEvent(new Event('submit'));
+                        performSearch();
                     });
                     topQueriesContainer.appendChild(tag);
                 });
@@ -335,49 +337,55 @@ <h3>Create a Playlist from Results</h3>
     
     // Example query tags (kept for backwards compatibility, but replaced by loadTopQueries)
     document.querySelectorAll('.example-tag').forEach(tag => {
-        tag.addEventListener('click', function() {
+        tag.addEventListener('click', function(e) {
+            e.preventDefault();
+            e.stopPropagation();
             const query = this.getAttribute('data-query');
             searchQuery.value = query;
-            searchForm.dispatchEvent(new Event('submit'));
+            performSearch();
         });
     });
     
-    // Search form submission
-    searchForm.addEventListener('submit', async function(e) {
-        e.preventDefault();
-        
+    // Core search logic
+    async function performSearch() {
         const query = searchQuery.value.trim();
         const limit = parseInt(document.getElementById('limit').value);
-        
+
         if (!query || query.length < 3) {
             alert('Please enter at least 3 characters');
             return;
         }
-        
+
         // Show loading
         resultsContainer.classList.remove('hidden');
         resultsList.innerHTML = '<div class="loading-spinner">🔍 Searching...</div>';
         playlistCreator.classList.add('hidden');
-        
+
         try {
             const response = await fetch("{{ url_for('clap_search_bp.clap_search_api') }}", {
                 method: 'POST',
                 headers: { 'Content-Type': 'application/json' },
                 body: JSON.stringify({ query, limit })
             });
-            
+
             const data = await response.json();
-            
+
             if (!response.ok) {
                 throw new Error(data.error || 'Search failed');
             }
-            
+
             currentResults = data.results || [];
             displayResults(currentResults, query);
-            
+
         } catch (error) {
             resultsList.innerHTML = `<div class="error-message">❌ ${error.message}</div>`;
         }
+    }
+
+    // Search form submission
+    searchForm.addEventListener('submit', function(e) {
+        e.preventDefault();
+        performSearch();
     });
     
     function displayResults(results, query) {
diff --git a/templates/settings.html b/templates/settings.html
index fff4605a..8db445dc 100644
--- a/templates/settings.html
+++ b/templates/settings.html
@@ -238,6 +238,7 @@
         border: 1px solid var(--border-color);
         border-radius: 4px;
         background: var(--bg-body);
+        color: var(--text-main);
         cursor: pointer;
         font-size: 0.85rem;
     }
@@ -315,6 +316,7 @@
         border: 1px solid var(--border-color);
         border-radius: 4px;
         background: var(--bg-body);
+        color: var(--text-main);
         cursor: pointer;
         font-size: 0.8rem;
     }
@@ -432,6 +434,7 @@
     .modal-footer .btn-cancel {
         background: var(--bg-card);
         border: 1px solid var(--border-color);
+        color: var(--text-main);
     }
 
     .modal-footer .btn-primary {
@@ -733,7 +736,16 @@ <h3 id="modal-title">Add Provider</h3>
     async function loadSettings() {
         try {
             const response = await fetch('/api/setup/settings');
-            settings = await response.json();
+            const raw = await response.json();
+            // Flatten the category-grouped structure into a simple key-value map.
+            // Backend returns: { category: { key: { value, description } } }
+            // Frontend expects: { key: value }
+            settings = {};
+            for (const category of Object.values(raw)) {
+                for (const [key, entry] of Object.entries(category)) {
+                    settings[key] = entry.value !== undefined ? entry.value : entry;
+                }
+            }
         } catch (err) {
             console.error('Error loading settings:', err);
         }
diff --git a/templates/setup.html b/templates/setup.html
index 99f07972..2b789c4a 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -1148,7 +1148,16 @@ <h4>Existing Installation Detected</h4>
     async function loadSettings() {
         try {
             const response = await fetch('/api/setup/settings');
-            existingSettings = await response.json();
+            const raw = await response.json();
+            // Flatten the category-grouped structure into a simple key-value map.
+            // Backend returns: { category: { key: { value, description } } }
+            // Frontend expects: { key: value }
+            existingSettings = {};
+            for (const category of Object.values(raw)) {
+                for (const [key, entry] of Object.entries(category)) {
+                    existingSettings[key] = entry.value !== undefined ? entry.value : entry;
+                }
+            }
         } catch (err) {
             console.error('Error loading settings:', err);
         }
diff --git a/testing_suite/comparators/api_comparator.py b/testing_suite/comparators/api_comparator.py
index fecb265d..3c98a290 100644
--- a/testing_suite/comparators/api_comparator.py
+++ b/testing_suite/comparators/api_comparator.py
@@ -16,6 +16,8 @@
 import warnings
 from typing import Any, Dict, List, Optional, Tuple
 
+import requests as requests_lib
+
 from testing_suite.config import ComparisonConfig, InstanceConfig
 from testing_suite.utils import (
     ComparisonReport, TestResult, TestStatus,
@@ -34,7 +36,7 @@ def __init__(self, config: ComparisonConfig):
         self.url_b = config.instance_b.api_url.rstrip('/')
         self.name_a = config.instance_a.name
         self.name_b = config.instance_b.name
-        self.timeout = config.api_timeout
+        self.timeout = config.instance_a.api_timeout
         self.retries = config.api_retries
         self.retry_delay = config.api_retry_delay
 
@@ -101,6 +103,45 @@ def run_all(self, report: ComparisonReport):
         self._test_error_handling(report, alive_a, alive_b)
         self._test_collection_last_task(report, alive_a, alive_b)
 
+        # --- Group 1: Additional read-only GET endpoints ---
+        self._test_track_endpoint(report, alive_a, alive_b)
+        self._test_similar_artists(report, alive_a, alive_b)
+        self._test_artist_tracks(report, alive_a, alive_b)
+        self._test_task_status(report, alive_a, alive_b)
+        self._test_config_defaults(report, alive_a, alive_b)
+        self._test_mulan_stats(report, alive_a, alive_b)
+        self._test_mulan_warmup_status(report, alive_a, alive_b)
+        self._test_mulan_top_queries(report, alive_a, alive_b)
+        self._test_external_get_score(report, alive_a, alive_b)
+        self._test_external_get_embedding(report, alive_a, alive_b)
+        self._test_waveform_with_track(report, alive_a, alive_b)
+        self._test_rebuild_map_cache(report, alive_a, alive_b)
+        self._test_build_artist_projection(report, alive_a, alive_b)
+
+        # --- Group 2: Text search POST endpoints ---
+        self._test_clap_search(report, alive_a, alive_b)
+        self._test_clap_warmup(report, alive_a, alive_b)
+        self._test_mulan_search(report, alive_a, alive_b)
+        self._test_mulan_warmup(report, alive_a, alive_b)
+
+        # --- Group 3: Playlist & task start smoke tests ---
+        self._test_create_playlist(report, alive_a, alive_b)
+        self._test_cron_create(report, alive_a, alive_b)
+        if self.config.run_task_start_tests:
+            self._test_analysis_start(report, alive_a, alive_b)
+            self._test_clustering_start(report, alive_a, alive_b)
+            self._test_cleaning_start(report, alive_a, alive_b)
+
+        # --- Group 4: Setup wizard CRUD (feature-only) ---
+        if self.config.run_setup_crud_tests:
+            self._test_setup_provider_crud(report, alive_a, alive_b)
+            self._test_setup_provider_test_connection(report, alive_a, alive_b)
+            self._test_setup_settings_update(report, alive_a, alive_b)
+            self._test_setup_multi_provider_toggle(report, alive_a, alive_b)
+
+        # --- Group 5: Extended error handling ---
+        self._test_extended_error_handling(report, alive_a, alive_b)
+
         logger.info("API comparison tests complete.")
 
     # ------------------------------------------------------------------
@@ -758,3 +799,775 @@ def _find_track_id(self, base_url: str, artist: str, title: str) -> Optional[str
         except Exception as e:
             logger.debug(f"Track search failed: {e}")
         return None
+
+    def _get_last_task_id(self, base_url: str) -> Optional[str]:
+        """Get the task_id from the last completed task."""
+        try:
+            resp = http_get(f"{base_url}/api/last_task", timeout=15, retries=2, retry_delay=1)
+            if resp.status_code == 200:
+                data = resp.json()
+                if isinstance(data, dict):
+                    return data.get("task_id")
+        except Exception:
+            pass
+        return None
+
+    # ==================================================================
+    # Group 1: Additional Read-Only GET Endpoint Tests
+    # ==================================================================
+
+    def _test_track_endpoint(self, report, alive_a, alive_b):
+        """Test GET /api/track with a real item_id."""
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            item_id = self._find_track_id(url, self.config.test_track_artist_1,
+                                           self.config.test_track_title_1)
+            if not item_id:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/track ({label})",
+                    status=TestStatus.SKIP, message="No test track found",
+                    duration_seconds=time.time() - t0))
+                continue
+
+            resp, lat = timed_request("GET", f"{url}/api/track",
+                                       params={"item_id": item_id},
+                                       timeout=self.timeout, retries=self.retries,
+                                       retry_delay=self.retry_delay)
+            if resp.status_code == 200:
+                data = resp.json()
+                has_fields = all(k in data for k in ("item_id", "title", "author"))
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/track ({label})",
+                    status=TestStatus.PASS if has_fields else TestStatus.WARN,
+                    message=f"Fields present: {has_fields}, latency: {lat:.2f}s",
+                    instance_a_value=sorted(data.keys()) if label == "A" else None,
+                    instance_b_value=sorted(data.keys()) if label == "B" else None,
+                    duration_seconds=time.time() - t0,
+                    details={"latency": lat}))
+            else:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/track ({label})",
+                    status=TestStatus.FAIL,
+                    message=f"Status {resp.status_code}: {resp.text[:200]}",
+                    duration_seconds=time.time() - t0))
+
+    def _test_similar_artists(self, report, alive_a, alive_b):
+        """Test GET /api/similar_artists with a known artist."""
+        self._compare_get(report, "/api/similar_artists",
+                          "GET /api/similar_artists",
+                          params={"artist": self.config.test_track_artist_1, "n": 5},
+                          alive_a=alive_a, alive_b=alive_b,
+                          compare_list_length=True)
+
+    def _test_artist_tracks(self, report, alive_a, alive_b):
+        """Test GET /api/artist_tracks with a known artist."""
+        data_a, data_b = self._compare_get(
+            report, "/api/artist_tracks",
+            "GET /api/artist_tracks",
+            params={"artist": self.config.test_track_artist_1},
+            alive_a=alive_a, alive_b=alive_b,
+            compare_list_length=True)
+
+        # Validate track objects have expected fields
+        t0 = time.time()
+        for label, data in [("A", data_a), ("B", data_b)]:
+            if data and isinstance(data, list) and data:
+                track = data[0]
+                expected = {"item_id", "title"}
+                present = expected.intersection(track.keys())
+                report.add_result(TestResult(
+                    category="api",
+                    name=f"GET /api/artist_tracks: {label} track fields",
+                    status=TestStatus.PASS if present == expected else TestStatus.FAIL,
+                    message=f"Has fields {present}, expected {expected}",
+                    duration_seconds=time.time() - t0))
+
+    def _test_task_status(self, report, alive_a, alive_b):
+        """Test GET /api/status/<task_id> using the last task ID."""
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            task_id = self._get_last_task_id(url)
+            if not task_id:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/status (task detail) ({label})",
+                    status=TestStatus.SKIP, message="No last task found",
+                    duration_seconds=time.time() - t0))
+                continue
+
+            resp, lat = timed_request("GET", f"{url}/api/status/{task_id}",
+                                       timeout=self.timeout, retries=self.retries,
+                                       retry_delay=self.retry_delay)
+            if resp.status_code == 200:
+                data = resp.json()
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/status (task detail) ({label})",
+                    status=TestStatus.PASS,
+                    message=f"Task {task_id}: state={data.get('state', 'unknown')}, latency: {lat:.2f}s",
+                    duration_seconds=time.time() - t0,
+                    details={"latency": lat}))
+            else:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/status (task detail) ({label})",
+                    status=TestStatus.WARN,
+                    message=f"Status {resp.status_code} for task {task_id}",
+                    duration_seconds=time.time() - t0))
+
+    def _test_config_defaults(self, report, alive_a, alive_b):
+        """Test GET /api/config/defaults (sonic fingerprint config)."""
+        self._compare_get(report, "/api/config/defaults",
+                          "GET /api/config/defaults",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_mulan_stats(self, report, alive_a, alive_b):
+        """Test GET /api/mulan/stats."""
+        self._compare_get(report, "/api/mulan/stats",
+                          "GET /api/mulan/stats",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_mulan_warmup_status(self, report, alive_a, alive_b):
+        """Test GET /api/mulan/warmup/status."""
+        self._compare_get(report, "/api/mulan/warmup/status",
+                          "GET /api/mulan/warmup/status",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_mulan_top_queries(self, report, alive_a, alive_b):
+        """Test GET /api/mulan/top_queries."""
+        self._compare_get(report, "/api/mulan/top_queries",
+                          "GET /api/mulan/top_queries",
+                          alive_a=alive_a, alive_b=alive_b)
+
+    def _test_external_get_score(self, report, alive_a, alive_b):
+        """Test GET /external/get_score with a real item_id."""
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            item_id = self._find_track_id(url, self.config.test_track_artist_1,
+                                           self.config.test_track_title_1)
+            if not item_id:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /external/get_score ({label})",
+                    status=TestStatus.SKIP, message="No test track found",
+                    duration_seconds=time.time() - t0))
+                continue
+
+            resp, lat = timed_request("GET", f"{url}/external/get_score",
+                                       params={"id": item_id},
+                                       timeout=self.timeout, retries=self.retries,
+                                       retry_delay=self.retry_delay)
+            if resp.status_code == 200:
+                data = resp.json()
+                expected_keys = {"item_id", "title", "author", "tempo", "energy"}
+                present = expected_keys.intersection(data.keys()) if isinstance(data, dict) else set()
+                report.add_result(TestResult(
+                    category="api", name=f"GET /external/get_score ({label})",
+                    status=TestStatus.PASS if len(present) >= 4 else TestStatus.WARN,
+                    message=f"Has {len(present)}/{len(expected_keys)} expected keys, latency: {lat:.2f}s",
+                    duration_seconds=time.time() - t0,
+                    details={"latency": lat, "keys_found": sorted(present)}))
+            else:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /external/get_score ({label})",
+                    status=TestStatus.FAIL,
+                    message=f"Status {resp.status_code}: {resp.text[:200]}",
+                    duration_seconds=time.time() - t0))
+
+    def _test_external_get_embedding(self, report, alive_a, alive_b):
+        """Test GET /external/get_embedding with a real item_id."""
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            item_id = self._find_track_id(url, self.config.test_track_artist_1,
+                                           self.config.test_track_title_1)
+            if not item_id:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /external/get_embedding ({label})",
+                    status=TestStatus.SKIP, message="No test track found",
+                    duration_seconds=time.time() - t0))
+                continue
+
+            resp, lat = timed_request("GET", f"{url}/external/get_embedding",
+                                       params={"id": item_id},
+                                       timeout=self.timeout, retries=self.retries,
+                                       retry_delay=self.retry_delay)
+            if resp.status_code == 200:
+                data = resp.json()
+                has_embedding = isinstance(data, dict) and "embedding" in data
+                emb_len = len(data.get("embedding", [])) if has_embedding else 0
+                report.add_result(TestResult(
+                    category="api", name=f"GET /external/get_embedding ({label})",
+                    status=TestStatus.PASS if has_embedding and emb_len > 0 else TestStatus.WARN,
+                    message=f"Embedding present: {has_embedding}, dimensions: {emb_len}, latency: {lat:.2f}s",
+                    duration_seconds=time.time() - t0,
+                    details={"latency": lat, "embedding_dimensions": emb_len}))
+            else:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /external/get_embedding ({label})",
+                    status=TestStatus.FAIL,
+                    message=f"Status {resp.status_code}: {resp.text[:200]}",
+                    duration_seconds=time.time() - t0))
+
+    def _test_waveform_with_track(self, report, alive_a, alive_b):
+        """Test GET /api/waveform with a real item_id (complements error-only test)."""
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            item_id = self._find_track_id(url, self.config.test_track_artist_1,
+                                           self.config.test_track_title_1)
+            if not item_id:
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/waveform (with track) ({label})",
+                    status=TestStatus.SKIP, message="No test track found",
+                    duration_seconds=time.time() - t0))
+                continue
+
+            resp, lat = timed_request("GET", f"{url}/api/waveform",
+                                       params={"item_id": item_id},
+                                       timeout=self.timeout, retries=self.retries,
+                                       retry_delay=self.retry_delay)
+            if resp.status_code == 200:
+                data = resp.json()
+                has_peaks = isinstance(data, dict) and "peaks" in data
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/waveform (with track) ({label})",
+                    status=TestStatus.PASS if has_peaks else TestStatus.WARN,
+                    message=f"Peaks present: {has_peaks}, latency: {lat:.2f}s",
+                    duration_seconds=time.time() - t0,
+                    details={"latency": lat}))
+            else:
+                # Waveform requires audio file access; may fail if not available
+                report.add_result(TestResult(
+                    category="api", name=f"GET /api/waveform (with track) ({label})",
+                    status=TestStatus.WARN,
+                    message=f"Status {resp.status_code} (may need audio file access)",
+                    duration_seconds=time.time() - t0))
+
+    def _test_rebuild_map_cache(self, report, alive_a, alive_b):
+        """Test POST /api/rebuild_map_cache (idempotent cache rebuild)."""
+        self._compare_post(report, "/api/rebuild_map_cache",
+                           "POST /api/rebuild_map_cache",
+                           alive_a=alive_a, alive_b=alive_b,
+                           check_keys=["ok"])
+
+    def _test_build_artist_projection(self, report, alive_a, alive_b):
+        """Test POST /api/build_artist_projection."""
+        self._compare_post(report, "/api/build_artist_projection",
+                           "POST /api/build_artist_projection",
+                           alive_a=alive_a, alive_b=alive_b)
+
+    # ==================================================================
+    # Group 2: Text Search POST Endpoints
+    # ==================================================================
+
+    def _test_clap_search(self, report, alive_a, alive_b):
+        """Test POST /api/clap/search with a text query."""
+        payload = {"query": "energetic rock music", "limit": 5}
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            try:
+                resp, lat = timed_request("POST", f"{url}/api/clap/search",
+                                           json_data=payload, timeout=self.timeout,
+                                           retries=self.retries, retry_delay=self.retry_delay)
+                if resp.status_code == 200:
+                    data = resp.json()
+                    count = data.get("count", 0) if isinstance(data, dict) else 0
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/clap/search ({label})",
+                        status=TestStatus.PASS,
+                        message=f"Results: {count}, latency: {lat:.2f}s",
+                        duration_seconds=time.time() - t0,
+                        details={"latency": lat, "result_count": count}))
+                elif resp.status_code == 503:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/clap/search ({label})",
+                        status=TestStatus.SKIP,
+                        message="CLAP cache not loaded (503)",
+                        duration_seconds=time.time() - t0))
+                else:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/clap/search ({label})",
+                        status=TestStatus.WARN,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/clap/search ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    def _test_clap_warmup(self, report, alive_a, alive_b):
+        """Test POST /api/clap/warmup."""
+        self._compare_post(report, "/api/clap/warmup",
+                           "POST /api/clap/warmup",
+                           alive_a=alive_a, alive_b=alive_b)
+
+    def _test_mulan_search(self, report, alive_a, alive_b):
+        """Test POST /api/mulan/search with a text query."""
+        payload = {"query": "energetic rock music", "limit": 5}
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            try:
+                resp, lat = timed_request("POST", f"{url}/api/mulan/search",
+                                           json_data=payload, timeout=self.timeout,
+                                           retries=self.retries, retry_delay=self.retry_delay)
+                if resp.status_code == 200:
+                    data = resp.json()
+                    count = data.get("count", 0) if isinstance(data, dict) else 0
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/mulan/search ({label})",
+                        status=TestStatus.PASS,
+                        message=f"Results: {count}, latency: {lat:.2f}s",
+                        duration_seconds=time.time() - t0,
+                        details={"latency": lat, "result_count": count}))
+                elif resp.status_code == 503:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/mulan/search ({label})",
+                        status=TestStatus.SKIP,
+                        message="MuLan cache not loaded (503)",
+                        duration_seconds=time.time() - t0))
+                else:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/mulan/search ({label})",
+                        status=TestStatus.WARN,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/mulan/search ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    def _test_mulan_warmup(self, report, alive_a, alive_b):
+        """Test POST /api/mulan/warmup."""
+        self._compare_post(report, "/api/mulan/warmup",
+                           "POST /api/mulan/warmup",
+                           alive_a=alive_a, alive_b=alive_b)
+
+    # ==================================================================
+    # Group 3: Playlist & Task Start Smoke Tests
+    # ==================================================================
+
+    def _test_create_playlist(self, report, alive_a, alive_b):
+        """Test POST /api/create_playlist with real track IDs."""
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            # Find two track IDs
+            id1 = self._find_track_id(url, self.config.test_track_artist_1,
+                                       self.config.test_track_title_1)
+            id2 = self._find_track_id(url, self.config.test_track_artist_2,
+                                       self.config.test_track_title_2)
+            if not id1 or not id2:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/create_playlist ({label})",
+                    status=TestStatus.SKIP, message="Could not find test tracks",
+                    duration_seconds=time.time() - t0))
+                continue
+
+            import uuid
+            playlist_name = f"_test_suite_{uuid.uuid4().hex[:8]}"
+            payload = {
+                "playlist_name": playlist_name,
+                "track_ids": [id1, id2],
+            }
+            try:
+                resp, lat = timed_request("POST", f"{url}/api/create_playlist",
+                                           json_data=payload, timeout=self.timeout,
+                                           retries=self.retries, retry_delay=self.retry_delay)
+                if resp.status_code in (200, 201):
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/create_playlist ({label})",
+                        status=TestStatus.PASS,
+                        message=f"Playlist '{playlist_name}' created, latency: {lat:.2f}s",
+                        duration_seconds=time.time() - t0,
+                        details={"latency": lat, "playlist_name": playlist_name}))
+                else:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/create_playlist ({label})",
+                        status=TestStatus.FAIL,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/create_playlist ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    def _test_cron_create(self, report, alive_a, alive_b):
+        """Test POST /api/cron — create a disabled cron entry (will never fire)."""
+        payload = {
+            "name": "_test_suite_cron",
+            "task_type": "analysis",
+            "cron_expr": "0 0 31 2 *",  # Feb 31 = never
+            "enabled": False,
+        }
+        self._compare_post(report, "/api/cron", "POST /api/cron (create disabled)",
+                           json_data=payload, alive_a=alive_a, alive_b=alive_b)
+
+    def _test_analysis_start(self, report, alive_a, alive_b):
+        """Smoke test POST /api/analysis/start — verify 202 acceptance."""
+        payload = {"num_recent_albums": 0}
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            try:
+                resp, lat = timed_request("POST", f"{url}/api/analysis/start",
+                                           json_data=payload, timeout=self.timeout,
+                                           retries=1, retry_delay=1)
+                if resp.status_code in (200, 202):
+                    data = resp.json()
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/analysis/start ({label})",
+                        status=TestStatus.PASS,
+                        message=f"Accepted: task_id={data.get('task_id', 'N/A')}, latency: {lat:.2f}s",
+                        duration_seconds=time.time() - t0))
+                elif resp.status_code == 409:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/analysis/start ({label})",
+                        status=TestStatus.PASS,
+                        message="Task already running (409 Conflict) — expected",
+                        duration_seconds=time.time() - t0))
+                else:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/analysis/start ({label})",
+                        status=TestStatus.FAIL,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/analysis/start ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    def _test_clustering_start(self, report, alive_a, alive_b):
+        """Smoke test POST /api/clustering/start — verify 202 or 409."""
+        payload = {"clustering_runs": 1, "top_n_playlists": 1}
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            try:
+                resp, lat = timed_request("POST", f"{url}/api/clustering/start",
+                                           json_data=payload, timeout=self.timeout,
+                                           retries=1, retry_delay=1)
+                if resp.status_code in (200, 202):
+                    data = resp.json()
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/clustering/start ({label})",
+                        status=TestStatus.PASS,
+                        message=f"Accepted: task_id={data.get('task_id', 'N/A')}",
+                        duration_seconds=time.time() - t0))
+                elif resp.status_code == 409:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/clustering/start ({label})",
+                        status=TestStatus.PASS,
+                        message="Task already running (409) — expected",
+                        duration_seconds=time.time() - t0))
+                else:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/clustering/start ({label})",
+                        status=TestStatus.FAIL,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/clustering/start ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    def _test_cleaning_start(self, report, alive_a, alive_b):
+        """Smoke test POST /api/cleaning/start — verify 202 or 409."""
+        t0 = time.time()
+        for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            try:
+                resp, lat = timed_request("POST", f"{url}/api/cleaning/start",
+                                           timeout=self.timeout, retries=1, retry_delay=1)
+                if resp.status_code in (200, 202):
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/cleaning/start ({label})",
+                        status=TestStatus.PASS,
+                        message=f"Accepted, latency: {lat:.2f}s",
+                        duration_seconds=time.time() - t0))
+                elif resp.status_code == 409:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/cleaning/start ({label})",
+                        status=TestStatus.PASS,
+                        message="Task already running (409) — expected",
+                        duration_seconds=time.time() - t0))
+                else:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/cleaning/start ({label})",
+                        status=TestStatus.FAIL,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/cleaning/start ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    # ==================================================================
+    # Group 4: Setup Wizard CRUD Tests (Feature-Only)
+    # ==================================================================
+
+    def _test_setup_provider_crud(self, report, alive_a, alive_b):
+        """Test provider CRUD lifecycle: create → update → delete (feature branch only)."""
+        t0 = time.time()
+        # Only test on instance B (feature branch has setup wizard)
+        for label, url, alive in [("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            provider_id = None
+            try:
+                # Step 1: Create a test provider
+                create_payload = {
+                    "provider_type": "localfiles",
+                    "name": "_test_suite_provider",
+                    "config": {"music_directory": "/tmp/test_suite_nonexistent"},
+                    "enabled": False,
+                    "priority": 99,
+                }
+                resp, lat = timed_request("POST", f"{url}/api/setup/providers",
+                                           json_data=create_payload, timeout=self.timeout,
+                                           retries=self.retries, retry_delay=self.retry_delay)
+                if resp.status_code in (200, 201):
+                    data = resp.json()
+                    provider_id = data.get("id")
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/setup/providers (create) ({label})",
+                        status=TestStatus.PASS,
+                        message=f"Created provider id={provider_id}, latency: {lat:.2f}s",
+                        duration_seconds=time.time() - t0))
+                else:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/setup/providers (create) ({label})",
+                        status=TestStatus.FAIL,
+                        message=f"Status {resp.status_code}: {resp.text[:200]}",
+                        duration_seconds=time.time() - t0))
+                    return
+
+                # Step 2: Update the provider
+                if provider_id:
+                    update_payload = {"name": "_test_suite_provider_updated"}
+                    resp, lat = timed_request("POST", f"{url}/api/setup/providers/{provider_id}",
+                                               json_data=update_payload, timeout=self.timeout,
+                                               retries=self.retries, retry_delay=self.retry_delay)
+                    # Try PUT if POST doesn't work
+                    if resp.status_code == 405:
+                        resp = requests_lib.put(f"{url}/api/setup/providers/{provider_id}",
+                                            json=update_payload, timeout=self.timeout)
+                    report.add_result(TestResult(
+                        category="api", name=f"PUT /api/setup/providers/{provider_id} (update) ({label})",
+                        status=TestStatus.PASS if resp.status_code == 200 else TestStatus.FAIL,
+                        message=f"Status {resp.status_code}",
+                        duration_seconds=time.time() - t0))
+
+                # Step 3: Delete the provider
+                if provider_id:
+                    resp = requests_lib.delete(f"{url}/api/setup/providers/{provider_id}",
+                                           timeout=self.timeout)
+                    report.add_result(TestResult(
+                        category="api", name=f"DELETE /api/setup/providers/{provider_id} ({label})",
+                        status=TestStatus.PASS if resp.status_code == 200 else TestStatus.FAIL,
+                        message=f"Status {resp.status_code}",
+                        duration_seconds=time.time() - t0))
+                    provider_id = None
+
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"Setup provider CRUD ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+            finally:
+                # Cleanup: ensure test provider is deleted
+                if provider_id:
+                    try:
+                        requests_lib.delete(f"{url}/api/setup/providers/{provider_id}",
+                                        timeout=15)
+                    except Exception:
+                        pass
+
+    def _test_setup_provider_test_connection(self, report, alive_a, alive_b):
+        """Test POST /api/setup/providers/test — test connection without saving."""
+        t0 = time.time()
+        for label, url, alive in [("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            payload = {
+                "provider_type": "localfiles",
+                "config": {"music_directory": "/tmp"},
+            }
+            try:
+                resp, lat = timed_request("POST", f"{url}/api/setup/providers/test",
+                                           json_data=payload, timeout=self.timeout,
+                                           retries=self.retries, retry_delay=self.retry_delay)
+                data = resp.json() if resp.status_code == 200 else {}
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/setup/providers/test ({label})",
+                    status=TestStatus.PASS if resp.status_code == 200 else TestStatus.WARN,
+                    message=f"Status {resp.status_code}, success={data.get('success', 'N/A')}, latency: {lat:.2f}s",
+                    duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/setup/providers/test ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    def _test_setup_settings_update(self, report, alive_a, alive_b):
+        """Test PUT /api/setup/settings — update and verify a setting."""
+        t0 = time.time()
+        for label, url, alive in [("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            try:
+                # Read current settings first
+                resp = http_get(f"{url}/api/setup/settings", timeout=15, retries=2, retry_delay=1)
+                if resp.status_code != 200:
+                    report.add_result(TestResult(
+                        category="api", name=f"PUT /api/setup/settings ({label})",
+                        status=TestStatus.SKIP,
+                        message=f"Cannot read current settings: {resp.status_code}",
+                        duration_seconds=time.time() - t0))
+                    continue
+
+                # Update with a test setting
+                update_resp = requests_lib.put(f"{url}/api/setup/settings",
+                                           json={"_test_suite_key": "test_value"},
+                                           timeout=self.timeout)
+                report.add_result(TestResult(
+                    category="api", name=f"PUT /api/setup/settings ({label})",
+                    status=TestStatus.PASS if update_resp.status_code == 200 else TestStatus.FAIL,
+                    message=f"Status {update_resp.status_code}",
+                    duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"PUT /api/setup/settings ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    def _test_setup_multi_provider_toggle(self, report, alive_a, alive_b):
+        """Test POST /api/setup/multi-provider — toggle and restore."""
+        t0 = time.time()
+        for label, url, alive in [("B", self.url_b, alive_b)]:
+            if not alive:
+                continue
+            try:
+                # Read current state
+                status_resp = http_get(f"{url}/api/setup/status", timeout=15, retries=2, retry_delay=1)
+                if status_resp.status_code != 200:
+                    report.add_result(TestResult(
+                        category="api", name=f"POST /api/setup/multi-provider ({label})",
+                        status=TestStatus.SKIP,
+                        message=f"Cannot read setup status: {status_resp.status_code}",
+                        duration_seconds=time.time() - t0))
+                    continue
+
+                current_state = status_resp.json().get("multi_provider_enabled", False)
+
+                # Toggle
+                resp, lat = timed_request("POST", f"{url}/api/setup/multi-provider",
+                                           json_data={"enabled": not current_state},
+                                           timeout=self.timeout, retries=self.retries,
+                                           retry_delay=self.retry_delay)
+                toggled_ok = resp.status_code == 200
+
+                # Restore original state
+                requests_lib.post(f"{url}/api/setup/multi-provider",
+                              json={"enabled": current_state}, timeout=15)
+
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/setup/multi-provider ({label})",
+                    status=TestStatus.PASS if toggled_ok else TestStatus.FAIL,
+                    message=f"Toggle {current_state} -> {not current_state} -> {current_state}: status {resp.status_code}",
+                    duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api", name=f"POST /api/setup/multi-provider ({label})",
+                    status=TestStatus.ERROR, message=str(e),
+                    duration_seconds=time.time() - t0))
+
+    # ==================================================================
+    # Group 5: Extended Error Handling Tests
+    # ==================================================================
+
+    def _test_extended_error_handling(self, report, alive_a, alive_b):
+        """Test error handling for additional endpoints."""
+        error_cases = [
+            ("/api/track", "GET /api/track without item_id", 400, None),
+            ("/api/similar_artists", "GET /api/similar_artists without artist", 400, None),
+            ("/external/get_score?id=nonexistent_item_99999", "GET /external/get_score nonexistent", 404, None),
+        ]
+
+        for path, desc, expected_status, _ in error_cases:
+            t0 = time.time()
+            try:
+                resp_a = http_get(f"{self.url_a}{path}", timeout=15, retries=1) if alive_a else None
+                resp_b = http_get(f"{self.url_b}{path}", timeout=15, retries=1) if alive_b else None
+
+                status_a = resp_a.status_code if resp_a else None
+                status_b = resp_b.status_code if resp_b else None
+
+                if alive_a and alive_b:
+                    if status_a == status_b:
+                        report.add_result(TestResult(
+                            category="api",
+                            name=f"Error handling: {desc}",
+                            status=TestStatus.PASS,
+                            message=f"Consistent: {status_a}",
+                            instance_a_value=status_a,
+                            instance_b_value=status_b,
+                            duration_seconds=time.time() - t0))
+                    else:
+                        report.add_result(TestResult(
+                            category="api",
+                            name=f"Error handling: {desc}",
+                            status=TestStatus.WARN,
+                            message=f"Different codes: A={status_a}, B={status_b}",
+                            instance_a_value=status_a,
+                            instance_b_value=status_b,
+                            duration_seconds=time.time() - t0))
+            except Exception as e:
+                report.add_result(TestResult(
+                    category="api",
+                    name=f"Error handling: {desc}",
+                    status=TestStatus.ERROR,
+                    message=str(e),
+                    duration_seconds=time.time() - t0))
+
+        # CLAP search with too-short query (POST)
+        t0 = time.time()
+        try:
+            short_query = {"query": "ab", "limit": 5}
+            for label, url, alive in [("A", self.url_a, alive_a), ("B", self.url_b, alive_b)]:
+                if not alive:
+                    continue
+                resp, lat = timed_request("POST", f"{url}/api/clap/search",
+                                           json_data=short_query, timeout=15,
+                                           retries=1, retry_delay=1)
+                # Should be 400 (too short) or 503 (not loaded)
+                report.add_result(TestResult(
+                    category="api",
+                    name=f"Error handling: CLAP search short query ({label})",
+                    status=TestStatus.PASS if resp.status_code in (400, 503) else TestStatus.WARN,
+                    message=f"Status {resp.status_code} (expected 400 or 503)",
+                    duration_seconds=time.time() - t0))
+        except Exception as e:
+            report.add_result(TestResult(
+                category="api",
+                name="Error handling: CLAP search short query",
+                status=TestStatus.ERROR, message=str(e),
+                duration_seconds=time.time() - t0))
diff --git a/testing_suite/comparison_config.yaml b/testing_suite/comparison_config.yaml
new file mode 100644
index 00000000..b085780f
--- /dev/null
+++ b/testing_suite/comparison_config.yaml
@@ -0,0 +1,78 @@
+# AudioMuse-AI Testing & Comparison Suite - Active Configuration
+
+# Instance A - Main branch (baseline)
+instance_a:
+  name: "main"
+  branch: "main"
+  api_url: "http://localhost:8001"
+  api_timeout: 120
+  pg_host: "localhost"
+  pg_port: 5433
+  pg_user: "audiomuse"
+  pg_password: "audiomusepassword"
+  pg_database: "audiomusedb"
+  redis_url: "redis://localhost:6379/0"
+  docker_flask_container: "test-am-flask-jellyfin"
+  docker_worker_container: "test-am-worker-jellyfin"
+  docker_postgres_container: "test-am-pg-jellyfin"
+  docker_redis_container: "test-am-redis-jellyfin"
+  ssh_host: ""
+  ssh_user: ""
+  ssh_key: ""
+  ssh_port: 22
+
+# Instance B - Feature branch (under test)
+instance_b:
+  name: "feature"
+  branch: "multi-provider-testing-suite"
+  api_url: "http://localhost:8000"
+  api_timeout: 120
+  pg_host: "localhost"
+  pg_port: 5432
+  pg_user: "audiomuse"
+  pg_password: "audiomusepassword"
+  pg_database: "audiomusedb"
+  redis_url: "redis://localhost:6379/0"
+  docker_flask_container: "audiomuse-ai-flask-app"
+  docker_worker_container: "audiomuse-ai-worker-instance"
+  docker_postgres_container: "audiomuse-postgres"
+  docker_redis_container: "audiomuse-redis"
+  ssh_host: ""
+  ssh_user: ""
+  ssh_key: ""
+  ssh_port: 22
+
+# Test modules to run
+run_api_tests: true
+run_db_tests: true
+run_docker_tests: true
+run_performance_tests: true
+run_existing_unit_tests: false
+run_existing_integration_tests: false
+
+# Performance test settings
+perf_warmup_requests: 3
+perf_benchmark_requests: 10
+perf_concurrent_users: 5
+
+# API test settings
+api_retries: 3
+api_retry_delay: 2.0
+api_task_timeout: 1200
+
+# Database quality thresholds
+db_row_count_tolerance_pct: 5.0
+db_embedding_dimension_expected: 200
+db_clap_dimension_expected: 512
+db_score_null_threshold_pct: 10.0
+
+# Reporting
+output_dir: "testing_suite/reports/output"
+report_format: "both"
+verbose: false
+
+# Test track references - tracks that exist in BOTH instances
+test_track_artist_1: "Coldplay"
+test_track_title_1: "Fix You"
+test_track_artist_2: "Linkin Park"
+test_track_title_2: "Papercut"
diff --git a/testing_suite/config.py b/testing_suite/config.py
index 1419c884..b9b1afa4 100644
--- a/testing_suite/config.py
+++ b/testing_suite/config.py
@@ -98,6 +98,10 @@ class ComparisonConfig:
     api_retry_delay: float = 2.0
     api_task_timeout: int = 1200  # 20 minutes for long-running tasks
 
+    # Advanced test groups
+    run_setup_crud_tests: bool = True     # Setup wizard provider CRUD (feature-only, creates/deletes test data)
+    run_task_start_tests: bool = False    # Task start smoke tests (triggers analysis/clustering work)
+
     # Database comparison thresholds
     db_row_count_tolerance_pct: float = 5.0  # % difference allowed in row counts
     db_embedding_dimension_expected: int = 200
diff --git a/testing_suite/run_comparison.py b/testing_suite/run_comparison.py
index b07ea7ce..b2b7f579 100644
--- a/testing_suite/run_comparison.py
+++ b/testing_suite/run_comparison.py
@@ -137,6 +137,10 @@ def build_parser() -> argparse.ArgumentParser:
                        help="Only run these categories (comma-separated: api,db,docker,performance,existing_tests)")
     grp_t.add_argument("--skip", type=str, default="",
                        help="Skip these categories (comma-separated)")
+    grp_t.add_argument("--skip-setup-crud", action="store_true",
+                       help="Skip setup wizard CRUD tests (provider create/update/delete)")
+    grp_t.add_argument("--enable-task-starts", action="store_true",
+                       help="Enable task start smoke tests (analysis, clustering, cleaning)")
 
     # Performance settings
     grp_p = parser.add_argument_group("Performance Settings")
@@ -262,6 +266,12 @@ def build_config(args) -> ComparisonConfig:
         if "existing_tests" in skip or "integration" in skip:
             config.run_existing_integration_tests = False
 
+    # Advanced test group flags
+    if args.skip_setup_crud:
+        config.run_setup_crud_tests = False
+    if args.enable_task_starts:
+        config.run_task_start_tests = True
+
     return config
 
 

From f6b4cbf96524c3becf6cfaee23f218486904a739 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Fri, 6 Feb 2026 12:49:29 +0100
Subject: [PATCH 19/33] Prompt tests

---
 testing_suite/ai_naming_test_config.yaml | 173 +++++
 testing_suite/test_ai_naming.py          | 839 +++++++++++++++++++++++
 2 files changed, 1012 insertions(+)
 create mode 100644 testing_suite/ai_naming_test_config.yaml
 create mode 100644 testing_suite/test_ai_naming.py

diff --git a/testing_suite/ai_naming_test_config.yaml b/testing_suite/ai_naming_test_config.yaml
new file mode 100644
index 00000000..278129ff
--- /dev/null
+++ b/testing_suite/ai_naming_test_config.yaml
@@ -0,0 +1,173 @@
+# AudioMuse-AI - AI Playlist Naming Performance Test Configuration
+
+postgres:
+  container_name: "audiomuse-postgres"
+  user: "audiomuse"
+  database: "audiomusedb"
+
+test_config:
+  num_runs_per_model: 5
+  num_playlists: 3
+  songs_per_playlist: 25
+  timeout_per_request: 120
+
+# The prompt sent to each model. Use {song_list_sample} where the song list goes.
+prompt: |
+  "You are an expert music curator. Your task is to craft a title for a playlist.\n\n"
+  "To craft a strong title ensure that you:\n"
+  "  - Represent the genres, scenes, and styles of the songs.\n"
+  "  - Capture the overall vibe of the playlist.\n"
+  "  - Reference activities and/or locations that are well suited for listening.\n"
+  "  - Stand out in a sea of boring and trite playlist titles.\n"
+  "  - Be both pithy *and* coherent.\n\n"
+  "Additionally, you MUST strictly adhere to these rules:\n"
+  "  - Use ONLY standard ASCII characters (a-z, A-Z, 0-9, spaces, and - & ' ! . , ? ( ) [ ]).\n"
+  "  - Keep the length between 10 and 40 characters.\n"
+  "  - Do NOT use special fonts or emojis.\n"
+  "  - Respond with ONLY a single playlist name.\n\n"
+  "On the topic of creativity...\n"
+  "Here are some examples of words and phrases that are trite, boring, and uncreative: neon, autumn, quiet, porch, groove, midnight, dusk, night, morning. If you find yourself reaching those words (or other similarly yawn-inducing phrasing), it's a clear sign you need to be more creative. Think laterally!\n\n"
+  "This is the playlist:\n{song_list_sample}\n\n"
+  "To begin, think hard and come up with 5-10 options. Explore what works and try different approaches before deciding on the final name for the playlist.\n"
+
+# Hardcoded song list for testing (bypasses DB fetch). Remove to fetch random songs from DB.
+# This simulates a cluster of melancholic/atmospheric songs that would group together.
+sample_songs:
+  - title: "Fix You"
+    author: "Coldplay"
+  - title: "Swallowed In The Sea"
+    author: "Coldplay"
+  - title: "What If"
+    author: "Coldplay"
+  - title: "Til Kingdom Come"
+    author: "Coldplay"
+  - title: "The Hardest Part"
+    author: "Coldplay"
+  - title: "How Does It Feel"
+    author: "London Grammar"
+  - title: "I Need the Night"
+    author: "London Grammar"
+  - title: "Missing"
+    author: "London Grammar"
+  - title: "Lose Your Head"
+    author: "London Grammar"
+  - title: "California Soil"
+    author: "London Grammar"
+  - title: "Fare Well"
+    author: "Hozier"
+  - title: "Wildflower and Barley"
+    author: "Hozier"
+  - title: "Mariners Apartment Complex"
+    author: "Lana Del Rey"
+  - title: "How To Disappear"
+    author: "Lana Del Rey"
+  - title: "Cinnamon Girl"
+    author: "Lana Del Rey"
+  - title: "Happiness Is A Butterfly"
+    author: "Lana Del Rey"
+  - title: "Love Song"
+    author: "Lana Del Rey"
+  - title: "The Greatest"
+    author: "Lana Del Rey"
+  - title: "Heart Of Gold"
+    author: "Neil Young"
+  - title: "Old Man"
+    author: "Neil Young"
+  - title: "Harvest"
+    author: "Neil Young"
+  - title: "A Man Needs A Maid"
+    author: "Neil Young"
+  - title: "Out On The Weekend"
+    author: "Neil Young"
+  - title: "If Leaving Me Is Easy"
+    author: "Phil Collins"
+  - title: "Speed Of Sound"
+    author: "Coldplay"
+
+# Set these once - models inherit from their provider defaults
+defaults:
+  ollama:
+    url: "http://192.168.1.71:11434/api/generate"
+  openrouter:
+    url: "https://openrouter.ai/api/v1/chat/completions"
+    api_key: "sk-or-v1-key"
+
+models:
+  - provider: "ollama"
+    name: "Llama 3.1 8B"
+    model_id: "llama3.1:8b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Llama 3.2 1B"
+    model_id: "llama3.2:1b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Gemma 3 1B"
+    model_id: "gemma3:1b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Gemma 3 4B"
+    model_id: "gemma3:4b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Gemma 3 12B"
+    model_id: "gemma3:12b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Qwen 3 0.6B"
+    model_id: "qwen3:0.6b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Qwen 3 1.7B"
+    model_id: "qwen3:1.7b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "DeepSeek R1 1.5B"
+    model_id: "deepseek-r1:1.5b"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "GPT-4o Mini"
+    model_id: "openai/gpt-4o-mini"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Claude 4.5 Haiku"
+    model_id: "anthropic/claude-haiku-4.5"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Claude 4.5 Sonnet"
+    model_id: "anthropic/claude-sonnet-4.5"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Claude 4.6 Opus"
+    model_id: "anthropic/claude-opus-4.6"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Gemini 3 Flash"
+    model_id: "google/gemini-3-flash-preview"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Gemini 3 Pro"
+    model_id: "google/gemini-3-pro-preview"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "GPT 5.2"
+    model_id: "openai/gpt-5.2"
+    enabled: true
+
+output:
+  directory: "testing_suite/reports/ai_naming"
+  save_raw_responses: true
diff --git a/testing_suite/test_ai_naming.py b/testing_suite/test_ai_naming.py
new file mode 100644
index 00000000..4a1eda35
--- /dev/null
+++ b/testing_suite/test_ai_naming.py
@@ -0,0 +1,839 @@
+#!/usr/bin/env python3
+"""
+AudioMuse-AI - AI Playlist Naming Performance Test
+
+Compares how different AI models perform on the same playlist naming prompt.
+Sends identical song lists to multiple Ollama + OpenRouter models, runs N times
+each, and produces a comparison report (console, TXT, HTML, JSON).
+
+Usage:
+  python testing_suite/test_ai_naming.py
+  python testing_suite/test_ai_naming.py --config path/to/config.yaml
+  python testing_suite/test_ai_naming.py --runs 10
+  python testing_suite/test_ai_naming.py --dry-run
+"""
+
+import argparse
+import json
+import os
+import re
+import subprocess
+import sys
+import time
+import unicodedata
+from datetime import datetime
+
+import ftfy
+import requests
+import yaml
+
+
+# ---------------------------------------------------------------------------
+# Prompt template (inlined from ai.py:16-28)
+# ---------------------------------------------------------------------------
+CREATIVE_PROMPT_TEMPLATE = (
+    "You are an expert music collector and MUST give a title to this playlist.\n"
+    "The title MUST represent the mood and the activity of when you are listening to the playlist.\n"
+    "The title MUST use ONLY standard ASCII (a-z, A-Z, 0-9, spaces, and - & ' ! . , ? ( ) [ ]).\n"
+    "The title MUST be within the range of 5 to 40 characters long.\n"
+    "No special fonts or emojis.\n"
+    "* BAD EXAMPLES: 'Ambient Electronic Space - Electric Soundscapes - Emotional Waves' (Too long/descriptive)\n"
+    "* BAD EXAMPLES: 'Blues Rock Fast Tracks' (Too direct/literal, not evocative enough)\n"
+    "* BAD EXAMPLES: '\U0001d46f\U0001d4f0\U0001d4ea \U0001d4ea\U0001d4fb\U0001d4f8\U0001d4f7\U0001d4f2 \U0001d4ed\U0001d4ea\U0001d4fd\U0001d4fc' (Non-standard characters)\n\n"
+    "CRITICAL: Your response MUST be ONLY the single playlist name. No explanations, no 'Playlist Name:', no numbering, no extra text or formatting whatsoever.\n\n"
+    "This is the playlist:\n{song_list_sample}\n\n"
+)
+
+MIN_NAME_LENGTH = 5
+MAX_NAME_LENGTH = 40
+
+
+# ---------------------------------------------------------------------------
+# Name cleaning (inlined from ai.py:30-43)
+# ---------------------------------------------------------------------------
+def clean_playlist_name(name: str) -> str:
+    if not isinstance(name, str):
+        return ""
+    name = ftfy.fix_text(name)
+    name = unicodedata.normalize('NFKC', name)
+    cleaned = re.sub(r'[^a-zA-Z0-9\s\-\&\'!\.\,\?\(\)\[\]]', '', name)
+    cleaned = re.sub(r'\s\(\d+\)$', '', cleaned)
+    cleaned = re.sub(r'\s+', ' ', cleaned).strip()
+    return cleaned
+
+
+# ---------------------------------------------------------------------------
+# Song data fetching
+# ---------------------------------------------------------------------------
+def fetch_songs_from_db(container: str, user: str, database: str, total: int) -> list[dict]:
+    """Fetch random songs from the PostgreSQL database via docker exec."""
+    query = (
+        f"SELECT title, author FROM score "
+        f"WHERE title IS NOT NULL AND author IS NOT NULL "
+        f"ORDER BY RANDOM() LIMIT {total}"
+    )
+    cmd = [
+        "docker", "exec", container,
+        "psql", "-U", user, "-d", database,
+        "-t", "-A", "-F", "|",
+        "-c", query,
+    ]
+    try:
+        result = subprocess.run(cmd, capture_output=True, text=True, timeout=30)
+    except FileNotFoundError:
+        print("ERROR: 'docker' command not found. Is Docker installed and in PATH?")
+        sys.exit(1)
+    except subprocess.TimeoutExpired:
+        print("ERROR: Database query timed out after 30 seconds.")
+        sys.exit(1)
+
+    if result.returncode != 0:
+        print(f"ERROR: Database query failed.\n  Command: {' '.join(cmd)}\n  Stderr: {result.stderr.strip()}")
+        sys.exit(1)
+
+    songs = []
+    for line in result.stdout.strip().split('\n'):
+        line = line.strip()
+        if not line:
+            continue
+        parts = line.split('|', 1)
+        if len(parts) == 2:
+            songs.append({"title": parts[0].strip(), "author": parts[1].strip()})
+
+    if len(songs) < total:
+        print(f"ERROR: Not enough songs in database. Found {len(songs)}, need {total}.")
+        sys.exit(1)
+
+    return songs
+
+
+def apply_defaults(config: dict) -> None:
+    """Merge provider defaults (url, api_key) into each model entry."""
+    defaults = config.get("defaults", {})
+    for model in config.get("models", []):
+        provider = model.get("provider", "")
+        provider_defaults = defaults.get(provider, {})
+        for key, value in provider_defaults.items():
+            if key not in model:
+                model[key] = value
+
+
+def split_into_playlists(songs: list[dict], num_playlists: int, per_playlist: int) -> list[list[dict]]:
+    """Split a flat song list into N playlists of M songs each."""
+    playlists = []
+    for i in range(num_playlists):
+        start = i * per_playlist
+        playlists.append(songs[start:start + per_playlist])
+    return playlists
+
+
+# ---------------------------------------------------------------------------
+# Prompt building
+# ---------------------------------------------------------------------------
+def build_prompt(songs: list[dict], template: str | None = None) -> str:
+    """Build the full prompt from a list of songs and an optional template."""
+    formatted = "\n".join(f"- {s['title']} by {s['author']}" for s in songs)
+    tpl = template if template else CREATIVE_PROMPT_TEMPLATE
+    return tpl.format(song_list_sample=formatted)
+
+
+# ---------------------------------------------------------------------------
+# API calling (inlined from ai.py:47-183)
+# ---------------------------------------------------------------------------
+def call_model(model_cfg: dict, prompt: str, timeout: int) -> dict:
+    """
+    Call an AI model and return result dict with keys:
+      name, raw_response, cleaned_name, valid, elapsed, error
+    """
+    provider = model_cfg["provider"]
+    url = model_cfg["url"]
+    model_id = model_cfg["model_id"]
+    api_key = model_cfg.get("api_key", "")
+
+    is_openai_format = (
+        bool(api_key) or
+        "openai" in url.lower() or
+        "openrouter" in url.lower()
+    )
+
+    headers = {"Content-Type": "application/json"}
+
+    if api_key:
+        headers["Authorization"] = f"Bearer {api_key}"
+
+    if "openrouter" in url.lower():
+        headers["HTTP-Referer"] = "https://github.com/NeptuneHub/AudioMuse-AI"
+        headers["X-Title"] = "AudioMuse-AI"
+
+    if is_openai_format:
+        payload = {
+            "model": model_id,
+            "messages": [{"role": "user", "content": prompt}],
+            "stream": True,
+            "temperature": 0.7,
+            "max_tokens": 8000,
+        }
+    else:
+        payload = {
+            "model": model_id,
+            "prompt": prompt,
+            "stream": True,
+            "options": {
+                "num_predict": 8000,
+                "temperature": 0.7,
+            },
+        }
+
+    start_time = time.time()
+    try:
+        response = requests.post(
+            url, headers=headers, data=json.dumps(payload),
+            stream=True, timeout=timeout,
+        )
+        response.raise_for_status()
+
+        full_raw = ""
+        for line in response.iter_lines():
+            if not line:
+                continue
+            line_str = line.decode('utf-8', errors='ignore').strip()
+
+            if line_str.startswith(':'):
+                continue
+
+            if line_str.startswith('data: '):
+                line_str = line_str[6:]
+                if line_str == '[DONE]':
+                    break
+
+            try:
+                chunk = json.loads(line_str)
+                if is_openai_format:
+                    if 'choices' in chunk and len(chunk['choices']) > 0:
+                        choice = chunk['choices'][0]
+                        finish_reason = choice.get('finish_reason')
+                        if finish_reason in ('stop', 'length'):
+                            # Grab any final content before breaking
+                            if 'delta' in choice:
+                                c = choice['delta'].get('content')
+                                if c:
+                                    full_raw += c
+                            break
+                        if 'delta' in choice:
+                            c = choice['delta'].get('content')
+                            if c is not None:
+                                full_raw += c
+                        elif 'text' in choice:
+                            t = choice.get('text')
+                            if t is not None:
+                                full_raw += t
+                else:
+                    if 'response' in chunk:
+                        full_raw += chunk['response']
+                    if chunk.get('done'):
+                        break
+            except json.JSONDecodeError:
+                continue
+
+        elapsed = time.time() - start_time
+
+        # Strip think tags (inlined from ai.py:178-182)
+        extracted = full_raw.strip()
+        for tag in ["</think>", "[/INST]", "[/THOUGHT]"]:
+            if tag in extracted:
+                extracted = extracted.split(tag, 1)[-1].strip()
+
+        if not extracted:
+            return {
+                "raw_response": full_raw,
+                "cleaned_name": "",
+                "valid": False,
+                "elapsed": elapsed,
+                "error": "Empty response after think-tag stripping",
+            }
+
+        cleaned = clean_playlist_name(extracted)
+        valid = MIN_NAME_LENGTH <= len(cleaned) <= MAX_NAME_LENGTH
+
+        return {
+            "raw_response": extracted,
+            "cleaned_name": cleaned,
+            "valid": valid,
+            "elapsed": elapsed,
+            "error": None,
+        }
+
+    except requests.exceptions.ConnectionError:
+        elapsed = time.time() - start_time
+        return {
+            "raw_response": "",
+            "cleaned_name": "",
+            "valid": False,
+            "elapsed": elapsed,
+            "error": "Connection refused",
+        }
+    except requests.exceptions.Timeout:
+        elapsed = time.time() - start_time
+        return {
+            "raw_response": "",
+            "cleaned_name": "",
+            "valid": False,
+            "elapsed": elapsed,
+            "error": f"Timeout after {timeout}s",
+        }
+    except requests.exceptions.HTTPError as e:
+        elapsed = time.time() - start_time
+        detail = ""
+        try:
+            detail = e.response.text[:200]
+        except Exception:
+            pass
+        return {
+            "raw_response": "",
+            "cleaned_name": "",
+            "valid": False,
+            "elapsed": elapsed,
+            "error": f"HTTP {e.response.status_code}: {detail}",
+        }
+    except Exception as e:
+        elapsed = time.time() - start_time
+        return {
+            "raw_response": "",
+            "cleaned_name": "",
+            "valid": False,
+            "elapsed": elapsed,
+            "error": str(e),
+        }
+
+
+# ---------------------------------------------------------------------------
+# Report generation
+# ---------------------------------------------------------------------------
+def generate_summary_table(results: dict, timestamp: str) -> str:
+    """Generate the ASCII summary table."""
+    lines = []
+    lines.append("=" * 70)
+    lines.append(f" RESULTS - AI Playlist Naming Test ({timestamp})")
+    lines.append("=" * 70)
+    lines.append(f" {'Model':<22} {'Tests':>5}  {'Valid':>5}  {'Rate':>6}  {'Avg':>6}  {'Min':>6}  {'Max':>6}")
+    lines.append("-" * 70)
+
+    for model_name, model_data in results.items():
+        all_runs = model_data["runs"]
+        total = len(all_runs)
+        valid = sum(1 for r in all_runs if r["valid"])
+        rate = (valid / total * 100) if total > 0 else 0
+        times = [r["elapsed"] for r in all_runs if r["error"] is None]
+        avg_t = sum(times) / len(times) if times else 0
+        min_t = min(times) if times else 0
+        max_t = max(times) if times else 0
+
+        lines.append(
+            f" {model_name:<22} {total:>5}  {valid:>5}  {rate:>5.1f}%  {avg_t:>5.1f}s  {min_t:>5.1f}s  {max_t:>5.1f}s"
+        )
+
+    lines.append("-" * 70)
+    return "\n".join(lines)
+
+
+def generate_names_table(results: dict, playlists: list[list[dict]], num_runs: int) -> str:
+    """Generate per-playlist names detail table."""
+    lines = []
+    model_names = list(results.keys())
+    num_playlists = len(playlists)
+
+    for pi in range(num_playlists):
+        lines.append(f"\nPlaylist {pi + 1} - Generated Names:")
+        header = f"  {'Model':<22}"
+        for ri in range(num_runs):
+            header += f"  {'Run ' + str(ri + 1):<24}"
+        lines.append(header)
+        lines.append("  " + "-" * (22 + num_runs * 26))
+
+        for model_name in model_names:
+            row = f"  {model_name:<22}"
+            runs = results[model_name]["runs"]
+            # Filter runs for this playlist
+            playlist_runs = [r for r in runs if r["playlist_index"] == pi]
+            for r in playlist_runs:
+                name = r.get("cleaned_name", "")
+                if r.get("error"):
+                    name = f"[ERR: {r['error'][:15]}]"
+                elif not r["valid"]:
+                    name = f"[INVALID: {name[:12]}]"
+                # Truncate to fit column
+                if len(name) > 23:
+                    name = name[:20] + "..."
+                row += f"  {name:<24}"
+            lines.append(row)
+
+    return "\n".join(lines)
+
+
+def generate_html_report(results: dict, playlists: list[list[dict]],
+                         num_runs: int, timestamp: str, config: dict,
+                         save_raw: bool) -> str:
+    """Generate a self-contained HTML report."""
+    model_names = list(results.keys())
+    num_playlists = len(playlists)
+
+    # Build summary rows
+    summary_rows = ""
+    for model_name, model_data in results.items():
+        all_runs = model_data["runs"]
+        total = len(all_runs)
+        valid = sum(1 for r in all_runs if r["valid"])
+        rate = (valid / total * 100) if total > 0 else 0
+        errors = sum(1 for r in all_runs if r["error"])
+        times = [r["elapsed"] for r in all_runs if r["error"] is None]
+        avg_t = sum(times) / len(times) if times else 0
+        min_t = min(times) if times else 0
+        max_t = max(times) if times else 0
+
+        rate_class = "pass" if rate >= 80 else ("warn" if rate >= 50 else "fail")
+        provider = model_data.get("provider", "")
+
+        summary_rows += f"""<tr>
+            <td>{model_name}</td><td>{provider}</td>
+            <td>{total}</td><td>{valid}</td><td>{errors}</td>
+            <td class="{rate_class}">{rate:.1f}%</td>
+            <td>{avg_t:.2f}s</td><td>{min_t:.2f}s</td><td>{max_t:.2f}s</td>
+        </tr>\n"""
+
+    # Build per-playlist detail sections
+    playlist_sections = ""
+    for pi in range(num_playlists):
+        song_list_html = "<ul>\n"
+        for s in playlists[pi]:
+            song_list_html += f"  <li>{s['title']} &mdash; {s['author']}</li>\n"
+        song_list_html += "</ul>"
+
+        detail_rows = ""
+        for model_name in model_names:
+            runs = [r for r in results[model_name]["runs"] if r["playlist_index"] == pi]
+            valid_count = sum(1 for r in runs if r["valid"])
+            total_count = len(runs)
+            times = [r["elapsed"] for r in runs if r["error"] is None]
+            avg_t = sum(times) / len(times) if times else 0
+            rate = (valid_count / total_count * 100) if total_count else 0
+            rate_class = "pass" if rate >= 80 else ("warn" if rate >= 50 else "fail")
+
+            # Build all names into a single cell
+            names_html = ""
+            for ri, r in enumerate(runs):
+                name = r.get("cleaned_name", "")
+                error = r.get("error")
+                raw = r.get("raw_response", "").replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")
+
+                if error:
+                    names_html += f'<div class="name-entry error">Run {ri + 1}: <em>{error}</em> ({r["elapsed"]:.1f}s)</div>\n'
+                elif r["valid"]:
+                    raw_detail = f' <details class="inline-raw"><summary>raw</summary><pre>{raw}</pre></details>' if save_raw and raw else ""
+                    names_html += f'<div class="name-entry pass">Run {ri + 1}: {name} ({r["elapsed"]:.1f}s){raw_detail}</div>\n'
+                else:
+                    raw_detail = f' <details class="inline-raw"><summary>raw</summary><pre>{raw}</pre></details>' if save_raw and raw else ""
+                    names_html += f'<div class="name-entry fail">Run {ri + 1}: {name} <span class="len">({len(name)} chars)</span> ({r["elapsed"]:.1f}s){raw_detail}</div>\n'
+
+            detail_rows += f"""<tr>
+                <td><strong>{model_name}</strong><br><span class="meta">{results[model_name].get('provider', '')}</span></td>
+                <td class="{rate_class}">{valid_count}/{total_count} ({rate:.0f}%)</td>
+                <td>{avg_t:.2f}s</td>
+                <td class="names-cell">{names_html}</td>
+            </tr>\n"""
+
+        playlist_sections += f"""
+        <details open>
+            <summary><h3>Playlist {pi + 1}</h3></summary>
+            <div class="song-list">
+                <strong>Songs used:</strong>
+                {song_list_html}
+            </div>
+            <table>
+                <thead><tr>
+                    <th>Model</th><th>Valid</th><th>Avg Time</th>
+                    <th>Generated Names</th>
+                </tr></thead>
+                <tbody>{detail_rows}</tbody>
+            </table>
+        </details>
+        """
+
+    html = f"""<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>AI Playlist Naming Test - {timestamp}</title>
+<style>
+    body {{ font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif;
+           margin: 2rem; background: #f8f9fa; color: #212529; }}
+    h1 {{ color: #2563eb; }}
+    h2 {{ margin-top: 2rem; border-bottom: 2px solid #dee2e6; padding-bottom: 0.5rem; }}
+    h3 {{ margin: 0; display: inline; }}
+    table {{ border-collapse: collapse; width: 100%; margin: 1rem 0; background: #fff; }}
+    th, td {{ border: 1px solid #dee2e6; padding: 0.5rem 0.75rem; text-align: left; }}
+    th {{ background: #e9ecef; font-weight: 600; }}
+    tr:nth-child(even) {{ background: #f8f9fa; }}
+    .pass {{ background: #d4edda; color: #155724; font-weight: bold; }}
+    .fail {{ background: #f8d7da; color: #721c24; font-weight: bold; }}
+    .warn {{ background: #fff3cd; color: #856404; font-weight: bold; }}
+    .error {{ background: #f8d7da; color: #721c24; }}
+    .names-cell {{ padding: 0.25rem 0.5rem; }}
+    .name-entry {{ padding: 0.3rem 0.5rem; margin: 0.2rem 0; border-radius: 3px; font-size: 0.9rem; }}
+    .name-entry.pass {{ background: #d4edda; color: #155724; font-weight: normal; }}
+    .name-entry.fail {{ background: #fff3cd; color: #856404; font-weight: normal; }}
+    .name-entry.error {{ background: #f8d7da; color: #721c24; font-weight: normal; }}
+    .name-entry .len {{ font-size: 0.8rem; opacity: 0.7; }}
+    .meta {{ font-size: 0.8rem; color: #6c757d; }}
+    .inline-raw {{ display: inline; margin-left: 0.5rem; }}
+    .inline-raw summary {{ display: inline; background: none; padding: 0; font-size: 0.75rem;
+                           color: #6c757d; text-decoration: underline; }}
+    .inline-raw pre {{ margin-top: 0.25rem; }}
+    details {{ margin: 1rem 0; }}
+    summary {{ cursor: pointer; padding: 0.5rem; background: #e9ecef; border-radius: 4px; }}
+    summary:hover {{ background: #dee2e6; }}
+    .song-list {{ background: #fff; padding: 1rem; border: 1px solid #dee2e6;
+                  border-radius: 4px; margin: 0.5rem 0; max-height: 300px; overflow-y: auto; }}
+    .song-list ul {{ margin: 0.5rem 0; padding-left: 1.5rem; }}
+    .config {{ background: #fff; padding: 1rem; border: 1px solid #dee2e6;
+               border-radius: 4px; font-family: monospace; font-size: 0.85rem; }}
+    .prompt-box {{ white-space: pre-wrap; max-width: 100%; background: #fff; padding: 1rem;
+                   border: 1px solid #dee2e6; border-radius: 4px; font-size: 0.9rem; }}
+    .prompt-box em {{ color: #2563eb; font-style: normal; font-weight: bold; }}
+    pre {{ white-space: pre-wrap; word-break: break-all; max-width: 400px;
+           font-size: 0.8rem; background: #f1f3f5; padding: 0.5rem; border-radius: 4px; }}
+    .footer {{ margin-top: 3rem; padding-top: 1rem; border-top: 1px solid #dee2e6;
+               color: #6c757d; font-size: 0.85rem; }}
+</style>
+</head>
+<body>
+<h1>AI Playlist Naming Test</h1>
+<p><strong>Date:</strong> {timestamp} &nbsp;|&nbsp;
+   <strong>Runs per model:</strong> {num_runs} &nbsp;|&nbsp;
+   <strong>Playlists:</strong> {num_playlists} &nbsp;|&nbsp;
+   <strong>Songs per playlist:</strong> {len(playlists[0]) if playlists else 0}</p>
+
+<h2>Summary</h2>
+<table>
+    <thead><tr>
+        <th>Model</th><th>Provider</th><th>Tests</th><th>Valid</th><th>Errors</th>
+        <th>Valid Rate</th><th>Avg Time</th><th>Min Time</th><th>Max Time</th>
+    </tr></thead>
+    <tbody>{summary_rows}</tbody>
+</table>
+
+<h2>Prompt Used</h2>
+<details open>
+    <summary>Show prompt template</summary>
+    <pre class="prompt-box">{(config.get('prompt') or CREATIVE_PROMPT_TEMPLATE).replace('&', '&amp;').replace('<', '&lt;').replace('>', '&gt;').replace('{song_list_sample}', '<em>&lbrace;song_list_sample&rbrace;</em>')}</pre>
+</details>
+
+<h2>Detailed Results</h2>
+{playlist_sections}
+
+<h2>Test Configuration</h2>
+<div class="config">{json.dumps(config, indent=2, default=str)}</div>
+
+<div class="footer">
+    Generated by AudioMuse-AI Testing Suite
+</div>
+</body>
+</html>"""
+    return html
+
+
+def generate_json_report(results: dict, playlists: list[list[dict]],
+                         timestamp: str, config: dict) -> dict:
+    """Generate the full JSON report."""
+    report = {
+        "timestamp": timestamp,
+        "config": config,
+        "playlists": [
+            [{"title": s["title"], "author": s["author"]} for s in pl]
+            for pl in playlists
+        ],
+        "models": {},
+    }
+
+    for model_name, model_data in results.items():
+        all_runs = model_data["runs"]
+        total = len(all_runs)
+        valid = sum(1 for r in all_runs if r["valid"])
+        errors = sum(1 for r in all_runs if r["error"])
+        times = [r["elapsed"] for r in all_runs if r["error"] is None]
+
+        report["models"][model_name] = {
+            "provider": model_data.get("provider", ""),
+            "model_id": model_data.get("model_id", ""),
+            "url": model_data.get("url", ""),
+            "summary": {
+                "total_tests": total,
+                "valid": valid,
+                "invalid": total - valid - errors,
+                "errors": errors,
+                "valid_rate": round(valid / total * 100, 1) if total > 0 else 0,
+                "avg_time": round(sum(times) / len(times), 3) if times else 0,
+                "min_time": round(min(times), 3) if times else 0,
+                "max_time": round(max(times), 3) if times else 0,
+            },
+            "runs": [
+                {
+                    "playlist_index": r["playlist_index"],
+                    "run_index": r["run_index"],
+                    "cleaned_name": r.get("cleaned_name", ""),
+                    "raw_response": r.get("raw_response", ""),
+                    "valid": r["valid"],
+                    "elapsed": round(r["elapsed"], 3),
+                    "error": r.get("error"),
+                    "name_length": len(r.get("cleaned_name", "")),
+                }
+                for r in all_runs
+            ],
+        }
+
+    return report
+
+
+# ---------------------------------------------------------------------------
+# Main test loop
+# ---------------------------------------------------------------------------
+def run_tests(config: dict, dry_run: bool = False) -> tuple[dict, list[list[dict]]]:
+    """
+    Execute the full test suite.
+
+    Returns:
+        (results_dict, playlists)
+        results_dict keys are model names, values have 'runs' list and metadata.
+    """
+    pg = config["postgres"]
+    tc = config["test_config"]
+    models = [m for m in config["models"] if m.get("enabled", False)]
+
+    if not models:
+        print("ERROR: No models enabled in configuration.")
+        sys.exit(1)
+
+    num_runs = tc["num_runs_per_model"]
+    num_playlists = tc["num_playlists"]
+    songs_per = tc["songs_per_playlist"]
+    timeout = tc.get("timeout_per_request", 120)
+    total_songs = num_playlists * songs_per
+
+    # Use sample_songs from config if present, otherwise fetch from DB
+    sample_songs = config.get("sample_songs")
+    if sample_songs:
+        # Single playlist when using hardcoded songs (no point repeating identical lists)
+        num_playlists = 1
+        playlists = [sample_songs[:songs_per]]
+        print(f"Using {len(sample_songs)} songs from config (sample_songs, 1 playlist)...\n")
+    else:
+        print(f"Fetching {total_songs} songs from database ({pg['container_name']})...")
+        songs = fetch_songs_from_db(
+            pg["container_name"], pg["user"], pg["database"], total_songs,
+        )
+        playlists = split_into_playlists(songs, num_playlists, songs_per)
+        print(f"  OK - {len(songs)} songs split into {num_playlists} playlists of {songs_per}\n")
+
+    # Build prompts (same for all models)
+    # Use prompt from config if provided, otherwise fall back to hardcoded default
+    prompt_template = config.get("prompt")
+    prompts = [build_prompt(pl, prompt_template) for pl in playlists]
+
+    if dry_run:
+        print("=== DRY RUN MODE ===")
+        print(f"Would test {len(models)} model(s), {num_playlists} playlist(s), {num_runs} run(s) each\n")
+        for mi, m in enumerate(models):
+            print(f"  Model {mi + 1}: {m['name']} ({m['provider']}) - {m['model_id']}")
+        print(f"\nPlaylist 1 prompt preview (first 500 chars):")
+        print(prompts[0][:500])
+        print("...")
+        return {}, playlists
+
+    # Run tests
+    results = {}
+    total_models = len(models)
+    connection_failures = set()
+
+    for mi, model in enumerate(models):
+        model_name = model["name"]
+        print(f"[{mi + 1}/{total_models}] Testing: {model_name} ({model['provider']})")
+
+        results[model_name] = {
+            "provider": model["provider"],
+            "model_id": model["model_id"],
+            "url": model["url"],
+            "runs": [],
+        }
+
+        # Skip if previous connection to same URL failed
+        if model["url"] in connection_failures:
+            print(f"  Skipping (connection to {model['url']} already failed)\n")
+            for pi in range(num_playlists):
+                for ri in range(num_runs):
+                    results[model_name]["runs"].append({
+                        "playlist_index": pi,
+                        "run_index": ri,
+                        "raw_response": "",
+                        "cleaned_name": "",
+                        "valid": False,
+                        "elapsed": 0,
+                        "error": "Skipped (connection failed)",
+                    })
+            continue
+
+        model_valid = 0
+        model_total = 0
+        model_times = []
+        abort_model = False
+
+        for pi in range(num_playlists):
+            for ri in range(num_runs):
+                if abort_model:
+                    results[model_name]["runs"].append({
+                        "playlist_index": pi,
+                        "run_index": ri,
+                        "raw_response": "",
+                        "cleaned_name": "",
+                        "valid": False,
+                        "elapsed": 0,
+                        "error": "Skipped (connection failed)",
+                    })
+                    continue
+
+                model_total += 1
+                status_prefix = f"  Playlist {pi + 1}: Run {ri + 1}/{num_runs}..."
+
+                result = call_model(model, prompts[pi], timeout)
+                result["playlist_index"] = pi
+                result["run_index"] = ri
+                results[model_name]["runs"].append(result)
+
+                if result["error"] == "Connection refused":
+                    print(f"{status_prefix} FAIL  (connection refused)")
+                    connection_failures.add(model["url"])
+                    abort_model = True
+                    continue
+
+                if result["error"]:
+                    print(f"{status_prefix} ERR   {result['elapsed']:.1f}s  {result['error']}")
+                elif result["valid"]:
+                    model_valid += 1
+                    model_times.append(result["elapsed"])
+                    print(f"{status_prefix} OK    {result['elapsed']:.1f}s  \"{result['cleaned_name']}\"")
+                else:
+                    name = result["cleaned_name"]
+                    print(f"{status_prefix} INVALID {result['elapsed']:.1f}s  \"{name}\" ({len(name)} chars)")
+                    model_times.append(result["elapsed"])
+
+        # Model summary
+        if model_total > 0 and not abort_model:
+            avg_t = sum(model_times) / len(model_times) if model_times else 0
+            rate = model_valid / model_total * 100
+            print(f"  Result: {model_valid}/{model_total} valid ({rate:.1f}%), avg {avg_t:.1f}s\n")
+        elif abort_model:
+            print(f"  Result: Aborted (connection failed)\n")
+
+    return results, playlists
+
+
+def save_reports(results: dict, playlists: list[list[dict]], config: dict,
+                 num_runs: int, output_dir: str, save_raw: bool):
+    """Save TXT, HTML, and JSON reports to disk."""
+    os.makedirs(output_dir, exist_ok=True)
+    timestamp = datetime.now().strftime("%Y-%m-%d %H:%M")
+    file_ts = datetime.now().strftime("%Y%m%d_%H%M%S")
+
+    # Console / TXT summary
+    summary = generate_summary_table(results, timestamp)
+    names_detail = generate_names_table(results, playlists, num_runs)
+    full_txt = summary + "\n" + names_detail + "\n"
+
+    print("\n" + full_txt)
+
+    txt_path = os.path.join(output_dir, f"ai_naming_{file_ts}.txt")
+    with open(txt_path, "w", encoding="utf-8") as f:
+        f.write(full_txt)
+    print(f"TXT report saved: {txt_path}")
+
+    # HTML report
+    html = generate_html_report(results, playlists, num_runs, timestamp, config, save_raw)
+    html_path = os.path.join(output_dir, f"ai_naming_{file_ts}.html")
+    with open(html_path, "w", encoding="utf-8") as f:
+        f.write(html)
+    print(f"HTML report saved: {html_path}")
+
+    # JSON report
+    json_data = generate_json_report(results, playlists, timestamp, config)
+    json_path = os.path.join(output_dir, f"ai_naming_{file_ts}.json")
+    with open(json_path, "w", encoding="utf-8") as f:
+        json.dump(json_data, f, indent=2, default=str)
+    print(f"JSON report saved: {json_path}")
+
+
+# ---------------------------------------------------------------------------
+# CLI entry point
+# ---------------------------------------------------------------------------
+def main():
+    parser = argparse.ArgumentParser(
+        description="AudioMuse-AI - AI Playlist Naming Performance Test",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+    )
+    parser.add_argument("--config", "-c", type=str,
+                        default="testing_suite/ai_naming_test_config.yaml",
+                        help="Path to YAML config file (default: testing_suite/ai_naming_test_config.yaml)")
+    parser.add_argument("--runs", "-n", type=int, default=None,
+                        help="Override num_runs_per_model from config")
+    parser.add_argument("--dry-run", action="store_true",
+                        help="Fetch songs and build prompts, but don't call any APIs")
+
+    args = parser.parse_args()
+
+    # Load config
+    if not os.path.exists(args.config):
+        print(f"ERROR: Config file not found: {args.config}")
+        print(f"Usage: python testing_suite/test_ai_naming.py --config path/to/config.yaml")
+        sys.exit(1)
+
+    with open(args.config, "r", encoding="utf-8") as f:
+        config = yaml.safe_load(f)
+
+    # Merge provider defaults (url, api_key) into each model entry
+    apply_defaults(config)
+
+    # Apply CLI overrides
+    if args.runs is not None:
+        config["test_config"]["num_runs_per_model"] = args.runs
+
+    num_runs = config["test_config"]["num_runs_per_model"]
+    output_cfg = config.get("output", {})
+    output_dir = output_cfg.get("directory", "testing_suite/reports/ai_naming")
+    save_raw = output_cfg.get("save_raw_responses", True)
+
+    print("=" * 60)
+    print(" AudioMuse-AI - AI Playlist Naming Performance Test")
+    print("=" * 60)
+
+    enabled = [m for m in config["models"] if m.get("enabled", False)]
+    print(f" Models:    {len(enabled)} enabled")
+    print(f" Playlists: {config['test_config']['num_playlists']}")
+    print(f" Runs/model: {num_runs}")
+    print(f" Songs/playlist: {config['test_config']['songs_per_playlist']}")
+    print("=" * 60 + "\n")
+
+    # Run tests
+    results, playlists = run_tests(config, dry_run=args.dry_run)
+
+    if args.dry_run:
+        print("\nDry run complete. No API calls were made.")
+        return
+
+    if not results:
+        print("No results to report.")
+        return
+
+    # Generate and save reports
+    save_reports(results, playlists, config, num_runs, output_dir, save_raw)
+
+
+if __name__ == "__main__":
+    main()

From da5f56321b229212987fc152591feabb06464a6e Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Fri, 6 Feb 2026 19:34:48 +0100
Subject: [PATCH 20/33] =?UTF-8?q?-=20Added=20library=20selection=20in=20th?=
 =?UTF-8?q?e=20setup=20-=20Optimized=20the=20instant=20playlist=20by:=20?=
 =?UTF-8?q?=20=20Files=20Modified=20=20=20File:=20ai=5Fmcp=5Fclient.py=20?=
 =?UTF-8?q?=20=20Changes:=20New=20=5Fbuild=5Fsystem=5Fprompt()=20replaces?=
 =?UTF-8?q?=204=20hardcoded=20prompts;=20all=20provider=20=20=20=20=20func?=
 =?UTF-8?q?tions=20accept=20library=5Fcontext;=20search=5Fdatabase=20tool?=
 =?UTF-8?q?=20schema=20adds=20scale,=20=20=20=20=20year=5Fmin,=20year=5Fma?=
 =?UTF-8?q?x,=20min=5Frating;=20energy=20normalization=20(0-1=20->=20raw)?=
 =?UTF-8?q?=20in=20=20=20=20=20execute=5Fmcp=5Ftool=20=20=20=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=20=20=20File:=20app=5Fchat?=
 =?UTF-8?q?.py=20=20=20Changes:=20Fetches=20library=20context=20at=20workf?=
 =?UTF-8?q?low=20start;=20iteration=200=20simplified=20to=20one=20=20=20?=
 =?UTF-8?q?=20=20line;=20iteration=202+=20gets=20rich=20feedback=20(top=20?=
 =?UTF-8?q?artists,=20diversity=20ratio,=20=20=20=20=20genres=20covered,?=
 =?UTF-8?q?=20tools=20used);=20pre-execution=20validation=20rejects=20empt?=
 =?UTF-8?q?y=20=20=20=20=20song=5Fsimilarity=20and=20filterless=20search?=
 =?UTF-8?q?=5Fdatabase;=20artist=20diversity=20=20=20=20=20enforcement=20(?=
 =?UTF-8?q?max=205/artist=20with=20backfill);=20song=20ordering=20for=20sm?=
 =?UTF-8?q?ooth=20=20=20=20=20transitions=20=20=20=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=20=20=20File:=20tasks/mcp=5Fserver.?=
 =?UTF-8?q?py=20=20=20Changes:=20New=20get=5Flibrary=5Fcontext()=20with=20?=
 =?UTF-8?q?caching;=20=5Fdatabase=5Fgenre=5Fquery=5Fsync=20=20=20=20=20enh?=
 =?UTF-8?q?anced=20with=20regex=20genre=20matching,=20relevance-scored=20r?=
 =?UTF-8?q?anking,=20=20=20=20=20scale/year/rating=20filters;=20=5Fai=5Fbr?=
 =?UTF-8?q?ainstorm=5Fsync=20rewritten=20with=20strict=20=20=20=20=202-sta?=
 =?UTF-8?q?ge=20matching=20(exact=20then=20normalized=20fuzzy)=20requiring?=
 =?UTF-8?q?=20BOTH=20title=20AND=20=20=20=20=20artist=20=20=20=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80=E2=94=80?=
 =?UTF-8?q?=E2=94=80=E2=94=80=E2=94=80=E2=94=80=20=20=20File:=20config.py?=
 =?UTF-8?q?=20=20=20Changes:=20New:=20MAX=5FSONGS=5FPER=5FARTIST=5FPLAYLIS?=
 =?UTF-8?q?T=20(default=205),=20PLAYLIST=5FENERGY=5FARC=20=20=20=20=20(def?=
 =?UTF-8?q?ault=20False)=20=20=20New=20File=20=20=20File:=20tasks/playlist?=
 =?UTF-8?q?=5Fordering.py=20=20=20Purpose:=20Greedy=20nearest-neighbor=20o?=
 =?UTF-8?q?rdering=20using=20composite=20distance=20(35%=20tempo=20+=20=20?=
 =?UTF-8?q?=2035%=20=20=20=20=20=20energy=20+=2030%=20key=20via=20Circle?=
 =?UTF-8?q?=20of=20Fifths).=20Optional=20energy=20arc=20shaping.=20=20=20K?=
 =?UTF-8?q?ey=20Improvements?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

  1. Unified prompts - One canonical prompt for all 4 AI providers with correct tool
   names and library context
  2. Smart iteration feedback - AI sees what was already found (top artists,
  diversity metrics) so it can diversify
  3. Library awareness - AI knows what genres/years/ratings exist in the user's
  collection
  4. Better search - Genre regex avoids false positives, relevance ranking replaces
  random, year/rating/scale filters unlocked
  5. Strict matching - ai_brainstorm no longer matches "All" in title to every song
  with "all"
  6. Normalized energy - AI uses intuitive 0-1 scale instead of raw 0.01-0.15
  7. Smooth ordering - Songs transition smoothly by tempo, energy, and musical key
  8. Artist diversity - No artist dominates with >5 songs; overflow backfilled
  intelligently
  9. Tool validation - Empty/filterless tool calls rejected before execution
---
 ai_mcp_client.py               | 428 +++++++++++++++------------------
 app_chat.py                    | 179 +++++++++-----
 app_setup.py                   |  50 +++-
 config.py                      |   6 +
 tasks/mcp_server.py            | 286 +++++++++++++++++-----
 tasks/mediaserver.py           |  26 ++
 tasks/mediaserver_emby.py      | 133 ++++++----
 tasks/mediaserver_jellyfin.py  | 110 +++++++--
 tasks/mediaserver_lyrion.py    |  87 ++++++-
 tasks/mediaserver_navidrome.py |  44 +++-
 tasks/playlist_ordering.py     | 189 +++++++++++++++
 templates/settings.html        | 120 +++++++++
 templates/setup.html           | 103 ++++++++
 13 files changed, 1324 insertions(+), 437 deletions(-)
 create mode 100644 tasks/playlist_ordering.py

diff --git a/ai_mcp_client.py b/ai_mcp_client.py
index aa01dd27..aebe7528 100644
--- a/ai_mcp_client.py
+++ b/ai_mcp_client.py
@@ -10,61 +10,136 @@
 logger = logging.getLogger(__name__)
 
 
+def _build_system_prompt(tools: List[Dict], library_context: Optional[Dict] = None) -> str:
+    """Build a single canonical system prompt used by ALL AI providers.
+
+    Args:
+        tools: MCP tool definitions (used to list correct tool names)
+        library_context: Optional dict from get_library_context() with library stats
+    """
+    tool_names = [t['name'] for t in tools]
+    has_text_search = 'text_search' in tool_names
+
+    # Build library context section
+    lib_section = ""
+    if library_context and library_context.get('total_songs', 0) > 0:
+        ctx = library_context
+        genres_str = ', '.join(ctx['top_genres'][:12]) if ctx.get('top_genres') else 'unknown'
+        year_range = ''
+        if ctx.get('year_min') and ctx.get('year_max'):
+            year_range = f"\n- Year range: {ctx['year_min']}-{ctx['year_max']}"
+        rating_info = ''
+        if ctx.get('has_ratings'):
+            rating_info = f"\n- {ctx['rated_songs_pct']}% of songs have ratings (0-5 scale)"
+        scale_info = ''
+        if ctx.get('scales'):
+            scale_info = f"\n- Scales available: {', '.join(ctx['scales'])}"
+
+        lib_section = f"""
+=== USER'S MUSIC LIBRARY ===
+- {ctx['total_songs']} songs from {ctx['unique_artists']} artists
+- Top genres: {genres_str}{year_range}{rating_info}{scale_info}
+"""
+
+    # Build tool decision tree
+    decision_tree = []
+    decision_tree.append("1. Specific song+artist mentioned? -> song_similarity")
+    if has_text_search:
+        decision_tree.append("2. Instruments (piano, guitar, drums) or descriptive moods (romantic, dreamy)? -> text_search")
+        decision_tree.append("3. 'songs like [ARTIST]' (similar artists)? -> artist_similarity")
+        decision_tree.append("4. 'sounds like A + B' or 'like X but not Y'? -> song_alchemy")
+        decision_tree.append("5. Artist's own songs, trending, era, complex? -> ai_brainstorm")
+        decision_tree.append("6. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
+    else:
+        decision_tree.append("2. 'songs like [ARTIST]' (similar artists)? -> artist_similarity")
+        decision_tree.append("3. 'sounds like A + B' or 'like X but not Y'? -> song_alchemy")
+        decision_tree.append("4. Artist's own songs, trending, era, complex? -> ai_brainstorm")
+        decision_tree.append("5. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
+
+    decision_text = '\n'.join(decision_tree)
+
+    prompt = f"""You are an expert music playlist curator. Analyze the user's request and call the appropriate tools to build a playlist of 100 songs.
+{lib_section}
+=== TOOL SELECTION (most specific -> most general) ===
+{decision_text}
+
+=== RULES ===
+1. Call one or more tools - each returns songs with item_id, title, and artist
+2. song_similarity REQUIRES both title AND artist - never leave empty
+3. artist_similarity returns songs from SIMILAR artists, NOT the artist's own songs
+4. search_database: COMBINE all filters in ONE call. Use for genre/mood/tempo/energy/year/rating
+5. For multiple artists: call artist_similarity once per artist, or use song_alchemy to blend
+6. Return ONLY tool calls - no text explanations
+
+=== VALID search_database VALUES ===
+GENRES: rock, pop, metal, jazz, electronic, dance, alternative, indie, punk, blues, hard rock, heavy metal, Hip-Hop, funk, country, soul, 00s, 90s, 80s, 70s, 60s
+MOODS: danceable, aggressive, happy, party, relaxed, sad
+TEMPO: 40-200 BPM
+ENERGY: 0.0 (calm) to 1.0 (intense) - use 0.0-0.35 for low, 0.35-0.65 for medium, 0.65-1.0 for high
+SCALE: major, minor
+YEAR: year_min/year_max (e.g., 1990-1999 for 90s)
+RATING: min_rating 1-5 (user's personal ratings)"""
+
+    return prompt
+
+
 def call_ai_with_mcp_tools(
     provider: str,
     user_message: str,
     tools: List[Dict],
     ai_config: Dict,
-    log_messages: List[str]
+    log_messages: List[str],
+    library_context: Optional[Dict] = None
 ) -> Dict:
     """
     Call AI provider with MCP tool definitions and handle tool calling flow.
-    
+
     Args:
         provider: AI provider ('GEMINI', 'OPENAI', 'MISTRAL', 'OLLAMA')
         user_message: The user's natural language request
         tools: List of MCP tool definitions
         ai_config: Configuration dict with API keys, URLs, model names
         log_messages: List to append log messages to
-    
+        library_context: Optional library stats dict from get_library_context()
+
     Returns:
         Dict with 'tool_calls' (list of tool calls) or 'error' (error message)
     """
     if provider == "GEMINI":
-        return _call_gemini_with_tools(user_message, tools, ai_config, log_messages)
+        return _call_gemini_with_tools(user_message, tools, ai_config, log_messages, library_context)
     elif provider == "OPENAI":
-        return _call_openai_with_tools(user_message, tools, ai_config, log_messages)
+        return _call_openai_with_tools(user_message, tools, ai_config, log_messages, library_context)
     elif provider == "MISTRAL":
-        return _call_mistral_with_tools(user_message, tools, ai_config, log_messages)
+        return _call_mistral_with_tools(user_message, tools, ai_config, log_messages, library_context)
     elif provider == "OLLAMA":
-        return _call_ollama_with_tools(user_message, tools, ai_config, log_messages)
+        return _call_ollama_with_tools(user_message, tools, ai_config, log_messages, library_context)
     else:
         return {"error": f"Unsupported AI provider: {provider}"}
 
 
-def _call_gemini_with_tools(user_message: str, tools: List[Dict], ai_config: Dict, log_messages: List[str]) -> Dict:
+def _call_gemini_with_tools(user_message: str, tools: List[Dict], ai_config: Dict, log_messages: List[str], library_context: Optional[Dict] = None) -> Dict:
     """Call Gemini with function calling."""
     try:
         import google.genai as genai
-        
+
         api_key = ai_config.get('gemini_key')
         model_name = ai_config.get('gemini_model', 'gemini-2.5-pro')
-        
+
         if not api_key or api_key == "YOUR-GEMINI-API-KEY-HERE":
             return {"error": "Valid Gemini API key required"}
-        
+
         # Use new google-genai Client API
         client = genai.Client(api_key=api_key)
-        
+
         # Convert MCP tools to Gemini function declarations
         # Gemini uses a different schema format - need to convert types
         def convert_schema_for_gemini(schema):
             """Convert JSON Schema to Gemini-compatible format."""
             if not isinstance(schema, dict):
                 return schema
-            
+
             result = {}
-            
+
             # Convert type field
             if 'type' in schema:
                 schema_type = schema['type']
@@ -78,29 +153,29 @@ def convert_schema_for_gemini(schema):
                     'object': 'OBJECT'
                 }
                 result['type'] = type_map.get(schema_type, schema_type.upper())
-            
+
             # Copy description
             if 'description' in schema:
                 result['description'] = schema['description']
-            
+
             # Handle properties recursively
             if 'properties' in schema:
                 result['properties'] = {
-                    k: convert_schema_for_gemini(v) 
+                    k: convert_schema_for_gemini(v)
                     for k, v in schema['properties'].items()
                 }
-            
+
             # Handle array items
             if 'items' in schema:
                 result['items'] = convert_schema_for_gemini(schema['items'])
-            
+
             # Copy required and enum (Gemini doesn't support 'default')
             for field in ['required', 'enum']:
                 if field in schema:
                     result[field] = schema[field]
-            
+
             return result
-        
+
         function_declarations = []
         for tool in tools:
             func_decl = {
@@ -109,31 +184,13 @@ def convert_schema_for_gemini(schema):
                 "parameters": convert_schema_for_gemini(tool['inputSchema'])
             }
             function_declarations.append(func_decl)
-        
-        # System instruction for playlist generation
-        system_instruction = """You are an expert music playlist curator with access to a music database.
-
-Your task is to analyze the user's request and determine which tools to call to build a great playlist.
-
-IMPORTANT RULES:
-1. Call tools to gather songs - you can call multiple tools
-2. Each tool returns a list of songs with item_id, title, and artist
-3. Combine results from multiple tool calls if needed
-4. Return ONLY tool calls - do not provide text responses yet
-
-Available strategies:
-- For artist requests: Use artist_similarity or artist_hits
-- For genre/mood: Use search_by_genre
-- For energy/tempo: Use search_by_tempo_energy
-- For vibe descriptions: Use vibe_match
-- For specific songs: Use song_similarity
-- To check what's available: Use explore_database first
-
-Call the appropriate tools now to fulfill the user's request."""
-        
+
+        # Unified system prompt
+        system_instruction = _build_system_prompt(tools, library_context)
+
         # Prepare tools for new API
         tools_list = [genai.types.Tool(function_declarations=function_declarations)]
-        
+
         # Generate response with function calling using new API
         # Note: Using 'ANY' mode to force tool calling instead of text response
         response = client.models.generate_content(
@@ -197,15 +254,15 @@ def convert_to_dict(obj):
         return {"error": f"Gemini error: {str(e)}"}
 
 
-def _call_openai_with_tools(user_message: str, tools: List[Dict], ai_config: Dict, log_messages: List[str]) -> Dict:
+def _call_openai_with_tools(user_message: str, tools: List[Dict], ai_config: Dict, log_messages: List[str], library_context: Optional[Dict] = None) -> Dict:
     """Call OpenAI-compatible API with function calling."""
     try:
         import httpx
-        
+
         api_url = ai_config.get('openai_url', 'https://api.openai.com/v1/chat/completions')
         api_key = ai_config.get('openai_key', 'no-key-needed')
         model_name = ai_config.get('openai_model', 'gpt-4')
-        
+
         # Convert MCP tools to OpenAI function format
         functions = []
         for tool in tools:
@@ -217,34 +274,22 @@ def _call_openai_with_tools(user_message: str, tools: List[Dict], ai_config: Dic
                     "parameters": tool['inputSchema']
                 }
             })
-        
+
         # Build request
         headers = {
             "Content-Type": "application/json",
             "Authorization": f"Bearer {api_key}"
         }
-        
+
+        # Unified system prompt
+        system_prompt = _build_system_prompt(tools, library_context)
+
         payload = {
             "model": model_name,
             "messages": [
                 {
                     "role": "system",
-                    "content": """You are an expert music playlist curator with access to a music database.
-
-Analyze the user's request and call the appropriate tools to build a playlist.
-
-Rules:
-1. Call one or more tools to gather songs
-2. Each tool returns songs with item_id, title, and artist
-3. Choose tools based on the request type:
-   - Artist requests → artist_similarity or artist_hits
-   - Genre/mood → search_by_genre
-   - Energy/tempo → search_by_tempo_energy
-   - Vibe descriptions → vibe_match
-   - Specific songs → song_similarity
-   - Check availability → explore_database
-
-Call the tools needed to fulfill the request."""
+                    "content": system_prompt
                 },
                 {
                     "role": "user",
@@ -298,19 +343,19 @@ def _call_openai_with_tools(user_message: str, tools: List[Dict], ai_config: Dic
         return {"error": f"OpenAI error: {str(e)}"}
 
 
-def _call_mistral_with_tools(user_message: str, tools: List[Dict], ai_config: Dict, log_messages: List[str]) -> Dict:
+def _call_mistral_with_tools(user_message: str, tools: List[Dict], ai_config: Dict, log_messages: List[str], library_context: Optional[Dict] = None) -> Dict:
     """Call Mistral with function calling."""
     try:
         from mistralai import Mistral
-        
+
         api_key = ai_config.get('mistral_key')
         model_name = ai_config.get('mistral_model', 'mistral-large-latest')
-        
+
         if not api_key or api_key == "YOUR-GEMINI-API-KEY-HERE":
             return {"error": "Valid Mistral API key required"}
-        
+
         client = Mistral(api_key=api_key)
-        
+
         # Convert MCP tools to Mistral function format
         mistral_tools = []
         for tool in tools:
@@ -322,26 +367,17 @@ def _call_mistral_with_tools(user_message: str, tools: List[Dict], ai_config: Di
                     "parameters": tool['inputSchema']
                 }
             })
-        
+
+        # Unified system prompt
+        system_prompt = _build_system_prompt(tools, library_context)
+
         # Call Mistral
         response = client.chat.complete(
             model=model_name,
             messages=[
                 {
                     "role": "system",
-                    "content": """You are an expert music playlist curator with access to a music database.
-
-Analyze the user's request and call the appropriate tools to build a playlist.
-
-Rules:
-1. Call one or more tools to gather songs
-2. Choose tools based on request type:
-   - Artists → artist_similarity or artist_hits
-   - Genres → search_by_genre
-   - Energy/tempo → search_by_tempo_energy
-   - Vibes → vibe_match
-
-Call the tools now."""
+                    "content": system_prompt
                 },
                 {
                     "role": "user",
@@ -376,180 +412,58 @@ def _call_mistral_with_tools(user_message: str, tools: List[Dict], ai_config: Di
         return {"error": f"Mistral error: {str(e)}"}
 
 
-def _call_ollama_with_tools(user_message: str, tools: List[Dict], ai_config: Dict, log_messages: List[str]) -> Dict:
+def _call_ollama_with_tools(user_message: str, tools: List[Dict], ai_config: Dict, log_messages: List[str], library_context: Optional[Dict] = None) -> Dict:
     """
     Call Ollama with tool definitions.
     Note: Ollama's tool calling support varies by model. This uses a prompt-based approach.
     """
     try:
         import httpx
-        
+
         ollama_url = ai_config.get('ollama_url', 'http://localhost:11434/api/generate')
         model_name = ai_config.get('ollama_model', 'llama3.1:8b')
-        
-        # Build simpler tool list for Ollama
+
+        # Build tool parameter descriptions for Ollama (it needs explicit param listings)
         tools_list = []
-        has_text_search = False
+        has_text_search = 'text_search' in [t['name'] for t in tools]
         for tool in tools:
-            if tool['name'] == 'text_search':
-                has_text_search = True
             props = tool['inputSchema'].get('properties', {})
-            required = tool['inputSchema'].get('required', [])
             params_desc = ", ".join([f"{k} ({v.get('type')})" for k, v in props.items()])
-            tools_list.append(f"• {tool['name']}: {tool['description']}\n  Parameters: {params_desc}")
-        
+            tools_list.append(f"- {tool['name']}: {params_desc}")
         tools_text = "\n".join(tools_list)
-        
-        # Build tool priority list dynamically
-        tool_count = len(tools)
-        tool_priorities = []
-        tool_priorities.append("1. song_similarity - EXACT API: similar songs (needs title+artist)")
-        if has_text_search:
-            tool_priorities.append("2. text_search - CLAP SEARCH: natural language search for instruments, moods, descriptive queries")
-            tool_priorities.append("3. artist_similarity - EXACT API: songs from similar artists (NOT artist's own songs)")
-            tool_priorities.append("4. song_alchemy - VECTOR MATH: blend/subtract artists/songs")
-            tool_priorities.append("5. ai_brainstorm - AI KNOWLEDGE: artist's own songs, trending, era, complex requests")
-            tool_priorities.append("6. search_database - EXACT DB: filter by genre/mood/tempo/energy (LAST RESORT)")
-        else:
-            tool_priorities.append("2. artist_similarity - EXACT API: songs from similar artists (NOT artist's own songs)")
-            tool_priorities.append("3. song_alchemy - VECTOR MATH: blend/subtract artists/songs")
-            tool_priorities.append("4. ai_brainstorm - AI KNOWLEDGE: artist's own songs, trending, era, complex requests")
-            tool_priorities.append("5. search_database - EXACT DB: filter by genre/mood/tempo/energy (LAST RESORT)")
-        
-        tool_priorities_text = "\n".join(tool_priorities)
-        
-        # Build decision tree dynamically
-        decision_steps = []
-        if has_text_search:
-            decision_steps.append("- Specific song+artist mentioned? → song_similarity (exact API)")
-            decision_steps.append("- ⚠️ INSTRUMENTS mentioned (piano, guitar, drums, violin, saxophone, etc.)? → text_search (CLAP) - NEVER use search_database for instruments!")
-            decision_steps.append("- Descriptive/subjective moods (romantic, chill, melancholic, dreamy, uplifting)? → text_search (CLAP)")
-            decision_steps.append("- 'songs like [ARTIST]' (similar artists)? → artist_similarity (exact API)")
-            decision_steps.append("- 'sounds like [ARTIST1] + [ARTIST2]' or 'like X but NOT Y'? → song_alchemy (vector math)")
-            decision_steps.append("- Artist's OWN songs, trending, era, complex? → ai_brainstorm (AI knowledge)")
-            decision_steps.append("- Database genres/moods ONLY (rock, pop, metal, jazz - NO instruments)? → search_database (exact DB)")
-        else:
-            decision_steps.append("- Specific song+artist mentioned? → song_similarity (exact API)")
-            decision_steps.append("- 'songs like [ARTIST]' (similar artists)? → artist_similarity (exact API)")
-            decision_steps.append("- 'sounds like [ARTIST1] + [ARTIST2]' or 'like X but NOT Y'? → song_alchemy (vector math)")
-            decision_steps.append("- Artist's OWN songs, trending, era, complex? → ai_brainstorm (AI knowledge)")
-            decision_steps.append("- Genre/mood/tempo/energy filters only? → search_database (exact DB)")
-        
-        decision_steps_text = "\n".join(decision_steps)
-        
-        # Build examples dynamically
+
+        # Use the unified system prompt as base, then add Ollama-specific JSON format instructions
+        system_prompt = _build_system_prompt(tools, library_context)
+
+        # Build a few examples for Ollama's JSON output format
         examples = []
-        examples.append("""
-"Similar to By the Way by Red Hot Chili Peppers"
-{{
-  "tool_calls": [{{"name": "song_similarity", "arguments": {{"song_title": "By the Way", "song_artist": "Red Hot Chili Peppers", "get_songs": 100}}}}]
-}}""")
-        
+        examples.append('"Similar to By the Way by Red Hot Chili Peppers"\n{{"tool_calls": [{{"name": "song_similarity", "arguments": {{"song_title": "By the Way", "song_artist": "Red Hot Chili Peppers", "get_songs": 100}}}}]}}')
         if has_text_search:
-            examples.append("""
-"calm piano song"
-{{
-  "tool_calls": [{{"name": "text_search", "arguments": {{"description": "calm piano", "get_songs": 100}}}}]
-}}""")
-            examples.append("""
-"romantic acoustic guitar"
-{{
-  "tool_calls": [{{"name": "text_search", "arguments": {{"description": "romantic acoustic guitar", "get_songs": 100}}}}]
-}}""")
-            examples.append("""
-"energetic ukulele songs"
-{{
-  "tool_calls": [{{"name": "text_search", "arguments": {{"description": "energetic ukulele", "energy_filter": "high", "get_songs": 100}}}}]
-}}""")
-        
-        examples.append("""
-"songs like blink-182" (similar artists, NOT blink-182's own)
-{{
-  "tool_calls": [{{"name": "artist_similarity", "arguments": {{"artist": "blink-182", "get_songs": 100}}}}]
-}}""")
-        
-        examples.append("""
-"blink-182 songs" (blink-182's OWN songs)
-{{
-  "tool_calls": [{{"name": "ai_brainstorm", "arguments": {{"user_request": "blink-182 songs", "get_songs": 100}}}}]
-}}""")
-        
-        examples.append("""
-"running 120 bpm"
-{{
-  "tool_calls": [{{"name": "search_database", "arguments": {{"tempo_min": 115, "tempo_max": 125, "energy_min": 0.08, "get_songs": 100}}}}]
-}}""")
-        
-        examples_text = "\n".join(examples)
-        
-        prompt = f"""You are a music playlist curator. Analyze this request and decide which tools to call.
+            examples.append('"calm piano song"\n{{"tool_calls": [{{"name": "text_search", "arguments": {{"description": "calm piano", "get_songs": 100}}}}]}}')
+        examples.append('"songs like blink-182"\n{{"tool_calls": [{{"name": "artist_similarity", "arguments": {{"artist": "blink-182", "get_songs": 100}}}}]}}')
+        examples.append('"blink-182 songs"\n{{"tool_calls": [{{"name": "ai_brainstorm", "arguments": {{"user_request": "blink-182 songs", "get_songs": 100}}}}]}}')
+        examples.append('"energetic rock"\n{{"tool_calls": [{{"name": "search_database", "arguments": {{"genres": ["rock"], "energy_min": 0.65, "get_songs": 100}}}}]}}')
+        examples_text = "\n\n".join(examples)
 
-Request: "{user_message}"
+        prompt = f"""{system_prompt}
 
-Available tools:
+=== TOOL PARAMETERS ===
 {tools_text}
 
-CRITICAL RULES:
-1. Return ONLY valid JSON object (not an array)
-2. Use this EXACT format:
+=== OUTPUT FORMAT (CRITICAL) ===
+Return ONLY a valid JSON object with this EXACT format:
 {{
   "tool_calls": [
-    {{"name": "tool_name", "arguments": {{"param": "value"}}}},
-    {{"name": "tool_name2", "arguments": {{"param": "value"}}}}
+    {{"name": "tool_name", "arguments": {{"param": "value"}}}}
   ]
 }}
 
-YOU HAVE {tool_count} TOOLS (in priority order):
-{tool_priorities_text}
-
-STEP 1 - ANALYZE INTENT:
-What does the user want?
-{decision_steps_text}
-
-CRITICAL RULES:
-1. song_similarity NEEDS title+artist - no empty titles!
-2. ⚠️ INSTRUMENTS → text_search! If query mentions INSTRUMENTS (piano, guitar, drums, violin, saxophone, trumpet, flute, bass, ukulele, harmonica), you MUST use text_search, NOT search_database!
-3. text_search is ALSO BEST for descriptive/subjective moods (romantic, chill, sad, melancholic, uplifting, dreamy)
-4. artist_similarity returns SIMILAR artists, NOT artist's own songs
-5. search_database = ONLY for database genres/moods listed below (NOT instruments!)
-6. ai_brainstorm = DEFAULT for complex requests
-7. Match ACTUAL user request - don't invent different requests!
-
-⚠️ CRITICAL DISTINCTION:
-- INSTRUMENTS (piano, guitar, drums) → text_search
-- GENRES (rock, pop, metal, jazz) → search_database
-- "piano" is NOT a genre! Use text_search for instruments!
-
-VALID search_database VALUES (ONLY THESE):
-GENRES: rock, pop, metal, jazz, electronic, dance, alternative, indie, punk, blues, hard rock, heavy metal, Hip-Hop, funk, country, 00s, 90s, 80s, 70s, 60s
-MOODS: danceable, aggressive, happy, party, relaxed, sad
-TEMPO: 40-200 BPM | ENERGY: 0.01-0.15
-⚠️ NOTE: Instruments like "piano" are NOT valid genres! Use text_search instead!
-
-KEY EXAMPLES:
+=== EXAMPLES ===
 {examples_text}
 
-"energetic rock"
-{{
-  "tool_calls": [{{"name": "search_database", "arguments": {{"genres": ["rock"], "energy_min": 0.08, "moods": ["happy"], "get_songs": 100}}}}]
-}}
-
-"trending 2025"
-{{
-  "tool_calls": [{{"name": "ai_brainstorm", "arguments": {{"user_request": "trending 2025", "get_songs": 100}}}}]
-}}
-
-⚠️ WRONG EXAMPLES (DO NOT DO THIS):
-❌ "piano songs" with search_database genres=["piano"] → WRONG! Piano is an instrument, not a genre. Use text_search instead.
-❌ "guitar music" with search_database genres=["guitar"] → WRONG! Guitar is an instrument. Use text_search.
-✅ "piano songs" → Use text_search with description="piano"
-✅ "calm piano" → Use text_search with description="calm piano"
-
-Now analyze this request and call tools:
-
+Now analyze this request and return ONLY the JSON:
 Request: "{user_message}"
-
-Return ONLY the JSON object with tool_calls array:"""
+"""
         
         payload = {
             "model": model_name,
@@ -710,15 +624,38 @@ def normalize_items(items):
                 tool_args.get('get_songs', 100)
             )
         elif tool_name == "search_database":
+            # Convert normalized energy (0-1) to raw energy scale
+            energy_min_raw = None
+            energy_max_raw = None
+            e_min = tool_args.get('energy_min')
+            e_max = tool_args.get('energy_max')
+            if e_min is not None:
+                e_min = float(e_min)
+                # If the value looks like it's already in raw scale (0.01-0.15), pass through
+                if e_min <= 0.15:
+                    energy_min_raw = e_min
+                else:
+                    energy_min_raw = config.ENERGY_MIN + e_min * (config.ENERGY_MAX - config.ENERGY_MIN)
+            if e_max is not None:
+                e_max = float(e_max)
+                if e_max <= 0.15:
+                    energy_max_raw = e_max
+                else:
+                    energy_max_raw = config.ENERGY_MIN + e_max * (config.ENERGY_MAX - config.ENERGY_MIN)
+
             return _database_genre_query_sync(
                 tool_args.get('genres'),
                 tool_args.get('get_songs', 100),
                 tool_args.get('moods'),
                 tool_args.get('tempo_min'),
                 tool_args.get('tempo_max'),
-                tool_args.get('energy_min'),
-                tool_args.get('energy_max'),
-                tool_args.get('key')
+                energy_min_raw,
+                energy_max_raw,
+                tool_args.get('key'),
+                tool_args.get('scale'),
+                tool_args.get('year_min'),
+                tool_args.get('year_max'),
+                tool_args.get('min_rating')
             )
         elif tool_name == "ai_brainstorm":
             return _ai_brainstorm_sync(
@@ -903,7 +840,7 @@ def get_mcp_tools() -> List[Dict]:
         },
         {
             "name": "search_database",
-            "description": f"🎖️ PRIORITY #{'6' if CLAP_ENABLED else '5'}: MOST GENERAL (last resort) - Search by genre/mood/tempo/energy filters. ✅ USE for: genre/mood/tempo combinations when NO specific artists/songs mentioned AND text_search not available/suitable. ❌ DON'T USE if you can use other more specific tools. COMBINE all filters in ONE call!",
+            "description": f"🎖️ PRIORITY #{'6' if CLAP_ENABLED else '5'}: MOST GENERAL (last resort) - Search by genre/mood/tempo/energy/year/rating/scale filters. ✅ USE for: genre/mood/tempo combinations when NO specific artists/songs mentioned AND text_search not available/suitable. ❌ DON'T USE if you can use other more specific tools. COMBINE all filters in ONE call!",
             "inputSchema": {
                 "type": "object",
                 "properties": {
@@ -927,16 +864,33 @@ def get_mcp_tools() -> List[Dict]:
                     },
                     "energy_min": {
                         "type": "number",
-                        "description": "Min energy (0.01-0.15)"
+                        "description": "Min energy 0.0 (calm) to 1.0 (intense)"
                     },
                     "energy_max": {
                         "type": "number",
-                        "description": "Max energy (0.01-0.15)"
+                        "description": "Max energy 0.0 (calm) to 1.0 (intense)"
                     },
                     "key": {
                         "type": "string",
                         "description": "Musical key (C, D, E, F, G, A, B with # or b)"
                     },
+                    "scale": {
+                        "type": "string",
+                        "enum": ["major", "minor"],
+                        "description": "Musical scale: major or minor"
+                    },
+                    "year_min": {
+                        "type": "integer",
+                        "description": "Earliest release year (e.g. 1990)"
+                    },
+                    "year_max": {
+                        "type": "integer",
+                        "description": "Latest release year (e.g. 1999)"
+                    },
+                    "min_rating": {
+                        "type": "integer",
+                        "description": "Minimum user rating 1-5"
+                    },
                     "get_songs": {
                         "type": "integer",
                         "description": "Number of songs",
diff --git a/app_chat.py b/app_chat.py
index 4ee17e84..7c274390 100644
--- a/app_chat.py
+++ b/app_chat.py
@@ -327,13 +327,19 @@ def chat_playlist_api():
     # ====================
     # MCP AGENTIC WORKFLOW
     # ====================
-    
+
     log_messages.append("\n🤖 Using MCP Agentic Workflow for playlist generation")
     log_messages.append("Target: 100 songs")
-    
-    # Get MCP tools
+
+    # Get MCP tools and library context
     mcp_tools = get_mcp_tools()
     log_messages.append(f"Available tools: {', '.join([t['name'] for t in mcp_tools])}")
+
+    # Fetch library context for smarter AI prompting
+    from tasks.mcp_server import get_library_context
+    library_context = get_library_context()
+    if library_context.get('total_songs', 0) > 0:
+        log_messages.append(f"Library: {library_context['total_songs']} songs, {library_context['unique_artists']} artists")
     
     # Agentic workflow - AI iteratively calls tools until enough songs
     all_songs = []
@@ -361,56 +367,42 @@ def chat_playlist_api():
         
         # Build context for AI about current state
         if iteration == 0:
-            ai_context = f"""Build a {target_song_count}-song playlist for: "{original_user_input}"
-
-=== STEP 1: ANALYZE INTENT ===
-First, understand what the user wants:
-- Specific song + artist? → Use exact API lookup (song_similarity)
-- Similar to an artist? → Use exact API lookup (artist_similarity)
-- Genre/mood/tempo/energy? → Use exact DB search (search_database)
-- Everything else? → Use AI knowledge (ai_brainstorm)
-
-=== YOUR 4 TOOLS ===
-1. song_similarity(song_title, artist, get_songs) - Exact API: find similar songs (NEEDS both title+artist)
-2. artist_similarity(artist, get_songs) - Exact API: find songs from SIMILAR artists (NOT artist's own songs)
-3. search_database(genres, moods, tempo_min, tempo_max, energy_min, energy_max, key, get_songs) - Exact DB: filter by attributes (COMBINE all filters in ONE call)
-4. ai_brainstorm(user_request, get_songs) - AI knowledge: for ANYTHING else (artist's own songs, trending, era, complex requests)
-
-=== DECISION RULES ===
-"similar to [TITLE] by [ARTIST]" → song_similarity (exact API)
-"songs like [ARTIST]" → artist_similarity (exact API)
-"[GENRE]/[MOOD]/[TEMPO]/[ENERGY]" → search_database (exact DB search)
-"[ARTIST] songs/hits", "trending", "era", etc. → ai_brainstorm (AI knowledge)
-
-=== EXAMPLES ===
-"Similar to Smells Like Teen Spirit by Nirvana" → song_similarity(song_title="Smells Like Teen Spirit", song_artist="Nirvana", get_songs=100)
-"songs like AC/DC" → artist_similarity(artist="AC/DC", get_songs=100)
-"AC/DC songs" → ai_brainstorm(user_request="AC/DC songs", get_songs=100)
-"energetic rock music" → search_database(genres=["rock"], energy_min=0.08, moods=["happy"], get_songs=100)
-"running 120 bpm" → search_database(tempo_min=115, tempo_max=125, energy_min=0.08, get_songs=100)
-"post lunch" → search_database(moods=["relaxed"], energy_min=0.03, energy_max=0.08, tempo_min=80, tempo_max=110, get_songs=100)
-"trending 2025" → ai_brainstorm(user_request="trending 2025", get_songs=100)
-"greatest hits Red Hot Chili Peppers" → ai_brainstorm(user_request="greatest hits RHCP", get_songs=100)
-"Metal like AC/DC + Metallica" → artist_similarity("AC/DC", 50) + artist_similarity("Metallica", 50)
-
-VALID DB VALUES:
-GENRES: rock, pop, metal, jazz, electronic, dance, alternative, indie, punk, blues, hard rock, heavy metal, Hip-Hop, funk, country, soul, 00s, 90s, 80s, 70s, 60s
-MOODS: danceable, aggressive, happy, party, relaxed, sad
-TEMPO: 40-200 BPM | ENERGY: 0.01-0.15
-
-Now analyze the request and call tools:"""
+            # Iteration 0: Just the request - system prompt already has all instructions
+            ai_context = f'Build a {target_song_count}-song playlist for: "{original_user_input}"'
         else:
             songs_needed = target_song_count - current_song_count
             previous_tools_str = ", ".join([f"{t['name']}({t.get('songs', 0)} songs)" for t in tools_used_history])
-            
-            ai_context = f"""User request: {original_user_input}
-Goal: {target_song_count} songs total
-Current: {current_song_count} songs
-Needed: {songs_needed} MORE songs
 
-Previous tools: {previous_tools_str}
+            # Build feedback about what we have so far
+            artist_counts = {}
+            for song in all_songs:
+                a = song.get('artist', 'Unknown')
+                artist_counts[a] = artist_counts.get(a, 0) + 1
+            top_artists = sorted(artist_counts.items(), key=lambda x: x[1], reverse=True)[:5]
+            top_artists_str = ", ".join([f"{a} ({c})" for a, c in top_artists])
+
+            # Unique artists ratio
+            unique_artists = len(artist_counts)
+            diversity_ratio = round(unique_artists / max(len(all_songs), 1), 2)
+
+            # Genres covered (from tools used)
+            genres_used = set()
+            for t in tools_used_history:
+                if t.get('args', {}).get('genres'):
+                    genres_used.update(t['args']['genres'])
+            genres_str = ", ".join(genres_used) if genres_used else "none specifically"
 
-Call 1-3 DIFFERENT tools or parameters to get {songs_needed} more diverse songs."""
+            ai_context = f"""Original request: "{original_user_input}"
+Progress: {current_song_count}/{target_song_count} songs collected. Need {songs_needed} MORE.
+
+What we have so far:
+- Top artists: {top_artists_str}
+- Artist diversity: {unique_artists} unique artists (ratio: {diversity_ratio})
+- Tools used: {previous_tools_str}
+- Genres covered: {genres_str}
+
+Call DIFFERENT tools or parameters to add {songs_needed} more DIVERSE songs.
+Prioritize variety - avoid tools/parameters that duplicate what we already have."""
         
         # AI decides which tools to call
         log_messages.append(f"\n--- AI Decision (Iteration {iteration + 1}) ---")
@@ -419,7 +411,8 @@ def chat_playlist_api():
             user_message=ai_context,
             tools=mcp_tools,
             ai_config=ai_config,
-            log_messages=log_messages
+            log_messages=log_messages,
+            library_context=library_context
         )
         
         if 'error' in tool_calling_result:
@@ -451,9 +444,38 @@ def chat_playlist_api():
             break
         
         log_messages.append(f"\n--- Executing {len(tool_calls)} Tool(s) ---")
-        
+
+        # Pre-execution validation (Phase 4A)
+        validated_calls = []
+        for tc in tool_calls:
+            tn = tc.get('name', '')
+            ta = tc.get('arguments', {})
+
+            # song_similarity: reject if title or artist is empty
+            if tn == 'song_similarity':
+                if not ta.get('song_title', '').strip() or not ta.get('song_artist', '').strip():
+                    log_messages.append(f"   ⚠️ Skipping {tn}: empty title or artist")
+                    tools_used_history.append({'name': tn, 'args': ta, 'songs': 0, 'error': True, 'call_index': tool_call_counter})
+                    tool_call_counter += 1
+                    continue
+
+            # search_database: reject if zero filters specified
+            if tn == 'search_database':
+                filter_keys = ['genres', 'moods', 'tempo_min', 'tempo_max', 'energy_min', 'energy_max',
+                               'key', 'scale', 'year_min', 'year_max', 'min_rating']
+                has_filter = any(ta.get(k) for k in filter_keys)
+                if not has_filter:
+                    log_messages.append(f"   ⚠️ Skipping {tn}: no filters specified (would return random noise)")
+                    tools_used_history.append({'name': tn, 'args': ta, 'songs': 0, 'error': True, 'call_index': tool_call_counter})
+                    tool_call_counter += 1
+                    continue
+
+            validated_calls.append(tc)
+
+        tool_calls = validated_calls
+
         iteration_songs_added = 0
-        
+
         for i, tool_call in enumerate(tool_calls):
             tool_name = tool_call.get('name')
             tool_args = tool_call.get('arguments', {})
@@ -625,13 +647,62 @@ def convert_to_dict(obj):
             
             # Truncate if we somehow went over (shouldn't happen)
             final_query_results_list = final_query_results_list[:target_song_count]
-        
+
+        # --- Artist Diversity Enforcement (Phase 3B) ---
+        from config import MAX_SONGS_PER_ARTIST_PLAYLIST
+        max_per_artist = MAX_SONGS_PER_ARTIST_PLAYLIST
+
+        artist_song_counts = {}
+        diverse_list = []
+        overflow_pool = []
+        for song in final_query_results_list:
+            artist = song.get('artist', 'Unknown')
+            artist_song_counts[artist] = artist_song_counts.get(artist, 0) + 1
+            if artist_song_counts[artist] <= max_per_artist:
+                diverse_list.append(song)
+            else:
+                overflow_pool.append(song)
+
+        removed_count = len(final_query_results_list) - len(diverse_list)
+        if removed_count > 0:
+            log_messages.append(f"\n🎨 Artist diversity: removed {removed_count} excess songs (max {max_per_artist}/artist)")
+            # Backfill from overflow with least-represented artists
+            if len(diverse_list) < target_song_count and overflow_pool:
+                # Sort overflow by how underrepresented their artist is
+                diverse_artist_counts = {}
+                for s in diverse_list:
+                    a = s.get('artist', 'Unknown')
+                    diverse_artist_counts[a] = diverse_artist_counts.get(a, 0) + 1
+                overflow_pool.sort(key=lambda s: diverse_artist_counts.get(s.get('artist', ''), 0))
+                backfill_needed = target_song_count - len(diverse_list)
+                diverse_list.extend(overflow_pool[:backfill_needed])
+                if backfill_needed > 0:
+                    log_messages.append(f"   Backfilled {min(backfill_needed, len(overflow_pool))} songs from overflow")
+
+        final_query_results_list = diverse_list
+
+        # --- Song Ordering for Smooth Transitions (Phase 3A) ---
+        try:
+            from tasks.playlist_ordering import order_playlist
+            from config import PLAYLIST_ENERGY_ARC
+
+            song_id_list = [s['item_id'] for s in final_query_results_list]
+            ordered_ids = order_playlist(song_id_list, energy_arc=PLAYLIST_ENERGY_ARC)
+
+            # Rebuild list in new order
+            id_to_song = {s['item_id']: s for s in final_query_results_list}
+            final_query_results_list = [id_to_song[sid] for sid in ordered_ids if sid in id_to_song]
+            log_messages.append(f"\n🎵 Playlist ordered for smooth transitions (tempo/energy/key)")
+        except Exception as e:
+            logger.warning(f"Playlist ordering failed (non-fatal): {e}")
+            log_messages.append(f"\n⚠️ Playlist ordering skipped: {str(e)[:100]}")
+
         final_executed_query_str = f"MCP Agentic ({len(tools_used_history)} tools, {iteration + 1} iterations): {' → '.join(tool_execution_summary)}"
-        
+
         log_messages.append(f"\n✅ SUCCESS! Generated playlist with {len(final_query_results_list)} songs")
         log_messages.append(f"   Total songs collected: {len(all_songs)}")
         if len(all_songs) > target_song_count:
-            log_messages.append(f"   ⚖️ Proportionally sampled {len(all_songs) - target_song_count} excess songs to meet target of {target_song_count}")
+            log_messages.append(f"   Proportionally sampled {len(all_songs) - target_song_count} excess songs to meet target of {target_song_count}")
         log_messages.append(f"   Iterations used: {iteration + 1}/{max_iterations}")
         log_messages.append(f"   Tools called: {len(tools_used_history)}")
         
diff --git a/app_setup.py b/app_setup.py
index 263cd5e6..fed1b538 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -22,6 +22,7 @@
     get_provider_info,
     test_provider_connection,
     get_sample_tracks_from_provider,
+    get_libraries_for_provider,
     PROVIDER_TYPES
 )
 import config
@@ -230,19 +231,19 @@ def delete_provider(provider_id):
 PROVIDER_SCHEMAS = {
     'jellyfin': {
         'required': ['url', 'user_id', 'token'],
-        'optional': ['music_path_prefix'],
+        'optional': ['music_path_prefix', 'music_libraries'],
     },
     'navidrome': {
         'required': ['url', 'user', 'password'],
-        'optional': ['music_path_prefix'],
+        'optional': ['music_path_prefix', 'music_libraries'],
     },
     'lyrion': {
         'required': ['url'],
-        'optional': ['music_path_prefix'],
+        'optional': ['music_path_prefix', 'music_libraries'],
     },
     'emby': {
         'required': ['url', 'user_id', 'token'],
-        'optional': ['music_path_prefix'],
+        'optional': ['music_path_prefix', 'music_libraries'],
     },
     'localfiles': {
         'required': ['music_directory'],
@@ -705,6 +706,47 @@ def test_provider_config():
     return jsonify(result)
 
 
+@setup_bp.route('/api/setup/providers/libraries', methods=['POST'])
+def get_provider_libraries():
+    """
+    Fetch available music libraries for a provider.
+    Called by frontend after successful connection test.
+    ---
+    tags:
+      - Setup
+    requestBody:
+      required: true
+      content:
+        application/json:
+          schema:
+            type: object
+            properties:
+              provider_type:
+                type: string
+              config:
+                type: object
+    responses:
+      200:
+        description: List of available music libraries
+    """
+    data = request.get_json()
+    if not data:
+        return jsonify({'error': 'No data provided'}), 400
+
+    provider_type = data.get('provider_type')
+    config_data = data.get('config', {})
+
+    if not provider_type:
+        return jsonify({'error': 'provider_type is required'}), 400
+
+    try:
+        libraries = get_libraries_for_provider(provider_type, config_data)
+        return jsonify({'libraries': libraries})
+    except Exception as e:
+        logger.error(f"Error fetching libraries for {provider_type}: {e}")
+        return jsonify({'error': str(e), 'libraries': []}), 500
+
+
 @setup_bp.route('/api/setup/settings', methods=['GET'])
 def get_settings():
     """
diff --git a/config.py b/config.py
index cc933177..7b49ca73 100644
--- a/config.py
+++ b/config.py
@@ -454,3 +454,9 @@
 #   proxy_set_header X-Forwarded-Prefix /audiomuseai;
 # }
 ENABLE_PROXY_FIX = os.environ.get("ENABLE_PROXY_FIX", "False").lower() == "true"
+
+# --- Instant Playlist Optimization ---
+# Max songs from a single artist in the instant playlist (diversity enforcement)
+MAX_SONGS_PER_ARTIST_PLAYLIST = int(os.environ.get("MAX_SONGS_PER_ARTIST_PLAYLIST", "5"))
+# Enable energy-arc shaping for playlist ordering (gentle start -> peak -> cool down)
+PLAYLIST_ENERGY_ARC = os.environ.get("PLAYLIST_ENERGY_ARC", "False").lower() == "true"
diff --git a/tasks/mcp_server.py b/tasks/mcp_server.py
index 28cbe8ef..03f88f42 100644
--- a/tasks/mcp_server.py
+++ b/tasks/mcp_server.py
@@ -5,12 +5,16 @@
 """
 import logging
 import json
+import re
 from typing import List, Dict, Optional
 import psycopg2
 from psycopg2.extras import DictCursor
 
 logger = logging.getLogger(__name__)
 
+# Cache for library context (refreshed once per app lifetime or on demand)
+_library_context_cache = None
+
 
 def get_db_connection():
     """Get database connection using config settings."""
@@ -18,10 +22,83 @@ def get_db_connection():
     return psycopg2.connect(DATABASE_URL)
 
 
+def get_library_context(force_refresh: bool = False) -> Dict:
+    """Query the database once to build a summary of the user's music library.
+
+    Returns a dict with:
+        total_songs, unique_artists, top_genres (list), year_min, year_max,
+        has_ratings (bool), rated_songs_pct (float)
+    """
+    global _library_context_cache
+    if _library_context_cache is not None and not force_refresh:
+        return _library_context_cache
+
+    db_conn = get_db_connection()
+    try:
+        with db_conn.cursor(cursor_factory=DictCursor) as cur:
+            # Basic counts
+            cur.execute("SELECT COUNT(*) AS cnt, COUNT(DISTINCT author) AS artists FROM public.score")
+            row = cur.fetchone()
+            total_songs = row['cnt']
+            unique_artists = row['artists']
+
+            # Year range
+            cur.execute("SELECT MIN(year) AS ymin, MAX(year) AS ymax FROM public.score WHERE year IS NOT NULL AND year > 0")
+            yr = cur.fetchone()
+            year_min = yr['ymin']
+            year_max = yr['ymax']
+
+            # Rating coverage
+            cur.execute("SELECT COUNT(*) AS rated FROM public.score WHERE rating IS NOT NULL AND rating > 0")
+            rated_count = cur.fetchone()['rated']
+            rated_pct = round(100.0 * rated_count / total_songs, 1) if total_songs > 0 else 0
+
+            # Top genres from mood_vector (extract genre names and count occurrences)
+            # mood_vector format: "rock:0.82,pop:0.45,..."
+            cur.execute("""
+                SELECT unnest(string_to_array(mood_vector, ',')) AS tag
+                FROM public.score
+                WHERE mood_vector IS NOT NULL AND mood_vector != ''
+            """)
+            genre_counts = {}
+            for r in cur:
+                tag = r['tag'].strip()
+                if ':' in tag:
+                    name = tag.split(':')[0].strip()
+                    if name:
+                        genre_counts[name] = genre_counts.get(name, 0) + 1
+            top_genres = sorted(genre_counts, key=genre_counts.get, reverse=True)[:15]
+
+            # Available scales
+            cur.execute("SELECT DISTINCT scale FROM public.score WHERE scale IS NOT NULL AND scale != '' ORDER BY scale")
+            scales = [r['scale'] for r in cur.fetchall()]
+
+        ctx = {
+            'total_songs': total_songs,
+            'unique_artists': unique_artists,
+            'top_genres': top_genres,
+            'year_min': year_min,
+            'year_max': year_max,
+            'has_ratings': rated_count > 0,
+            'rated_songs_pct': rated_pct,
+            'scales': scales,
+        }
+        _library_context_cache = ctx
+        return ctx
+    except Exception as e:
+        logger.warning(f"Failed to get library context: {e}")
+        return {
+            'total_songs': 0, 'unique_artists': 0, 'top_genres': [],
+            'year_min': None, 'year_max': None, 'has_ratings': False,
+            'rated_songs_pct': 0, 'scales': [],
+        }
+    finally:
+        db_conn.close()
+
+
 def _artist_similarity_api_sync(artist: str, count: int, get_songs: int) -> List[Dict]:
     """Synchronous implementation of artist similarity API."""
     from tasks.artist_gmm_manager import find_similar_artists
-    import re
     
     db_conn = get_db_connection()
     log_messages = []
@@ -447,48 +524,61 @@ def _ai_brainstorm_sync(user_request: str, ai_config: Dict, get_songs: int) -> L
             log_messages.append(f"Raw AI response (first 500 chars): {raw_response[:500]}")
             return {"songs": [], "message": "\n".join(log_messages)}
         
-        # Search database for these songs (FUZZY match)
+        # Search database for these songs using strict two-stage matching
         found_songs = []
+        seen_ids = set()
+
+        def _normalize(s: str) -> str:
+            """Strip spaces, dashes, apostrophes for fuzzy comparison."""
+            return re.sub(r"[\s\-\u2010\u2011\u2012\u2013\u2014/'\".,!?()]", '', s).lower()
+
         for item in song_list:
             title = item.get('title', '')
             artist = item.get('artist', '')
-            
+
             if not title or not artist:
                 continue
-            
+
             with db_conn.cursor(cursor_factory=DictCursor) as cur:
-                # Fuzzy search - match partial title OR artist
+                # Stage 1: Exact case-insensitive match on BOTH title AND artist
                 cur.execute("""
                     SELECT item_id, title, author
                     FROM public.score
-                    WHERE LOWER(title) LIKE LOWER(%s) 
-                       OR LOWER(author) LIKE LOWER(%s)
-                    ORDER BY 
-                        CASE 
-                            WHEN LOWER(title) LIKE LOWER(%s) AND LOWER(author) LIKE LOWER(%s) THEN 1
-                            WHEN LOWER(title) LIKE LOWER(%s) THEN 2
-                            WHEN LOWER(author) LIKE LOWER(%s) THEN 3
-                            ELSE 4
-                        END
-                    LIMIT 3
-                """, (f"%{title}%", f"%{artist}%", f"%{title}%", f"%{artist}%", f"%{title}%", f"%{artist}%"))
-                results = cur.fetchall()
-                
-                for result in results:
-                    song_dict = {
+                    WHERE LOWER(title) = LOWER(%s) AND LOWER(author) = LOWER(%s)
+                    LIMIT 1
+                """, (title, artist))
+                result = cur.fetchone()
+
+                # Stage 2: Normalized fuzzy match requiring BOTH title AND artist to match
+                if not result:
+                    title_norm = _normalize(title)
+                    artist_norm = _normalize(artist)
+                    if title_norm and artist_norm:
+                        cur.execute("""
+                            SELECT item_id, title, author
+                            FROM public.score
+                            WHERE LOWER(REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(title, ' ', ''), '-', ''), '''', ''), '.', ''), ',', ''))
+                                  LIKE LOWER(%s)
+                              AND LOWER(REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(author, ' ', ''), '-', ''), '''', ''), '.', ''), ',', ''))
+                                  LIKE LOWER(%s)
+                            ORDER BY LENGTH(title) + LENGTH(author)
+                            LIMIT 1
+                        """, (f"%{title_norm}%", f"%{artist_norm}%"))
+                        result = cur.fetchone()
+
+                if result and result['item_id'] not in seen_ids:
+                    found_songs.append({
                         "item_id": result['item_id'],
                         "title": result['title'],
                         "artist": result['author']
-                    }
-                    # Avoid duplicates
-                    if song_dict not in found_songs:
-                        found_songs.append(song_dict)
-            
+                    })
+                    seen_ids.add(result['item_id'])
+
             if len(found_songs) >= get_songs:
                 break
-        
-        log_messages.append(f"Found {len(found_songs)} songs in database")
-        
+
+        log_messages.append(f"Found {len(found_songs)} songs in database (from {len(song_list)} AI suggestions)")
+
         return {"songs": found_songs, "ai_suggestions": len(song_list), "message": "\n".join(log_messages)}
     finally:
         db_conn.close()
@@ -638,37 +728,53 @@ def _song_alchemy_sync(add_items: List[Dict], subtract_items: Optional[List[Dict
 
 
 def _database_genre_query_sync(
-    genres: Optional[List[str]] = None, 
+    genres: Optional[List[str]] = None,
     get_songs: int = 100,
     moods: Optional[List[str]] = None,
     tempo_min: Optional[float] = None,
     tempo_max: Optional[float] = None,
     energy_min: Optional[float] = None,
     energy_max: Optional[float] = None,
-    key: Optional[str] = None
+    key: Optional[str] = None,
+    scale: Optional[str] = None,
+    year_min: Optional[int] = None,
+    year_max: Optional[int] = None,
+    min_rating: Optional[int] = None
 ) -> List[Dict]:
-    """Synchronous implementation of flexible database search with multiple optional filters."""
+    """Synchronous implementation of flexible database search with multiple optional filters.
+
+    Improvements over the original:
+    - Genre matching uses regex to avoid substring false positives (e.g. 'rock' won't match 'indie rock')
+    - Results are ordered by genre confidence score sum (relevance) instead of RANDOM()
+    - Supports scale (major/minor), year range, and minimum rating filters
+    """
     # Ensure get_songs is int (Gemini may return float)
     get_songs = int(get_songs) if get_songs is not None else 100
-    
+
     db_conn = get_db_connection()
     log_messages = []
-    
+
     try:
         with db_conn.cursor(cursor_factory=DictCursor) as cur:
             # Build conditions
             conditions = []
             params = []
-            
-            # Genre conditions (OR)
+
+            # Genre conditions (OR) - use regex to match whole genre names with confidence scores
+            # mood_vector format: "rock:0.82,pop:0.45,indie rock:0.31"
+            # We want "rock" to match "rock:0.82" but NOT "indie rock:0.31"
+            has_genre_filter = False
             if genres:
                 genre_conditions = []
                 for genre in genres:
-                    genre_conditions.append("mood_vector LIKE %s")
-                    params.append(f"%{genre}%")
+                    # Match genre at start of string or after comma, followed by colon
+                    # PostgreSQL regex: (^|,)\s*rock:
+                    genre_conditions.append("mood_vector ~* %s")
+                    params.append(f"(^|,)\\s*{re.escape(genre)}:")
                 conditions.append("(" + " OR ".join(genre_conditions) + ")")
-            
-            # Mood/other_features conditions (AND if multiple moods)
+                has_genre_filter = True
+
+            # Mood/other_features conditions (OR)
             if moods:
                 mood_conditions = []
                 for mood in moods:
@@ -678,7 +784,7 @@ def _database_genre_query_sync(
                     conditions.append(mood_conditions[0])
                 else:
                     conditions.append("(" + " OR ".join(mood_conditions) + ")")
-            
+
             # Numeric filters (AND)
             if tempo_min is not None:
                 conditions.append("tempo >= %s")
@@ -692,31 +798,87 @@ def _database_genre_query_sync(
             if energy_max is not None:
                 conditions.append("energy <= %s")
                 params.append(energy_max)
-            
+
             # Key filter
             if key:
                 conditions.append("key = %s")
                 params.append(key.upper())
-            
+
+            # Scale filter (major/minor)
+            if scale:
+                conditions.append("LOWER(scale) = LOWER(%s)")
+                params.append(scale)
+
+            # Year range filter
+            if year_min is not None:
+                conditions.append("year >= %s")
+                params.append(int(year_min))
+            if year_max is not None:
+                conditions.append("year <= %s")
+                params.append(int(year_max))
+
+            # Minimum rating filter
+            if min_rating is not None:
+                conditions.append("rating >= %s")
+                params.append(int(min_rating))
+
             where_clause = " AND ".join(conditions) if conditions else "1=1"
             params.append(get_songs)
-            
-            query = f"""
-                SELECT DISTINCT item_id, title, author
-                FROM (
-                    SELECT item_id, title, author
-                    FROM public.score
-                    WHERE {where_clause}
-                    ORDER BY RANDOM()
-                ) AS randomized
-                LIMIT %s
-            """
-            
-            cur.execute(query, params)
+
+            # Use relevance ranking when genre filter is active, otherwise random
+            if has_genre_filter:
+                # Build a scoring expression that sums confidence scores for matched genres
+                # For each requested genre, extract its score from mood_vector and sum them
+                score_parts = []
+                score_params = []
+                for genre in genres:
+                    # Extract the numeric score after 'genre:' using regex
+                    score_parts.append("""
+                        COALESCE(
+                            CAST(
+                                NULLIF(
+                                    SUBSTRING(mood_vector FROM %s),
+                                    ''
+                                ) AS NUMERIC
+                            ),
+                            0
+                        )
+                    """)
+                    # Regex to capture the score value: (?:^|,)\s*rock:(\d+\.?\d*)
+                    score_params.append(f"(?:^|,)\\s*{re.escape(genre)}:(\\d+\\.?\\d*)")
+
+                relevance_expr = " + ".join(score_parts)
+                all_params = score_params + params
+
+                query = f"""
+                    SELECT DISTINCT item_id, title, author
+                    FROM (
+                        SELECT item_id, title, author,
+                               ({relevance_expr}) AS relevance_score
+                        FROM public.score
+                        WHERE {where_clause}
+                        ORDER BY relevance_score DESC, RANDOM()
+                    ) AS ranked
+                    LIMIT %s
+                """
+                cur.execute(query, all_params)
+            else:
+                query = f"""
+                    SELECT DISTINCT item_id, title, author
+                    FROM (
+                        SELECT item_id, title, author
+                        FROM public.score
+                        WHERE {where_clause}
+                        ORDER BY RANDOM()
+                    ) AS randomized
+                    LIMIT %s
+                """
+                cur.execute(query, params)
+
             results = cur.fetchall()
-        
+
         songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author']} for r in results]
-        
+
         filters = []
         if genres:
             filters.append(f"genres: {', '.join(genres)}")
@@ -728,9 +890,15 @@ def _database_genre_query_sync(
             filters.append(f"energy: {energy_min or 'any'}-{energy_max or 'any'}")
         if key:
             filters.append(f"key: {key}")
-        
+        if scale:
+            filters.append(f"scale: {scale}")
+        if year_min or year_max:
+            filters.append(f"year: {year_min or 'any'}-{year_max or 'any'}")
+        if min_rating:
+            filters.append(f"min_rating: {min_rating}")
+
         log_messages.append(f"Found {len(songs)} songs matching {', '.join(filters) if filters else 'all criteria'}")
-        
+
         return {"songs": songs, "message": "\n".join(log_messages)}
     finally:
         db_conn.close()
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index 3d26b327..b5de7a2b 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -25,6 +25,7 @@
 
 # Import the specific implementations
 from tasks.mediaserver_jellyfin import (
+    get_music_libraries as jellyfin_get_music_libraries,
     resolve_user as jellyfin_resolve_user,
     get_all_playlists as jellyfin_get_all_playlists,
     delete_playlist as jellyfin_delete_playlist,
@@ -39,6 +40,7 @@
     get_last_played_time as jellyfin_get_last_played_time,
 )
 from tasks.mediaserver_navidrome import (
+    get_music_libraries as navidrome_get_music_libraries,
     get_all_playlists as navidrome_get_all_playlists,
     delete_playlist as navidrome_delete_playlist,
     get_recent_albums as navidrome_get_recent_albums,
@@ -52,6 +54,7 @@
     get_last_played_time as navidrome_get_last_played_time,
 )
 from tasks.mediaserver_lyrion import (
+    get_music_libraries as lyrion_get_music_libraries,
     get_all_playlists as lyrion_get_all_playlists,
     delete_playlist as lyrion_delete_playlist,
     get_recent_albums as lyrion_get_recent_albums,
@@ -65,6 +68,7 @@
     get_last_played_time as lyrion_get_last_played_time,
 )
 from tasks.mediaserver_emby import (
+    get_music_libraries as emby_get_music_libraries,
     resolve_user as emby_resolve_user,
     get_all_playlists as emby_get_all_playlists,
     delete_playlist as emby_delete_playlist,
@@ -777,6 +781,28 @@ def get_provider_info(provider_type: str):
     return None
 
 
+def get_libraries_for_provider(provider_type: str, config_dict: dict = None):
+    """Fetch available music libraries for a provider type.
+    Args:
+        provider_type: Type of provider (jellyfin, navidrome, etc.)
+        config_dict: Optional provider config dict for setup-time calls
+    Returns: [{'id': str, 'name': str}]
+    """
+    if provider_type == 'jellyfin':
+        return jellyfin_get_music_libraries(config_dict)
+    elif provider_type == 'navidrome':
+        return navidrome_get_music_libraries(config_dict)
+    elif provider_type == 'emby':
+        return emby_get_music_libraries(config_dict)
+    elif provider_type == 'lyrion':
+        return lyrion_get_music_libraries(config_dict)
+    elif provider_type == 'localfiles':
+        return []  # Single directory, no library concept
+    else:
+        logger.warning(f"get_libraries_for_provider: unknown provider type '{provider_type}'")
+        return []
+
+
 def _get_provider_config_fields(provider_type: str):
     """Get configuration fields for a provider type."""
     # Common field for path normalization in multi-provider setups
diff --git a/tasks/mediaserver_emby.py b/tasks/mediaserver_emby.py
index 16252f8e..09abe70d 100644
--- a/tasks/mediaserver_emby.py
+++ b/tasks/mediaserver_emby.py
@@ -14,17 +14,50 @@
 # ##############################################################################
 # Accessing the API is via http[s]://hostname:port/emby/{apipath}
 # https://dev.emby.media/doc/restapi/index.html
-def _get_target_library_ids():
+def get_music_libraries(config_dict=None):
+    """Fetch available music libraries from Emby.
+    Args: config_dict -- provider JSONB config dict (url, token, user_id). Falls back to global config.
+    Returns: [{'id': str, 'name': str}]
+    """
+    if config_dict:
+        url = f"{config_dict.get('url', '').rstrip('/')}/emby/Library/VirtualFolders"
+        headers = {"X-Emby-Token": config_dict.get('token', '')}
+    else:
+        url = f"{config.EMBY_URL}/emby/Library/VirtualFolders"
+        headers = config.HEADERS
+
+    try:
+        r = requests.get(url, headers=headers, timeout=REQUESTS_TIMEOUT)
+        r.raise_for_status()
+        all_libraries = r.json()
+        if not isinstance(all_libraries, list):
+            return []
+        return [
+            {'id': lib['ItemId'], 'name': lib['Name']}
+            for lib in all_libraries
+            if lib.get('CollectionType') == 'music'
+        ]
+    except Exception as e:
+        logger.error(f"Failed to fetch Emby music libraries from '{url}': {e}", exc_info=True)
+        return []
+
+
+def _get_target_library_ids(provider_config=None):
     """
     Parses config for library names and returns their IDs for filtering using a robust,
     case-insensitive matching against the server's actual library configuration.
     """
-    library_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
-
-    if not library_names_str.strip():
-        return None
+    # Try per-provider config first
+    if provider_config and provider_config.get('music_libraries'):
+        library_names = provider_config['music_libraries']  # already a list
+    else:
+        # Fallback to global env var
+        library_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
+        if not library_names_str.strip():
+            return None
+        library_names = [n.strip() for n in library_names_str.split(',') if n.strip()]
 
-    target_names_lower = {name.strip().lower() for name in library_names_str.split(',') if name.strip()}
+    target_names_lower = {name.lower() for name in library_names}
 
     # Compatible with Emby GET /Library/VirtualFolders API (returns a list, not a dict).
     # https://dev.emby.media/reference/RestAPI/LibraryStructureService/getLibraryVirtualfoldersQuery.html
@@ -523,48 +556,64 @@ def _select_best_artist(item, title="Unknown"):
     return track_artist, artist_id
 
 def get_all_songs(user_creds=None):
-    # Emby might have a maximum number of items returned per request.
-    # not sure if this approach would work.. It defnitly needs testing.
-    """Fetches all songs from Emby using admin credentials."""
+    """Fetches all songs from Emby using admin credentials.
+    If MUSIC_LIBRARIES is set (or per-provider music_libraries), filters by library.
+    """
     user_id = user_creds.get('user_id') if user_creds else config.EMBY_USER_ID
-    url = f"{config.EMBY_URL}/emby/Users/{user_id}/Items"
+    target_library_ids = _get_target_library_ids()
+
+    # Config is set but no matching libraries found - return nothing
+    if isinstance(target_library_ids, set) and not target_library_ids:
+        logger.warning("Library filtering is active, but no matching libraries were found. Returning no songs.")
+        return []
+
     all_items = []
-    start_index = 0
     limit = 1000  # max items per request
 
-    while True:
-        params = {
-            "IncludeItemTypes": "Audio",
-            "Recursive": True,
-            "StartIndex": start_index,
-            "Limit": limit,
-            "Fields": "UserData,Path,ProductionYear"
-        }
-        try:
-            r = requests.get(url, headers=config.HEADERS, params=params, timeout=REQUESTS_TIMEOUT)
-            r.raise_for_status()
-            items = r.json().get("Items", [])
+    # Build list of parent_ids to iterate over
+    if target_library_ids is None:
+        parent_ids = [None]  # No filtering
+    else:
+        parent_ids = list(target_library_ids)
+        logger.info(f"Fetching songs from {len(parent_ids)} specific Emby libraries.")
 
-            # Apply artist field prioritization
-            for item in items:
-                item['OriginalAlbumArtist'] = item.get('AlbumArtist')
-                title = item.get('Name', 'Unknown')
-                artist_name, artist_id = _select_best_artist(item, title)
-                item['AlbumArtist'] = artist_name
-                item['ArtistId'] = artist_id
-                item['Year'] = item.get('ProductionYear')
-                item['FilePath'] = item.get('Path')
-
-            all_items.extend(items)
-
-            if len(items) < limit:
-                # No more items left
-                break
+    for parent_id in parent_ids:
+        start_index = 0
+        while True:
+            url = f"{config.EMBY_URL}/emby/Users/{user_id}/Items"
+            params = {
+                "IncludeItemTypes": "Audio",
+                "Recursive": True,
+                "StartIndex": start_index,
+                "Limit": limit,
+                "Fields": "UserData,Path,ProductionYear"
+            }
+            if parent_id:
+                params["ParentId"] = parent_id
+            try:
+                r = requests.get(url, headers=config.HEADERS, params=params, timeout=REQUESTS_TIMEOUT)
+                r.raise_for_status()
+                items = r.json().get("Items", [])
 
-            start_index += limit
-        except Exception as e:
-            logger.error(f"Emby get_all_songs failed at index {start_index}: {e}", exc_info=True)
-            break
+                # Apply artist field prioritization
+                for item in items:
+                    item['OriginalAlbumArtist'] = item.get('AlbumArtist')
+                    title = item.get('Name', 'Unknown')
+                    artist_name, artist_id = _select_best_artist(item, title)
+                    item['AlbumArtist'] = artist_name
+                    item['ArtistId'] = artist_id
+                    item['Year'] = item.get('ProductionYear')
+                    item['FilePath'] = item.get('Path')
+
+                all_items.extend(items)
+
+                if len(items) < limit:
+                    break
+
+                start_index += limit
+            except Exception as e:
+                logger.error(f"Emby get_all_songs failed at index {start_index}: {e}", exc_info=True)
+                break
 
     return all_items
 
diff --git a/tasks/mediaserver_jellyfin.py b/tasks/mediaserver_jellyfin.py
index 14a43cb1..4dde3c6f 100644
--- a/tasks/mediaserver_jellyfin.py
+++ b/tasks/mediaserver_jellyfin.py
@@ -13,17 +13,49 @@
 # JELLYFIN IMPLEMENTATION
 # ##############################################################################
 
-def _get_target_library_ids():
+def get_music_libraries(config_dict=None):
+    """Fetch available music libraries from Jellyfin.
+    Args: config_dict -- provider JSONB config dict (url, token, user_id). Falls back to global config.
+    Returns: [{'id': str, 'name': str}]
+    """
+    if config_dict:
+        url = config_dict.get('url', '').rstrip('/')
+        headers = {"X-Emby-Token": config_dict.get('token', '')}
+    else:
+        url = config.JELLYFIN_URL
+        headers = config.HEADERS
+
+    api_url = f"{url}/Library/VirtualFolders"
+    try:
+        r = requests.get(api_url, headers=headers, timeout=REQUESTS_TIMEOUT)
+        r.raise_for_status()
+        all_libraries = r.json()
+        return [
+            {'id': lib['ItemId'], 'name': lib['Name']}
+            for lib in all_libraries
+            if lib.get('CollectionType') == 'music'
+        ]
+    except Exception as e:
+        logger.error(f"Failed to fetch Jellyfin music libraries from '{api_url}': {e}", exc_info=True)
+        return []
+
+
+def _get_target_library_ids(provider_config=None):
     """
     Parses config for library names and returns their IDs for filtering using a robust,
     case-insensitive matching against the server's actual library configuration.
     """
-    library_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
-
-    if not library_names_str.strip():
-        return None
+    # Try per-provider config first
+    if provider_config and provider_config.get('music_libraries'):
+        library_names = provider_config['music_libraries']  # already a list
+    else:
+        # Fallback to global env var
+        library_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
+        if not library_names_str.strip():
+            return None
+        library_names = [n.strip() for n in library_names_str.split(',') if n.strip()]
 
-    target_names_lower = {name.strip().lower() for name in library_names_str.split(',') if name.strip()}
+    target_names_lower = {name.lower() for name in library_names}
 
     # Use the /Library/VirtualFolders endpoint as it provides the canonical system configuration.
     url = f"{config.JELLYFIN_URL}/Library/VirtualFolders"
@@ -270,29 +302,55 @@ def _select_best_artist(item, title="Unknown"):
     return track_artist, artist_id
 
 def get_all_songs():
-    """Fetches all songs from Jellyfin using admin credentials."""
-    url = f"{config.JELLYFIN_URL}/Users/{config.JELLYFIN_USER_ID}/Items"
-    params = {"IncludeItemTypes": "Audio", "Recursive": True, "Fields": "Path"}
-    try:
-        r = requests.get(url, headers=config.HEADERS, params=params, timeout=REQUESTS_TIMEOUT)
-        r.raise_for_status()
-        items = r.json().get("Items", [])
-
-        # Apply artist field prioritization to each item
-        for item in items:
-            item['OriginalAlbumArtist'] = item.get('AlbumArtist')
-            title = item.get('Name', 'Unknown')
-            artist_name, artist_id = _select_best_artist(item, title)
-            item['AlbumArtist'] = artist_name
-            item['ArtistId'] = artist_id
-            item['Year'] = item.get('ProductionYear')
-            item['FilePath'] = item.get('Path')
+    """Fetches all songs from Jellyfin using admin credentials.
+    If MUSIC_LIBRARIES is set (or per-provider music_libraries), filters by library.
+    """
+    target_library_ids = _get_target_library_ids()
 
-        return items
-    except Exception as e:
-        logger.error(f"Jellyfin get_all_songs failed: {e}", exc_info=True)
+    # Config is set but no matching libraries found - return nothing
+    if isinstance(target_library_ids, set) and not target_library_ids:
+        logger.warning("Library filtering is active, but no matching libraries were found. Returning no songs.")
         return []
 
+    all_items = []
+
+    if target_library_ids is None:
+        # No filtering - fetch all songs
+        url = f"{config.JELLYFIN_URL}/Users/{config.JELLYFIN_USER_ID}/Items"
+        params = {"IncludeItemTypes": "Audio", "Recursive": True, "Fields": "Path"}
+        try:
+            r = requests.get(url, headers=config.HEADERS, params=params, timeout=REQUESTS_TIMEOUT)
+            r.raise_for_status()
+            all_items = r.json().get("Items", [])
+        except Exception as e:
+            logger.error(f"Jellyfin get_all_songs failed: {e}", exc_info=True)
+            return []
+    else:
+        # Filter by library using ParentId
+        logger.info(f"Fetching songs from {len(target_library_ids)} specific Jellyfin libraries.")
+        for library_id in target_library_ids:
+            url = f"{config.JELLYFIN_URL}/Users/{config.JELLYFIN_USER_ID}/Items"
+            params = {"IncludeItemTypes": "Audio", "Recursive": True, "Fields": "Path", "ParentId": library_id}
+            try:
+                r = requests.get(url, headers=config.HEADERS, params=params, timeout=REQUESTS_TIMEOUT)
+                r.raise_for_status()
+                items = r.json().get("Items", [])
+                all_items.extend(items)
+            except Exception as e:
+                logger.error(f"Jellyfin get_all_songs failed for library {library_id}: {e}", exc_info=True)
+
+    # Apply artist field prioritization to each item
+    for item in all_items:
+        item['OriginalAlbumArtist'] = item.get('AlbumArtist')
+        title = item.get('Name', 'Unknown')
+        artist_name, artist_id = _select_best_artist(item, title)
+        item['AlbumArtist'] = artist_name
+        item['ArtistId'] = artist_id
+        item['Year'] = item.get('ProductionYear')
+        item['FilePath'] = item.get('Path')
+
+    return all_items
+
 def get_playlist_by_name(playlist_name):
     """Finds a Jellyfin playlist by its exact name using admin credentials."""
     url = f"{config.JELLYFIN_URL}/Users/{config.JELLYFIN_USER_ID}/Items"
diff --git a/tasks/mediaserver_lyrion.py b/tasks/mediaserver_lyrion.py
index bdfba590..ee8e9c01 100644
--- a/tasks/mediaserver_lyrion.py
+++ b/tasks/mediaserver_lyrion.py
@@ -27,12 +27,17 @@ def _decode_lyrion_url(url):
 # ##############################################################################
 # Lyrion uses a JSON-RPC API. This section contains functions to interact with it.
 
-def _get_target_paths_for_filtering():
+def _get_target_paths_for_filtering(provider_config=None):
     """
     Gets the target paths from config for path-based filtering.
     Returns a set of lowercase paths to match against, or None if no filtering.
     """
-    folder_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
+    # Try per-provider config first
+    if provider_config and provider_config.get('music_libraries'):
+        library_names = provider_config['music_libraries']
+        folder_names_str = ','.join(library_names)
+    else:
+        folder_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
     logger.info(f"DEBUG: MUSIC_LIBRARIES config value: '{folder_names_str}'")
 
     if not folder_names_str.strip():
@@ -140,12 +145,69 @@ def _album_matches_target_paths(album, target_paths):
     logger.info(f"DEBUG: No match for album path '{album_path_lower}'")
     return False
 
-def _get_target_music_folder_ids():
+def get_music_libraries(config_dict=None):
+    """Fetch available music libraries (folders) from Lyrion.
+    Args: config_dict -- provider JSONB config dict (url). Falls back to global config.
+    Returns: [{'id': str, 'name': str}]
+    """
+    if config_dict:
+        api_url = f"{config_dict.get('url', '').rstrip('/')}/jsonrpc.js"
+        payload = {
+            "id": 1,
+            "method": "slim.request",
+            "params": ["", ["musicfolders", 0, 999999]]
+        }
+        try:
+            r = requests.post(api_url, json=payload, timeout=REQUESTS_TIMEOUT)
+            r.raise_for_status()
+            response = r.json().get("result", {})
+        except Exception as e:
+            logger.error(f"Failed to fetch Lyrion music folders: {e}", exc_info=True)
+            return []
+    else:
+        try:
+            response = _jsonrpc_request("musicfolders", [0, 999999])
+        except Exception as e:
+            logger.error(f"Failed to fetch Lyrion music folders: {e}", exc_info=True)
+            return []
+
+    if not response:
+        return []
+
+    # Extract folder list - handle different response key variants
+    all_folders = []
+    if isinstance(response, dict):
+        if "folder_loop" in response:
+            all_folders = response["folder_loop"]
+        elif "folders_loop" in response:
+            all_folders = response["folders_loop"]
+        else:
+            for v in response.values():
+                if isinstance(v, list):
+                    all_folders = v
+                    break
+    elif isinstance(response, list):
+        all_folders = response
+
+    return [
+        {'id': str(f.get('id') or f.get('folder_id', '')), 'name': f.get('name') or f.get('folder', '')}
+        for f in all_folders
+        if isinstance(f, dict) and (f.get('name') or f.get('folder'))
+    ]
+
+
+def _get_target_music_folder_ids(provider_config=None):
     """
     Parses config for music folder names and returns their IDs for filtering using a robust,
     case-insensitive matching against the server's actual folder configuration.
     """
-    folder_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
+    # Try per-provider config first
+    if provider_config and provider_config.get('music_libraries'):
+        library_names = provider_config['music_libraries']  # already a list
+        folder_names_str = ','.join(library_names)
+    else:
+        # Fallback to global env var
+        folder_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
 
     logger.info(f"DEBUG: MUSIC_LIBRARIES config value: '{folder_names_str}'")
 
@@ -719,14 +781,10 @@ def get_recent_albums(limit):
 def get_all_songs():
     """
     Fetches all songs from Lyrion using JSON-RPC.
-    For now, just gets all songs since folder filtering is complex in Lyrion.
+    If MUSIC_LIBRARIES is set, filters songs by checking file paths against target folders.
     """
     target_paths = _get_target_paths_for_filtering()
 
-    if target_paths is not None:
-        logger.warning("LYRION FOLDER FILTERING IS DISABLED - fetching all songs instead")
-    
-    # Fetch all songs without filtering
     logger.info("Fetching all songs from Lyrion")
     response = _jsonrpc_request("titles", [0, 999999, "tags:galduAyR"])
     
@@ -772,6 +830,17 @@ def get_all_songs():
 
         logger.info(f"Found {len(songs)} total songs")
 
+    # Apply path filtering if target_paths is set
+    if target_paths is not None and all_songs:
+        pre_filter_count = len(all_songs)
+        filtered_songs = []
+        for song in all_songs:
+            song_path = (song.get('FilePath') or song.get('Path') or '').lower()
+            if any(tp in song_path for tp in target_paths):
+                filtered_songs.append(song)
+        logger.info(f"Lyrion path filtering: {pre_filter_count} -> {len(filtered_songs)} songs")
+        return filtered_songs
+
     return all_songs
 
 def _add_to_playlist(playlist_id, item_ids):
diff --git a/tasks/mediaserver_navidrome.py b/tasks/mediaserver_navidrome.py
index 10cc4939..508a0893 100644
--- a/tasks/mediaserver_navidrome.py
+++ b/tasks/mediaserver_navidrome.py
@@ -15,17 +15,49 @@
 # NAVIDROME (SUBSONIC API) IMPLEMENTATION
 # ##############################################################################
 
-def _get_target_music_folder_ids():
+def get_music_libraries(config_dict=None):
+    """Fetch available music libraries (folders) from Navidrome.
+    Args: config_dict -- provider JSONB config dict (url, user, password). Falls back to global config.
+    Returns: [{'id': str, 'name': str}]
+    """
+    if config_dict:
+        auth_params = get_navidrome_auth_params(username=config_dict.get('user'), password=config_dict.get('password'))
+        url = f"{config_dict.get('url', '').rstrip('/')}/rest/getMusicFolders.view"
+        try:
+            r = requests.get(url, params=auth_params, timeout=REQUESTS_TIMEOUT)
+            r.raise_for_status()
+            subsonic = r.json().get("subsonic-response", {})
+            if subsonic.get("status") == "failed":
+                return []
+            folders = subsonic.get("musicFolders", {}).get("musicFolder", [])
+            return [{'id': str(f.get('id', '')), 'name': f.get('name', '')} for f in folders if isinstance(f, dict)]
+        except Exception as e:
+            logger.error(f"Failed to fetch Navidrome music folders: {e}", exc_info=True)
+            return []
+    else:
+        response = _navidrome_request("getMusicFolders")
+        if not (response and "musicFolders" in response and "musicFolder" in response["musicFolders"]):
+            return []
+        folders = response["musicFolders"]["musicFolder"]
+        return [{'id': str(f.get('id', '')), 'name': f.get('name', '')} for f in folders if isinstance(f, dict)]
+
+
+def _get_target_music_folder_ids(provider_config=None):
     """
     Parses config for music folder names and returns their IDs for filtering using a robust,
     case-insensitive matching against the server's actual folder configuration.
     """
-    folder_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
-
-    if not folder_names_str.strip():
-        return None
+    # Try per-provider config first
+    if provider_config and provider_config.get('music_libraries'):
+        library_names = provider_config['music_libraries']  # already a list
+    else:
+        # Fallback to global env var
+        folder_names_str = getattr(config, 'MUSIC_LIBRARIES', '')
+        if not folder_names_str.strip():
+            return None
+        library_names = [n.strip() for n in folder_names_str.split(',') if n.strip()]
 
-    target_names_lower = {name.strip().lower() for name in folder_names_str.split(',') if name.strip()}
+    target_names_lower = {name.lower() for name in library_names}
 
     # Use the getMusicFolders endpoint to get the available music folders.
     response = _navidrome_request("getMusicFolders")
diff --git a/tasks/playlist_ordering.py b/tasks/playlist_ordering.py
new file mode 100644
index 00000000..e425e224
--- /dev/null
+++ b/tasks/playlist_ordering.py
@@ -0,0 +1,189 @@
+"""
+Playlist Ordering Algorithm
+Orders songs for smooth transitions using tempo, energy, and key distance.
+Uses a greedy nearest-neighbor approach with a composite distance metric.
+"""
+import logging
+from typing import List, Dict, Optional
+
+logger = logging.getLogger(__name__)
+
+# Circle of Fifths order for key distance calculation
+# Maps key name -> position on the circle (0-11)
+CIRCLE_OF_FIFTHS = {
+    'C': 0, 'G': 1, 'D': 2, 'A': 3, 'E': 4, 'B': 5,
+    'F#': 6, 'GB': 6, 'DB': 7, 'C#': 7, 'AB': 8, 'G#': 8,
+    'EB': 9, 'D#': 9, 'BB': 10, 'A#': 10, 'F': 11,
+}
+
+
+def _key_distance(key1: Optional[str], scale1: Optional[str],
+                  key2: Optional[str], scale2: Optional[str]) -> float:
+    """Calculate distance between two keys on the Circle of Fifths (0-1 normalized).
+
+    Same-scale bonus: if both keys share the same scale (major/minor), distance
+    is reduced by 20% to encourage keeping scale consistency.
+    """
+    if not key1 or not key2:
+        return 0.5  # neutral when key data is missing
+
+    pos1 = CIRCLE_OF_FIFTHS.get(key1.upper().replace(' ', ''), None)
+    pos2 = CIRCLE_OF_FIFTHS.get(key2.upper().replace(' ', ''), None)
+
+    if pos1 is None or pos2 is None:
+        return 0.5
+
+    # Shortest distance around the circle (max 6 steps)
+    raw = abs(pos1 - pos2)
+    steps = min(raw, 12 - raw)  # 0-6
+    dist = steps / 6.0  # normalize to 0-1
+
+    # Same-scale bonus
+    if scale1 and scale2 and scale1.lower() == scale2.lower():
+        dist *= 0.8
+
+    return dist
+
+
+def _composite_distance(song_a: Dict, song_b: Dict,
+                        w_tempo: float = 0.35,
+                        w_energy: float = 0.35,
+                        w_key: float = 0.30) -> float:
+    """Compute composite distance between two songs.
+
+    Args:
+        song_a, song_b: Dicts with keys 'tempo', 'energy', 'key', 'scale'
+        w_tempo, w_energy, w_key: Weights (should sum to 1.0)
+    """
+    # Tempo difference, normalized by typical BPM range (80 BPM span)
+    tempo_a = song_a.get('tempo') or 0
+    tempo_b = song_b.get('tempo') or 0
+    tempo_diff = min(abs(tempo_a - tempo_b) / 80.0, 1.0)
+
+    # Energy difference, normalized by energy range (0.14 span for raw 0.01-0.15)
+    energy_a = song_a.get('energy') or 0
+    energy_b = song_b.get('energy') or 0
+    energy_diff = min(abs(energy_a - energy_b) / 0.14, 1.0)
+
+    # Key distance
+    key_dist = _key_distance(
+        song_a.get('key'), song_a.get('scale'),
+        song_b.get('key'), song_b.get('scale')
+    )
+
+    return w_tempo * tempo_diff + w_energy * energy_diff + w_key * key_dist
+
+
+def order_playlist(song_ids: List[str], energy_arc: bool = False) -> List[str]:
+    """Order a list of song IDs for smooth listening transitions.
+
+    Uses greedy nearest-neighbor: start from the song at the 25th percentile
+    of energy, then greedily pick the nearest unvisited song.
+
+    Args:
+        song_ids: List of item_id strings
+        energy_arc: If True, shape an energy arc (gentle start -> peak -> cooldown)
+
+    Returns:
+        Reordered list of item_id strings
+    """
+    if len(song_ids) <= 2:
+        return song_ids
+
+    from tasks.mcp_server import get_db_connection
+    from psycopg2.extras import DictCursor
+
+    # Fetch song attributes
+    db_conn = get_db_connection()
+    try:
+        with db_conn.cursor(cursor_factory=DictCursor) as cur:
+            placeholders = ','.join(['%s'] * len(song_ids))
+            cur.execute(f"""
+                SELECT item_id, tempo, energy, key, scale
+                FROM public.score
+                WHERE item_id IN ({placeholders})
+            """, song_ids)
+            rows = cur.fetchall()
+    finally:
+        db_conn.close()
+
+    if not rows:
+        return song_ids
+
+    # Build lookup
+    song_data = {}
+    for r in rows:
+        song_data[r['item_id']] = {
+            'tempo': r['tempo'] or 0,
+            'energy': r['energy'] or 0,
+            'key': r['key'] or '',
+            'scale': r['scale'] or '',
+        }
+
+    # Only order songs we have data for; keep others at the end
+    orderable_ids = [sid for sid in song_ids if sid in song_data]
+    unorderable_ids = [sid for sid in song_ids if sid not in song_data]
+
+    if len(orderable_ids) <= 2:
+        return song_ids
+
+    # Find starting song: 25th percentile energy (gentle start)
+    sorted_by_energy = sorted(orderable_ids, key=lambda sid: song_data[sid]['energy'])
+    start_idx = len(sorted_by_energy) // 4  # 25th percentile
+    start_id = sorted_by_energy[start_idx]
+
+    # Greedy nearest-neighbor
+    remaining = set(orderable_ids)
+    remaining.remove(start_id)
+    ordered = [start_id]
+
+    current = start_id
+    while remaining:
+        best_id = None
+        best_dist = float('inf')
+        for candidate in remaining:
+            d = _composite_distance(song_data[current], song_data[candidate])
+            if d < best_dist:
+                best_dist = d
+                best_id = candidate
+        ordered.append(best_id)
+        remaining.remove(best_id)
+        current = best_id
+
+    # Optional energy arc: reorder for gentle start -> peak -> cooldown
+    if energy_arc and len(ordered) >= 10:
+        ordered = _apply_energy_arc(ordered, song_data)
+
+    return ordered + unorderable_ids
+
+
+def _apply_energy_arc(ordered_ids: List[str], song_data: Dict) -> List[str]:
+    """Reshape ordering for an energy arc: build up -> peak at 60-70% -> cool down.
+
+    Split the smooth-ordered list into low/medium/high energy buckets,
+    then interleave: low-start -> medium -> high (peak) -> medium -> low-end.
+    """
+    n = len(ordered_ids)
+
+    # Sort by energy for bucketing
+    by_energy = sorted(ordered_ids, key=lambda sid: song_data[sid]['energy'])
+
+    # Split into 3 segments
+    third = n // 3
+    low = by_energy[:third]
+    mid = by_energy[third:2*third]
+    high = by_energy[2*third:]
+
+    # Build arc: low-start -> mid-rise -> high-peak -> mid-fall -> low-end
+    half_low = len(low) // 2
+    half_mid = len(mid) // 2
+
+    arc = (
+        low[:half_low] +           # gentle start
+        mid[:half_mid] +           # building
+        high +                      # peak
+        list(reversed(mid[half_mid:])) +  # cooling
+        list(reversed(low[half_low:]))    # gentle end
+    )
+
+    return arc
diff --git a/templates/settings.html b/templates/settings.html
index 8db445dc..b7141557 100644
--- a/templates/settings.html
+++ b/templates/settings.html
@@ -492,6 +492,40 @@
         background: rgba(220, 53, 69, 0.2);
         color: #dc3545;
     }
+
+    /* Library Checklist */
+    .library-checklist {
+        margin-top: 0.75rem;
+        padding: 0.75rem;
+        background: var(--bg-card);
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+    }
+
+    .library-checklist-title {
+        font-weight: 500;
+        margin-bottom: 0.5rem;
+        font-size: 0.9rem;
+    }
+
+    .library-checklist label {
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+        padding: 0.25rem 0;
+        font-size: 0.9rem;
+        cursor: pointer;
+    }
+
+    .library-checklist label:hover {
+        color: var(--color-primary);
+    }
+
+    .library-checklist .library-note {
+        font-size: 0.8rem;
+        color: var(--text-muted);
+        margin-top: 0.5rem;
+    }
 </style>
 {% endblock %}
 
@@ -677,6 +711,7 @@ <h3 id="modal-title">Add Provider</h3>
                 <!-- Populated based on provider type -->
             </div>
             <div id="provider-test-result" class="test-result" style="display: none;"></div>
+            <div id="provider-library-checklist" class="library-checklist" style="display: none;"></div>
         </div>
         <div class="modal-footer">
             <button class="btn-cancel" onclick="closeProviderModal()">Cancel</button>
@@ -943,6 +978,8 @@ <h3 id="modal-title">Add Provider</h3>
 
         updateProviderFields();
         document.getElementById('provider-test-result').style.display = 'none';
+        const checklistDiv = document.getElementById('provider-library-checklist');
+        if (checklistDiv) { checklistDiv.style.display = 'none'; checklistDiv.innerHTML = ''; }
         document.getElementById('provider-modal').classList.add('visible');
     }
 
@@ -966,6 +1003,8 @@ <h3 id="modal-title">Add Provider</h3>
 
         updateProviderFields(provider.config);
         document.getElementById('provider-test-result').style.display = 'none';
+        const checklistDiv = document.getElementById('provider-library-checklist');
+        if (checklistDiv) { checklistDiv.style.display = 'none'; checklistDiv.innerHTML = ''; }
         document.getElementById('provider-modal').classList.add('visible');
     }
 
@@ -973,6 +1012,12 @@ <h3 id="modal-title">Add Provider</h3>
         document.getElementById('provider-modal').classList.remove('visible');
         document.getElementById('provider-type').disabled = false;
         editingProviderId = null;
+        // Reset library checklist
+        const checklistDiv = document.getElementById('provider-library-checklist');
+        if (checklistDiv) {
+            checklistDiv.style.display = 'none';
+            checklistDiv.innerHTML = '';
+        }
     }
 
     function updateProviderFields(existingConfig = {}) {
@@ -1025,6 +1070,26 @@ <h3 id="modal-title">Add Provider</h3>
                 }
             }
         });
+
+        // Collect selected music libraries from checklist
+        const libraryCheckboxes = document.querySelectorAll('.library-checkbox');
+        if (libraryCheckboxes.length > 0) {
+            const allChecked = Array.from(libraryCheckboxes).every(cb => cb.checked);
+            if (allChecked) {
+                // All checked = no filtering (don't store music_libraries)
+            } else {
+                const selectedLibraries = [];
+                libraryCheckboxes.forEach(cb => {
+                    if (cb.checked) {
+                        selectedLibraries.push(cb.dataset.libraryName);
+                    }
+                });
+                if (selectedLibraries.length > 0) {
+                    config.music_libraries = selectedLibraries;
+                }
+            }
+        }
+
         return config;
     }
 
@@ -1046,12 +1111,67 @@ <h3 id="modal-title">Add Provider</h3>
             const data = await response.json();
             resultDiv.className = `test-result ${data.success ? 'success' : 'error'}`;
             resultDiv.textContent = data.message;
+
+            // After successful connection test, fetch available libraries
+            if (data.success && type !== 'localfiles') {
+                fetchProviderLibraries(type, config);
+            }
         } catch (err) {
             resultDiv.className = 'test-result error';
             resultDiv.textContent = 'Connection test failed: ' + err.message;
         }
     }
 
+    async function fetchProviderLibraries(type, config) {
+        const checklistDiv = document.getElementById('provider-library-checklist');
+        if (!checklistDiv) return;
+
+        try {
+            const response = await fetch('/api/setup/providers/libraries', {
+                method: 'POST',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({ provider_type: type, config })
+            });
+            const data = await response.json();
+            const libraries = data.libraries || [];
+
+            if (libraries.length === 0) {
+                checklistDiv.style.display = 'none';
+                return;
+            }
+
+            // Get existing music_libraries from editing provider (if any)
+            let existingLibraries = null;
+            if (editingProviderId) {
+                const provider = providers.find(p => p.id === editingProviderId);
+                if (provider && provider.config && provider.config.music_libraries) {
+                    existingLibraries = provider.config.music_libraries;
+                }
+            }
+
+            // Render checklist
+            let html = '<div class="library-checklist-title">Music Libraries:</div>';
+            libraries.forEach(lib => {
+                // If editing and provider has music_libraries, check only those
+                // Otherwise check all (default = scan everything)
+                const isChecked = existingLibraries
+                    ? existingLibraries.includes(lib.name)
+                    : true;
+                html += `<label>
+                    <input type="checkbox" ${isChecked ? 'checked' : ''}
+                           class="library-checkbox"
+                           data-library-name="${lib.name}">
+                    ${lib.name}
+                </label>`;
+            });
+            html += '<div class="library-note">Uncheck libraries you don\'t want to scan. All checked = scan everything.</div>';
+            checklistDiv.innerHTML = html;
+            checklistDiv.style.display = 'block';
+        } catch (err) {
+            console.error('Error fetching libraries:', err);
+        }
+    }
+
     async function saveProvider() {
         const type = document.getElementById('provider-type').value;
         const typeInfo = providerTypes.find(t => t.type === type);
diff --git a/templates/setup.html b/templates/setup.html
index 2b789c4a..65756bd9 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -752,6 +752,40 @@
     .hardware-benefits li {
         margin-bottom: 0.25rem;
     }
+
+    /* Library Checklist */
+    .library-checklist {
+        margin-top: 0.75rem;
+        padding: 0.75rem;
+        background: var(--bg-body);
+        border: 1px solid var(--border-color);
+        border-radius: 4px;
+    }
+
+    .library-checklist-title {
+        font-weight: 500;
+        margin-bottom: 0.5rem;
+        font-size: 0.9rem;
+    }
+
+    .library-checklist label {
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+        padding: 0.25rem 0;
+        font-size: 0.9rem;
+        cursor: pointer;
+    }
+
+    .library-checklist label:hover {
+        color: var(--color-primary);
+    }
+
+    .library-checklist .library-note {
+        font-size: 0.8rem;
+        color: var(--text-muted);
+        margin-top: 0.5rem;
+    }
 </style>
 {% endblock %}
 
@@ -1396,9 +1430,16 @@ <h4>Existing Installation Detected</h4>
             testResult.className = 'test-result';
             testResult.style.display = 'none';
 
+            // Library checklist container (populated after successful test)
+            const libraryChecklist = document.createElement('div');
+            libraryChecklist.id = `library-checklist-${type}`;
+            libraryChecklist.className = 'library-checklist';
+            libraryChecklist.style.display = 'none';
+
             configDiv.appendChild(form);
             configDiv.appendChild(testBtn);
             configDiv.appendChild(testResult);
+            configDiv.appendChild(libraryChecklist);
             configs.appendChild(configDiv);
         });
     }
@@ -1466,12 +1507,53 @@ <h4>Existing Installation Detected</h4>
             }
 
             resultDiv.innerHTML = resultHTML;
+
+            // After successful connection test, fetch available libraries
+            if (data.success && type !== 'localfiles') {
+                fetchProviderLibraries(type, config);
+            }
         } catch (err) {
             resultDiv.className = 'test-result error';
             resultDiv.textContent = 'Connection test failed: ' + err.message;
         }
     }
 
+    async function fetchProviderLibraries(type, config) {
+        const checklistDiv = document.getElementById(`library-checklist-${type}`);
+        if (!checklistDiv) return;
+
+        try {
+            const response = await fetch('/api/setup/providers/libraries', {
+                method: 'POST',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({ provider_type: type, config })
+            });
+            const data = await response.json();
+            const libraries = data.libraries || [];
+
+            if (libraries.length === 0) {
+                checklistDiv.style.display = 'none';
+                return;
+            }
+
+            // Render checklist - all checked by default
+            let html = '<div class="library-checklist-title">Music Libraries:</div>';
+            libraries.forEach(lib => {
+                html += `<label>
+                    <input type="checkbox" checked
+                           data-provider-library="${type}"
+                           data-library-name="${lib.name}">
+                    ${lib.name}
+                </label>`;
+            });
+            html += '<div class="library-note">Uncheck libraries you don\'t want to scan. All checked = scan everything.</div>';
+            checklistDiv.innerHTML = html;
+            checklistDiv.style.display = 'block';
+        } catch (err) {
+            console.error('Error fetching libraries for', type, err);
+        }
+    }
+
     function collectProviderConfig(type) {
         const config = {};
         const inputs = document.querySelectorAll(`[data-provider="${type}"]`);
@@ -1483,6 +1565,27 @@ <h4>Existing Installation Detected</h4>
                 config[field] = input.value;
             }
         });
+
+        // Collect selected music libraries
+        const libraryCheckboxes = document.querySelectorAll(`[data-provider-library="${type}"]`);
+        if (libraryCheckboxes.length > 0) {
+            const allChecked = Array.from(libraryCheckboxes).every(cb => cb.checked);
+            if (allChecked) {
+                // All checked = no filtering (don't store music_libraries)
+                // This means "scan everything"
+            } else {
+                const selectedLibraries = [];
+                libraryCheckboxes.forEach(cb => {
+                    if (cb.checked) {
+                        selectedLibraries.push(cb.dataset.libraryName);
+                    }
+                });
+                if (selectedLibraries.length > 0) {
+                    config.music_libraries = selectedLibraries;
+                }
+            }
+        }
+
         return config;
     }
 

From 495b2f8884f784ec30e2d775b1344f49094788e0 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Sun, 8 Feb 2026 14:34:41 +0100
Subject: [PATCH 21/33] Branch review fixes: security, bugs, thread safety,
 XSS, MPD removal, docker cleanup

Security:
- Remove leaked OpenRouter API key and private IP from YAML test configs
- Delete deployment/main.env containing real credentials
- Add env var override (OPENROUTER_API_KEY) for test scripts
- Gitignore test reports and deployment/main.env

Bug fixes:
- Fix ImportError: get_providers/get_provider_by_id imported from app_setup not app_helper
- Fix dir() scoping bug in test_instant_playlist.py (use locals())
- Fix Lyrion rating ValueError with _safe_rating() helper for non-numeric values
- Fix SQL LIKE wildcard injection with _escape_like() helper
- Add ftfy to testing_suite/requirements.txt

Thread safety:
- Refactor _create_playlist_for_provider_type() to pass server_config instead of
  mutating global config module with setattr - eliminates race conditions
- Add server_config param to all 5 providers' create_instant_playlist()
- Fix remap_item_ids_for_provider() to exclude source IDs in target query

Frontend:
- Add static/utils.js with escapeHtml() for XSS prevention
- Fix XSS in provider-selector.js, setup.html, settings.html
- Fix undefined CSS variables in provider-selector.js (--bg-input, --text-main, --color-primary)
- Fix hardcoded color in .app-version (use var(--text-muted))

MPD removal:
- Add clear error message when MPD provider is configured
- Remove MPD env vars from all docker-compose files and .env.example

Docker cleanup:
- Remove deprecated version: '3.8' from all 14 docker-compose files

LocalFiles performance:
- Add _get_songs_from_db() cache helper querying score table
- Use DB cache in get_recent_albums(), get_tracks_from_album(), create_playlist()

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 .gitignore                                    |    4 +
 ai_mcp_client.py                              |   84 +-
 app.py                                        |    8 +
 app_chat.py                                   |   57 +-
 app_helper.py                                 |    3 +
 app_setup.py                                  |   45 +
 deployment/.env.example                       |    7 +-
 deployment/docker-compose-dmr.yaml            |    1 -
 deployment/docker-compose-emby.yaml           |    1 -
 deployment/docker-compose-lyrion.yaml         |    1 -
 deployment/docker-compose-navidrome.yaml      |    1 -
 deployment/docker-compose-nvidia-local.yaml   |    1 -
 deployment/docker-compose-nvidia.yaml         |    1 -
 deployment/docker-compose-server.yaml         |    6 -
 .../docker-compose-unified-nvidia-test.yaml   |   11 -
 deployment/docker-compose-unified-nvidia.yaml |   11 -
 deployment/docker-compose-unified.yaml        |   11 -
 deployment/docker-compose-worker-cpu.yaml     |    6 -
 deployment/docker-compose-worker-nvidia.yaml  |    6 -
 deployment/docker-compose-worker.yaml         |    1 -
 deployment/docker-compose.yaml                |    1 -
 static/provider-selector.js                   |   14 +-
 static/style.css                              |    2 +-
 static/utils.js                               |   18 +
 tasks/chat_manager.py                         |   35 +-
 tasks/mcp_server.py                           |   27 +-
 tasks/mediaserver.py                          |  108 +-
 tasks/mediaserver_emby.py                     |   11 +-
 tasks/mediaserver_jellyfin.py                 |   13 +-
 tasks/mediaserver_localfiles.py               |   83 +-
 tasks/mediaserver_lyrion.py                   |   31 +-
 tasks/mediaserver_navidrome.py                |   22 +-
 templates/settings.html                       |  116 +-
 templates/setup.html                          |    3 +-
 testing_suite/ai_naming_test_config.yaml      |    4 +-
 .../instant_playlist_test_config.yaml         |  245 +++
 testing_suite/requirements.txt                |    1 +
 testing_suite/test_ai_naming.py               |    7 +
 testing_suite/test_instant_playlist.py        | 1643 +++++++++++++++++
 39 files changed, 2392 insertions(+), 258 deletions(-)
 create mode 100644 static/utils.js
 create mode 100644 testing_suite/instant_playlist_test_config.yaml
 create mode 100644 testing_suite/test_instant_playlist.py

diff --git a/.gitignore b/.gitignore
index a8d894e9..7f25fce0 100644
--- a/.gitignore
+++ b/.gitignore
@@ -37,6 +37,10 @@ env/
 .pytest_cache/
 htmlcov/
 nul
+testing_suite/reports/
+
+# Deployment secrets
+deployment/main.env
 
 # Large model files in query folder
 /query/*.pt
diff --git a/ai_mcp_client.py b/ai_mcp_client.py
index aebe7528..e65eec08 100644
--- a/ai_mcp_client.py
+++ b/ai_mcp_client.py
@@ -10,6 +10,24 @@
 logger = logging.getLogger(__name__)
 
 
+_FALLBACK_GENRES = "rock, pop, metal, jazz, electronic, dance, alternative, indie, punk, blues, hard rock, heavy metal, hip-hop, funk, country, soul"
+_FALLBACK_MOODS = "danceable, aggressive, happy, party, relaxed, sad"
+
+
+def _get_dynamic_genres(library_context: Optional[Dict]) -> str:
+    """Return genre list from library context, falling back to defaults."""
+    if library_context and library_context.get('top_genres'):
+        return ', '.join(library_context['top_genres'][:15])
+    return _FALLBACK_GENRES
+
+
+def _get_dynamic_moods(library_context: Optional[Dict]) -> str:
+    """Return mood list from library context, falling back to defaults."""
+    if library_context and library_context.get('top_moods'):
+        return ', '.join(library_context['top_moods'][:10])
+    return _FALLBACK_MOODS
+
+
 def _build_system_prompt(tools: List[Dict], library_context: Optional[Dict] = None) -> str:
     """Build a single canonical system prompt used by ALL AI providers.
 
@@ -24,7 +42,6 @@ def _build_system_prompt(tools: List[Dict], library_context: Optional[Dict] = No
     lib_section = ""
     if library_context and library_context.get('total_songs', 0) > 0:
         ctx = library_context
-        genres_str = ', '.join(ctx['top_genres'][:12]) if ctx.get('top_genres') else 'unknown'
         year_range = ''
         if ctx.get('year_min') and ctx.get('year_max'):
             year_range = f"\n- Year range: {ctx['year_min']}-{ctx['year_max']}"
@@ -37,23 +54,22 @@ def _build_system_prompt(tools: List[Dict], library_context: Optional[Dict] = No
 
         lib_section = f"""
 === USER'S MUSIC LIBRARY ===
-- {ctx['total_songs']} songs from {ctx['unique_artists']} artists
-- Top genres: {genres_str}{year_range}{rating_info}{scale_info}
+- {ctx['total_songs']} songs from {ctx['unique_artists']} artists{year_range}{rating_info}{scale_info}
 """
 
     # Build tool decision tree
     decision_tree = []
     decision_tree.append("1. Specific song+artist mentioned? -> song_similarity")
     if has_text_search:
-        decision_tree.append("2. Instruments (piano, guitar, drums) or descriptive moods (romantic, dreamy)? -> text_search")
-        decision_tree.append("3. 'songs like [ARTIST]' (similar artists)? -> artist_similarity")
-        decision_tree.append("4. 'sounds like A + B' or 'like X but not Y'? -> song_alchemy")
-        decision_tree.append("5. Artist's own songs, trending, era, complex? -> ai_brainstorm")
+        decision_tree.append("2. Instruments (piano, guitar, ukulele) or SOUND DESCRIPTIONS (romantic, dreamy, chill vibes)? -> text_search")
+        decision_tree.append("3. 'songs by/from/like [ARTIST]'? -> artist_similarity (returns artist's own + similar)")
+        decision_tree.append("4. MULTIPLE artists blended ('A meets B', 'A + B', 'like A and B combined') OR negation ('X but not Y', 'X without Y')? -> song_alchemy (REQUIRES 2+ items)")
+        decision_tree.append("5. Songs NOT in library, trending, award winners (Grammy, Billboard), cultural knowledge? -> ai_brainstorm")
         decision_tree.append("6. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
     else:
-        decision_tree.append("2. 'songs like [ARTIST]' (similar artists)? -> artist_similarity")
-        decision_tree.append("3. 'sounds like A + B' or 'like X but not Y'? -> song_alchemy")
-        decision_tree.append("4. Artist's own songs, trending, era, complex? -> ai_brainstorm")
+        decision_tree.append("2. 'songs by/from/like [ARTIST]'? -> artist_similarity (returns artist's own + similar)")
+        decision_tree.append("3. MULTIPLE artists blended ('A meets B', 'A + B', 'like A and B combined') OR negation ('X but not Y', 'X without Y')? -> song_alchemy (REQUIRES 2+ items)")
+        decision_tree.append("4. Songs NOT in library, trending, award winners (Grammy, Billboard), cultural knowledge? -> ai_brainstorm")
         decision_tree.append("5. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
 
     decision_text = '\n'.join(decision_tree)
@@ -66,18 +82,24 @@ def _build_system_prompt(tools: List[Dict], library_context: Optional[Dict] = No
 === RULES ===
 1. Call one or more tools - each returns songs with item_id, title, and artist
 2. song_similarity REQUIRES both title AND artist - never leave empty
-3. artist_similarity returns songs from SIMILAR artists, NOT the artist's own songs
+3. artist_similarity returns the artist's OWN songs + songs from SIMILAR artists
 4. search_database: COMBINE all filters in ONE call. Use for genre/mood/tempo/energy/year/rating
 5. For multiple artists: call artist_similarity once per artist, or use song_alchemy to blend
-6. Return ONLY tool calls - no text explanations
+6. Prefer tool calls over text explanations
+7. For complex requests, call MULTIPLE tools in ONE turn for better coverage:
+   - "relaxing piano jazz" -> text_search("relaxing piano") + search_database(genres=["jazz"])
+   - "energetic songs by Metallica and AC/DC" -> artist_similarity("Metallica") + artist_similarity("AC/DC")
+8. When a query has BOTH a genre AND a mood from the MOODS list, prefer search_database over text_search:
+   - "sad jazz" -> search_database(genres=["jazz"], moods=["sad"])  NOT text_search
+   - But "dreamy atmospheric" -> text_search (no specific genre, sound description)
 
 === VALID search_database VALUES ===
-GENRES: rock, pop, metal, jazz, electronic, dance, alternative, indie, punk, blues, hard rock, heavy metal, Hip-Hop, funk, country, soul, 00s, 90s, 80s, 70s, 60s
-MOODS: danceable, aggressive, happy, party, relaxed, sad
+GENRES: {_get_dynamic_genres(library_context)}
+MOODS: {_get_dynamic_moods(library_context)}
 TEMPO: 40-200 BPM
 ENERGY: 0.0 (calm) to 1.0 (intense) - use 0.0-0.35 for low, 0.35-0.65 for medium, 0.65-1.0 for high
 SCALE: major, minor
-YEAR: year_min/year_max (e.g., 1990-1999 for 90s)
+YEAR: year_min/year_max (e.g., 1990-1999 for 90s). For decade requests (80s, 90s), prefer year filters over genres.
 RATING: min_rating 1-5 (user's personal ratings)"""
 
     return prompt
@@ -193,10 +215,12 @@ def convert_schema_for_gemini(schema):
 
         # Generate response with function calling using new API
         # Note: Using 'ANY' mode to force tool calling instead of text response
+        # system_instruction gives the prompt proper role separation (not mixed into user content)
         response = client.models.generate_content(
             model=model_name,
-            contents=f"{system_instruction}\n\nUser request: {user_message}",
+            contents=user_message,
             config=genai.types.GenerateContentConfig(
+                system_instruction=system_instruction,
                 tools=tools_list,
                 tool_config=genai.types.ToolConfig(
                     function_calling_config=genai.types.FunctionCallingConfig(mode='ANY')
@@ -441,7 +465,7 @@ def _call_ollama_with_tools(user_message: str, tools: List[Dict], ai_config: Dic
         if has_text_search:
             examples.append('"calm piano song"\n{{"tool_calls": [{{"name": "text_search", "arguments": {{"description": "calm piano", "get_songs": 100}}}}]}}')
         examples.append('"songs like blink-182"\n{{"tool_calls": [{{"name": "artist_similarity", "arguments": {{"artist": "blink-182", "get_songs": 100}}}}]}}')
-        examples.append('"blink-182 songs"\n{{"tool_calls": [{{"name": "ai_brainstorm", "arguments": {{"user_request": "blink-182 songs", "get_songs": 100}}}}]}}')
+        examples.append('"blink-182 songs"\n{{"tool_calls": [{{"name": "artist_similarity", "arguments": {{"artist": "blink-182", "get_songs": 100}}}}]}}')
         examples.append('"energetic rock"\n{{"tool_calls": [{{"name": "search_database", "arguments": {{"genres": ["rock"], "energy_min": 0.65, "get_songs": 100}}}}]}}')
         examples_text = "\n\n".join(examples)
 
@@ -625,23 +649,17 @@ def normalize_items(items):
             )
         elif tool_name == "search_database":
             # Convert normalized energy (0-1) to raw energy scale
+            # AI sees 0.0-1.0, raw DB range is ENERGY_MIN-ENERGY_MAX (e.g. 0.01-0.15)
             energy_min_raw = None
             energy_max_raw = None
             e_min = tool_args.get('energy_min')
             e_max = tool_args.get('energy_max')
             if e_min is not None:
                 e_min = float(e_min)
-                # If the value looks like it's already in raw scale (0.01-0.15), pass through
-                if e_min <= 0.15:
-                    energy_min_raw = e_min
-                else:
-                    energy_min_raw = config.ENERGY_MIN + e_min * (config.ENERGY_MAX - config.ENERGY_MIN)
+                energy_min_raw = config.ENERGY_MIN + e_min * (config.ENERGY_MAX - config.ENERGY_MIN)
             if e_max is not None:
                 e_max = float(e_max)
-                if e_max <= 0.15:
-                    energy_max_raw = e_max
-                else:
-                    energy_max_raw = config.ENERGY_MIN + e_max * (config.ENERGY_MAX - config.ENERGY_MIN)
+                energy_max_raw = config.ENERGY_MIN + e_max * (config.ENERGY_MAX - config.ENERGY_MIN)
 
             return _database_genre_query_sync(
                 tool_args.get('genres'),
@@ -673,13 +691,13 @@ def normalize_items(items):
 
 def get_mcp_tools() -> List[Dict]:
     """Get the list of available MCP tools - 6 CORE TOOLS.
-    
+
     ⚠️ CRITICAL: ALWAYS choose tools in THIS ORDER (most specific → most general):
     1. SONG_SIMILARITY - for specific song title + artist
     2. TEXT_SEARCH - for instruments, specific moods, descriptive queries (requires CLAP)
-    3. ARTIST_SIMILARITY - for songs FROM specific artist(s)
+    3. ARTIST_SIMILARITY - for songs BY/FROM specific artist(s) (includes artist's own songs)
     4. SONG_ALCHEMY - for 'sounds LIKE' blending multiple artists/songs
-    5. AI_BRAINSTORM - for world knowledge (artist's own songs, era, awards)
+    5. AI_BRAINSTORM - for world knowledge (trending, awards, songs NOT in library)
     6. SEARCH_DATABASE - for genre/mood/tempo filters (last resort)
     
     Never skip to a general tool when a specific tool can handle the request!
@@ -718,7 +736,7 @@ def get_mcp_tools() -> List[Dict]:
     if CLAP_ENABLED:
         tools.append({
             "name": "text_search",
-            "description": "🥈 PRIORITY #2: HIGH PRIORITY - Natural language search using CLAP. ✅ USE for: INSTRUMENTS (piano, guitar, ukulele), SPECIFIC MOODS (romantic, sad, happy), DESCRIPTIVE QUERIES ('chill vibes', 'energetic workout'). Supports optional tempo/energy filters for hybrid search.",
+            "description": "🥈 PRIORITY #2: HIGH PRIORITY - Natural language search using CLAP. ✅ USE for: INSTRUMENTS (piano, guitar, ukulele), SOUND DESCRIPTIONS (romantic, dreamy, chill vibes), DESCRIPTIVE QUERIES ('energetic workout'). Supports optional tempo/energy filters for hybrid search.",
             "inputSchema": {
                 "type": "object",
                 "properties": {
@@ -749,7 +767,7 @@ def get_mcp_tools() -> List[Dict]:
     tools.extend([
         {
             "name": "artist_similarity",
-            "description": f"🥉 PRIORITY #{'3' if CLAP_ENABLED else '2'}: Find songs FROM similar artists (NOT the artist's own songs). ✅ USE for: 'songs FROM Artist X, Artist Y' (call once per artist). ❌ DON'T USE for: 'sounds LIKE multiple artists' (use song_alchemy).",
+            "description": f"🥉 PRIORITY #{'3' if CLAP_ENABLED else '2'}: Find songs BY an artist AND similar artists. ✅ USE for: 'songs by/from/like Artist X' including the artist's own songs (call once per artist). ❌ DON'T USE for: 'sounds LIKE multiple artists blended' (use song_alchemy).",
             "inputSchema": {
                 "type": "object",
                 "properties": {
@@ -768,7 +786,7 @@ def get_mcp_tools() -> List[Dict]:
         },
         {
             "name": "song_alchemy",
-            "description": f"🏅 PRIORITY #{'4' if CLAP_ENABLED else '3'}: VECTOR ARITHMETIC - Blend or subtract artists/songs using musical math. ✅ BEST for: 'SOUNDS LIKE / PLAY LIKE multiple artists' ('play like Iron Maiden, Metallica, Deep Purple'), 'like X but NOT Y', 'Artist A meets Artist B'. ❌ DON'T USE for: 'songs FROM artists' (use artist_similarity), single artist (use artist_similarity), genre/mood (use search_database). Examples: 'play like Iron Maiden + Metallica + Deep Purple' = add all 3; 'Beatles but not ballads' = add Beatles, subtract ballads.",
+            "description": f"🏅 PRIORITY #{'4' if CLAP_ENABLED else '3'}: VECTOR ARITHMETIC - Blend or subtract MULTIPLE artists/songs. REQUIRES 2+ items. Keywords: 'meets', 'combined', 'blend', 'mix of', 'but not', 'without'. ✅ BEST for: 'play like A + B' ('play like Iron Maiden, Metallica, Deep Purple'), 'like X but NOT Y', 'Artist A meets Artist B', 'mix of A and B'. ❌ DON'T USE for: single artist (use artist_similarity), genre/mood (use search_database). Examples: 'play like Iron Maiden + Metallica + Deep Purple' = add all 3; 'Beatles but not ballads' = add Beatles, subtract ballads.",
             "inputSchema": {
                 "type": "object",
                 "properties": {
@@ -821,7 +839,7 @@ def get_mcp_tools() -> List[Dict]:
         },
         {
             "name": "ai_brainstorm",
-            "description": f"🏅 PRIORITY #{'5' if CLAP_ENABLED else '4'}: AI world knowledge - Use ONLY when other tools CAN'T work. ✅ USE for: artist's OWN songs, specific era/year, trending songs, award winners, chart hits. ❌ DON'T USE for: 'sounds like' (use song_alchemy), artist similarity (use artist_similarity), genre/mood (use search_database), instruments/moods (use text_search if available).",
+            "description": f"🏅 PRIORITY #{'5' if CLAP_ENABLED else '4'}: AI world knowledge - Use ONLY when other tools CAN'T work. ✅ USE for: named events (Grammy, Billboard, festivals), cultural knowledge (trending, viral, classic hits), historical significance (best of decade, iconic albums), songs NOT in library. ❌ DON'T USE for: artist's own songs (use artist_similarity), 'sounds like' (use song_alchemy), genre/mood (use search_database), instruments/moods (use text_search if available).",
             "inputSchema": {
                 "type": "object",
                 "properties": {
diff --git a/app.py b/app.py
index 4b4c2943..e1003355 100644
--- a/app.py
+++ b/app.py
@@ -628,6 +628,14 @@ def listen_for_index_reloads():
   os.makedirs(TEMP_DIR, exist_ok=True)
 
   with app.app_context():
+    # --- Apply DB settings to runtime config ---
+    try:
+      from app_setup import apply_settings_to_config
+      apply_settings_to_config()
+      logger.info("Applied DB settings to runtime config.")
+    except Exception as e:
+      logger.debug(f"Could not apply DB settings at startup: {e}")
+
     # --- Initial Voyager Index Load ---
     from tasks.voyager_manager import load_voyager_index_for_querying
     load_voyager_index_for_querying()
diff --git a/app_chat.py b/app_chat.py
index 7c274390..0f7bad18 100644
--- a/app_chat.py
+++ b/app_chat.py
@@ -88,15 +88,16 @@ def chat_config_defaults_api():
     """
     API endpoint to provide default configuration values for the chat interface.
     """
-    # The default_gemini_api_key is no longer sent to the front end for security.
+    # Read from config module attributes (may be overridden by DB settings via apply_settings_to_config)
+    import config as cfg
     return jsonify({
-        "default_ai_provider": AI_MODEL_PROVIDER,
-        "default_ollama_model_name": OLLAMA_MODEL_NAME,
-        "ollama_server_url": OLLAMA_SERVER_URL, # Ollama server URL might be useful for display/info
-        "default_openai_model_name": OPENAI_MODEL_NAME,
-        "openai_server_url": OPENAI_SERVER_URL, # OpenAI server URL for display/info
-        "default_gemini_model_name": GEMINI_MODEL_NAME,
-        "default_mistral_model_name": MISTRAL_MODEL_NAME,
+        "default_ai_provider": cfg.AI_MODEL_PROVIDER,
+        "default_ollama_model_name": cfg.OLLAMA_MODEL_NAME,
+        "ollama_server_url": cfg.OLLAMA_SERVER_URL,
+        "default_openai_model_name": cfg.OPENAI_MODEL_NAME,
+        "openai_server_url": cfg.OPENAI_SERVER_URL,
+        "default_gemini_model_name": cfg.GEMINI_MODEL_NAME,
+        "default_mistral_model_name": cfg.MISTRAL_MODEL_NAME,
     }), 200
 
 @chat_bp.route('/api/chatPlaylist', methods=['POST'])
@@ -385,12 +386,35 @@ def chat_playlist_api():
             unique_artists = len(artist_counts)
             diversity_ratio = round(unique_artists / max(len(all_songs), 1), 2)
 
-            # Genres covered (from tools used)
-            genres_used = set()
-            for t in tools_used_history:
-                if t.get('args', {}).get('genres'):
-                    genres_used.update(t['args']['genres'])
-            genres_str = ", ".join(genres_used) if genres_used else "none specifically"
+            # Genres covered (from actual collected songs' mood_vector)
+            genres_str = "none specifically"
+            collected_ids = [s['item_id'] for s in all_songs]
+            if collected_ids:
+                try:
+                    from tasks.mcp_server import get_db_connection
+                    from psycopg2.extras import DictCursor
+                    db_conn_feedback = get_db_connection()
+                    with db_conn_feedback.cursor(cursor_factory=DictCursor) as cur:
+                        placeholders = ','.join(['%s'] * min(len(collected_ids), 200))
+                        cur.execute(f"""
+                            SELECT unnest(string_to_array(mood_vector, ',')) AS tag
+                            FROM public.score
+                            WHERE item_id IN ({placeholders})
+                            AND mood_vector IS NOT NULL AND mood_vector != ''
+                        """, collected_ids[:200])
+                        genre_freq = {}
+                        for r in cur:
+                            tag = r['tag'].strip()
+                            if ':' in tag:
+                                name = tag.split(':')[0].strip()
+                                if name:
+                                    genre_freq[name] = genre_freq.get(name, 0) + 1
+                        if genre_freq:
+                            top_collected = sorted(genre_freq, key=genre_freq.get, reverse=True)[:8]
+                            genres_str = ", ".join(top_collected)
+                    db_conn_feedback.close()
+                except Exception:
+                    pass
 
             ai_context = f"""Original request: "{original_user_input}"
 Progress: {current_song_count}/{target_song_count} songs collected. Need {songs_needed} MORE.
@@ -421,8 +445,9 @@ def chat_playlist_api():
             
             # Fallback based on iteration
             if iteration == 0:
-                log_messages.append("\n🔄 Fallback: Trying genre search...")
-                fallback_result = execute_mcp_tool('search_database', {'genres': ['pop', 'rock'], 'get_songs': 100}, ai_config)
+                fallback_genres = library_context.get('top_genres', ['pop', 'rock'])[:2] if library_context else ['pop', 'rock']
+                log_messages.append(f"\n🔄 Fallback: Trying genre search with {fallback_genres}...")
+                fallback_result = execute_mcp_tool('search_database', {'genres': fallback_genres, 'get_songs': 100}, ai_config)
                 if 'songs' in fallback_result:
                     songs = fallback_result['songs']
                     for song in songs:
diff --git a/app_helper.py b/app_helper.py
index d7dca0f7..8ded0ddc 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -324,6 +324,9 @@ def init_db():
                 ('setup_version', '"1.0"', 'system', 'Version of the setup wizard last completed'),
                 ('multi_provider_enabled', 'false', 'providers', 'Whether multi-provider mode is enabled'),
                 ('primary_provider_id', 'null', 'providers', 'ID of the primary provider for playlist creation'),
+                ('max_songs_per_artist_playlist', '5', 'ai', 'Max songs per artist in instant playlists'),
+                ('playlist_energy_arc', 'false', 'ai', 'Enable energy arc shaping for playlist ordering'),
+                ('ai_request_timeout', '300', 'ai', 'AI request timeout in seconds'),
             ]
             for key, value, category, description in default_settings:
                 cur.execute("""
diff --git a/app_setup.py b/app_setup.py
index fed1b538..85d99204 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -83,6 +83,45 @@ def get_all_settings():
         return settings
 
 
+def apply_settings_to_config():
+    """Apply DB settings to runtime config module.
+
+    Reads relevant settings from the database and updates the corresponding
+    config.* module attributes so that changes made in the settings UI take
+    effect immediately without requiring an app restart.
+    """
+    mapping = {
+        'ai_provider': 'AI_MODEL_PROVIDER',
+        'clap_enabled': 'CLAP_ENABLED',
+        'ollama_server_url': 'OLLAMA_SERVER_URL',
+        'ollama_model_name': 'OLLAMA_MODEL_NAME',
+        'openai_server_url': 'OPENAI_SERVER_URL',
+        'openai_model_name': 'OPENAI_MODEL_NAME',
+        'gemini_model_name': 'GEMINI_MODEL_NAME',
+        'mistral_model_name': 'MISTRAL_MODEL_NAME',
+        'max_songs_per_artist_playlist': 'MAX_SONGS_PER_ARTIST_PLAYLIST',
+        'playlist_energy_arc': 'PLAYLIST_ENERGY_ARC',
+        'ai_request_timeout': 'AI_REQUEST_TIMEOUT_SECONDS',
+    }
+    for db_key, config_attr in mapping.items():
+        val = get_setting(db_key)
+        if val is not None and val != '':
+            existing = getattr(config, config_attr, None)
+            if isinstance(existing, bool):
+                val = val in (True, 'true', 'True')
+            elif isinstance(existing, int):
+                try:
+                    val = int(val)
+                except (ValueError, TypeError):
+                    continue
+            elif isinstance(existing, float):
+                try:
+                    val = float(val)
+                except (ValueError, TypeError):
+                    continue
+            setattr(config, config_attr, val)
+
+
 def is_setup_completed():
     """Check if initial setup has been completed."""
     result = get_setting('setup_completed')
@@ -787,6 +826,12 @@ def update_settings():
     for key, value in data.items():
         set_setting(key, value)
 
+    # Apply relevant settings to runtime config immediately
+    try:
+        apply_settings_to_config()
+    except Exception as e:
+        logger.warning(f"Failed to apply settings to runtime config: {e}")
+
     return jsonify({'message': 'Settings updated'})
 
 
diff --git a/deployment/.env.example b/deployment/.env.example
index bc5b2bc1..f07a7d59 100644
--- a/deployment/.env.example
+++ b/deployment/.env.example
@@ -39,7 +39,7 @@
 # Choose your primary media provider. Additional providers can be configured
 # via the web-based setup wizard at http://localhost:8000/setup
 #
-# Options: jellyfin, navidrome, lyrion, mpd, emby, localfiles
+# Options: jellyfin, navidrome, lyrion, emby, localfiles
 # Default: localfiles (scans local music directory)
 MEDIASERVER_TYPE=localfiles
 
@@ -71,11 +71,6 @@ NAVIDROME_PASSWORD=
 # --- Lyrion (formerly LMS) ---
 LYRION_URL=http://lyrion.example.com:9000
 
-# --- MPD (Music Player Daemon) ---
-MPD_HOST=localhost
-MPD_PORT=6600
-MPD_PASSWORD=
-MPD_MUSIC_DIRECTORY=/var/lib/mpd/music
 
 # =============================================================================
 # DATABASE & INFRASTRUCTURE
diff --git a/deployment/docker-compose-dmr.yaml b/deployment/docker-compose-dmr.yaml
index 38168184..cb6ae80c 100644
--- a/deployment/docker-compose-dmr.yaml
+++ b/deployment/docker-compose-dmr.yaml
@@ -1,4 +1,3 @@
-version: '3.8'
 services:
   # Redis service for RQ (task queue)
   redis:
diff --git a/deployment/docker-compose-emby.yaml b/deployment/docker-compose-emby.yaml
index a56bd3b8..2175f123 100644
--- a/deployment/docker-compose-emby.yaml
+++ b/deployment/docker-compose-emby.yaml
@@ -1,4 +1,3 @@
-version: '3.8'
 services:
   # Redis service for RQ (task queue)
   redis:
diff --git a/deployment/docker-compose-lyrion.yaml b/deployment/docker-compose-lyrion.yaml
index 301f13a4..b7c07078 100644
--- a/deployment/docker-compose-lyrion.yaml
+++ b/deployment/docker-compose-lyrion.yaml
@@ -1,4 +1,3 @@
-version: '3.8'
 services:
   # Redis service for RQ (task queue)
   redis:
diff --git a/deployment/docker-compose-navidrome.yaml b/deployment/docker-compose-navidrome.yaml
index 88d1e479..ef85a5b9 100644
--- a/deployment/docker-compose-navidrome.yaml
+++ b/deployment/docker-compose-navidrome.yaml
@@ -1,4 +1,3 @@
-version: '3.8'
 services:
   # Redis service for RQ (task queue)
   redis:
diff --git a/deployment/docker-compose-nvidia-local.yaml b/deployment/docker-compose-nvidia-local.yaml
index f3b18348..f49ab7c4 100644
--- a/deployment/docker-compose-nvidia-local.yaml
+++ b/deployment/docker-compose-nvidia-local.yaml
@@ -1,4 +1,3 @@
-version: '3.8'
 services:
   # Redis service for RQ (task queue)
   redis:
diff --git a/deployment/docker-compose-nvidia.yaml b/deployment/docker-compose-nvidia.yaml
index 951167de..a6f95366 100644
--- a/deployment/docker-compose-nvidia.yaml
+++ b/deployment/docker-compose-nvidia.yaml
@@ -1,4 +1,3 @@
-version: '3.8'
 services:
   # Redis service for RQ (task queue)
   redis:
diff --git a/deployment/docker-compose-server.yaml b/deployment/docker-compose-server.yaml
index 8c968d5b..27ff1867 100644
--- a/deployment/docker-compose-server.yaml
+++ b/deployment/docker-compose-server.yaml
@@ -27,8 +27,6 @@
 #   - PostgreSQL with SSL and strong password
 # =============================================================================
 
-version: '3.8'
-
 services:
   # ---------------------------------------------------------------------------
   # Redis - Task Queue (exposed for remote workers)
@@ -91,10 +89,6 @@ services:
       NAVIDROME_USER: "${NAVIDROME_USER:-}"
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       LYRION_URL: "${LYRION_URL:-}"
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
       EMBY_TOKEN: "${EMBY_TOKEN:-}"
diff --git a/deployment/docker-compose-unified-nvidia-test.yaml b/deployment/docker-compose-unified-nvidia-test.yaml
index 2489b3d9..abfdf7a3 100644
--- a/deployment/docker-compose-unified-nvidia-test.yaml
+++ b/deployment/docker-compose-unified-nvidia-test.yaml
@@ -21,8 +21,6 @@
 # media servers!
 # =============================================================================
 
-version: '3.8'
-
 services:
   # ---------------------------------------------------------------------------
   # Redis - Task Queue
@@ -91,11 +89,6 @@ services:
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       # Lyrion (if using)
       LYRION_URL: "${LYRION_URL:-}"
-      # MPD (if using)
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       # Emby (if using)
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
@@ -168,10 +161,6 @@ services:
       NAVIDROME_USER: "${NAVIDROME_USER:-}"
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       LYRION_URL: "${LYRION_URL:-}"
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
       EMBY_TOKEN: "${EMBY_TOKEN:-}"
diff --git a/deployment/docker-compose-unified-nvidia.yaml b/deployment/docker-compose-unified-nvidia.yaml
index c86f8153..13e16dfa 100644
--- a/deployment/docker-compose-unified-nvidia.yaml
+++ b/deployment/docker-compose-unified-nvidia.yaml
@@ -18,8 +18,6 @@
 # media servers!
 # =============================================================================
 
-version: '3.8'
-
 services:
   # ---------------------------------------------------------------------------
   # Redis - Task Queue
@@ -83,11 +81,6 @@ services:
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       # Lyrion (if using)
       LYRION_URL: "${LYRION_URL:-}"
-      # MPD (if using)
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       # Emby (if using)
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
@@ -153,10 +146,6 @@ services:
       NAVIDROME_USER: "${NAVIDROME_USER:-}"
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       LYRION_URL: "${LYRION_URL:-}"
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
       EMBY_TOKEN: "${EMBY_TOKEN:-}"
diff --git a/deployment/docker-compose-unified.yaml b/deployment/docker-compose-unified.yaml
index e6541931..5cbff99a 100644
--- a/deployment/docker-compose-unified.yaml
+++ b/deployment/docker-compose-unified.yaml
@@ -13,8 +13,6 @@
 # media servers!
 # =============================================================================
 
-version: '3.8'
-
 services:
   # ---------------------------------------------------------------------------
   # Redis - Task Queue
@@ -78,11 +76,6 @@ services:
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       # Lyrion (if using)
       LYRION_URL: "${LYRION_URL:-}"
-      # MPD (if using)
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       # Emby (if using)
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
@@ -138,10 +131,6 @@ services:
       NAVIDROME_USER: "${NAVIDROME_USER:-}"
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       LYRION_URL: "${LYRION_URL:-}"
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
       EMBY_TOKEN: "${EMBY_TOKEN:-}"
diff --git a/deployment/docker-compose-worker-cpu.yaml b/deployment/docker-compose-worker-cpu.yaml
index ae093b87..78439111 100644
--- a/deployment/docker-compose-worker-cpu.yaml
+++ b/deployment/docker-compose-worker-cpu.yaml
@@ -25,8 +25,6 @@
 #   - Tasks automatically distributed across workers
 # =============================================================================
 
-version: '3.8'
-
 services:
   # ---------------------------------------------------------------------------
   # AudioMuse-AI Worker (CPU-only, connects to remote server)
@@ -63,10 +61,6 @@ services:
       NAVIDROME_USER: "${NAVIDROME_USER:-}"
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       LYRION_URL: "${LYRION_URL:-}"
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
       EMBY_TOKEN: "${EMBY_TOKEN:-}"
diff --git a/deployment/docker-compose-worker-nvidia.yaml b/deployment/docker-compose-worker-nvidia.yaml
index 18d7cf90..55e40b14 100644
--- a/deployment/docker-compose-worker-nvidia.yaml
+++ b/deployment/docker-compose-worker-nvidia.yaml
@@ -26,8 +26,6 @@
 #   - Tasks automatically distributed across workers
 # =============================================================================
 
-version: '3.8'
-
 services:
   # ---------------------------------------------------------------------------
   # AudioMuse-AI Worker (NVIDIA GPU, connects to remote server)
@@ -64,10 +62,6 @@ services:
       NAVIDROME_USER: "${NAVIDROME_USER:-}"
       NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD:-}"
       LYRION_URL: "${LYRION_URL:-}"
-      MPD_HOST: "${MPD_HOST:-}"
-      MPD_PORT: "${MPD_PORT:-6600}"
-      MPD_PASSWORD: "${MPD_PASSWORD:-}"
-      MPD_MUSIC_DIRECTORY: "${MPD_MUSIC_DIRECTORY:-/music}"
       EMBY_URL: "${EMBY_URL:-}"
       EMBY_USER_ID: "${EMBY_USER_ID:-}"
       EMBY_TOKEN: "${EMBY_TOKEN:-}"
diff --git a/deployment/docker-compose-worker.yaml b/deployment/docker-compose-worker.yaml
index 7e85a651..10845f17 100644
--- a/deployment/docker-compose-worker.yaml
+++ b/deployment/docker-compose-worker.yaml
@@ -1,7 +1,6 @@
 # AudioMuse-AI Deployment Configuration
 #
 # WORKER TEMPLATE - Run this for heavy CPU tasks like analysis and clustering, connected to a lightweight server with Jellyfin and AudioMuse-AI Flask application and databases.
-version: '3.8'
 services:
   # AudioMuse-AI Worker service (GPU-dependent)
   audiomuse-ai-worker:
diff --git a/deployment/docker-compose.yaml b/deployment/docker-compose.yaml
index e285cc16..e8342d4f 100644
--- a/deployment/docker-compose.yaml
+++ b/deployment/docker-compose.yaml
@@ -1,4 +1,3 @@
-version: '3.8'
 services:
   # Redis service for RQ (task queue)
   redis:
diff --git a/static/provider-selector.js b/static/provider-selector.js
index 754cfdb4..a5dbcea9 100644
--- a/static/provider-selector.js
+++ b/static/provider-selector.js
@@ -8,6 +8,12 @@
  * 4. Get selected value with getSelectedProviders() when creating playlist
  */
 
+function _escapeHtml(str) {
+    if (str == null) return '';
+    return String(str).replace(/&/g,'&amp;').replace(/</g,'&lt;')
+        .replace(/>/g,'&gt;').replace(/"/g,'&quot;').replace(/'/g,'&#039;');
+}
+
 let _providers = [];
 let _selectedProviderValue = null; // null = primary/default, 'all' = all providers, number = specific provider
 
@@ -61,7 +67,7 @@ async function initProviderSelector(containerId = 'provider-selector-container',
     }
 
     _providers.forEach(p => {
-        html += `<option value="${p.id}">${p.name}</option>`;
+        html += `<option value="${_escapeHtml(p.id)}">${_escapeHtml(p.name)}</option>`;
     });
 
     html += '</select></div>';
@@ -144,15 +150,15 @@ const providerSelectorStyles = `
     padding: 0.4rem 0.75rem;
     border: 1px solid var(--border-color, #ccc);
     border-radius: 4px;
-    background: var(--bg-primary, #fff);
-    color: var(--text-color, #333);
+    background: var(--bg-input, #fff);
+    color: var(--text-main, #333);
     font-size: 0.9rem;
     min-width: 150px;
 }
 
 .provider-select:focus {
     outline: none;
-    border-color: var(--primary-color, #007bff);
+    border-color: var(--color-primary, #007bff);
 }
 
 /* Compact variant for inline use */
diff --git a/static/style.css b/static/style.css
index deb56312..b4cbbec7 100644
--- a/static/style.css
+++ b/static/style.css
@@ -739,7 +739,7 @@ body.dark-mode #cancel-sync-btn:disabled {
     /* This will now appear directly after the navigation links */
     padding: 2rem 1rem 1rem 1rem; /* Extra top padding to space it from the last link */
     font-size: 0.8rem; /* Smaller font */
-    color: #6B7280; /* Grey text color */
+    color: var(--text-muted); /* Grey text color */
     text-align: center;
     /* Ensure long text wraps and doesn't get truncated */
     overflow-wrap: break-word;
diff --git a/static/utils.js b/static/utils.js
new file mode 100644
index 00000000..03ba81b0
--- /dev/null
+++ b/static/utils.js
@@ -0,0 +1,18 @@
+/**
+ * Shared utility functions for AudioMuse-AI frontend.
+ */
+
+/**
+ * Escape HTML special characters to prevent XSS.
+ * @param {*} str - Value to escape
+ * @returns {string} Escaped string safe for innerHTML
+ */
+function escapeHtml(str) {
+    if (str == null) return '';
+    return String(str)
+        .replace(/&/g, '&amp;')
+        .replace(/</g, '&lt;')
+        .replace(/>/g, '&gt;')
+        .replace(/"/g, '&quot;')
+        .replace(/'/g, '&#039;');
+}
diff --git a/tasks/chat_manager.py b/tasks/chat_manager.py
index 789c29de..3ee93fc9 100644
--- a/tasks/chat_manager.py
+++ b/tasks/chat_manager.py
@@ -460,7 +460,7 @@ def execute_action(action, db_conn, log_messages, ai_config=None):
                 
                 if energy_filter and energy_filter in energy_ranges:
                     energy_min, energy_max = energy_ranges[energy_filter]
-                    filter_conditions.append("energy_normalized >= %s AND energy_normalized < %s")
+                    filter_conditions.append("energy >= %s AND energy < %s")
                     query_params.extend([energy_min, energy_max])
                 
                 # Query database to filter by tempo/energy
@@ -469,7 +469,7 @@ def execute_action(action, db_conn, log_messages, ai_config=None):
                     where_clause = ' AND '.join(filter_conditions)
                     
                     sql = f"""
-                        SELECT item_id, title, author, tempo, energy_normalized
+                        SELECT item_id, title, author, tempo, energy
                         FROM public.score
                         WHERE item_id IN ({placeholders})
                         AND {where_clause}
@@ -1226,8 +1226,8 @@ def generate_final_sql_query(intent, strategy_info, found_artists, found_keyword
 Is Energy Query: {is_energy_query}
 
 {"**CRITICAL - TEMPORAL QUERY DETECTED**" if is_temporal_query else "**CRITICAL - GENRE/MOOD QUERY DETECTED**"}
-{"This is a time-based query (e.g., 'recent years', '2020s'). The database has NO YEAR COLUMN." if is_temporal_query else "This is a GENRE/MOOD query (e.g., 'metal songs', 'chill music'). You MUST use mood_vector filtering."}
-{"You MUST filter by specific SONG TITLES to achieve temporal filtering." if is_temporal_query else "You MUST use 'AND mood_vector LIKE %genre%' to filter by genre/mood."}
+{"This is a time-based query (e.g., 'recent years', '2020s'). Use the year column (integer) to filter by year/decade." if is_temporal_query else "This is a GENRE/MOOD query (e.g., 'metal songs', 'chill music'). You MUST use mood_vector filtering."}
+{"Use 'AND year >= YYYY' or 'AND year BETWEEN YYYY AND YYYY' for temporal filtering. You can also combine with specific SONG TITLES if available." if is_temporal_query else "You MUST use 'AND mood_vector LIKE %genre%' to filter by genre/mood."}
 
 {"**CRITICAL - ENERGY QUERY DETECTED**" if is_energy_query else ""}
 {"Add 'AND energy > 0.08' for high energy OR 'AND energy < 0.05' for low energy INSIDE the WHERE clause." if is_energy_query else ""}
@@ -1260,7 +1260,7 @@ def generate_final_sql_query(intent, strategy_info, found_artists, found_keyword
 The goal is to return EXACTLY {target_count} songs. Start with minimal filters and add more ONLY if needed.
 
 **Filtering Priority:**
-- **TEMPORAL QUERIES** (has song titles): Artist filtering + Song title matching
+- **TEMPORAL QUERIES** (year-based): Year column filtering + Artist filtering (+ optional song title matching)
 - **GENRE/MOOD QUERIES** (no song titles): Artist filtering + mood_vector LIKE filter **REQUIRED**
 - **ENERGY QUERIES**: Artist filtering + energy filter
 
@@ -1281,23 +1281,16 @@ def generate_final_sql_query(intent, strategy_info, found_artists, found_keyword
 2. **ABSOLUTELY CRITICAL**: ALL filters (mood_vector, energy, tempo) go INSIDE the subquery, BEFORE "ORDER BY RANDOM()"
 3. **NEVER EVER** add WHERE clause after ") AS randomized" - the outer query is ALWAYS: SELECT DISTINCT item_id, title, author FROM (...) AS randomized LIMIT {target_count}
 4. Use ONLY artists found in step 3 exploration (found_artists list)
-5. For temporal queries: Use (title, author) IN tuples for exact matches
+5. For temporal queries: Use year column filtering (year >= YYYY, year BETWEEN). Optionally add (title, author) IN tuples for exact matches.
 6. Use proper SQL escaping (single quotes as '')
 7. **DOUBLE CHECK**: After writing your SQL, verify that mood_vector, energy, tempo filters are INSIDE the subquery, not outside
 
 **FOR TEMPORAL QUERIES ("recent years", "2020s", "last decade"):**
-- Use found song titles with artist names as exact (title, author) IN tuples
-- Add OR author IN (...) for additional songs from those artists
+- Use the year column to filter by time period (e.g., year >= 2020, year BETWEEN 2010 AND 2019)
+- Combine with author IN (...) if specific artists are found
+- Optionally add (title, author) IN tuples for exact song matches
 - DO NOT add energy filters - this is a TIME-based query, not energy-based
-- DO NOT add mood_vector filters - keep it simple to maximize results
-- **IMPORTANT**: If you have many found artists (>10), use a simpler query:
-  ```
-  SELECT DISTINCT item_id, title, author FROM (
-    SELECT item_id, title, author FROM public.score
-    WHERE author IN ('Taylor Swift', 'Miley Cyrus', 'The Weeknd', ...)
-    ORDER BY RANDOM()
-  ) AS randomized LIMIT {target_count}
-  ```
+- Handle NULL years: some tracks may have year = NULL, exclude them with year IS NOT NULL
 
 **FOR GENRE/MOOD QUERIES ("rock songs", "pop music", "jazz"):**
 - Use author IN (...) for found artists
@@ -1314,12 +1307,8 @@ def generate_final_sql_query(intent, strategy_info, found_artists, found_keyword
 **Example 1 - Temporal query ("top radio songs recent years"):**
 SELECT DISTINCT item_id, title, author FROM (
   SELECT item_id, title, author FROM public.score
-  WHERE (title, author) IN (
-      ('Anti-Hero', 'Taylor Swift'),
-      ('Flowers', 'Miley Cyrus'),
-      ('As It Was', 'Harry Styles')
-    )
-    OR author IN ('Taylor Swift', 'Miley Cyrus', 'The Weeknd', 'Dua Lipa')
+  WHERE year >= 2020 AND year IS NOT NULL
+    AND author IN ('Taylor Swift', 'Miley Cyrus', 'The Weeknd', 'Dua Lipa')
   ORDER BY RANDOM()
 ) AS randomized LIMIT {target_count}
 
diff --git a/tasks/mcp_server.py b/tasks/mcp_server.py
index 03f88f42..6d1c622c 100644
--- a/tasks/mcp_server.py
+++ b/tasks/mcp_server.py
@@ -73,10 +73,25 @@ def get_library_context(force_refresh: bool = False) -> Dict:
             cur.execute("SELECT DISTINCT scale FROM public.score WHERE scale IS NOT NULL AND scale != '' ORDER BY scale")
             scales = [r['scale'] for r in cur.fetchall()]
 
+            # Top moods from other_features (extract mood tags and count occurrences)
+            # other_features format: "danceable, aggressive, happy" (comma-separated)
+            cur.execute("""
+                SELECT unnest(string_to_array(other_features, ',')) AS mood
+                FROM public.score
+                WHERE other_features IS NOT NULL AND other_features != ''
+            """)
+            mood_counts = {}
+            for r in cur:
+                mood = r['mood'].strip().lower()
+                if mood:
+                    mood_counts[mood] = mood_counts.get(mood, 0) + 1
+            top_moods = sorted(mood_counts, key=mood_counts.get, reverse=True)[:10]
+
         ctx = {
             'total_songs': total_songs,
             'unique_artists': unique_artists,
             'top_genres': top_genres,
+            'top_moods': top_moods,
             'year_min': year_min,
             'year_max': year_max,
             'has_ratings': rated_count > 0,
@@ -89,8 +104,8 @@ def get_library_context(force_refresh: bool = False) -> Dict:
         logger.warning(f"Failed to get library context: {e}")
         return {
             'total_songs': 0, 'unique_artists': 0, 'top_genres': [],
-            'year_min': None, 'year_max': None, 'has_ratings': False,
-            'rated_songs_pct': 0, 'scales': [],
+            'top_moods': [], 'year_min': None, 'year_max': None,
+            'has_ratings': False, 'rated_songs_pct': 0, 'scales': [],
         }
     finally:
         db_conn.close()
@@ -389,7 +404,7 @@ def _text_search_sync(description: str, tempo_filter: Optional[str], energy_filt
             
             if energy_filter and energy_filter in energy_ranges:
                 energy_min, energy_max = energy_ranges[energy_filter]
-                filter_conditions.append("energy_normalized >= %s AND energy_normalized < %s")
+                filter_conditions.append("energy >= %s AND energy < %s")
                 query_params.extend([energy_min, energy_max])
             
             # Query database to filter by tempo/energy
@@ -532,6 +547,10 @@ def _normalize(s: str) -> str:
             """Strip spaces, dashes, apostrophes for fuzzy comparison."""
             return re.sub(r"[\s\-\u2010\u2011\u2012\u2013\u2014/'\".,!?()]", '', s).lower()
 
+        def _escape_like(s: str) -> str:
+            """Escape LIKE wildcards to prevent injection."""
+            return s.replace('%', r'\%').replace('_', r'\_')
+
         for item in song_list:
             title = item.get('title', '')
             artist = item.get('artist', '')
@@ -563,7 +582,7 @@ def _normalize(s: str) -> str:
                                   LIKE LOWER(%s)
                             ORDER BY LENGTH(title) + LENGTH(author)
                             LIMIT 1
-                        """, (f"%{title_norm}%", f"%{artist_norm}%"))
+                        """, (f"%{_escape_like(title_norm)}%", f"%{_escape_like(artist_norm)}%"))
                         result = cur.fetchone()
 
                 if result and result['item_id'] not in seen_ids:
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index b5de7a2b..9c5b61ee 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -243,6 +243,12 @@ def get_provider_function(provider_type: str, function_name: str):
         get_all_songs = get_provider_function('jellyfin', 'get_all_songs')
         songs = get_all_songs()
     """
+    if provider_type == 'mpd':
+        raise ValueError(
+            "MPD provider has been removed in v0.9. Please use the LocalFiles "
+            "provider or another supported media server. See "
+            "deployment/.env.example for configuration options."
+        )
     provider_funcs = _PROVIDER_FUNCTIONS.get(provider_type)
     if not provider_funcs:
         logger.warning(f"Unknown provider type: {provider_type}")
@@ -875,7 +881,7 @@ def get_all_playlists_multi_provider(provider_ids=None):
     Returns:
         List of playlists with provider info, deduplicated by name
     """
-    from app_helper import get_providers, get_provider_by_id
+    from app_setup import get_providers, get_provider_by_id
 
     all_playlists = []
     seen_names = {}  # Track playlist names to detect duplicates
@@ -972,14 +978,13 @@ def remap_item_ids_for_provider(item_ids: list, source_provider_id: int, target_
             # Get the file paths we need to look up
             paths_to_find = list(source_id_to_path.values())
 
-            # Find matching item_ids in target provider by file_path
-            # The score table has file_path but item_ids are provider-specific
-            # We need to normalize paths and match
+            # Find matching item_ids in target provider by file_path,
+            # excluding source item_ids so we get the target provider's IDs
             cur.execute("""
                 SELECT item_id, file_path
                 FROM score
-                WHERE file_path = ANY(%s)
-            """, (paths_to_find,))
+                WHERE file_path = ANY(%s) AND item_id != ALL(%s)
+            """, (paths_to_find, item_ids))
             path_to_ids = {}
             for row in cur.fetchall():
                 path = row[1]
@@ -1116,78 +1121,37 @@ def _create_playlist_for_provider_type(provider_type, playlist_name, item_ids, u
     """Create playlist on a specific provider type.
 
     When called from multi-provider mode, provider_config contains the DB-stored
-    config (url, token, etc.).  We temporarily apply these values to the config
-    module so that downstream provider functions (which read config.JELLYFIN_URL
-    etc.) pick them up, and we build user_creds from the stored config when the
-    caller hasn't supplied explicit credentials.
+    config (url, token, etc.).  We pass it as server_config to the provider's
+    create_instant_playlist function, which handles the override internally.
     """
-    # Build a mapping of config module attributes to override from the provider's
-    # stored DB config so that provider functions that read config.* work correctly
-    # even when environment variables are empty.
-    _config_overrides = {}
-    if provider_config:
+    sc = provider_config or {}
+
+    # Build user_creds from stored config when the caller hasn't supplied
+    # explicit credentials.
+    if sc and not user_creds:
         if provider_type == 'jellyfin':
-            _config_overrides = {
-                'JELLYFIN_URL': provider_config.get('url', ''),
-                'JELLYFIN_TOKEN': provider_config.get('token', ''),
-                'JELLYFIN_USER_ID': provider_config.get('user_id', ''),
-            }
-            if not user_creds:
-                user_creds = {
-                    'token': provider_config.get('token', ''),
-                    'user_identifier': provider_config.get('user_id', ''),
-                }
-        elif provider_type == 'navidrome':
-            _config_overrides = {
-                'NAVIDROME_URL': provider_config.get('url', ''),
-                'NAVIDROME_USER': provider_config.get('user', ''),
-                'NAVIDROME_PASSWORD': provider_config.get('password', ''),
+            user_creds = {
+                'token': sc.get('token', ''),
+                'user_identifier': sc.get('user_id', ''),
             }
         elif provider_type == 'emby':
-            _config_overrides = {
-                'EMBY_URL': provider_config.get('url', ''),
-                'EMBY_TOKEN': provider_config.get('token', ''),
-                'EMBY_USER_ID': provider_config.get('user_id', ''),
-            }
-            if not user_creds:
-                user_creds = {
-                    'token': provider_config.get('token', ''),
-                    'user_id': provider_config.get('user_id', ''),
-                }
-        elif provider_type == 'lyrion':
-            _config_overrides = {
-                'LYRION_URL': provider_config.get('url', ''),
-            }
-        elif provider_type == 'localfiles':
-            _config_overrides = {
-                'LOCALFILES_MUSIC_DIR': provider_config.get('music_directory', ''),
-                'LOCALFILES_PLAYLIST_DIR': provider_config.get('playlist_directory', ''),
+            user_creds = {
+                'token': sc.get('token', ''),
+                'user_id': sc.get('user_id', ''),
             }
 
-    # Temporarily apply config overrides
-    _saved = {}
-    for attr, val in _config_overrides.items():
-        if val:  # Only override if the provider config has a value
-            _saved[attr] = getattr(config, attr, '')
-            setattr(config, attr, val)
-
-    try:
-        if provider_type == 'jellyfin':
-            return jellyfin_create_instant_playlist(playlist_name, item_ids, user_creds)
-        elif provider_type == 'navidrome':
-            return navidrome_create_instant_playlist(playlist_name, item_ids, user_creds)
-        elif provider_type == 'lyrion':
-            return lyrion_create_instant_playlist(playlist_name, item_ids)
-        elif provider_type == 'emby':
-            return emby_create_instant_playlist(playlist_name, item_ids, user_creds)
-        elif provider_type == 'localfiles':
-            return localfiles_create_instant_playlist(playlist_name, item_ids, user_creds)
-        else:
-            raise ValueError(f"Unknown provider type: {provider_type}")
-    finally:
-        # Restore original config values
-        for attr, val in _saved.items():
-            setattr(config, attr, val)
+    if provider_type == 'jellyfin':
+        return jellyfin_create_instant_playlist(playlist_name, item_ids, user_creds, server_config=sc)
+    elif provider_type == 'navidrome':
+        return navidrome_create_instant_playlist(playlist_name, item_ids, user_creds, server_config=sc)
+    elif provider_type == 'lyrion':
+        return lyrion_create_instant_playlist(playlist_name, item_ids, server_config=sc)
+    elif provider_type == 'emby':
+        return emby_create_instant_playlist(playlist_name, item_ids, user_creds, server_config=sc)
+    elif provider_type == 'localfiles':
+        return localfiles_create_instant_playlist(playlist_name, item_ids, user_creds, server_config=sc)
+    else:
+        raise ValueError(f"Unknown provider type: {provider_type}")
 
 
 def get_enabled_providers_for_playlists():
diff --git a/tasks/mediaserver_emby.py b/tasks/mediaserver_emby.py
index 09abe70d..122cef88 100644
--- a/tasks/mediaserver_emby.py
+++ b/tasks/mediaserver_emby.py
@@ -783,14 +783,15 @@ def get_last_played_time(item_id, user_creds=None):
         logger.error(f"Emby get_last_played_time failed for item {item_id}, user {user_id}: {e}", exc_info=True)
         return None
 
-def create_instant_playlist(playlist_name, item_ids, user_creds=None):
+def create_instant_playlist(playlist_name, item_ids, user_creds=None, server_config=None):
     # is this duplicate of create_playlist?
     """
     Creates a new instant playlist on Emby for a specific user.
     Handles empty tokens by falling back to the default config token.
     """
-    user_id = user_creds.get('user_id') if user_creds else config.EMBY_USER_ID
-    token = (user_creds.get('token') if user_creds else None) or config.EMBY_TOKEN
+    sc = server_config or {}
+    user_id = user_creds.get('user_id') if user_creds else (sc.get('user_id') or config.EMBY_USER_ID)
+    token = (user_creds.get('token') if user_creds else None) or sc.get('token') or config.EMBY_TOKEN
     if not token:
         raise ValueError("Emby Token is required and could not be found.")
     if not user_id:
@@ -808,10 +809,10 @@ def create_instant_playlist(playlist_name, item_ids, user_creds=None):
         # https://dev.emby.media/doc/restapi/Playlists.html
         # https://dev.emby.media/reference/RestAPI/PlaylistService/postPlaylists.html
 
-        
+        base_url = sc.get('url') or config.EMBY_URL
         ids_param = ",".join(item_ids) if isinstance(item_ids, (list, set, tuple)) else str(item_ids)
         url = (
-            f"{config.EMBY_URL}/emby/Playlists"
+            f"{base_url}/emby/Playlists"
             f"?Name={requests.utils.quote(final_playlist_name)}"
             f"&Ids={requests.utils.quote(ids_param)}"
             f"&UserId={user_id}"
diff --git a/tasks/mediaserver_jellyfin.py b/tasks/mediaserver_jellyfin.py
index 4dde3c6f..0756224b 100644
--- a/tasks/mediaserver_jellyfin.py
+++ b/tasks/mediaserver_jellyfin.py
@@ -444,10 +444,12 @@ def get_last_played_time(item_id, user_creds=None):
         logger.error(f"Jellyfin get_last_played_time failed for item {item_id}, user {user_id}: {e}", exc_info=True)
         return None
 
-def create_instant_playlist(playlist_name, item_ids, user_creds=None):
+def create_instant_playlist(playlist_name, item_ids, user_creds=None, server_config=None):
     """Creates a new instant playlist on Jellyfin for a specific user."""
+    sc = server_config or {}
+
     # Treat empty token ("") as not provided and fall back to admin token from config
-    token = config.JELLYFIN_TOKEN
+    token = sc.get('token') or config.JELLYFIN_TOKEN
     if user_creds and isinstance(user_creds, dict) and user_creds.get('token'):
         token = user_creds.get('token')
     if not token:
@@ -455,16 +457,17 @@ def create_instant_playlist(playlist_name, item_ids, user_creds=None):
         raise ValueError("Jellyfin Token is required.")
 
     # Treat empty user_identifier as not provided and fall back to admin user id
-    identifier = config.JELLYFIN_USER_ID
+    identifier = sc.get('user_id') or config.JELLYFIN_USER_ID
     if user_creds and isinstance(user_creds, dict) and user_creds.get('user_identifier'):
         identifier = user_creds.get('user_identifier')
     if not identifier:
         raise ValueError("Jellyfin User Identifier is required.")
 
     user_id = resolve_user(identifier, token)
-    
+
     final_playlist_name = f"{playlist_name.strip()}_instant"
-    url = f"{config.JELLYFIN_URL}/Playlists"
+    base_url = sc.get('url') or config.JELLYFIN_URL
+    url = f"{base_url}/Playlists"
     headers = {"X-Emby-Token": token}
     body = {"Name": final_playlist_name, "Ids": item_ids, "UserId": user_id}
     try:
diff --git a/tasks/mediaserver_localfiles.py b/tasks/mediaserver_localfiles.py
index 0d1574d1..1182a69a 100644
--- a/tasks/mediaserver_localfiles.py
+++ b/tasks/mediaserver_localfiles.py
@@ -51,6 +51,48 @@ def get_config() -> Dict:
     }
 
 
+# ##############################################################################
+# DB CACHE HELPERS
+# ##############################################################################
+
+def _get_songs_from_db() -> List[Dict]:
+    """
+    Query the score table for songs with file_path set (previously analyzed).
+    Returns a list of dicts matching the format returned by get_all_songs().
+    Falls back to empty list if DB is unavailable.
+    """
+    try:
+        from app_helper import get_db
+        db = get_db()
+        if not db:
+            return []
+        with db.cursor() as cur:
+            cur.execute("""
+                SELECT item_id, title, author, album, album_artist, file_path,
+                       year, rating
+                FROM score
+                WHERE file_path IS NOT NULL
+            """)
+            rows = cur.fetchall()
+            songs = []
+            for row in rows:
+                songs.append({
+                    'Id': row[0],
+                    'Name': row[1] or 'Unknown',
+                    'AlbumArtist': row[2] or 'Unknown Artist',
+                    'Album': row[3] or 'Unknown Album',
+                    'OriginalAlbumArtist': row[4],
+                    'Path': row[5],
+                    'FilePath': row[5],
+                    'Year': row[6],
+                    'Rating': row[7],
+                })
+            return songs
+    except Exception as e:
+        logger.debug(f"DB cache lookup failed (expected during first scan): {e}")
+        return []
+
+
 # ##############################################################################
 # UTILITY FUNCTIONS
 # ##############################################################################
@@ -439,11 +481,13 @@ def get_recent_albums(limit: int) -> List[Dict]:
 
     For local files, we group songs by album and return the most recently
     modified albums based on the newest file in each album.
+    Uses DB cache when available to avoid rescanning the filesystem.
     """
     cfg = get_config()
     music_dir = cfg['music_directory']
 
-    all_songs = get_all_songs()
+    # Try DB cache first, fall back to filesystem scan
+    all_songs = _get_songs_from_db() or get_all_songs()
     if not all_songs:
         return []
 
@@ -489,8 +533,9 @@ def get_tracks_from_album(album_id: str) -> List[Dict]:
     Get all tracks from an album.
 
     For local files, album_id is "Artist - Album Name" format.
+    Uses DB cache when available to avoid rescanning the filesystem.
     """
-    all_songs = get_all_songs()
+    all_songs = _get_songs_from_db() or get_all_songs()
 
     # Filter songs matching this album
     tracks = []
@@ -590,9 +635,9 @@ def create_playlist(base_name: str, item_ids: List[str]) -> Optional[str]:
     # Ensure playlist directory exists
     os.makedirs(playlist_dir, exist_ok=True)
 
-    # Build a lookup from item_id to file path
-    all_songs = get_all_songs()
-    id_to_path = {song['Id']: song['Path'] for song in all_songs}
+    # Build a lookup from item_id to file path (DB cache first, filesystem fallback)
+    all_songs = _get_songs_from_db() or get_all_songs()
+    id_to_path = {song['Id']: song.get('Path') or song.get('FilePath', '') for song in all_songs}
 
     # Resolve paths
     paths = []
@@ -650,13 +695,29 @@ def delete_playlist(playlist_id: str) -> bool:
         return False
 
 
-def create_instant_playlist(playlist_name: str, item_ids: List[str], user_creds=None) -> Optional[Dict]:
+def create_instant_playlist(playlist_name: str, item_ids: List[str], user_creds=None, server_config=None) -> Optional[Dict]:
     """Create an instant playlist (same as regular playlist for local files)."""
-    final_name = f"{playlist_name.strip()}_instant"
-    result = create_playlist(final_name, item_ids)
-    if result:
-        return {'Id': result, 'Name': final_name}
-    return None
+    sc = server_config or {}
+    # Temporarily override env vars if server_config provides directories
+    overrides = {}
+    if sc.get('music_directory'):
+        overrides['LOCALFILES_MUSIC_DIRECTORY'] = os.environ.get('LOCALFILES_MUSIC_DIRECTORY')
+        os.environ['LOCALFILES_MUSIC_DIRECTORY'] = sc['music_directory']
+    if sc.get('playlist_directory'):
+        overrides['LOCALFILES_PLAYLIST_DIR'] = os.environ.get('LOCALFILES_PLAYLIST_DIR')
+        os.environ['LOCALFILES_PLAYLIST_DIR'] = sc['playlist_directory']
+    try:
+        final_name = f"{playlist_name.strip()}_instant"
+        result = create_playlist(final_name, item_ids)
+        if result:
+            return {'Id': result, 'Name': final_name}
+        return None
+    finally:
+        for key, original in overrides.items():
+            if original is None:
+                os.environ.pop(key, None)
+            else:
+                os.environ[key] = original
 
 
 def get_top_played_songs(limit: int, user_creds=None) -> List[Dict]:
diff --git a/tasks/mediaserver_lyrion.py b/tasks/mediaserver_lyrion.py
index ee8e9c01..e8f87abe 100644
--- a/tasks/mediaserver_lyrion.py
+++ b/tasks/mediaserver_lyrion.py
@@ -22,6 +22,15 @@ def _decode_lyrion_url(url):
         return unquote(urlparse(url).path)
     return unquote(url)
 
+def _safe_rating(val):
+    """Convert Lyrion 0-100 rating to 0-5 scale, handling non-numeric values."""
+    if not val:
+        return None
+    try:
+        return int(int(val) / 20)
+    except (ValueError, TypeError):
+        return None
+
 # ##############################################################################
 # LYRION (JSON-RPC) IMPLEMENTATION
 # ##############################################################################
@@ -823,7 +832,7 @@ def get_all_songs():
                 'Path': song.get('url'),
                 'url': song.get('url'),
                 'Year': int(song.get('year')) if song.get('year') else None,
-                'Rating': int(int(song.get('rating')) / 20) if song.get('rating') else None,
+                'Rating': _safe_rating(song.get('rating')),
                 'FilePath': _decode_lyrion_url(song.get('url')),
             }
             all_songs.append(mapped_song)
@@ -1119,7 +1128,7 @@ def is_spotify_track(item: dict) -> bool:
             'Album': s.get('album'),
             'Path': path, 'url': path,
             'Year': int(s.get('year')) if s.get('year') else None,
-            'Rating': int(int(s.get('rating')) / 20) if s.get('rating') else None,
+            'Rating': _safe_rating(s.get('rating')),
             'FilePath': _decode_lyrion_url(s.get('url')),
         })
 
@@ -1173,7 +1182,7 @@ def get_top_played_songs(limit):
                 'Path': s.get('url'),
                 'url': s.get('url'),
                 'Year': int(s.get('year')) if s.get('year') else None,
-                'Rating': int(int(s.get('rating')) / 20) if s.get('rating') else None,
+                'Rating': _safe_rating(s.get('rating')),
                 'FilePath': _decode_lyrion_url(s.get('url')),
             })
         return mapped_songs
@@ -1185,7 +1194,17 @@ def get_last_played_time(item_id):
     logger.warning("Lyrion's JSON-RPC API does not provide a 'last played time' for individual tracks.")
     return None
 
-def create_instant_playlist(playlist_name, item_ids):
+def create_instant_playlist(playlist_name, item_ids, server_config=None):
     """Creates a new instant playlist on Lyrion for a specific user, with batching."""
-    final_playlist_name = f"{playlist_name.strip()}_instant"
-    return _create_playlist_batched(final_playlist_name, item_ids)
+    sc = server_config or {}
+    # Temporarily override URL if server_config provides one
+    effective_url = sc.get('url') if sc.get('url') else None
+    if effective_url:
+        original_url = config.LYRION_URL
+        config.LYRION_URL = effective_url
+    try:
+        final_playlist_name = f"{playlist_name.strip()}_instant"
+        return _create_playlist_batched(final_playlist_name, item_ids)
+    finally:
+        if effective_url:
+            config.LYRION_URL = original_url
diff --git a/tasks/mediaserver_navidrome.py b/tasks/mediaserver_navidrome.py
index 508a0893..7d07ce4c 100644
--- a/tasks/mediaserver_navidrome.py
+++ b/tasks/mediaserver_navidrome.py
@@ -537,7 +537,23 @@ def get_last_played_time(item_id, user_creds):
     if response and "song" in response: return response["song"].get("lastPlayed")
     return None
 
-def create_instant_playlist(playlist_name, item_ids, user_creds):
+def create_instant_playlist(playlist_name, item_ids, user_creds=None, server_config=None):
     """Creates a new instant playlist on Navidrome for a specific user, with batching."""
-    final_playlist_name = f"{playlist_name.strip()}_instant"
-    return _create_playlist_batched(final_playlist_name, item_ids, user_creds)
+    sc = server_config or {}
+    # Build user_creds from server_config if not explicitly provided
+    if not user_creds and sc:
+        user_creds = {
+            'user': sc.get('user', ''),
+            'password': sc.get('password', ''),
+        }
+    # Temporarily override URL if server_config provides one
+    effective_url = sc.get('url') if sc.get('url') else None
+    if effective_url:
+        original_url = config.NAVIDROME_URL
+        config.NAVIDROME_URL = effective_url
+    try:
+        final_playlist_name = f"{playlist_name.strip()}_instant"
+        return _create_playlist_batched(final_playlist_name, item_ids, user_creds)
+    finally:
+        if effective_url:
+            config.NAVIDROME_URL = original_url
diff --git a/templates/settings.html b/templates/settings.html
index b7141557..95e5c56d 100644
--- a/templates/settings.html
+++ b/templates/settings.html
@@ -670,19 +670,85 @@ <h2><span class="section-icon">&#129302;</span> AI Integration</h2>
         </div>
         <div class="section-content">
             <p class="section-description">
-                Configure AI providers for creative playlist naming and other features.
+                Configure AI providers for creative playlist naming, instant playlists, and other features.
             </p>
 
             <div class="field-group">
                 <label for="ai-provider">AI Provider</label>
-                <select id="ai-provider" onchange="markDirty()">
+                <select id="ai-provider" onchange="updateAiProviderFields(); markDirty()">
                     <option value="NONE">None (Use Default Names)</option>
                     <option value="OLLAMA">Ollama (Local)</option>
                     <option value="OPENAI">OpenAI / OpenRouter</option>
                     <option value="GEMINI">Google Gemini</option>
                     <option value="MISTRAL">Mistral AI</option>
                 </select>
-                <div class="field-help">AI service for generating creative playlist names</div>
+                <div class="field-help">AI service for generating creative playlist names and instant playlists</div>
+            </div>
+
+            <!-- Provider-specific fields -->
+            <div id="ollama-fields" style="display: none;">
+                <div class="field-group">
+                    <label for="ollama-url">Ollama Server URL</label>
+                    <input type="text" id="ollama-url" placeholder="http://localhost:11434/api/generate" onchange="markDirty()">
+                    <div class="field-help">URL of your Ollama instance</div>
+                </div>
+                <div class="field-group">
+                    <label for="ollama-model">Ollama Model Name</label>
+                    <input type="text" id="ollama-model" placeholder="llama3.1:8b" onchange="markDirty()">
+                    <div class="field-help">Model to use for Ollama (e.g., llama3.1:8b, mistral:7b)</div>
+                </div>
+            </div>
+
+            <div id="openai-fields" style="display: none;">
+                <div class="field-group">
+                    <label for="openai-url">OpenAI / OpenRouter URL</label>
+                    <input type="text" id="openai-url" placeholder="https://api.openai.com/v1/chat/completions" onchange="markDirty()">
+                    <div class="field-help">API endpoint URL. Use OpenRouter URL for third-party models.</div>
+                </div>
+                <div class="field-group">
+                    <label for="openai-model">OpenAI Model Name</label>
+                    <input type="text" id="openai-model" placeholder="gpt-4" onchange="markDirty()">
+                    <div class="field-help">Model name (e.g., gpt-4, gpt-4o, or OpenRouter model IDs)</div>
+                </div>
+            </div>
+
+            <div id="gemini-fields" style="display: none;">
+                <div class="field-group">
+                    <label for="gemini-model">Gemini Model Name</label>
+                    <input type="text" id="gemini-model" placeholder="gemini-2.5-pro" onchange="markDirty()">
+                    <div class="field-help">Google Gemini model (e.g., gemini-2.5-pro, gemini-2.5-flash)</div>
+                </div>
+            </div>
+
+            <div id="mistral-fields" style="display: none;">
+                <div class="field-group">
+                    <label for="mistral-model">Mistral Model Name</label>
+                    <input type="text" id="mistral-model" placeholder="ministral-3b-latest" onchange="markDirty()">
+                    <div class="field-help">Mistral AI model (e.g., ministral-3b-latest, mistral-large-latest)</div>
+                </div>
+            </div>
+
+            <!-- Instant Playlist Settings -->
+            <h3 style="margin-top: 1.5rem; margin-bottom: 1rem; font-size: 1rem; color: var(--text-muted);">Instant Playlist</h3>
+
+            <div class="field-group">
+                <label for="max-artist-songs">Max Songs Per Artist</label>
+                <input type="number" id="max-artist-songs" min="1" max="50" value="5" onchange="markDirty()">
+                <div class="field-help">Maximum songs from a single artist in AI-generated playlists. Lower = more diverse.</div>
+            </div>
+
+            <div class="field-group">
+                <label class="checkbox-label">
+                    <input type="checkbox" id="energy-arc" onchange="markDirty()">
+                    <span>Enable Energy Arc</span>
+                </label>
+                <div class="field-help">Shape playlist energy: gentle start, build to peak, then cool down.</div>
+            </div>
+
+            <div class="field-group">
+                <label for="ai-timeout">AI Request Timeout (seconds)</label>
+                <input type="number" id="ai-timeout" min="30" max="600" value="300" onchange="markDirty()">
+                <div class="field-help">Seconds to wait for AI responses. Increase for slower hardware or larger models.</div>
             </div>
         </div>
     </div>
@@ -727,6 +793,7 @@ <h3 id="modal-title">Add Provider</h3>
 
 {% block bodyAdditions %}
 <script src="{{ url_for('static', filename='menu.js') }}"></script>
+<script src="/static/utils.js"></script>
 <script>
     // State
     let providers = [];
@@ -812,8 +879,8 @@ <h3 id="modal-title">Add Provider</h3>
             item.innerHTML = `
                 <div class="provider-info">
                     <div>
-                        <div class="provider-name">${p.name || typeInfo.name || p.provider_type}</div>
-                        <div class="provider-type">${typeInfo.name || p.provider_type}</div>
+                        <div class="provider-name">${escapeHtml(p.name || typeInfo.name || p.provider_type)}</div>
+                        <div class="provider-type">${escapeHtml(typeInfo.name || p.provider_type)}</div>
                     </div>
                     <div class="provider-badges">
                         ${isPrimary ? '<span class="badge badge-primary">Primary</span>' : ''}
@@ -860,16 +927,40 @@ <h3 id="modal-title">Add Provider</h3>
         document.getElementById('clap-enabled').checked = settings.clap_enabled !== false;
         document.getElementById('gpu-clustering').checked = settings.gpu_clustering === true;
 
-        // AI
+        // AI Provider
         const aiProvider = document.getElementById('ai-provider');
         if (settings.ai_provider) {
             aiProvider.value = settings.ai_provider;
         }
 
+        // AI Provider Defaults
+        if (settings.ollama_server_url) document.getElementById('ollama-url').value = settings.ollama_server_url;
+        if (settings.ollama_model_name) document.getElementById('ollama-model').value = settings.ollama_model_name;
+        if (settings.openai_server_url) document.getElementById('openai-url').value = settings.openai_server_url;
+        if (settings.openai_model_name) document.getElementById('openai-model').value = settings.openai_model_name;
+        if (settings.gemini_model_name) document.getElementById('gemini-model').value = settings.gemini_model_name;
+        if (settings.mistral_model_name) document.getElementById('mistral-model').value = settings.mistral_model_name;
+
+        // Instant Playlist
+        document.getElementById('max-artist-songs').value = settings.max_songs_per_artist_playlist ?? 5;
+        document.getElementById('energy-arc').checked = settings.playlist_energy_arc === true;
+        document.getElementById('ai-timeout').value = settings.ai_request_timeout ?? 300;
+
+        // Show/hide provider-specific fields
+        updateAiProviderFields();
+
         // Update GPU clustering availability
         updateGpuClusteringState();
     }
 
+    function updateAiProviderFields() {
+        const provider = document.getElementById('ai-provider').value;
+        document.getElementById('ollama-fields').style.display = provider === 'OLLAMA' ? 'block' : 'none';
+        document.getElementById('openai-fields').style.display = provider === 'OPENAI' ? 'block' : 'none';
+        document.getElementById('gemini-fields').style.display = provider === 'GEMINI' ? 'block' : 'none';
+        document.getElementById('mistral-fields').style.display = provider === 'MISTRAL' ? 'block' : 'none';
+    }
+
     function updateWorkerInfo() {
         const workerInfo = document.getElementById('worker-info');
         const deploymentCards = document.querySelectorAll('.option-card[data-value="unified"], .option-card[data-value="split"]');
@@ -1270,7 +1361,18 @@ <h3 id="modal-title">Add Provider</h3>
             hardware_type: hardwareType,
             clap_enabled: document.getElementById('clap-enabled').checked,
             gpu_clustering: document.getElementById('gpu-clustering').checked,
-            ai_provider: document.getElementById('ai-provider').value
+            ai_provider: document.getElementById('ai-provider').value,
+            // AI Provider Defaults
+            ollama_server_url: document.getElementById('ollama-url').value || '',
+            ollama_model_name: document.getElementById('ollama-model').value || '',
+            openai_server_url: document.getElementById('openai-url').value || '',
+            openai_model_name: document.getElementById('openai-model').value || '',
+            gemini_model_name: document.getElementById('gemini-model').value || '',
+            mistral_model_name: document.getElementById('mistral-model').value || '',
+            // Instant Playlist
+            max_songs_per_artist_playlist: parseInt(document.getElementById('max-artist-songs').value) || 5,
+            playlist_energy_arc: document.getElementById('energy-arc').checked,
+            ai_request_timeout: parseInt(document.getElementById('ai-timeout').value) || 300,
         };
 
         try {
diff --git a/templates/setup.html b/templates/setup.html
index 65756bd9..ff61a5d1 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -1108,6 +1108,7 @@ <h3>Browse Directories</h3>
 
 {% block bodyAdditions %}
 <script src="{{ url_for('static', filename='menu.js') }}"></script>
+<script src="/static/utils.js"></script>
 <script>
     // State
     let currentStep = 1;
@@ -1152,7 +1153,7 @@ <h3>Browse Directories</h3>
                     const badges = [];
                     if (p.enabled) badges.push('<span class="provider-badge enabled">Enabled</span>');
                     else badges.push('<span class="provider-badge disabled">Disabled</span>');
-                    return `<li><strong>${p.name || p.provider_type}</strong> (${p.provider_type}) ${badges.join(' ')}</li>`;
+                    return `<li><strong>${escapeHtml(p.name || p.provider_type)}</strong> (${escapeHtml(p.provider_type)}) ${badges.join(' ')}</li>`;
                 }).join('');
 
                 // Show existing installation info with provider list
diff --git a/testing_suite/ai_naming_test_config.yaml b/testing_suite/ai_naming_test_config.yaml
index 278129ff..6fb809c1 100644
--- a/testing_suite/ai_naming_test_config.yaml
+++ b/testing_suite/ai_naming_test_config.yaml
@@ -87,10 +87,10 @@ sample_songs:
 # Set these once - models inherit from their provider defaults
 defaults:
   ollama:
-    url: "http://192.168.1.71:11434/api/generate"
+    url: "http://localhost:11434/api/generate"
   openrouter:
     url: "https://openrouter.ai/api/v1/chat/completions"
-    api_key: "sk-or-v1-key"
+    api_key: "your-openrouter-api-key-here"
 
 models:
   - provider: "ollama"
diff --git a/testing_suite/instant_playlist_test_config.yaml b/testing_suite/instant_playlist_test_config.yaml
new file mode 100644
index 00000000..073b4dc2
--- /dev/null
+++ b/testing_suite/instant_playlist_test_config.yaml
@@ -0,0 +1,245 @@
+# AudioMuse-AI - Instant Playlist Tool-Calling Performance Test Configuration
+
+test_config:
+  num_runs_per_model: 3
+  timeout_per_request: 120
+  clap_enabled: true  # Controls whether text_search tool is available
+
+# Mock library context (fed to system prompt for realistic testing)
+library_context:
+  total_songs: 15000
+  unique_artists: 2800
+  top_genres: ["rock", "pop", "electronic", "metal", "alternative", "jazz", "indie", "blues", "funk", "country"]
+  top_moods: ["danceable", "aggressive", "happy", "party", "relaxed", "sad"]
+  year_min: 1960
+  year_max: 2025
+  has_ratings: true
+  rated_songs_pct: 45.2
+  scales: ["major", "minor"]
+
+test_queries:
+  # --- song_similarity (3 queries) ---
+  - query: "Similar to By the Way by Red Hot Chili Peppers"
+    expected_tool: "song_similarity"
+    category: "song_similarity"
+    expected_args:
+      song_title: "By the Way"
+      song_artist: "Red Hot Chili Peppers"
+
+  - query: "Songs like Bohemian Rhapsody by Queen"
+    expected_tool: "song_similarity"
+    category: "song_similarity"
+    expected_args:
+      song_title: "Bohemian Rhapsody"
+      song_artist: "Queen"
+
+  - query: "Find me tracks similar to Smells Like Teen Spirit by Nirvana"
+    expected_tool: "song_similarity"
+    category: "song_similarity"
+    expected_args:
+      song_title: "Smells Like Teen Spirit"
+      song_artist: "Nirvana"
+
+  # --- text_search (3 queries, skip if CLAP disabled) ---
+  - query: "calm piano music"
+    expected_tool: "text_search"
+    category: "text_search"
+    skip_if_clap_disabled: true
+
+  - query: "romantic acoustic guitar"
+    expected_tool: "text_search"
+    category: "text_search"
+    skip_if_clap_disabled: true
+
+  - query: "energetic ukulele songs"
+    expected_tool: "text_search"
+    acceptable_tools: ["text_search", "search_database"]
+    category: "text_search"
+    skip_if_clap_disabled: true
+
+  # --- artist_similarity (3 queries) ---
+  - query: "songs like AC/DC"
+    expected_tool: "artist_similarity"
+    category: "artist_similarity"
+
+  - query: "music from artists similar to Radiohead"
+    expected_tool: "artist_similarity"
+    category: "artist_similarity"
+
+  - query: "bands like blink-182"
+    expected_tool: "artist_similarity"
+    category: "artist_similarity"
+
+  # --- song_alchemy (3 queries) ---
+  - query: "sounds like Iron Maiden and Metallica combined"
+    expected_tool: "song_alchemy"
+    category: "song_alchemy"
+
+  - query: "play like Deep Purple meets Led Zeppelin"
+    expected_tool: "song_alchemy"
+    category: "song_alchemy"
+
+  - query: "Beatles but not ballads"
+    expected_tool: "song_alchemy"
+    category: "song_alchemy"
+
+  - query: "mix of Daft Punk and Gorillaz"
+    expected_tool: "song_alchemy"
+    category: "song_alchemy"
+    expected_args:
+      add_items_artists: ["Daft Punk", "Gorillaz"]
+
+  - query: "Pink Floyd without the long songs"
+    expected_tool: "song_alchemy"
+    category: "song_alchemy"
+
+  # --- artist_own_songs (1 query - artist_similarity now handles own songs) ---
+  - query: "blink-182 songs"
+    expected_tool: "artist_similarity"
+    category: "artist_own_songs"
+
+  # --- ai_brainstorm (2 queries) ---
+  - query: "trending songs from 2024"
+    expected_tool: "ai_brainstorm"
+    category: "ai_brainstorm"
+
+  - query: "best Grammy winners of the last decade"
+    expected_tool: "ai_brainstorm"
+    acceptable_tools: ["ai_brainstorm", "search_database"]
+    category: "ai_brainstorm"
+
+  # --- search_database (6 queries, including new filter types) ---
+  - query: "energetic rock music"
+    expected_tool: "search_database"
+    acceptable_tools: ["search_database", "text_search"]
+    category: "search_database"
+    expected_args:
+      genres: ["rock"]
+
+  - query: "running music at 120 BPM"
+    expected_tool: "search_database"
+    category: "search_database"
+
+  - query: "sad jazz songs"
+    expected_tool: "search_database"
+    acceptable_tools: ["search_database", "text_search"]
+    category: "search_database"
+    expected_args:
+      genres: ["jazz"]
+      moods: ["sad"]
+
+  - query: "90s rock songs"
+    expected_tool: "search_database"
+    category: "search_database"
+    expected_args:
+      genres: ["rock"]
+
+  - query: "my highest rated songs"
+    expected_tool: "search_database"
+    category: "search_database"
+
+  - query: "songs in minor key"
+    expected_tool: "search_database"
+    category: "search_database"
+    expected_args:
+      scale: "minor"
+
+  - query: "fast metal songs"
+    expected_tool: "search_database"
+    category: "search_database"
+    expected_args:
+      genres: ["metal"]
+
+  - query: "songs rated 5 stars"
+    expected_tool: "search_database"
+    category: "search_database"
+    expected_args:
+      min_rating: 5
+
+# Set these once - models inherit from their provider defaults
+defaults:
+  ollama:
+    url: "http://localhost:11434/api/generate"
+  openrouter:
+    url: "https://openrouter.ai/api/v1/chat/completions"
+    api_key: "your-openrouter-api-key-here"
+
+models:
+  - provider: "ollama"
+    name: "Llama 3.1 8B"
+    model_id: "llama3.1:8b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Llama 3.2 1B"
+    model_id: "llama3.2:1b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Gemma 3 1B"
+    model_id: "gemma3:1b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Gemma 3 4B"
+    model_id: "gemma3:4b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Gemma 3 12B"
+    model_id: "gemma3:12b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Qwen 3 0.6B"
+    model_id: "qwen3:0.6b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "Qwen 3 1.7B"
+    model_id: "qwen3:1.7b"
+    enabled: true
+
+  - provider: "ollama"
+    name: "DeepSeek R1 1.5B"
+    model_id: "deepseek-r1:1.5b"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "GPT-4o Mini"
+    model_id: "openai/gpt-4o-mini"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Claude 4.5 Haiku"
+    model_id: "anthropic/claude-haiku-4.5"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Claude 4.5 Sonnet"
+    model_id: "anthropic/claude-sonnet-4.5"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Claude 4.6 Opus"
+    model_id: "anthropic/claude-opus-4.6"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Gemini 3 Flash"
+    model_id: "google/gemini-3-flash-preview"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "Gemini 3 Pro"
+    model_id: "google/gemini-3-pro-preview"
+    enabled: true
+
+  - provider: "openrouter"
+    name: "GPT 5.2"
+    model_id: "openai/gpt-5.2"
+    enabled: true
+
+output:
+  directory: "testing_suite/reports/instant_playlist"
+  save_raw_responses: true
diff --git a/testing_suite/requirements.txt b/testing_suite/requirements.txt
index ecec1016..4842b788 100644
--- a/testing_suite/requirements.txt
+++ b/testing_suite/requirements.txt
@@ -5,3 +5,4 @@ pyyaml>=6.0
 pytest>=7.0.0
 pytest-json-report>=1.5.0
 pytest-timeout>=2.1.0
+ftfy
diff --git a/testing_suite/test_ai_naming.py b/testing_suite/test_ai_naming.py
index 4a1eda35..6d1553df 100644
--- a/testing_suite/test_ai_naming.py
+++ b/testing_suite/test_ai_naming.py
@@ -117,6 +117,13 @@ def apply_defaults(config: dict) -> None:
             if key not in model:
                 model[key] = value
 
+    # Allow environment variable override for API keys
+    env_api_key = os.environ.get('OPENROUTER_API_KEY')
+    if env_api_key:
+        for model in config.get("models", []):
+            if model.get("provider") == "openrouter":
+                model["api_key"] = env_api_key
+
 
 def split_into_playlists(songs: list[dict], num_playlists: int, per_playlist: int) -> list[list[dict]]:
     """Split a flat song list into N playlists of M songs each."""
diff --git a/testing_suite/test_instant_playlist.py b/testing_suite/test_instant_playlist.py
new file mode 100644
index 00000000..ce629ba1
--- /dev/null
+++ b/testing_suite/test_instant_playlist.py
@@ -0,0 +1,1643 @@
+#!/usr/bin/env python3
+"""
+AudioMuse-AI - Instant Playlist Tool-Calling Performance Test
+
+Benchmarks how well different AI models select the correct MCP tool
+when given a natural language playlist request.  Mirrors test_ai_naming.py
+structure but tests tool selection instead of text generation.
+
+Sends the unified system prompt + user query to each model, parses the
+tool call response, and scores: JSON valid, correct tool, valid args,
+pre-execution valid.
+
+Usage:
+  python testing_suite/test_instant_playlist.py
+  python testing_suite/test_instant_playlist.py --config path/to/config.yaml
+  python testing_suite/test_instant_playlist.py --runs 5
+  python testing_suite/test_instant_playlist.py --dry-run
+"""
+
+import argparse
+import json
+import os
+import re
+import sys
+import time
+from datetime import datetime
+
+import requests
+import yaml
+
+
+# ---------------------------------------------------------------------------
+# Valid tool names (authoritative list)
+# ---------------------------------------------------------------------------
+VALID_TOOL_NAMES = [
+    "song_similarity",
+    "text_search",
+    "artist_similarity",
+    "song_alchemy",
+    "ai_brainstorm",
+    "search_database",
+]
+
+# search_database filter keys checked during pre-execution validation
+SEARCH_DB_FILTER_KEYS = [
+    "genres", "moods", "tempo_min", "tempo_max", "energy_min", "energy_max",
+    "key", "scale", "year_min", "year_max", "min_rating",
+]
+
+
+# ---------------------------------------------------------------------------
+# Tool definitions (inlined from ai_mcp_client.py:674-904)
+# ---------------------------------------------------------------------------
+def get_tool_definitions(clap_enabled: bool) -> list[dict]:
+    """Return the 6 MCP tool definitions. Mirrors get_mcp_tools()."""
+    tools = [
+        {
+            "name": "song_similarity",
+            "description": "PRIORITY #1: MOST SPECIFIC - Find songs similar to a specific song (requires exact title+artist). USE when user mentions a SPECIFIC SONG TITLE.",
+            "inputSchema": {
+                "type": "object",
+                "properties": {
+                    "song_title": {
+                        "type": "string",
+                        "description": "Song title"
+                    },
+                    "song_artist": {
+                        "type": "string",
+                        "description": "Artist name"
+                    },
+                    "get_songs": {
+                        "type": "integer",
+                        "description": "Number of songs",
+                        "default": 100
+                    }
+                },
+                "required": ["song_title", "song_artist"]
+            }
+        }
+    ]
+
+    if clap_enabled:
+        tools.append({
+            "name": "text_search",
+            "description": "PRIORITY #2: HIGH PRIORITY - Natural language search using CLAP. USE for: INSTRUMENTS (piano, guitar, ukulele), SOUND DESCRIPTIONS (romantic, dreamy, chill vibes), DESCRIPTIVE QUERIES ('energetic workout'). Supports optional tempo/energy filters for hybrid search.",
+            "inputSchema": {
+                "type": "object",
+                "properties": {
+                    "description": {
+                        "type": "string",
+                        "description": "Natural language description (e.g., 'piano music', 'romantic pop', 'ukulele songs', 'energetic guitar rock')"
+                    },
+                    "tempo_filter": {
+                        "type": "string",
+                        "enum": ["slow", "medium", "fast"],
+                        "description": "Optional: Filter CLAP results by tempo (hybrid mode)"
+                    },
+                    "energy_filter": {
+                        "type": "string",
+                        "enum": ["low", "medium", "high"],
+                        "description": "Optional: Filter CLAP results by energy (hybrid mode)"
+                    },
+                    "get_songs": {
+                        "type": "integer",
+                        "description": "Number of songs",
+                        "default": 100
+                    }
+                },
+                "required": ["description"]
+            }
+        })
+
+    p = '3' if clap_enabled else '2'
+    tools.append({
+        "name": "artist_similarity",
+        "description": f"PRIORITY #{p}: Find songs BY an artist AND similar artists. USE for: 'songs by/from/like Artist X' including the artist's own songs (call once per artist). DON'T USE for: 'sounds LIKE multiple artists blended' (use song_alchemy).",
+        "inputSchema": {
+            "type": "object",
+            "properties": {
+                "artist": {
+                    "type": "string",
+                    "description": "Artist name"
+                },
+                "get_songs": {
+                    "type": "integer",
+                    "description": "Number of songs",
+                    "default": 100
+                }
+            },
+            "required": ["artist"]
+        }
+    })
+
+    p2 = '4' if clap_enabled else '3'
+    tools.append({
+        "name": "song_alchemy",
+        "description": f"PRIORITY #{p2}: VECTOR ARITHMETIC - Blend or subtract MULTIPLE artists/songs. REQUIRES 2+ items. Keywords: 'meets', 'combined', 'blend', 'mix of', 'but not', 'without'. BEST for: 'play like A + B' ('play like Iron Maiden, Metallica, Deep Purple'), 'like X but NOT Y', 'Artist A meets Artist B', 'mix of A and B'. DON'T USE for: single artist (use artist_similarity), genre/mood (use search_database). Examples: 'play like Iron Maiden + Metallica + Deep Purple' = add all 3; 'Beatles but not ballads' = add Beatles, subtract ballads.",
+        "inputSchema": {
+            "type": "object",
+            "properties": {
+                "add_items": {
+                    "type": "array",
+                    "description": "Items to ADD (blend into result). Each item: {type: 'song' or 'artist', id: 'artist_name' or 'song_title by artist'}",
+                    "items": {
+                        "type": "object",
+                        "properties": {
+                            "type": {
+                                "type": "string",
+                                "enum": ["song", "artist"],
+                                "description": "Item type: 'song' or 'artist'"
+                            },
+                            "id": {
+                                "type": "string",
+                                "description": "For artist: 'Artist Name'; For song: 'Song Title by Artist Name'"
+                            }
+                        },
+                        "required": ["type", "id"]
+                    }
+                },
+                "subtract_items": {
+                    "type": "array",
+                    "description": "Items to SUBTRACT (remove from result). Same format as add_items.",
+                    "items": {
+                        "type": "object",
+                        "properties": {
+                            "type": {
+                                "type": "string",
+                                "enum": ["song", "artist"],
+                                "description": "Item type: 'song' or 'artist'"
+                            },
+                            "id": {
+                                "type": "string",
+                                "description": "For artist: 'Artist Name'; For song: 'Song Title by Artist Name'"
+                            }
+                        },
+                        "required": ["type", "id"]
+                    }
+                },
+                "get_songs": {
+                    "type": "integer",
+                    "description": "Number of songs",
+                    "default": 100
+                }
+            },
+            "required": ["add_items"]
+        }
+    })
+
+    p3 = '5' if clap_enabled else '4'
+    tools.append({
+        "name": "ai_brainstorm",
+        "description": f"PRIORITY #{p3}: AI world knowledge - Use ONLY when other tools CAN'T work. USE for: named events (Grammy, Billboard, festivals), cultural knowledge (trending, viral, classic hits), historical significance (best of decade, iconic albums), songs NOT in library. DON'T USE for: artist's own songs (use artist_similarity), 'sounds like' (use song_alchemy), genre/mood (use search_database), instruments/moods (use text_search if available).",
+        "inputSchema": {
+            "type": "object",
+            "properties": {
+                "user_request": {
+                    "type": "string",
+                    "description": "User's request"
+                },
+                "get_songs": {
+                    "type": "integer",
+                    "description": "Number of songs",
+                    "default": 100
+                }
+            },
+            "required": ["user_request"]
+        }
+    })
+
+    p4 = '6' if clap_enabled else '5'
+    tools.append({
+        "name": "search_database",
+        "description": f"PRIORITY #{p4}: MOST GENERAL (last resort) - Search by genre/mood/tempo/energy/year/rating/scale filters. USE for: genre/mood/tempo combinations when NO specific artists/songs mentioned AND text_search not available/suitable. DON'T USE if you can use other more specific tools. COMBINE all filters in ONE call!",
+        "inputSchema": {
+            "type": "object",
+            "properties": {
+                "genres": {
+                    "type": "array",
+                    "items": {"type": "string"},
+                    "description": "Genres (rock, pop, metal, jazz, etc.)"
+                },
+                "moods": {
+                    "type": "array",
+                    "items": {"type": "string"},
+                    "description": "Moods (danceable, aggressive, happy, party, relaxed, sad)"
+                },
+                "tempo_min": {
+                    "type": "number",
+                    "description": "Min BPM (40-200)"
+                },
+                "tempo_max": {
+                    "type": "number",
+                    "description": "Max BPM (40-200)"
+                },
+                "energy_min": {
+                    "type": "number",
+                    "description": "Min energy 0.0 (calm) to 1.0 (intense)"
+                },
+                "energy_max": {
+                    "type": "number",
+                    "description": "Max energy 0.0 (calm) to 1.0 (intense)"
+                },
+                "key": {
+                    "type": "string",
+                    "description": "Musical key (C, D, E, F, G, A, B with # or b)"
+                },
+                "scale": {
+                    "type": "string",
+                    "enum": ["major", "minor"],
+                    "description": "Musical scale: major or minor"
+                },
+                "year_min": {
+                    "type": "integer",
+                    "description": "Earliest release year (e.g. 1990)"
+                },
+                "year_max": {
+                    "type": "integer",
+                    "description": "Latest release year (e.g. 1999)"
+                },
+                "min_rating": {
+                    "type": "integer",
+                    "description": "Minimum user rating 1-5"
+                },
+                "get_songs": {
+                    "type": "integer",
+                    "description": "Number of songs",
+                    "default": 100
+                }
+            }
+        }
+    })
+
+    return tools
+
+
+# ---------------------------------------------------------------------------
+# System prompt builder (inlined from ai_mcp_client.py:13-83)
+# ---------------------------------------------------------------------------
+_FALLBACK_GENRES = "rock, pop, metal, jazz, electronic, dance, alternative, indie, punk, blues, hard rock, heavy metal, hip-hop, funk, country, soul"
+_FALLBACK_MOODS = "danceable, aggressive, happy, party, relaxed, sad"
+
+
+def _get_dynamic_genres(library_context: dict | None) -> str:
+    """Return genre list from library context, falling back to defaults."""
+    if library_context and library_context.get('top_genres'):
+        return ', '.join(library_context['top_genres'][:15])
+    return _FALLBACK_GENRES
+
+
+def _get_dynamic_moods(library_context: dict | None) -> str:
+    """Return mood list from library context, falling back to defaults."""
+    if library_context and library_context.get('top_moods'):
+        return ', '.join(library_context['top_moods'][:10])
+    return _FALLBACK_MOODS
+
+
+def build_system_prompt(tools: list[dict], library_context: dict | None = None) -> str:
+    """Build the unified system prompt used by ALL AI providers."""
+    tool_names = [t['name'] for t in tools]
+    has_text_search = 'text_search' in tool_names
+
+    # Build library context section
+    lib_section = ""
+    if library_context and library_context.get('total_songs', 0) > 0:
+        ctx = library_context
+        year_range = ''
+        if ctx.get('year_min') and ctx.get('year_max'):
+            year_range = f"\n- Year range: {ctx['year_min']}-{ctx['year_max']}"
+        rating_info = ''
+        if ctx.get('has_ratings'):
+            rating_info = f"\n- {ctx['rated_songs_pct']}% of songs have ratings (0-5 scale)"
+        scale_info = ''
+        if ctx.get('scales'):
+            scale_info = f"\n- Scales available: {', '.join(ctx['scales'])}"
+
+        lib_section = f"""
+=== USER'S MUSIC LIBRARY ===
+- {ctx['total_songs']} songs from {ctx['unique_artists']} artists{year_range}{rating_info}{scale_info}
+"""
+
+    # Build tool decision tree
+    decision_tree = []
+    decision_tree.append("1. Specific song+artist mentioned? -> song_similarity")
+    if has_text_search:
+        decision_tree.append("2. Instruments (piano, guitar, ukulele) or SOUND DESCRIPTIONS (romantic, dreamy, chill vibes)? -> text_search")
+        decision_tree.append("3. 'songs by/from/like [ARTIST]'? -> artist_similarity (returns artist's own + similar)")
+        decision_tree.append("4. MULTIPLE artists blended ('A meets B', 'A + B', 'like A and B combined') OR negation ('X but not Y', 'X without Y')? -> song_alchemy (REQUIRES 2+ items)")
+        decision_tree.append("5. Songs NOT in library, trending, award winners (Grammy, Billboard), cultural knowledge? -> ai_brainstorm")
+        decision_tree.append("6. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
+    else:
+        decision_tree.append("2. 'songs by/from/like [ARTIST]'? -> artist_similarity (returns artist's own + similar)")
+        decision_tree.append("3. MULTIPLE artists blended ('A meets B', 'A + B', 'like A and B combined') OR negation ('X but not Y', 'X without Y')? -> song_alchemy (REQUIRES 2+ items)")
+        decision_tree.append("4. Songs NOT in library, trending, award winners (Grammy, Billboard), cultural knowledge? -> ai_brainstorm")
+        decision_tree.append("5. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
+
+    decision_text = '\n'.join(decision_tree)
+
+    prompt = f"""You are an expert music playlist curator. Analyze the user's request and call the appropriate tools to build a playlist of 100 songs.
+{lib_section}
+=== TOOL SELECTION (most specific -> most general) ===
+{decision_text}
+
+=== RULES ===
+1. Call one or more tools - each returns songs with item_id, title, and artist
+2. song_similarity REQUIRES both title AND artist - never leave empty
+3. artist_similarity returns the artist's OWN songs + songs from SIMILAR artists
+4. search_database: COMBINE all filters in ONE call. Use for genre/mood/tempo/energy/year/rating
+5. For multiple artists: call artist_similarity once per artist, or use song_alchemy to blend
+6. Prefer tool calls over text explanations
+7. For complex requests, call MULTIPLE tools in ONE turn for better coverage:
+   - "relaxing piano jazz" -> text_search("relaxing piano") + search_database(genres=["jazz"])
+   - "energetic songs by Metallica and AC/DC" -> artist_similarity("Metallica") + artist_similarity("AC/DC")
+8. When a query has BOTH a genre AND a mood from the MOODS list, prefer search_database over text_search:
+   - "sad jazz" -> search_database(genres=["jazz"], moods=["sad"])  NOT text_search
+   - But "dreamy atmospheric" -> text_search (no specific genre, sound description)
+
+=== VALID search_database VALUES ===
+GENRES: {_get_dynamic_genres(library_context)}
+MOODS: {_get_dynamic_moods(library_context)}
+TEMPO: 40-200 BPM
+ENERGY: 0.0 (calm) to 1.0 (intense) - use 0.0-0.35 for low, 0.35-0.65 for medium, 0.65-1.0 for high
+SCALE: major, minor
+YEAR: year_min/year_max (e.g., 1990-1999 for 90s). For decade requests (80s, 90s), prefer year filters over genres.
+RATING: min_rating 1-5 (user's personal ratings)"""
+
+    return prompt
+
+
+# ---------------------------------------------------------------------------
+# Ollama prompt builder (inlined from ai_mcp_client.py:426-466)
+# ---------------------------------------------------------------------------
+def build_ollama_prompt(user_query: str, tools: list[dict],
+                        library_context: dict | None = None) -> str:
+    """Build the full Ollama prompt with JSON output instructions."""
+    has_text_search = 'text_search' in [t['name'] for t in tools]
+
+    # Build tool parameter descriptions
+    tools_list = []
+    for tool in tools:
+        props = tool['inputSchema'].get('properties', {})
+        params_desc = ", ".join([f"{k} ({v.get('type')})" for k, v in props.items()])
+        tools_list.append(f"- {tool['name']}: {params_desc}")
+    tools_text = "\n".join(tools_list)
+
+    system_prompt = build_system_prompt(tools, library_context)
+
+    # Build examples
+    examples = []
+    examples.append('"Similar to By the Way by Red Hot Chili Peppers"\n{{"tool_calls": [{{"name": "song_similarity", "arguments": {{"song_title": "By the Way", "song_artist": "Red Hot Chili Peppers", "get_songs": 100}}}}]}}')
+    if has_text_search:
+        examples.append('"calm piano song"\n{{"tool_calls": [{{"name": "text_search", "arguments": {{"description": "calm piano", "get_songs": 100}}}}]}}')
+    examples.append('"songs like blink-182"\n{{"tool_calls": [{{"name": "artist_similarity", "arguments": {{"artist": "blink-182", "get_songs": 100}}}}]}}')
+    examples.append('"blink-182 songs"\n{{"tool_calls": [{{"name": "artist_similarity", "arguments": {{"artist": "blink-182", "get_songs": 100}}}}]}}')
+    examples.append('"energetic rock"\n{{"tool_calls": [{{"name": "search_database", "arguments": {{"genres": ["rock"], "energy_min": 0.65, "get_songs": 100}}}}]}}')
+    examples_text = "\n\n".join(examples)
+
+    prompt = f"""{system_prompt}
+
+=== TOOL PARAMETERS ===
+{tools_text}
+
+=== OUTPUT FORMAT (CRITICAL) ===
+Return ONLY a valid JSON object with this EXACT format:
+{{
+  "tool_calls": [
+    {{"name": "tool_name", "arguments": {{"param": "value"}}}}
+  ]
+}}
+
+=== EXAMPLES ===
+{examples_text}
+
+Now analyze this request and return ONLY the JSON:
+Request: "{user_query}"
+"""
+    return prompt
+
+
+# ---------------------------------------------------------------------------
+# OpenAI-format payload builder (inlined from ai_mcp_client.py:257-301)
+# ---------------------------------------------------------------------------
+def build_openai_payload(user_query: str, tools: list[dict], model_id: str,
+                         library_context: dict | None = None) -> dict:
+    """Build the OpenAI/OpenRouter chat-completion payload with tools."""
+    functions = []
+    for tool in tools:
+        functions.append({
+            "type": "function",
+            "function": {
+                "name": tool['name'],
+                "description": tool['description'],
+                "parameters": tool['inputSchema']
+            }
+        })
+
+    system_prompt = build_system_prompt(tools, library_context)
+
+    return {
+        "model": model_id,
+        "messages": [
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": user_query}
+        ],
+        "tools": functions,
+        "tool_choice": "auto"
+    }
+
+
+# ---------------------------------------------------------------------------
+# API callers
+# ---------------------------------------------------------------------------
+def call_ollama_model(model_cfg: dict, user_query: str, tools: list[dict],
+                      library_context: dict | None, timeout: int) -> dict:
+    """Call an Ollama model and return parsed tool calls."""
+    url = model_cfg["url"]
+    model_id = model_cfg["model_id"]
+
+    prompt = build_ollama_prompt(user_query, tools, library_context)
+
+    payload = {
+        "model": model_id,
+        "prompt": prompt,
+        "stream": False,
+        "format": "json"
+    }
+
+    start_time = time.time()
+    try:
+        response = requests.post(url, json=payload, timeout=timeout)
+        response.raise_for_status()
+        result = response.json()
+        elapsed = time.time() - start_time
+
+        if 'response' not in result:
+            return {"error": "Invalid Ollama response", "elapsed": elapsed, "raw_response": str(result)[:500]}
+
+        response_text = result['response']
+        cleaned = response_text.strip()
+
+        # Remove markdown code blocks if present
+        if "```json" in cleaned:
+            cleaned = cleaned.split("```json")[1].split("```")[0]
+        elif "```" in cleaned:
+            cleaned = cleaned.split("```")[1].split("```")[0]
+        cleaned = cleaned.strip()
+
+        # Strip think tags
+        for tag in ["</think>", "[/INST]", "[/THOUGHT]"]:
+            if tag in cleaned:
+                cleaned = cleaned.split(tag, 1)[-1].strip()
+
+        parsed = json.loads(cleaned)
+
+        # Extract tool_calls from various response shapes
+        if isinstance(parsed, dict) and 'tool_calls' in parsed:
+            tool_calls = parsed['tool_calls']
+        elif isinstance(parsed, list):
+            tool_calls = parsed
+        elif isinstance(parsed, dict) and 'name' in parsed:
+            tool_calls = [parsed]
+        else:
+            return {"error": "Missing 'tool_calls' field", "elapsed": elapsed,
+                    "raw_response": cleaned[:500]}
+
+        if not isinstance(tool_calls, list):
+            tool_calls = [tool_calls]
+
+        # Validate structure
+        valid_calls = []
+        for tc in tool_calls:
+            if isinstance(tc, dict) and 'name' in tc:
+                if 'arguments' not in tc:
+                    tc['arguments'] = {}
+                valid_calls.append(tc)
+
+        if not valid_calls:
+            return {"error": "No valid tool calls found", "elapsed": elapsed,
+                    "raw_response": cleaned[:500]}
+
+        return {"tool_calls": valid_calls, "elapsed": elapsed, "raw_response": response_text}
+
+    except json.JSONDecodeError as e:
+        elapsed = time.time() - start_time
+        return {"error": f"JSON parse error: {e}", "elapsed": elapsed,
+                "raw_response": response_text[:500] if 'response_text' in locals() else ""}
+    except requests.exceptions.ConnectionError:
+        elapsed = time.time() - start_time
+        return {"error": "Connection refused", "elapsed": elapsed, "raw_response": ""}
+    except requests.exceptions.Timeout:
+        elapsed = time.time() - start_time
+        return {"error": f"Timeout after {timeout}s", "elapsed": elapsed, "raw_response": ""}
+    except requests.exceptions.HTTPError as e:
+        elapsed = time.time() - start_time
+        detail = ""
+        try:
+            detail = e.response.text[:200]
+        except Exception:
+            pass
+        return {"error": f"HTTP {e.response.status_code}: {detail}", "elapsed": elapsed, "raw_response": ""}
+    except Exception as e:
+        elapsed = time.time() - start_time
+        return {"error": str(e), "elapsed": elapsed, "raw_response": ""}
+
+
+def call_openai_model(model_cfg: dict, user_query: str, tools: list[dict],
+                      library_context: dict | None, timeout: int) -> dict:
+    """Call an OpenAI-compatible API and return parsed tool calls."""
+    url = model_cfg["url"]
+    model_id = model_cfg["model_id"]
+    api_key = model_cfg.get("api_key", "")
+
+    payload = build_openai_payload(user_query, tools, model_id, library_context)
+
+    headers = {"Content-Type": "application/json"}
+    if api_key:
+        headers["Authorization"] = f"Bearer {api_key}"
+    if "openrouter" in url.lower():
+        headers["HTTP-Referer"] = "https://github.com/NeptuneHub/AudioMuse-AI"
+        headers["X-Title"] = "AudioMuse-AI"
+
+    start_time = time.time()
+    try:
+        response = requests.post(url, headers=headers, json=payload, timeout=timeout)
+        response.raise_for_status()
+        result = response.json()
+        elapsed = time.time() - start_time
+
+        raw_response = json.dumps(result, indent=2)
+
+        tool_calls = []
+        if 'choices' in result and result['choices']:
+            message = result['choices'][0].get('message', {})
+            if 'tool_calls' in message:
+                for tc in message['tool_calls']:
+                    if tc.get('type') == 'function':
+                        try:
+                            args = json.loads(tc['function']['arguments'])
+                        except (json.JSONDecodeError, KeyError):
+                            args = {}
+                        tool_calls.append({
+                            "name": tc['function']['name'],
+                            "arguments": args
+                        })
+
+        if not tool_calls:
+            text_response = result.get('choices', [{}])[0].get('message', {}).get('content', '')
+            return {"error": "No tool calls returned", "elapsed": elapsed,
+                    "raw_response": text_response[:500] if text_response else raw_response[:500]}
+
+        return {"tool_calls": tool_calls, "elapsed": elapsed, "raw_response": raw_response}
+
+    except requests.exceptions.ConnectionError:
+        elapsed = time.time() - start_time
+        return {"error": "Connection refused", "elapsed": elapsed, "raw_response": ""}
+    except requests.exceptions.Timeout:
+        elapsed = time.time() - start_time
+        return {"error": f"Timeout after {timeout}s", "elapsed": elapsed, "raw_response": ""}
+    except requests.exceptions.HTTPError as e:
+        elapsed = time.time() - start_time
+        detail = ""
+        try:
+            detail = e.response.text[:200]
+        except Exception:
+            pass
+        return {"error": f"HTTP {e.response.status_code}: {detail}", "elapsed": elapsed, "raw_response": ""}
+    except Exception as e:
+        elapsed = time.time() - start_time
+        return {"error": str(e), "elapsed": elapsed, "raw_response": ""}
+
+
+def call_model(model_cfg: dict, user_query: str, tools: list[dict],
+               library_context: dict | None, timeout: int) -> dict:
+    """Dispatch to the correct API caller based on provider config."""
+    url = model_cfg.get("url", "")
+    api_key = model_cfg.get("api_key", "")
+    is_openai_format = (
+        bool(api_key) or
+        "openai" in url.lower() or
+        "openrouter" in url.lower()
+    )
+
+    if is_openai_format:
+        return call_openai_model(model_cfg, user_query, tools, library_context, timeout)
+    else:
+        return call_ollama_model(model_cfg, user_query, tools, library_context, timeout)
+
+
+# ---------------------------------------------------------------------------
+# Validation
+# ---------------------------------------------------------------------------
+def _score_args_quality(selected_tool: str, selected_args: dict, expected_args: dict) -> float:
+    """Score argument quality against expected_args from YAML config.
+
+    Returns a float 0.0-1.0 representing how well the arguments match expectations.
+    Uses case-insensitive matching to be tolerant of formatting variations.
+    """
+    if not expected_args:
+        return 1.0  # No expected args defined = full marks
+
+    if not isinstance(selected_args, dict):
+        return 0.0
+
+    checks = []
+
+    if selected_tool == "song_similarity":
+        # Check song_title and song_artist
+        if 'song_title' in expected_args:
+            actual = (selected_args.get('song_title') or '').lower()
+            expected = expected_args['song_title'].lower()
+            checks.append(expected in actual or actual in expected)
+        if 'song_artist' in expected_args:
+            actual = (selected_args.get('song_artist') or '').lower()
+            expected = expected_args['song_artist'].lower()
+            checks.append(expected in actual or actual in expected)
+
+    elif selected_tool == "search_database":
+        # Check genres
+        if 'genres' in expected_args:
+            actual_genres = [g.lower() for g in (selected_args.get('genres') or [])]
+            for exp_genre in expected_args['genres']:
+                checks.append(any(exp_genre.lower() in ag for ag in actual_genres))
+        # Check moods
+        if 'moods' in expected_args:
+            actual_moods = [m.lower() for m in (selected_args.get('moods') or [])]
+            for exp_mood in expected_args['moods']:
+                checks.append(any(exp_mood.lower() in am for am in actual_moods))
+        # Check scale
+        if 'scale' in expected_args:
+            checks.append((selected_args.get('scale') or '').lower() == expected_args['scale'].lower())
+        # Check min_rating
+        if 'min_rating' in expected_args:
+            checks.append(selected_args.get('min_rating') == expected_args['min_rating'])
+
+    elif selected_tool == "artist_similarity":
+        if 'artist' in expected_args:
+            actual = (selected_args.get('artist') or '').lower()
+            expected = expected_args['artist'].lower()
+            checks.append(expected in actual or actual in expected)
+
+    elif selected_tool == "song_alchemy":
+        # Check that expected artists appear in add_items
+        if 'add_items_artists' in expected_args:
+            add_items = selected_args.get('add_items') or []
+            actual_ids = []
+            for item in add_items:
+                if isinstance(item, dict):
+                    actual_ids.append((item.get('id') or '').lower())
+                elif isinstance(item, str):
+                    actual_ids.append(item.lower())
+            for exp_artist in expected_args['add_items_artists']:
+                checks.append(any(exp_artist.lower() in aid for aid in actual_ids))
+
+    if not checks:
+        return 1.0  # No checkable fields for this tool = full marks
+    return sum(1 for c in checks if c) / len(checks)
+
+
+def validate_result(result: dict, test_query: dict, tools: list[dict]) -> dict:
+    """
+    Validate a single model response against the expected outcome.
+
+    Returns a dict with:
+        json_valid, correct_tool, valid_args, pre_exec_valid,
+        args_quality, composite_score, selected_tool, selected_args,
+        all_tools_called
+    """
+    tool_names = [t['name'] for t in tools]
+    expected_tool = test_query['expected_tool']
+    acceptable_tools = test_query.get('acceptable_tools', [expected_tool])
+    expected_args = test_query.get('expected_args', {})
+
+    # Default: everything fails
+    validation = {
+        "json_valid": False,
+        "correct_tool": False,
+        "valid_args": False,
+        "pre_exec_valid": False,
+        "args_quality": 0.0,
+        "composite_score": 0.0,
+        "selected_tool": "",
+        "selected_args": {},
+        "all_tools_called": [],
+    }
+
+    if 'error' in result or 'tool_calls' not in result:
+        return validation
+
+    tc_list = result.get('tool_calls', [])
+    if not tc_list or not isinstance(tc_list, list):
+        return validation
+
+    # JSON is valid if we got parseable tool calls
+    validation["json_valid"] = True
+
+    # Record all tools called
+    all_called = [tc.get('name', '') for tc in tc_list]
+    validation["all_tools_called"] = all_called
+
+    # Check if expected tool appears ANYWHERE in tool calls (not just first)
+    matched_tc = None
+    for tc in tc_list:
+        if tc.get('name') == expected_tool:
+            matched_tc = tc
+            break
+
+    # If ideal tool not found, check acceptable_tools
+    if matched_tc is None:
+        for tc in tc_list:
+            if tc.get('name') in acceptable_tools:
+                matched_tc = tc
+                break
+
+    # Use matched tool call for scoring, fall back to first
+    scoring_tc = matched_tc if matched_tc else tc_list[0]
+    selected_tool = scoring_tc.get('name', '')
+    selected_args = scoring_tc.get('arguments', {})
+
+    validation["selected_tool"] = selected_tool
+    validation["selected_args"] = selected_args
+
+    # Correct tool? Check against acceptable_tools list
+    validation["correct_tool"] = (selected_tool in acceptable_tools)
+
+    # Valid args? (check required args and types for the SELECTED tool)
+    validation["valid_args"] = _check_args_valid(selected_tool, selected_args, tool_names)
+
+    # Pre-execution valid? (mirrors app_chat.py:448-475)
+    validation["pre_exec_valid"] = _check_pre_exec_valid(selected_tool, selected_args)
+
+    # Args quality scoring (0.0-1.0) using expected_args from YAML
+    if validation["correct_tool"] and expected_args:
+        validation["args_quality"] = _score_args_quality(selected_tool, selected_args, expected_args)
+    elif validation["correct_tool"]:
+        validation["args_quality"] = 1.0  # Correct tool, no expected_args to check
+
+    # Composite score: tool_correct (50) + args_quality (25) + pre_exec_valid (15) + json_valid (10)
+    score = 0.0
+    if validation["json_valid"]:
+        score += 10.0
+    if validation["correct_tool"]:
+        score += 50.0
+    if validation["correct_tool"]:
+        score += 25.0 * validation["args_quality"]
+    if validation["pre_exec_valid"]:
+        score += 15.0
+    validation["composite_score"] = round(score, 1)
+
+    return validation
+
+
+def _check_args_valid(tool_name: str, args: dict, available_tools: list[str]) -> bool:
+    """Check that required arguments are present and of correct type."""
+    if not isinstance(args, dict):
+        return False
+    if tool_name not in available_tools and tool_name not in VALID_TOOL_NAMES:
+        return False
+
+    if tool_name == "song_similarity":
+        return (isinstance(args.get('song_title'), str) and len(args['song_title']) > 0 and
+                isinstance(args.get('song_artist'), str) and len(args['song_artist']) > 0)
+
+    elif tool_name == "text_search":
+        return isinstance(args.get('description'), str) and len(args['description']) > 0
+
+    elif tool_name == "artist_similarity":
+        return isinstance(args.get('artist'), str) and len(args['artist']) > 0
+
+    elif tool_name == "song_alchemy":
+        add_items = args.get('add_items', [])
+        if not isinstance(add_items, list) or len(add_items) == 0:
+            return False
+        # Accept both structured dicts and simple strings
+        for item in add_items:
+            if isinstance(item, dict):
+                if not item.get('type') or not item.get('id'):
+                    return False
+            elif not isinstance(item, str):
+                return False
+        return True
+
+    elif tool_name == "ai_brainstorm":
+        return isinstance(args.get('user_request'), str) and len(args['user_request']) > 0
+
+    elif tool_name == "search_database":
+        # search_database has no required args (but pre_exec checks for filters)
+        return True
+
+    return False
+
+
+def _check_pre_exec_valid(tool_name: str, args: dict) -> bool:
+    """Mirror pre-execution validation from app_chat.py."""
+    if not isinstance(args, dict):
+        return False
+    if tool_name == "song_similarity":
+        title = args.get('song_title', '')
+        artist = args.get('song_artist', '')
+        if isinstance(title, str) and isinstance(artist, str):
+            return bool(title.strip()) and bool(artist.strip())
+        return False
+
+    elif tool_name == "search_database":
+        # At least one filter must be present
+        return any(args.get(k) for k in SEARCH_DB_FILTER_KEYS)
+
+    # All other tools pass pre-execution validation if they have valid args
+    return _check_args_valid(tool_name, args, VALID_TOOL_NAMES)
+
+
+# ---------------------------------------------------------------------------
+# Config helpers (mirrors test_ai_naming.py)
+# ---------------------------------------------------------------------------
+def apply_defaults(config: dict) -> None:
+    """Merge provider defaults (url, api_key) into each model entry."""
+    defaults = config.get("defaults", {})
+    for model in config.get("models", []):
+        provider = model.get("provider", "")
+        provider_defaults = defaults.get(provider, {})
+        for key, value in provider_defaults.items():
+            if key not in model:
+                model[key] = value
+
+    # Allow environment variable override for API keys
+    env_api_key = os.environ.get('OPENROUTER_API_KEY')
+    if env_api_key:
+        for model in config.get("models", []):
+            if model.get("provider") == "openrouter":
+                model["api_key"] = env_api_key
+
+
+# ---------------------------------------------------------------------------
+# Main test loop
+# ---------------------------------------------------------------------------
+def run_tests(config: dict, dry_run: bool = False) -> tuple[dict, list[dict]]:
+    """
+    Execute the full test suite.
+
+    Returns:
+        (results_dict, test_queries)
+        results_dict keys are model names, values have 'runs' list and metadata.
+    """
+    tc = config["test_config"]
+    models = [m for m in config["models"] if m.get("enabled", False)]
+    clap_enabled = tc.get("clap_enabled", True)
+    library_context = config.get("library_context")
+
+    if not models:
+        print("ERROR: No models enabled in configuration.")
+        sys.exit(1)
+
+    num_runs = tc["num_runs_per_model"]
+    timeout = tc.get("timeout_per_request", 120)
+
+    # Build tool definitions
+    tools = get_tool_definitions(clap_enabled)
+    tool_names_available = [t['name'] for t in tools]
+
+    # Filter test queries
+    all_queries = config.get("test_queries", [])
+    test_queries = []
+    for q in all_queries:
+        if q.get("skip_if_clap_disabled") and not clap_enabled:
+            continue
+        test_queries.append(q)
+
+    if not test_queries:
+        print("ERROR: No test queries after filtering.")
+        sys.exit(1)
+
+    num_queries = len(test_queries)
+
+    if dry_run:
+        print("=== DRY RUN MODE ===")
+        print(f"Would test {len(models)} model(s), {num_queries} queries, {num_runs} run(s) each")
+        print(f"CLAP enabled: {clap_enabled}")
+        print(f"Tools available: {', '.join(tool_names_available)}")
+        print(f"Library context: {'yes' if library_context else 'no'}\n")
+
+        for mi, m in enumerate(models):
+            print(f"  Model {mi + 1}: {m['name']} ({m['provider']}) - {m['model_id']}")
+
+        print(f"\n--- System Prompt Preview ---")
+        sys_prompt = build_system_prompt(tools, library_context)
+        print(sys_prompt[:800])
+        print("...\n")
+
+        # Show Ollama prompt for first query
+        print(f"--- Ollama Prompt Preview (query 1: \"{test_queries[0]['query']}\") ---")
+        ollama_prompt = build_ollama_prompt(test_queries[0]['query'], tools, library_context)
+        print(ollama_prompt[:1200])
+        print("...\n")
+
+        # Show OpenAI payload for first query
+        print(f"--- OpenAI Payload Preview (query 1) ---")
+        openai_payload = build_openai_payload(test_queries[0]['query'], tools, "example-model", library_context)
+        # Show just messages, not the full tool defs
+        print(json.dumps(openai_payload['messages'], indent=2)[:600])
+        print(f"  ... + {len(openai_payload['tools'])} tool definitions\n")
+
+        print(f"--- Test Queries ({num_queries}) ---")
+        for qi, q in enumerate(test_queries):
+            print(f"  {qi + 1:2d}. [{q['category']}] \"{q['query']}\" -> {q['expected_tool']}")
+
+        return {}, test_queries
+
+    # Run tests
+    results = {}
+    total_models = len(models)
+    connection_failures = set()
+
+    for mi, model in enumerate(models):
+        model_name = model["name"]
+        print(f"[{mi + 1}/{total_models}] Testing: {model_name} ({model['provider']})")
+
+        results[model_name] = {
+            "provider": model["provider"],
+            "model_id": model["model_id"],
+            "url": model["url"],
+            "runs": [],
+        }
+
+        # Skip if previous connection to same URL failed
+        if model["url"] in connection_failures:
+            print(f"  Skipping (connection to {model['url']} already failed)\n")
+            for qi in range(num_queries):
+                for ri in range(num_runs):
+                    results[model_name]["runs"].append({
+                        "query_index": qi,
+                        "query": test_queries[qi]["query"],
+                        "expected_tool": test_queries[qi]["expected_tool"],
+                        "category": test_queries[qi]["category"],
+                        "run_index": ri,
+                        "json_valid": False,
+                        "correct_tool": False,
+                        "valid_args": False,
+                        "pre_exec_valid": False,
+                        "args_quality": 0.0,
+                        "composite_score": 0.0,
+                        "selected_tool": "",
+                        "selected_args": {},
+                        "all_tools_called": [],
+                        "raw_response": "",
+                        "elapsed": 0,
+                        "error": "Skipped (connection failed)",
+                    })
+            continue
+
+        model_correct = 0
+        model_total = 0
+        model_times = []
+        abort_model = False
+
+        for qi, tq in enumerate(test_queries):
+            for ri in range(num_runs):
+                if abort_model:
+                    results[model_name]["runs"].append({
+                        "query_index": qi,
+                        "query": tq["query"],
+                        "expected_tool": tq["expected_tool"],
+                        "category": tq["category"],
+                        "run_index": ri,
+                        "json_valid": False,
+                        "correct_tool": False,
+                        "valid_args": False,
+                        "pre_exec_valid": False,
+                        "args_quality": 0.0,
+                        "composite_score": 0.0,
+                        "selected_tool": "",
+                        "selected_args": {},
+                        "all_tools_called": [],
+                        "raw_response": "",
+                        "elapsed": 0,
+                        "error": "Skipped (connection failed)",
+                    })
+                    continue
+
+                model_total += 1
+                status_prefix = f"  Q{qi + 1} Run {ri + 1}/{num_runs}:"
+
+                api_result = call_model(model, tq["query"], tools, library_context, timeout)
+                validation = validate_result(api_result, tq, tools)
+
+                elapsed = api_result.get("elapsed", 0)
+                error = api_result.get("error")
+                raw_resp = api_result.get("raw_response", "")
+
+                run_result = {
+                    "query_index": qi,
+                    "query": tq["query"],
+                    "expected_tool": tq["expected_tool"],
+                    "category": tq["category"],
+                    "run_index": ri,
+                    "json_valid": validation["json_valid"],
+                    "correct_tool": validation["correct_tool"],
+                    "valid_args": validation["valid_args"],
+                    "pre_exec_valid": validation["pre_exec_valid"],
+                    "args_quality": validation["args_quality"],
+                    "composite_score": validation["composite_score"],
+                    "selected_tool": validation["selected_tool"],
+                    "selected_args": validation["selected_args"],
+                    "all_tools_called": validation["all_tools_called"],
+                    "raw_response": raw_resp if isinstance(raw_resp, str) else str(raw_resp),
+                    "elapsed": elapsed,
+                    "error": error,
+                }
+                results[model_name]["runs"].append(run_result)
+
+                if error == "Connection refused":
+                    print(f"{status_prefix} FAIL  (connection refused)")
+                    connection_failures.add(model["url"])
+                    abort_model = True
+                    continue
+
+                if error:
+                    print(f"{status_prefix} ERR   {elapsed:.1f}s  {error}")
+                elif validation["correct_tool"]:
+                    model_correct += 1
+                    model_times.append(elapsed)
+                    args_ok = "args OK" if validation["valid_args"] else "args INVALID"
+                    print(f"{status_prefix} OK    {elapsed:.1f}s  {validation['selected_tool']} ({args_ok})")
+                else:
+                    model_times.append(elapsed)
+                    print(f"{status_prefix} WRONG {elapsed:.1f}s  got={validation['selected_tool']}  expected={tq['expected_tool']}")
+
+        # Model summary
+        if model_total > 0 and not abort_model:
+            avg_t = sum(model_times) / len(model_times) if model_times else 0
+            rate = model_correct / model_total * 100
+            print(f"  Result: {model_correct}/{model_total} correct ({rate:.1f}%), avg {avg_t:.1f}s\n")
+        elif abort_model:
+            print(f"  Result: Aborted (connection failed)\n")
+
+    return results, test_queries
+
+
+# ---------------------------------------------------------------------------
+# Report generation
+# ---------------------------------------------------------------------------
+def generate_summary_table(results: dict, timestamp: str) -> str:
+    """Generate the ASCII summary table."""
+    lines = []
+    lines.append("=" * 105)
+    lines.append(f" RESULTS - Instant Playlist Tool-Calling Test ({timestamp})")
+    lines.append("=" * 105)
+    lines.append(f" {'Model':<22} {'Total':>5}  {'JSON OK':>7}  {'Tool OK':>7}  {'Args OK':>7}  {'Rate':>6}  {'Score':>6}  {'Avg Time':>8}")
+    lines.append("-" * 105)
+
+    for model_name, model_data in results.items():
+        all_runs = model_data["runs"]
+        total = len(all_runs)
+        json_ok = sum(1 for r in all_runs if r["json_valid"])
+        tool_ok = sum(1 for r in all_runs if r["correct_tool"])
+        args_ok = sum(1 for r in all_runs if r["correct_tool"] and r["valid_args"])
+        rate = (tool_ok / total * 100) if total > 0 else 0
+        avg_composite = sum(r.get("composite_score", 0) for r in all_runs) / total if total > 0 else 0
+        times = [r["elapsed"] for r in all_runs if r["error"] is None]
+        avg_t = sum(times) / len(times) if times else 0
+
+        lines.append(
+            f" {model_name:<22} {total:>5}  {json_ok:>7}  {tool_ok:>7}  {args_ok:>7}  {rate:>5.1f}%  {avg_composite:>5.1f}  {avg_t:>7.1f}s"
+        )
+
+    lines.append("-" * 105)
+    return "\n".join(lines)
+
+
+def generate_query_detail_table(results: dict, test_queries: list[dict], num_runs: int) -> str:
+    """Generate per-query detail table."""
+    lines = []
+    model_names = list(results.keys())
+
+    # Group queries by category
+    categories = {}
+    for qi, tq in enumerate(test_queries):
+        cat = tq["category"]
+        if cat not in categories:
+            categories[cat] = []
+        categories[cat].append((qi, tq))
+
+    for cat, queries in categories.items():
+        lines.append(f"\n=== Category: {cat} ===")
+        for qi, tq in queries:
+            lines.append(f"\n  Q{qi + 1}: \"{tq['query']}\" -> expected: {tq['expected_tool']}")
+            for model_name in model_names:
+                runs = [r for r in results[model_name]["runs"] if r["query_index"] == qi]
+                correct = sum(1 for r in runs if r["correct_tool"])
+                total = len(runs)
+                tools_selected = [r["selected_tool"] or "(none)" for r in runs]
+                tools_str = ", ".join(tools_selected[:5])
+                lines.append(f"    {model_name:<22} {correct}/{total}  [{tools_str}]")
+
+    return "\n".join(lines)
+
+
+def generate_html_report(results: dict, test_queries: list[dict],
+                         num_runs: int, timestamp: str, config: dict,
+                         save_raw: bool, system_prompt: str) -> str:
+    """Generate a self-contained HTML report."""
+    model_names = list(results.keys())
+    num_queries = len(test_queries)
+
+    # Build summary rows
+    summary_rows = ""
+    for model_name, model_data in results.items():
+        all_runs = model_data["runs"]
+        total = len(all_runs)
+        json_ok = sum(1 for r in all_runs if r["json_valid"])
+        tool_ok = sum(1 for r in all_runs if r["correct_tool"])
+        args_ok = sum(1 for r in all_runs if r["correct_tool"] and r["valid_args"])
+        pre_exec = sum(1 for r in all_runs if r["correct_tool"] and r["pre_exec_valid"])
+        errors = sum(1 for r in all_runs if r["error"])
+        rate = (tool_ok / total * 100) if total > 0 else 0
+        avg_composite = sum(r.get("composite_score", 0) for r in all_runs) / total if total > 0 else 0
+        times = [r["elapsed"] for r in all_runs if r["error"] is None]
+        avg_t = sum(times) / len(times) if times else 0
+        min_t = min(times) if times else 0
+        max_t = max(times) if times else 0
+
+        rate_class = "pass" if rate >= 80 else ("warn" if rate >= 50 else "fail")
+        score_class = "pass" if avg_composite >= 75 else ("warn" if avg_composite >= 50 else "fail")
+        provider = model_data.get("provider", "")
+
+        summary_rows += f"""<tr>
+            <td>{model_name}</td><td>{provider}</td>
+            <td>{total}</td><td>{json_ok}</td><td>{tool_ok}</td><td>{args_ok}</td><td>{pre_exec}</td>
+            <td>{errors}</td>
+            <td class="{rate_class}">{rate:.1f}%</td>
+            <td class="{score_class}">{avg_composite:.1f}</td>
+            <td>{avg_t:.2f}s</td><td>{min_t:.2f}s</td><td>{max_t:.2f}s</td>
+        </tr>\n"""
+
+    # Build category breakdown
+    categories = {}
+    for qi, tq in enumerate(test_queries):
+        cat = tq["category"]
+        if cat not in categories:
+            categories[cat] = []
+        categories[cat].append(qi)
+
+    category_rows = ""
+    for cat, query_indices in categories.items():
+        for model_name, model_data in results.items():
+            cat_runs = [r for r in model_data["runs"] if r["query_index"] in query_indices]
+            cat_total = len(cat_runs)
+            cat_correct = sum(1 for r in cat_runs if r["correct_tool"])
+            cat_rate = (cat_correct / cat_total * 100) if cat_total > 0 else 0
+            cat_composite = sum(r.get("composite_score", 0) for r in cat_runs) / cat_total if cat_total > 0 else 0
+            cat_class = "pass" if cat_rate >= 80 else ("warn" if cat_rate >= 50 else "fail")
+            score_class = "pass" if cat_composite >= 75 else ("warn" if cat_composite >= 50 else "fail")
+            category_rows += f"""<tr>
+                <td>{cat}</td><td>{model_name}</td>
+                <td>{cat_correct}/{cat_total}</td>
+                <td class="{cat_class}">{cat_rate:.0f}%</td>
+                <td class="{score_class}">{cat_composite:.1f}</td>
+            </tr>\n"""
+
+    # Calculate per-query difficulty based on aggregate success rate
+    query_difficulty = {}
+    for qi, tq in enumerate(test_queries):
+        all_query_runs = []
+        for model_data in results.values():
+            all_query_runs.extend(r for r in model_data["runs"] if r["query_index"] == qi)
+        total_runs = len(all_query_runs)
+        correct_runs = sum(1 for r in all_query_runs if r["correct_tool"])
+        success_rate = (correct_runs / total_runs * 100) if total_runs > 0 else 0
+        if success_rate >= 90:
+            difficulty = "Easy"
+            diff_class = "pass"
+        elif success_rate >= 70:
+            difficulty = "Medium"
+            diff_class = "warn"
+        elif success_rate >= 50:
+            difficulty = "Hard"
+            diff_class = "fail"
+        else:
+            difficulty = "Very Hard"
+            diff_class = "fail"
+        query_difficulty[qi] = {"label": difficulty, "class": diff_class, "rate": success_rate}
+
+    # Build query difficulty summary table
+    difficulty_rows = ""
+    sorted_queries = sorted(query_difficulty.items(), key=lambda x: x[1]["rate"])
+    for qi, diff in sorted_queries:
+        tq = test_queries[qi]
+        acceptable = tq.get('acceptable_tools')
+        accept_str = f' <span class="meta">(also accepts: {", ".join(t for t in acceptable if t != tq["expected_tool"])})</span>' if acceptable and len(acceptable) > 1 else ""
+        difficulty_rows += f"""<tr>
+            <td>Q{qi + 1}</td><td>{tq['query']}</td><td>{tq['category']}</td>
+            <td>{tq['expected_tool']}{accept_str}</td>
+            <td class="{diff['class']}">{diff['rate']:.0f}%</td>
+            <td class="{diff['class']}">{diff['label']}</td>
+        </tr>\n"""
+
+    # Build per-query detail sections
+    query_sections = ""
+    for qi, tq in enumerate(test_queries):
+        diff = query_difficulty[qi]
+        detail_rows = ""
+        for model_name in model_names:
+            runs = [r for r in results[model_name]["runs"] if r["query_index"] == qi]
+            correct_count = sum(1 for r in runs if r["correct_tool"])
+            total_count = len(runs)
+            times = [r["elapsed"] for r in runs if r["error"] is None]
+            avg_t = sum(times) / len(times) if times else 0
+            avg_score = sum(r.get("composite_score", 0) for r in runs) / total_count if total_count else 0
+            rate = (correct_count / total_count * 100) if total_count else 0
+            rate_class = "pass" if rate >= 80 else ("warn" if rate >= 50 else "fail")
+
+            runs_html = ""
+            for ri, r in enumerate(runs):
+                error = r.get("error")
+                selected = r.get("selected_tool", "")
+                all_tools = r.get("all_tools_called", [])
+                args_str = json.dumps(r.get("selected_args", {}), indent=1)
+                raw = str(r.get("raw_response", "")).replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")
+                score = r.get("composite_score", 0)
+                multi_tool_str = f' [{", ".join(all_tools)}]' if len(all_tools) > 1 else ""
+
+                if error:
+                    runs_html += f'<div class="name-entry error">Run {ri + 1}: <em>{error}</em> ({r["elapsed"]:.1f}s)</div>\n'
+                elif r["correct_tool"]:
+                    args_ok_str = "args OK" if r["valid_args"] else "args INVALID"
+                    aq = r.get("args_quality", 0)
+                    aq_str = f" aq={aq:.0%}" if aq < 1.0 else ""
+                    raw_detail = f' <details class="inline-raw"><summary>raw</summary><pre>{raw[:1000]}</pre></details>' if save_raw and raw else ""
+                    runs_html += f'<div class="name-entry pass">Run {ri + 1}: {selected} ({args_ok_str}{aq_str}) score={score:.0f}{multi_tool_str} ({r["elapsed"]:.1f}s){raw_detail}</div>\n'
+                else:
+                    raw_detail = f' <details class="inline-raw"><summary>raw</summary><pre>{raw[:1000]}</pre></details>' if save_raw and raw else ""
+                    runs_html += f'<div class="name-entry fail">Run {ri + 1}: {selected or "(none)"} (expected {tq["expected_tool"]}) score={score:.0f}{multi_tool_str} ({r["elapsed"]:.1f}s){raw_detail}</div>\n'
+
+            detail_rows += f"""<tr>
+                <td><strong>{model_name}</strong><br><span class="meta">{results[model_name].get('provider', '')}</span></td>
+                <td class="{rate_class}">{correct_count}/{total_count} ({rate:.0f}%)</td>
+                <td>{avg_score:.1f}</td>
+                <td>{avg_t:.2f}s</td>
+                <td class="names-cell">{runs_html}</td>
+            </tr>\n"""
+
+        acceptable = tq.get('acceptable_tools')
+        accept_note = f' <span class="meta">(also accepts: {", ".join(t for t in acceptable if t != tq["expected_tool"])})</span>' if acceptable and len(acceptable) > 1 else ""
+
+        query_sections += f"""
+        <details>
+            <summary><h3>Q{qi + 1} [{tq['category']}]: "{tq['query']}" &rarr; {tq['expected_tool']}{accept_note} <span class="{diff['class']}" style="font-size:0.8em; padding:2px 6px; border-radius:3px;">{diff['label']}</span></h3></summary>
+            <table>
+                <thead><tr>
+                    <th>Model</th><th>Correct</th><th>Avg Score</th><th>Avg Time</th>
+                    <th>Results</th>
+                </tr></thead>
+                <tbody>{detail_rows}</tbody>
+            </table>
+        </details>
+        """
+
+    # Escape system prompt for HTML
+    sys_prompt_escaped = system_prompt.replace("&", "&amp;").replace("<", "&lt;").replace(">", "&gt;")
+
+    # Sanitize config for display (hide API keys)
+    display_config = json.loads(json.dumps(config, default=str))
+    if "defaults" in display_config:
+        for provider in display_config["defaults"]:
+            if "api_key" in display_config["defaults"][provider]:
+                display_config["defaults"][provider]["api_key"] = "***hidden***"
+    for m in display_config.get("models", []):
+        if "api_key" in m:
+            m["api_key"] = "***hidden***"
+
+    html = f"""<!DOCTYPE html>
+<html lang="en">
+<head>
+<meta charset="UTF-8">
+<meta name="viewport" content="width=device-width, initial-scale=1.0">
+<title>Instant Playlist Tool-Calling Test - {timestamp}</title>
+<style>
+    body {{ font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif;
+           margin: 2rem; background: #f8f9fa; color: #212529; }}
+    h1 {{ color: #2563eb; }}
+    h2 {{ margin-top: 2rem; border-bottom: 2px solid #dee2e6; padding-bottom: 0.5rem; }}
+    h3 {{ margin: 0; display: inline; }}
+    table {{ border-collapse: collapse; width: 100%; margin: 1rem 0; background: #fff; }}
+    th, td {{ border: 1px solid #dee2e6; padding: 0.5rem 0.75rem; text-align: left; }}
+    th {{ background: #e9ecef; font-weight: 600; }}
+    tr:nth-child(even) {{ background: #f8f9fa; }}
+    .pass {{ background: #d4edda; color: #155724; font-weight: bold; }}
+    .fail {{ background: #f8d7da; color: #721c24; font-weight: bold; }}
+    .warn {{ background: #fff3cd; color: #856404; font-weight: bold; }}
+    .error {{ background: #f8d7da; color: #721c24; }}
+    .names-cell {{ padding: 0.25rem 0.5rem; }}
+    .name-entry {{ padding: 0.3rem 0.5rem; margin: 0.2rem 0; border-radius: 3px; font-size: 0.9rem; }}
+    .name-entry.pass {{ background: #d4edda; color: #155724; font-weight: normal; }}
+    .name-entry.fail {{ background: #fff3cd; color: #856404; font-weight: normal; }}
+    .name-entry.error {{ background: #f8d7da; color: #721c24; font-weight: normal; }}
+    .meta {{ font-size: 0.8rem; color: #6c757d; }}
+    .inline-raw {{ display: inline; margin-left: 0.5rem; }}
+    .inline-raw summary {{ display: inline; background: none; padding: 0; font-size: 0.75rem;
+                           color: #6c757d; text-decoration: underline; cursor: pointer; }}
+    .inline-raw pre {{ margin-top: 0.25rem; }}
+    details {{ margin: 1rem 0; }}
+    summary {{ cursor: pointer; padding: 0.5rem; background: #e9ecef; border-radius: 4px; }}
+    summary:hover {{ background: #dee2e6; }}
+    .config {{ background: #fff; padding: 1rem; border: 1px solid #dee2e6;
+               border-radius: 4px; font-family: monospace; font-size: 0.85rem; }}
+    .prompt-box {{ white-space: pre-wrap; max-width: 100%; background: #fff; padding: 1rem;
+                   border: 1px solid #dee2e6; border-radius: 4px; font-size: 0.9rem;
+                   font-family: monospace; }}
+    pre {{ white-space: pre-wrap; word-break: break-all; max-width: 600px;
+           font-size: 0.8rem; background: #f1f3f5; padding: 0.5rem; border-radius: 4px; }}
+    .footer {{ margin-top: 3rem; padding-top: 1rem; border-top: 1px solid #dee2e6;
+               color: #6c757d; font-size: 0.85rem; }}
+</style>
+</head>
+<body>
+<h1>Instant Playlist Tool-Calling Test</h1>
+<p><strong>Date:</strong> {timestamp} &nbsp;|&nbsp;
+   <strong>Runs per model:</strong> {num_runs} &nbsp;|&nbsp;
+   <strong>Queries:</strong> {num_queries} &nbsp;|&nbsp;
+   <strong>CLAP enabled:</strong> {config['test_config'].get('clap_enabled', True)}</p>
+
+<h2>Summary</h2>
+<table>
+    <thead><tr>
+        <th>Model</th><th>Provider</th><th>Total</th><th>JSON OK</th><th>Tool OK</th>
+        <th>Args OK</th><th>Pre-Exec OK</th><th>Errors</th>
+        <th>Tool Rate</th><th>Composite</th><th>Avg Time</th><th>Min Time</th><th>Max Time</th>
+    </tr></thead>
+    <tbody>{summary_rows}</tbody>
+</table>
+
+<h2>Query Difficulty</h2>
+<p>Difficulty is auto-calculated from aggregate success rate across all models. Queries below 50% may need prompt improvement or reclassification.</p>
+<table>
+    <thead><tr>
+        <th>Query</th><th>Text</th><th>Category</th><th>Expected Tool</th><th>Success Rate</th><th>Difficulty</th>
+    </tr></thead>
+    <tbody>{difficulty_rows}</tbody>
+</table>
+
+<h2>Category Breakdown</h2>
+<table>
+    <thead><tr>
+        <th>Category</th><th>Model</th><th>Correct</th><th>Rate</th><th>Avg Score</th>
+    </tr></thead>
+    <tbody>{category_rows}</tbody>
+</table>
+
+<h2>System Prompt Used</h2>
+<details>
+    <summary>Show system prompt</summary>
+    <pre class="prompt-box">{sys_prompt_escaped}</pre>
+</details>
+
+<h2>Per-Query Details</h2>
+{query_sections}
+
+<h2>Test Configuration</h2>
+<div class="config"><pre>{json.dumps(display_config, indent=2, default=str)}</pre></div>
+
+<div class="footer">
+    Generated by AudioMuse-AI Testing Suite
+</div>
+</body>
+</html>"""
+    return html
+
+
+def generate_json_report(results: dict, test_queries: list[dict],
+                         timestamp: str, config: dict) -> dict:
+    """Generate the full JSON report."""
+    # Group queries by category for per-category stats
+    categories = {}
+    for qi, tq in enumerate(test_queries):
+        cat = tq["category"]
+        if cat not in categories:
+            categories[cat] = []
+        categories[cat].append(qi)
+
+    # Calculate per-query difficulty
+    query_stats = []
+    for qi, tq in enumerate(test_queries):
+        all_query_runs = []
+        for model_data in results.values():
+            all_query_runs.extend(r for r in model_data["runs"] if r["query_index"] == qi)
+        total_runs = len(all_query_runs)
+        correct_runs = sum(1 for r in all_query_runs if r["correct_tool"])
+        success_rate = round(correct_runs / total_runs * 100, 1) if total_runs > 0 else 0
+        if success_rate >= 90:
+            difficulty = "easy"
+        elif success_rate >= 70:
+            difficulty = "medium"
+        elif success_rate >= 50:
+            difficulty = "hard"
+        else:
+            difficulty = "very_hard"
+        query_stats.append({
+            "index": qi, "query": tq["query"], "expected_tool": tq["expected_tool"],
+            "acceptable_tools": tq.get("acceptable_tools", [tq["expected_tool"]]),
+            "category": tq["category"],
+            "success_rate": success_rate,
+            "difficulty": difficulty,
+        })
+
+    report = {
+        "timestamp": timestamp,
+        "test_type": "instant_playlist_tool_calling",
+        "config": {
+            "clap_enabled": config["test_config"].get("clap_enabled", True),
+            "num_runs_per_model": config["test_config"]["num_runs_per_model"],
+            "timeout": config["test_config"].get("timeout_per_request", 120),
+            "num_queries": len(test_queries),
+        },
+        "queries": query_stats,
+        "models": {},
+    }
+
+    for model_name, model_data in results.items():
+        all_runs = model_data["runs"]
+        total = len(all_runs)
+        json_ok = sum(1 for r in all_runs if r["json_valid"])
+        tool_ok = sum(1 for r in all_runs if r["correct_tool"])
+        args_ok = sum(1 for r in all_runs if r["correct_tool"] and r["valid_args"])
+        pre_exec = sum(1 for r in all_runs if r["correct_tool"] and r["pre_exec_valid"])
+        errors = sum(1 for r in all_runs if r["error"])
+        times = [r["elapsed"] for r in all_runs if r["error"] is None]
+
+        avg_composite = sum(r.get("composite_score", 0) for r in all_runs) / total if total > 0 else 0
+
+        # Per-category breakdown
+        per_category = {}
+        for cat, query_indices in categories.items():
+            cat_runs = [r for r in all_runs if r["query_index"] in query_indices]
+            cat_total = len(cat_runs)
+            cat_correct = sum(1 for r in cat_runs if r["correct_tool"])
+            cat_composite = sum(r.get("composite_score", 0) for r in cat_runs) / cat_total if cat_total > 0 else 0
+            per_category[cat] = {
+                "total": cat_total,
+                "correct": cat_correct,
+                "rate": round(cat_correct / cat_total * 100, 1) if cat_total > 0 else 0,
+                "avg_composite": round(cat_composite, 1),
+            }
+
+        report["models"][model_name] = {
+            "provider": model_data.get("provider", ""),
+            "model_id": model_data.get("model_id", ""),
+            "url": model_data.get("url", ""),
+            "summary": {
+                "total_tests": total,
+                "json_valid": json_ok,
+                "tool_correct": tool_ok,
+                "args_valid": args_ok,
+                "pre_exec_valid": pre_exec,
+                "errors": errors,
+                "tool_rate": round(tool_ok / total * 100, 1) if total > 0 else 0,
+                "avg_composite": round(avg_composite, 1),
+                "avg_time": round(sum(times) / len(times), 3) if times else 0,
+                "min_time": round(min(times), 3) if times else 0,
+                "max_time": round(max(times), 3) if times else 0,
+            },
+            "per_category": per_category,
+            "runs": [
+                {
+                    "query_index": r["query_index"],
+                    "query": r["query"],
+                    "expected_tool": r["expected_tool"],
+                    "category": r["category"],
+                    "run_index": r["run_index"],
+                    "json_valid": r["json_valid"],
+                    "correct_tool": r["correct_tool"],
+                    "valid_args": r["valid_args"],
+                    "pre_exec_valid": r["pre_exec_valid"],
+                    "args_quality": r.get("args_quality", 0),
+                    "composite_score": r.get("composite_score", 0),
+                    "selected_tool": r["selected_tool"],
+                    "selected_args": r["selected_args"],
+                    "all_tools_called": r.get("all_tools_called", []),
+                    "elapsed": round(r["elapsed"], 3),
+                    "error": r.get("error"),
+                }
+                for r in all_runs
+            ],
+        }
+
+    return report
+
+
+# ---------------------------------------------------------------------------
+# Save reports
+# ---------------------------------------------------------------------------
+def save_reports(results: dict, test_queries: list[dict], config: dict,
+                 num_runs: int, output_dir: str, save_raw: bool,
+                 system_prompt: str):
+    """Save TXT, HTML, and JSON reports to disk."""
+    os.makedirs(output_dir, exist_ok=True)
+    timestamp = datetime.now().strftime("%Y-%m-%d %H:%M")
+    file_ts = datetime.now().strftime("%Y%m%d_%H%M%S")
+
+    # Console / TXT summary
+    summary = generate_summary_table(results, timestamp)
+    query_detail = generate_query_detail_table(results, test_queries, num_runs)
+    full_txt = summary + "\n" + query_detail + "\n"
+
+    print("\n" + full_txt)
+
+    txt_path = os.path.join(output_dir, f"instant_playlist_{file_ts}.txt")
+    with open(txt_path, "w", encoding="utf-8") as f:
+        f.write(full_txt)
+    print(f"TXT report saved: {txt_path}")
+
+    # HTML report
+    html = generate_html_report(results, test_queries, num_runs, timestamp,
+                                config, save_raw, system_prompt)
+    html_path = os.path.join(output_dir, f"instant_playlist_{file_ts}.html")
+    with open(html_path, "w", encoding="utf-8") as f:
+        f.write(html)
+    print(f"HTML report saved: {html_path}")
+
+    # JSON report
+    json_data = generate_json_report(results, test_queries, timestamp, config)
+    json_path = os.path.join(output_dir, f"instant_playlist_{file_ts}.json")
+    with open(json_path, "w", encoding="utf-8") as f:
+        json.dump(json_data, f, indent=2, default=str)
+    print(f"JSON report saved: {json_path}")
+
+
+# ---------------------------------------------------------------------------
+# CLI entry point
+# ---------------------------------------------------------------------------
+def main():
+    parser = argparse.ArgumentParser(
+        description="AudioMuse-AI - Instant Playlist Tool-Calling Performance Test",
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+    )
+    parser.add_argument("--config", "-c", type=str,
+                        default="testing_suite/instant_playlist_test_config.yaml",
+                        help="Path to YAML config file (default: testing_suite/instant_playlist_test_config.yaml)")
+    parser.add_argument("--runs", "-n", type=int, default=None,
+                        help="Override num_runs_per_model from config")
+    parser.add_argument("--dry-run", action="store_true",
+                        help="Build prompts and show config, but don't call any APIs")
+
+    args = parser.parse_args()
+
+    # Load config
+    if not os.path.exists(args.config):
+        print(f"ERROR: Config file not found: {args.config}")
+        print(f"Usage: python testing_suite/test_instant_playlist.py --config path/to/config.yaml")
+        sys.exit(1)
+
+    with open(args.config, "r", encoding="utf-8") as f:
+        config = yaml.safe_load(f)
+
+    # Merge provider defaults into each model entry
+    apply_defaults(config)
+
+    # Apply CLI overrides
+    if args.runs is not None:
+        config["test_config"]["num_runs_per_model"] = args.runs
+
+    num_runs = config["test_config"]["num_runs_per_model"]
+    clap_enabled = config["test_config"].get("clap_enabled", True)
+    output_cfg = config.get("output", {})
+    output_dir = output_cfg.get("directory", "testing_suite/reports/instant_playlist")
+    save_raw = output_cfg.get("save_raw_responses", True)
+
+    # Build tools and system prompt for display
+    tools = get_tool_definitions(clap_enabled)
+    library_context = config.get("library_context")
+    system_prompt = build_system_prompt(tools, library_context)
+
+    # Filter queries for count
+    all_queries = config.get("test_queries", [])
+    active_queries = [q for q in all_queries
+                      if not (q.get("skip_if_clap_disabled") and not clap_enabled)]
+
+    print("=" * 60)
+    print(" AudioMuse-AI - Instant Playlist Tool-Calling Test")
+    print("=" * 60)
+
+    enabled = [m for m in config["models"] if m.get("enabled", False)]
+    print(f" Models:      {len(enabled)} enabled")
+    print(f" Queries:     {len(active_queries)}")
+    print(f" Runs/model:  {num_runs}")
+    print(f" CLAP:        {'enabled' if clap_enabled else 'disabled'}")
+    print(f" Tools:       {', '.join(t['name'] for t in tools)}")
+    print("=" * 60 + "\n")
+
+    # Run tests
+    results, test_queries = run_tests(config, dry_run=args.dry_run)
+
+    if args.dry_run:
+        print("\nDry run complete. No API calls were made.")
+        return
+
+    if not results:
+        print("No results to report.")
+        return
+
+    # Generate and save reports
+    save_reports(results, test_queries, config, num_runs, output_dir, save_raw,
+                 system_prompt)
+
+
+if __name__ == "__main__":
+    main()

From 2c784546ae19e3496a53651fae6b9e99a8607313 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Mon, 9 Feb 2026 12:11:08 +0100
Subject: [PATCH 22/33] bug fixes and test expansion. Ready for testing

---
 .gitignore                                    |    5 +
 TEST_CHECKLIST.md                             |  927 ++++++++++++
 app.py                                        |    9 +
 app_helper.py                                 |  320 +++-
 app_setup.py                                  |  117 +-
 config.py                                     |    5 +-
 deployment/.env.example                       |    4 +
 requirements/common-noavx2.txt                |    1 +
 requirements/common.txt                       |    1 +
 tasks/analysis.py                             |   63 +-
 tasks/mcp_server.py                           |  203 ++-
 tasks/mediaserver.py                          |  142 +-
 tasks/mediaserver_localfiles.py               |   70 +-
 tasks/mediaserver_lyrion.py                   |   36 +-
 tasks/mediaserver_navidrome.py                |   30 +-
 tasks/voyager_manager.py                      |   10 +-
 templates/settings.html                       |   99 ++
 templates/setup.html                          |  176 +++
 ...aml => ai_naming_test_config.example.yaml} |    0
 testing_suite/comparison_config.yaml          |   78 -
 ...instant_playlist_test_config.example.yaml} |    0
 testing_suite/test_ai_naming.py               |    7 +-
 testing_suite/test_instant_playlist.py        |    7 +-
 tests/conftest.py                             |  115 ++
 tests/unit/test_ai_mcp_client.py              |  945 ++++++++++++
 tests/unit/test_app_chat.py                   |  533 +++++++
 tests/unit/test_app_setup.py                  |  603 ++++++++
 tests/unit/test_mcp_server.py                 | 1322 +++++++++++++++++
 tests/unit/test_mediaserver_localfiles.py     |  620 ++++++++
 tests/unit/test_playlist_ordering.py          |  538 +++++++
 30 files changed, 6647 insertions(+), 339 deletions(-)
 create mode 100644 TEST_CHECKLIST.md
 rename testing_suite/{ai_naming_test_config.yaml => ai_naming_test_config.example.yaml} (100%)
 delete mode 100644 testing_suite/comparison_config.yaml
 rename testing_suite/{instant_playlist_test_config.yaml => instant_playlist_test_config.example.yaml} (100%)
 create mode 100644 tests/conftest.py
 create mode 100644 tests/unit/test_ai_mcp_client.py
 create mode 100644 tests/unit/test_app_chat.py
 create mode 100644 tests/unit/test_app_setup.py
 create mode 100644 tests/unit/test_mcp_server.py
 create mode 100644 tests/unit/test_mediaserver_localfiles.py
 create mode 100644 tests/unit/test_playlist_ordering.py

diff --git a/.gitignore b/.gitignore
index 7f25fce0..cafa068a 100644
--- a/.gitignore
+++ b/.gitignore
@@ -39,6 +39,11 @@ htmlcov/
 nul
 testing_suite/reports/
 
+# Testing suite configs (contain API keys / DB passwords)
+testing_suite/instant_playlist_test_config.yaml
+testing_suite/ai_naming_test_config.yaml
+testing_suite/comparison_config.yaml
+
 # Deployment secrets
 deployment/main.env
 
diff --git a/TEST_CHECKLIST.md b/TEST_CHECKLIST.md
new file mode 100644
index 00000000..cf84d445
--- /dev/null
+++ b/TEST_CHECKLIST.md
@@ -0,0 +1,927 @@
+# AudioMuse-AI v0.9.0 - Comprehensive Test Checklist
+
+## Branch: `multi-provider-v2` vs `main`
+
+**Scope**: 96 changed files, +22,091/-1,489 lines, 47 commits across 7 feature areas.
+
+---
+
+## Table of Contents
+
+1. [How to Use the Test Suite](#1-how-to-use-the-test-suite)
+2. [Automated vs Manual Testing Summary](#2-automated-vs-manual-testing-summary)
+3. [Multi-Provider Architecture](#3-multi-provider-architecture)
+4. [GUI Setup Wizard](#4-gui-setup-wizard)
+5. [Environment / Config Setup](#5-environment--config-setup)
+6. [API Endpoints](#6-api-endpoints)
+7. [App Interactions (UI/UX)](#7-app-interactions-uiux)
+8. [Instant Playlist & AI Changes](#8-instant-playlist--ai-changes)
+9. [MCP Tools](#9-mcp-tools)
+10. [Provider-Specific Testing](#10-provider-specific-testing)
+11. [Database & Schema Changes](#11-database--schema-changes)
+12. [Dark Mode](#12-dark-mode)
+13. [Analysis Pipeline](#13-analysis-pipeline)
+14. [Playlist Ordering](#14-playlist-ordering)
+15. [Deployment & Docker](#15-deployment--docker)
+16. [Regression Tests](#16-regression-tests)
+17. [Security](#17-security)
+
+---
+
+## 1. How to Use the Test Suite
+
+### Test Directory Structure
+
+```
+AudioMuse-AI/
+├── tests/unit/              # Unit tests (no external services needed)
+│   ├── test_analysis.py     # Audio analysis (50+ tests)
+│   ├── test_ai.py           # AI provider routing (30+ tests)
+│   ├── test_clustering.py   # Clustering helpers (60+ tests)
+│   ├── test_clustering_helper.py
+│   ├── test_clustering_postprocessing.py
+│   ├── test_mediaserver.py  # Jellyfin provider (15+ tests)
+│   ├── test_voyager_manager.py  # Similarity search (20+ tests)
+│   ├── test_commons.py      # Score vectors (10+ tests)
+│   ├── test_app_analysis.py
+│   ├── test_clap_text_search.py
+│   ├── test_artist_gmm_manager.py
+│   ├── test_memory_cleanup.py
+│   ├── test_memory_utils.py
+│   ├── test_path_manager.py
+│   ├── test_song_alchemy.py
+│   ├── test_sonic_fingerprint_manager.py
+│   ├── test_string_sanitization.py
+│   ├── test_mcp_server.py         # NEW - MCP tools
+│   ├── test_playlist_ordering.py  # NEW - Playlist ordering
+│   ├── test_app_setup.py          # NEW - Setup wizard & providers
+│   ├── test_app_chat.py           # NEW - Instant playlist pipeline
+│   └── test_mediaserver_localfiles.py  # NEW - LocalFiles provider
+├── test/                    # Integration tests (require running services)
+│   ├── test.py              # End-to-end smoke tests
+│   ├── test_analysis_integration.py
+│   ├── test_clap_analysis_integration.py
+│   ├── test_gpu_status.py
+│   ├── verify_onnx_embeddings.py
+│   └── provider_testing_stack/    # Multi-provider Docker test stack
+│       ├── docker-compose-test-audiomuse.yaml
+│       ├── docker-compose-test-providers.yaml
+│       └── TEST_GUIDE.md
+├── testing_suite/           # Comparison & benchmarking
+│   ├── test_instant_playlist.py   # Instant playlist scenarios
+│   ├── test_ai_naming.py          # AI naming quality
+│   ├── comparators/               # Cross-instance comparison
+│   │   ├── api_comparator.py
+│   │   ├── db_comparator.py
+│   │   ├── docker_comparator.py
+│   │   └── performance_comparator.py
+│   ├── run_comparison.py          # Entry point
+│   └── reports/html_report.py
+└── pytest.ini               # Test configuration
+```
+
+### Running Tests
+
+```bash
+# ============================================================
+# UNIT TESTS (no external services, 2-5 minutes)
+# ============================================================
+
+# Run ALL unit tests
+pytest tests/unit/ -v
+
+# Run specific test file
+pytest tests/unit/test_mcp_server.py -v
+
+# Run specific test class
+pytest tests/unit/test_mcp_server.py::TestSearchDatabase -v
+
+# Run specific test method
+pytest tests/unit/test_mcp_server.py::TestSearchDatabase::test_genre_regex_prevents_substring_match -v
+
+# Skip slow tests
+pytest tests/unit/ -v -m "not slow"
+
+# Run only new tests (for this branch)
+pytest tests/unit/test_mcp_server.py tests/unit/test_playlist_ordering.py tests/unit/test_app_setup.py tests/unit/test_app_chat.py tests/unit/test_mediaserver_localfiles.py -v
+
+# ============================================================
+# INTEGRATION TESTS (require running services, 20+ minutes)
+# ============================================================
+
+# Requires: Flask server, PostgreSQL, Redis, ONNX models
+pytest test/ -v -s --timeout=1200
+
+# ============================================================
+# COMPARISON SUITE (require Docker + AI services)
+# ============================================================
+
+# Run full comparison between two instances
+python testing_suite/run_comparison.py
+
+# Run instant playlist benchmarks
+python testing_suite/test_instant_playlist.py --runs 5
+
+# Run AI naming benchmarks
+python testing_suite/test_ai_naming.py --runs 5
+
+# ── Benchmark Configuration ──────────────────────────────
+# Both benchmarks are self-contained — they do NOT use the
+# main app's AI keys (Gemini, OpenAI, Mistral). Instead they
+# route cloud models through OpenRouter.
+#
+# Config files (gitignored — copy from .example.yaml first):
+#   cp testing_suite/instant_playlist_test_config.example.yaml \
+#      testing_suite/instant_playlist_test_config.yaml
+#   cp testing_suite/ai_naming_test_config.example.yaml \
+#      testing_suite/ai_naming_test_config.yaml
+#
+# Provider setup (in each YAML under "defaults"):
+#   Ollama (local) – no API key needed, just run Ollama
+#   OpenRouter     – set defaults.openrouter.api_key
+#
+# To disable a model, set enabled: false in the YAML.
+# If no local config exists the scripts fall back to the
+# .example.yaml automatically.
+
+# ============================================================
+# MULTI-PROVIDER TEST STACK (Docker-based)
+# ============================================================
+
+# Start test providers (Jellyfin, Navidrome)
+cd test/provider_testing_stack
+docker compose -f docker-compose-test-providers.yaml up -d
+
+# Start AudioMuse test instance
+docker compose -f docker-compose-test-audiomuse.yaml up -d
+
+# See TEST_GUIDE.md for detailed instructions
+```
+
+### Test Markers
+
+```bash
+pytest -m unit -v          # Unit tests only
+pytest -m integration -v   # Integration tests only
+pytest -m "not slow" -v    # Skip slow tests
+```
+
+### Test Dependencies
+
+```bash
+# Unit tests
+pip install pytest>=7.0.0
+
+# Integration tests
+pip install -r test/requirements.txt
+
+# Comparison suite
+pip install -r testing_suite/requirements.txt
+```
+
+---
+
+## 2. Automated vs Manual Testing Summary
+
+### Can Be Automated (Unit Tests)
+
+| Area | Tests | Status |
+|------|-------|--------|
+| MCP tool logic (genre regex, brainstorm matching, relevance scoring) | 40+ | **NEW** |
+| Playlist ordering (greedy NN, Circle of Fifths, energy arc) | 25+ | **NEW** |
+| Setup wizard (provider CRUD, settings, validation) | 30+ | **NEW** |
+| Instant playlist pipeline (iteration loop, diversity, sampling) | 35+ | **NEW** |
+| LocalFiles provider (hashing, metadata, M3U) | 25+ | **NEW** |
+| Energy normalization (0-1 to raw conversion) | 10+ | **NEW** |
+| Config validation (defaults, env parsing) | 10+ | **NEW** |
+| Existing core tests (analysis, clustering, voyager, AI) | 200+ | Existing |
+
+### Can Be Automated (Integration Tests)
+
+| Area | Tests | Status |
+|------|-------|--------|
+| API endpoint responses (status codes, JSON shape) | 50+ | Partially exists |
+| Provider connection testing | 5+ | Via test stack |
+| Cross-provider ID remapping | 5+ | Via test stack |
+| Database schema migration | 5+ | Via test stack |
+
+### Requires Manual Testing
+
+| Area | Why Manual | Steps |
+|------|-----------|-------|
+| Setup Wizard UI flow | Multi-step interactive wizard | See [Section 4](#4-gui-setup-wizard) |
+| Dark mode visual correctness | Visual inspection of 18 templates | See [Section 12](#12-dark-mode) |
+| Sidebar navigation | Interactive menu behavior | See [Section 7](#7-app-interactions-uiux) |
+| Chart.js dark mode colors | Canvas-rendered, no DOM assertion | See [Section 12](#12-dark-mode) |
+| Provider-specific playlist creation | Requires real media servers | See [Section 10](#10-provider-specific-testing) |
+| AI quality assessment | Subjective playlist quality | See [Section 8](#8-instant-playlist--ai-changes) |
+| Docker deployment | Full stack spin-up | See [Section 15](#15-deployment--docker) |
+| Instant playlist UX | Streaming response, progress display | See [Section 8](#8-instant-playlist--ai-changes) |
+
+---
+
+## 3. Multi-Provider Architecture
+
+### 3.1 Fresh Install (No Existing Data)
+
+| # | Test Case | Type | Steps | Expected |
+|---|-----------|------|-------|----------|
+| 3.1.1 | First-run redirect | Auto | Start app with empty DB | Redirects to `/setup` |
+| 3.1.2 | Provider table creation | Auto | Check DB after `init_db()` | `provider` table exists with correct schema |
+| 3.1.3 | Settings table creation | Auto | Check DB after `init_db()` | `app_settings` table exists |
+| 3.1.4 | Add Jellyfin provider | Manual | Setup wizard: select Jellyfin, enter URL/token/user | Provider saved, connection test passes |
+| 3.1.5 | Add Navidrome provider | Manual | Setup wizard: select Navidrome, enter URL/user/pass | Provider saved, connection test passes |
+| 3.1.6 | Add Lyrion provider | Manual | Setup wizard: select Lyrion, enter URL | Provider saved, connection test passes |
+| 3.1.7 | Add Emby provider | Manual | Setup wizard: select Emby, enter URL/token/user | Provider saved, connection test passes |
+| 3.1.8 | Add LocalFiles provider | Manual | Setup wizard: select LocalFiles, enter music dir | Provider saved, directory scan succeeds |
+| 3.1.9 | Multiple providers | Manual | Add 2+ providers of different types | All listed, all enabled |
+| 3.1.10 | Provider priority ordering | Auto | Add providers with different priorities | Returned in priority order |
+| 3.1.11 | Duplicate provider rejection | Auto | Add same type+name twice | Returns error, no duplicate |
+| 3.1.12 | music_path_prefix detection | Manual | Add provider, click auto-detect | Correct prefix detected from sample tracks |
+
+### 3.2 Migration (Existing Single-Provider Data)
+
+| # | Test Case | Type | Steps | Expected |
+|---|-----------|------|-------|----------|
+| 3.2.1 | Existing env vars preserved | Auto | Start with existing `.env` (JELLYFIN_*) | Config values still work |
+| 3.2.2 | Setup wizard shows on upgrade | Manual | Upgrade from main, start app | Redirects to `/setup` once |
+| 3.2.3 | Existing score data intact | Auto | Check `score` table after migration | All existing rows preserved |
+| 3.2.4 | New columns added | Auto | Check `score` table schema | `album_artist`, `year`, `rating`, `file_path` columns exist |
+| 3.2.5 | New columns nullable | Auto | Check existing rows | New columns are NULL for old data |
+| 3.2.6 | Re-analysis populates new fields | Manual | Run analysis on existing library | New fields populated |
+| 3.2.7 | Cross-provider file_path linking | Auto | Analyze same track via 2 providers | `find_existing_analysis_by_file_path()` finds match |
+| 3.2.8 | Analysis reuse via file_path | Auto | Mock existing analysis, add new provider | `copy_analysis_to_new_item()` copies instead of re-analyzing |
+
+### 3.3 Provider CRUD API
+
+| # | Test Case | Type | Endpoint | Expected |
+|---|-----------|------|----------|----------|
+| 3.3.1 | List providers (empty) | Auto | `GET /api/providers` | `[]` |
+| 3.3.2 | Add provider | Auto | `POST /api/providers` | 201, provider returned |
+| 3.3.3 | Get provider by ID | Auto | `GET /api/providers/<id>` | Provider details returned |
+| 3.3.4 | Update provider | Auto | `PUT /api/providers/<id>` | Updated fields reflected |
+| 3.3.5 | Delete provider | Auto | `DELETE /api/providers/<id>` | 200, provider removed |
+| 3.3.6 | Test connection (valid) | Auto | `POST /api/providers/test` | `{"success": true}` |
+| 3.3.7 | Test connection (invalid) | Auto | `POST /api/providers/test` with bad URL | `{"success": false, "error": "..."}` |
+| 3.3.8 | Get libraries | Manual | `GET /api/providers/<id>/libraries` | Library list returned |
+| 3.3.9 | Get sample tracks | Manual | `GET /api/providers/<id>/sample-tracks` | Track list with file paths |
+| 3.3.10 | Detect prefix | Auto | `POST /api/providers/detect-prefix` | Correct prefix string |
+| 3.3.11 | Get enabled providers | Auto | `GET /api/providers/enabled` | Only enabled providers |
+| 3.3.12 | Invalid provider type | Auto | `POST /api/providers` with bad type | 400 error |
+| 3.3.13 | Missing required fields | Auto | `POST /api/providers` incomplete | 400 error |
+
+### 3.4 Multi-Provider Playlist Creation
+
+| # | Test Case | Type | Steps | Expected |
+|---|-----------|------|-------|----------|
+| 3.4.1 | Single provider playlist | Auto | `create_playlist_from_ids(ids, provider_ids=1)` | Playlist on provider 1 only |
+| 3.4.2 | All providers playlist | Auto | `create_playlist_from_ids(ids, provider_ids='all')` | Playlist on all enabled providers |
+| 3.4.3 | Specific providers list | Auto | `create_playlist_from_ids(ids, provider_ids=[1,3])` | Playlist on providers 1 and 3 |
+| 3.4.4 | Cross-provider ID remapping | Auto | Create playlist with IDs from provider A on provider B | file_path hash lookup maps IDs correctly |
+| 3.4.5 | Unmapped track handling | Auto | Create playlist with track missing on target provider | Track skipped, warning logged |
+| 3.4.6 | Provider selector UI | Manual | Open instant playlist, select target providers | Dropdown shows enabled providers |
+
+---
+
+## 4. GUI Setup Wizard
+
+> **All Manual** - Interactive multi-step wizard UI
+
+| # | Test Case | Steps | Expected |
+|---|-----------|-------|----------|
+| 4.1 | Wizard loads on first run | Navigate to app URL | Setup wizard renders with welcome step |
+| 4.2 | Step 1: Welcome | Read welcome text, click Next | Advances to provider selection |
+| 4.3 | Step 2: Provider selection | Select provider type from dropdown | Configuration form appears for selected type |
+| 4.4 | Step 2: Jellyfin config form | Select Jellyfin | Shows URL, User ID, Token fields |
+| 4.5 | Step 2: Navidrome config form | Select Navidrome | Shows URL, Username, Password fields |
+| 4.6 | Step 2: Lyrion config form | Select Lyrion | Shows URL field |
+| 4.7 | Step 2: Emby config form | Select Emby | Shows URL, User ID, Token fields |
+| 4.8 | Step 2: LocalFiles config form | Select LocalFiles | Shows Music Directory, Formats, Scan Subdirs fields |
+| 4.9 | Step 3: Connection test success | Enter valid credentials, click Test | Green checkmark, "Connection successful" |
+| 4.10 | Step 3: Connection test failure | Enter invalid credentials, click Test | Red X, error message displayed |
+| 4.11 | Step 3: Library discovery | After successful test | Music libraries listed for selection |
+| 4.12 | Step 3: Path prefix auto-detect | Click auto-detect button | Prefix field populated |
+| 4.13 | Step 4: Add another provider | Click "Add Another Provider" | Returns to provider selection |
+| 4.14 | Step 5: Complete setup | Click Complete | Redirects to main app, setup marked complete |
+| 4.15 | Wizard skipped after setup | Return to app after completion | No redirect to `/setup` |
+| 4.16 | Settings page access | Navigate to `/settings` | Settings page loads with current config |
+| 4.17 | Settings: update AI provider | Change AI provider dropdown | Saves, applies to next instant playlist |
+| 4.18 | Settings: update clustering | Change clustering algorithm | Saves, applies to next clustering run |
+| 4.19 | Settings: disable provider | Toggle provider off | Provider excluded from playlist creation |
+| 4.20 | Settings: re-enable provider | Toggle provider back on | Provider included in playlist creation |
+| 4.21 | Form validation | Submit empty required fields | Client-side validation error shown |
+| 4.22 | XSS prevention | Enter `<script>` in provider name | Escaped in display, not executed |
+
+---
+
+## 5. Environment / Config Setup
+
+### 5.1 Config Variable Validation (Automated)
+
+| # | Test Case | Type | Variable | Expected |
+|---|-----------|------|----------|----------|
+| 5.1.1 | Default MEDIASERVER_TYPE | Auto | `MEDIASERVER_TYPE` not set | Defaults to `localfiles` |
+| 5.1.2 | Valid MEDIASERVER_TYPE | Auto | `MEDIASERVER_TYPE=jellyfin` | Accepted |
+| 5.1.3 | LocalFiles defaults | Auto | No LOCALFILES_* vars | Music dir `/music`, all formats, scan subdirs |
+| 5.1.4 | LOCALFILES_FORMATS parsing | Auto | `LOCALFILES_FORMATS=.mp3,.flac` | Only mp3/flac accepted |
+| 5.1.5 | MAX_SONGS_PER_ARTIST_PLAYLIST | Auto | Not set | Defaults to 5 |
+| 5.1.6 | PLAYLIST_ENERGY_ARC | Auto | Not set | Defaults to False |
+| 5.1.7 | ENERGY_MIN/MAX range | Auto | Default values | 0.01 / 0.15 |
+| 5.1.8 | AI_REQUEST_TIMEOUT_SECONDS | Auto | Not set | Defaults to 300 |
+| 5.1.9 | MPD vars removed | Auto | `MPD_HOST` in config | Should NOT exist |
+
+### 5.2 Environment File
+
+| # | Test Case | Type | Steps | Expected |
+|---|-----------|------|-------|----------|
+| 5.2.1 | .env.example complete | Auto | Compare .env.example to config.py | All variables documented |
+| 5.2.2 | .env.example defaults work | Manual | Copy .env.example as .env, start app | App starts (with setup wizard) |
+| 5.2.3 | No .env file | Manual | Start without .env | App starts with sensible defaults |
+
+### 5.3 Settings Persistence
+
+| # | Test Case | Type | Steps | Expected |
+|---|-----------|------|-------|----------|
+| 5.3.1 | Settings saved to DB | Auto | `POST /api/settings` | Saved in `app_settings` table |
+| 5.3.2 | Settings loaded on startup | Auto | Restart app | `apply_settings_to_config()` overrides config |
+| 5.3.3 | Settings override env vars | Auto | Set env var AND DB setting | DB setting takes precedence |
+
+---
+
+## 6. API Endpoints
+
+### 6.1 Endpoints Without Provider (No media server configured)
+
+| # | Test Case | Type | Endpoint | Expected |
+|---|-----------|------|----------|----------|
+| 6.1.1 | Homepage renders | Auto | `GET /` | 200, HTML page (or redirect to setup) |
+| 6.1.2 | Config endpoint | Auto | `GET /api/config` | 200, JSON with app config |
+| 6.1.3 | Status endpoint (bad ID) | Auto | `GET /api/status/nonexistent` | 404 |
+| 6.1.4 | Active tasks (none) | Auto | `GET /api/active_tasks` | 200, empty/null |
+| 6.1.5 | Cancel nonexistent task | Auto | `POST /api/cancel/nonexistent` | 404 |
+| 6.1.6 | Playlists (empty) | Auto | `GET /api/playlists` | 200, `[]` |
+| 6.1.7 | Setup status | Auto | `GET /api/setup/status` | 200, setup status |
+| 6.1.8 | Providers list (empty) | Auto | `GET /api/providers` | 200, `[]` |
+| 6.1.9 | Settings GET | Auto | `GET /api/settings` | 200, current settings |
+| 6.1.10 | Config defaults | Auto | `GET /api/config_defaults` | 200, AI provider defaults |
+| 6.1.11 | Filter options | Auto | `GET /api/filter_options` | 200 (may be empty) |
+| 6.1.12 | Similarity page | Auto | `GET /similarity` | 200, HTML |
+| 6.1.13 | Alchemy page | Auto | `GET /alchemy` | 200, HTML |
+| 6.1.14 | Map page | Auto | `GET /map` | 200, HTML |
+| 6.1.15 | Path page | Auto | `GET /path` | 200, HTML |
+| 6.1.16 | Cron page | Auto | `GET /cron` | 200, HTML |
+| 6.1.17 | Cleaning page | Auto | `GET /cleaning` | 200, HTML |
+
+### 6.2 Endpoints With Provider (Media server configured, tracks analyzed)
+
+| # | Test Case | Type | Endpoint | Expected |
+|---|-----------|------|----------|----------|
+| 6.2.1 | Search tracks | Auto | `GET /api/search_tracks?title=test` | 200, array of matches |
+| 6.2.2 | Similar tracks by ID | Auto | `GET /api/similar_tracks?item_id=X` | 200, similar tracks array |
+| 6.2.3 | Similar tracks by title+artist | Auto | `GET /api/similar_tracks?title=X&artist=Y` | 200, similar tracks array |
+| 6.2.4 | Get score | Auto | `GET /get_score?id=X` | 200, track metadata incl. new fields |
+| 6.2.5 | Get embedding | Auto | `GET /get_embedding?id=X` | 200, embedding vector |
+| 6.2.6 | Artist search | Auto | `GET /api/search_artists?query=X` | 200, artist matches |
+| 6.2.7 | Similar artists | Auto | `GET /api/similar_artists?artist=X` | 200, similar artists |
+| 6.2.8 | Alchemy search | Auto | `POST /api/alchemy` with items | 200, results array |
+| 6.2.9 | Path finding | Auto | `GET /api/find_path?start_song_id=X&end_song_id=Y` | 200, path array |
+| 6.2.10 | Map data | Auto | `GET /api/map/100` | 200, items with projections |
+| 6.2.11 | Map data compressed | Auto | `GET /api/map/gzip/100` | 200, gzip content |
+| 6.2.12 | CLAP search (if enabled) | Auto | `POST /api/clap/search` with query | 200, results |
+| 6.2.13 | MuLan search (if enabled) | Auto | `POST /api/mulan/search` with query | 200, results |
+| 6.2.14 | Chat playlist | Manual | `POST /api/chatPlaylist` | 200, streaming playlist |
+| 6.2.15 | Start analysis | Auto | `POST /api/analysis/start` | 202, task_id |
+| 6.2.16 | Start clustering | Auto | `POST /api/clustering/start` | 202, task_id |
+| 6.2.17 | Cron CRUD | Auto | `POST/GET/DELETE /api/cron` | Cron entry management |
+| 6.2.18 | Sonic fingerprint | Manual | `POST /api/sonic_fingerprint/generate` | 200, fingerprint results |
+
+### 6.3 Error Handling
+
+| # | Test Case | Type | Endpoint | Expected |
+|---|-----------|------|----------|----------|
+| 6.3.1 | Missing required params | Auto | `GET /api/similar_tracks` (no params) | 400 |
+| 6.3.2 | Invalid item_id | Auto | `GET /api/similar_tracks?item_id=INVALID` | 404 |
+| 6.3.3 | Task conflict | Auto | Start clustering twice | 409 on second call |
+| 6.3.4 | Invalid JSON body | Auto | `POST /api/alchemy` with bad JSON | 400 |
+| 6.3.5 | Voyager index not ready | Auto | Query before analysis | 503 |
+
+---
+
+## 7. App Interactions (UI/UX)
+
+> **All Manual** - Browser-based interaction testing
+
+| # | Test Case | Steps | Expected |
+|---|-----------|-------|----------|
+| 7.1 | Sidebar navigation | Click each nav item | Correct page loads, active class applied |
+| 7.2 | Sidebar collapse/expand | Click hamburger menu | Sidebar toggles, state persists via localStorage |
+| 7.3 | Sidebar state persistence | Toggle sidebar, navigate to another page | Sidebar state preserved |
+| 7.4 | Settings link in sidebar | Click Settings | Settings page loads |
+| 7.5 | Setup Wizard link in sidebar | Click Setup Wizard | Setup wizard loads |
+| 7.6 | Provider selector dropdown | Open instant playlist page | Provider dropdown shows enabled providers |
+| 7.7 | Provider selector in clustering | Open clustering page | Provider selector available |
+| 7.8 | Real-time task progress | Start analysis or clustering | Progress bar updates via polling |
+| 7.9 | Task cancellation | Click cancel during a task | Task cancelled, status updated |
+| 7.10 | Error notifications | Trigger an error (e.g., bad connection) | Error toast/message displayed |
+| 7.11 | Chart.js visualizations | Open map, clustering results | Charts render correctly |
+| 7.12 | Chart.js dark mode | Toggle dark mode on chart pages | Grid colors update to dark theme |
+| 7.13 | Responsive layout | Resize browser window | Layout adapts, no overflow |
+| 7.14 | escapeHtml XSS prevention | Track with `<script>` in title | Rendered as text, not executed |
+
+---
+
+## 8. Instant Playlist & AI Changes
+
+### 8.1 Agentic Loop (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 8.1.1 | Iteration 0: initial request | Auto | User input passed as-is, system prompt includes library context |
+| 8.1.2 | Iteration 0: fallback on AI error | Auto | On exception, falls back to `search_database(top 2 genres)` |
+| 8.1.3 | Iteration 1+: rich feedback | Auto | Feedback includes progress %, top artists, diversity, tools used |
+| 8.1.4 | Stop at 100 songs | Auto | Loop exits when `len(all_songs) >= 100` |
+| 8.1.5 | Stop on no new songs | Auto | Loop exits when `iteration_songs_added == 0` |
+| 8.1.6 | Stop at max iterations | Auto | Loop exits after iteration 4 (5 total) |
+| 8.1.7 | Deduplication by item_id | Auto | Same song from different tools not counted twice |
+| 8.1.8 | Tool call tracking | Auto | Each song tracks which tool call produced it |
+
+### 8.2 Pre-Execution Validation (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 8.2.1 | Reject song_similarity without title | Auto | Empty `song_title` → rejected, logged |
+| 8.2.2 | Reject song_similarity without artist | Auto | Empty `song_artist` → rejected, logged |
+| 8.2.3 | Reject search_database no filters | Auto | No genres/moods/tempo/energy/key/scale/year/rating → rejected |
+| 8.2.4 | Accept search_database with one filter | Auto | Only `genres` set → accepted |
+
+### 8.3 Proportional Sampling (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 8.3.1 | No sampling under 100 songs | Auto | 80 songs collected → all 80 returned |
+| 8.3.2 | Proportional reduction over 100 | Auto | 200 songs (100 from tool A, 100 from tool B) → 50 each |
+| 8.3.3 | Minimum 1 per tool | Auto | 150 songs (140 from A, 10 from B) → B gets at least 1 |
+| 8.3.4 | Randomized after sampling | Auto | Output is shuffled |
+
+### 8.4 Artist Diversity (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 8.4.1 | Cap at MAX_SONGS_PER_ARTIST | Auto | Artist with 10 songs → only 5 kept (default) |
+| 8.4.2 | Backfill from overflow | Auto | Excess songs removed, backfill from least-represented artists |
+| 8.4.3 | Backfill prioritizes least represented | Auto | Artist with 1 song backfilled before artist with 3 |
+| 8.4.4 | No backfill needed | Auto | All artists under limit → no changes |
+| 8.4.5 | Unknown artist handling | Auto | Songs with no artist field → treated as "Unknown" |
+
+### 8.5 System Prompt (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 8.5.1 | _build_system_prompt includes library context | Auto | Total songs, artists, genres, moods in prompt |
+| 8.5.2 | Energy scale documented as 0-1 | Auto | Prompt mentions "0.0 (calm) to 1.0 (intense)" |
+| 8.5.3 | Dynamic genre list from DB | Auto | Top 5 genres from `get_library_context()` in prompt |
+| 8.5.4 | CLAP tool included when enabled | Auto | `text_search` in tool list when `CLAP_ENABLED=true` |
+| 8.5.5 | CLAP tool excluded when disabled | Auto | `text_search` NOT in tool list when `CLAP_ENABLED=false` |
+
+### 8.6 AI Provider Integration (Manual + Automated)
+
+| # | Test Case | Type | Provider | Details |
+|---|-----------|------|----------|---------|
+| 8.6.1 | Gemini tool calling | Manual | Gemini | Sends request, receives tool calls, executes them |
+| 8.6.2 | Gemini protobuf handling | Auto | Gemini | `_convert_protobuf_to_dict()` converts correctly |
+| 8.6.3 | Gemini fc.args vs fc.arguments | Auto | Gemini | Both formats parsed correctly |
+| 8.6.4 | OpenAI tool calling | Manual | OpenAI | Standard tool calling works |
+| 8.6.5 | OpenAI timeout handling | Auto | OpenAI | `httpx.ReadTimeout` caught and handled |
+| 8.6.6 | Mistral tool calling | Manual | Mistral | SDK-based tool calling works |
+| 8.6.7 | Ollama JSON extraction | Auto | Ollama | Markdown code blocks stripped, JSON parsed |
+| 8.6.8 | Ollama edge case: text before JSON | Auto | Ollama | `Here is my response: {"tool_calls":...}` → parsed |
+| 8.6.9 | Ollama edge case: schema in response | Auto | Ollama | `{"tool_calls": {"_description": ...}}` → rejected |
+| 8.6.10 | Ollama edge case: invalid JSON | Auto | Ollama | Malformed JSON → empty tool_calls |
+| 8.6.11 | AI_MODEL_PROVIDER=NONE | Auto | None | Playlist naming skipped |
+| 8.6.12 | Full pipeline per provider | Manual | All | End-to-end playlist generation with each provider |
+
+### 8.7 Library Context (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 8.7.1 | get_library_context returns stats | Auto | Total songs, unique artists, top genres, etc. |
+| 8.7.2 | Caching works | Auto | Second call returns cached result |
+| 8.7.3 | Empty library handling | Auto | No songs in DB → graceful defaults |
+| 8.7.4 | Year range calculation | Auto | Min/max year from DB |
+| 8.7.5 | Rating coverage percentage | Auto | % of tracks with rating > 0 |
+
+---
+
+## 9. MCP Tools
+
+### 9.1 song_similarity (Automated)
+
+| # | Test Case | Details |
+|---|-----------|---------|
+| 9.1.1 | Exact title+artist match | Case-insensitive DB lookup succeeds |
+| 9.1.2 | Fuzzy normalized match | "dont stop believin" matches "Don't Stop Believin'" |
+| 9.1.3 | No match found | Returns empty list, no crash |
+| 9.1.4 | Seed song excluded from results | Seed not in similar list |
+| 9.1.5 | Result count respects `get_songs` | Returns exactly N songs |
+
+### 9.2 text_search (Automated)
+
+| # | Test Case | Details |
+|---|-----------|---------|
+| 9.2.1 | Basic query | "upbeat pop" returns results |
+| 9.2.2 | Tempo filter: slow | Only 40-100 BPM tracks |
+| 9.2.3 | Tempo filter: fast | Only 140-200 BPM tracks |
+| 9.2.4 | Energy filter: low (raw) | Only 0.01-0.05 energy tracks |
+| 9.2.5 | Energy filter: high (raw) | Only 0.10-0.15 energy tracks |
+| 9.2.6 | Disabled when CLAP_ENABLED=false | Returns error/empty |
+
+### 9.3 artist_similarity (Automated)
+
+| # | Test Case | Details |
+|---|-----------|---------|
+| 9.3.1 | Known artist | Returns similar artists + songs |
+| 9.3.2 | Unknown artist | Returns error message |
+| 9.3.3 | Artist name normalization | "ac dc" matches "AC/DC" |
+| 9.3.4 | Component matches breakdown | Shows count from original vs similar |
+
+### 9.4 song_alchemy (Automated)
+
+| # | Test Case | Details |
+|---|-----------|---------|
+| 9.4.1 | Two add items | Centroid calculated, neighbors found |
+| 9.4.2 | Add + subtract items | Subtract centroid applied |
+| 9.4.3 | Single add item rejected | Requires >= 2 items |
+| 9.4.4 | Plain string normalization | AI sends strings → converted to dicts |
+
+### 9.5 ai_brainstorm (Automated)
+
+| # | Test Case | Details |
+|---|-----------|---------|
+| 9.5.1 | Stage 1: exact match | "Bohemian Rhapsody" by "Queen" → match |
+| 9.5.2 | Stage 2: fuzzy match | "Don't Stop" matches "Dont Stop" |
+| 9.5.3 | Both title AND artist required | Title match with wrong artist → no match |
+| 9.5.4 | Normalization: apostrophes | "it's" → "its" |
+| 9.5.5 | Normalization: dashes | "up-beat" → "upbeat" |
+| 9.5.6 | Normalization: spaces | "The Beatles" → "thebeatles" |
+| 9.5.7 | Deduplication | Same normalized title+artist → first kept |
+| 9.5.8 | Child AI failure | Exception → empty results |
+| 9.5.9 | SQL injection prevention | Parameterized queries with LIKE escaping |
+
+### 9.6 search_database (Automated)
+
+| # | Test Case | Details |
+|---|-----------|---------|
+| 9.6.1 | Genre regex: exact match | `rock` matches `rock:0.82,...` |
+| 9.6.2 | Genre regex: no substring | `rock` does NOT match `indie rock:0.31,...` |
+| 9.6.3 | Genre regex: after comma | `rock` matches `pop:0.45,rock:0.82` |
+| 9.6.4 | Relevance scoring | Higher confidence genres ranked first |
+| 9.6.5 | Multiple genres (OR) | `["rock", "pop"]` → tracks with either |
+| 9.6.6 | Mood filtering | `["danceable"]` → tracks with that mood |
+| 9.6.7 | Tempo range | `tempo_min=120, tempo_max=140` → BPM range |
+| 9.6.8 | Energy normalization | AI sends 0.5 → converted to 0.08 raw |
+| 9.6.9 | Key filter | `key="C"` → only C key tracks |
+| 9.6.10 | Scale filter | `scale="major"` → only major scale |
+| 9.6.11 | Year range | `year_min=1980, year_max=1989` → 80s songs |
+| 9.6.12 | Rating minimum | `min_rating=4` → 4+ star tracks |
+| 9.6.13 | Combined filters (AND) | Genre + tempo + energy → intersection |
+| 9.6.14 | Empty result handling | Filters match nothing → empty list |
+| 9.6.15 | No filters rejected | No params → rejected at validation |
+
+---
+
+## 10. Provider-Specific Testing
+
+### 10.1 Common Provider Interface (Per Provider)
+
+> **Manual** - Requires running media server instances
+
+For EACH provider (Jellyfin, Navidrome, Lyrion, Emby, LocalFiles):
+
+| # | Test Case | Steps | Expected |
+|---|-----------|-------|----------|
+| 10.1.1 | Connection test | Call `test_provider_connection()` | Returns True |
+| 10.1.2 | Get music libraries | Call `get_music_libraries()` | Library list returned |
+| 10.1.3 | Get all songs | Call `get_all_songs()` | Song list with all fields |
+| 10.1.4 | Song has album_artist | Check returned song dict | `OriginalAlbumArtist` field present |
+| 10.1.5 | Song has year | Check returned song dict | `Year` field present (int or None) |
+| 10.1.6 | Song has rating | Check returned song dict | `Rating` field (0-5 scale) |
+| 10.1.7 | Song has file_path | Check returned song dict | `FilePath` field present |
+| 10.1.8 | Get recent albums | Call `get_recent_albums(10)` | 10 albums returned |
+| 10.1.9 | Get tracks from album | Call `get_tracks_from_album(album_id)` | Track list returned |
+| 10.1.10 | Download track | Call `download_track(temp_dir, item)` | File downloaded, path returned |
+| 10.1.11 | Get all playlists | Call `get_all_playlists()` | Playlist list returned |
+| 10.1.12 | Create playlist | Call `create_playlist("Test", [ids])` | Playlist created on server |
+| 10.1.13 | Delete playlist | Call `delete_playlist(id)` | Playlist removed from server |
+| 10.1.14 | Create instant playlist | Call `create_instant_playlist(...)` | Playlist created with metadata |
+
+### 10.2 LocalFiles Provider (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 10.2.1 | SHA-256 item ID generation | Auto | Same path → same hash, different path → different hash |
+| 10.2.2 | Path normalization | Auto | Windows backslashes → forward slashes |
+| 10.2.3 | Supported format filtering | Auto | `.mp3`, `.flac` accepted; `.txt` rejected |
+| 10.2.4 | Subdirectory scanning | Auto | `LOCALFILES_SCAN_SUBDIRS=true` → recursive scan |
+| 10.2.5 | No subdirectory scanning | Auto | `LOCALFILES_SCAN_SUBDIRS=false` → top-level only |
+| 10.2.6 | ID3 tag extraction | Auto | MP3 with ID3 tags → title, artist, album extracted |
+| 10.2.7 | Vorbis tag extraction | Auto | FLAC/OGG with Vorbis → metadata extracted |
+| 10.2.8 | MP4 tag extraction | Auto | M4A with MP4 tags → metadata extracted |
+| 10.2.9 | Rating from POPM tag | Auto | POPM rating → 0-5 scale |
+| 10.2.10 | Rating from TXXX:RATING | Auto | TXXX rating → 0-5 scale |
+| 10.2.11 | Year parsing: simple | Auto | "2023" → 2023 |
+| 10.2.12 | Year parsing: date string | Auto | "2023-05-01" → 2023 |
+| 10.2.13 | Year parsing: ID3 TDRC | Auto | TDRC frame → year extracted |
+| 10.2.14 | M3U playlist creation | Auto | Create playlist → .m3u file written |
+| 10.2.15 | M3U playlist listing | Auto | List playlists → .m3u files found |
+| 10.2.16 | M3U playlist deletion | Auto | Delete → .m3u file removed |
+| 10.2.17 | Empty directory handling | Auto | No music files → empty list, no crash |
+| 10.2.18 | Non-existent directory | Auto | Bad path → error returned |
+
+---
+
+## 11. Database & Schema Changes
+
+### 11.1 Schema Migration (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 11.1.1 | `provider` table created | Auto | `init_db()` creates table |
+| 11.1.2 | `app_settings` table created | Auto | `init_db()` creates table |
+| 11.1.3 | `album_artist` column added | Auto | `ALTER TABLE score ADD COLUMN IF NOT EXISTS` |
+| 11.1.4 | `year` column added | Auto | Integer column |
+| 11.1.5 | `rating` column added | Auto | Integer column (0-5) |
+| 11.1.6 | `file_path` column added | Auto | Text column |
+| 11.1.7 | Idempotent migration | Auto | Running `init_db()` twice → no error |
+| 11.1.8 | Existing data preserved | Auto | Old rows not affected by new columns |
+
+### 11.2 Data Integrity (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 11.2.1 | Score insert with new fields | Auto | All 4 new fields stored correctly |
+| 11.2.2 | Score select includes new fields | Auto | `get_score_data_by_ids()` returns new fields |
+| 11.2.3 | NULL new fields for old data | Auto | Pre-migration rows have NULL for new columns |
+| 11.2.4 | Provider JSONB config | Auto | Config stored and retrieved as JSON |
+| 11.2.5 | Provider unique constraint | Auto | Same type+name → integrity error |
+| 11.2.6 | Settings upsert | Auto | Same key → updated, not duplicated |
+
+---
+
+## 12. Dark Mode
+
+> **Mostly Manual** - Visual verification required
+
+### 12.1 Toggle & Persistence
+
+| # | Test Case | Type | Steps | Expected |
+|---|-----------|------|-------|----------|
+| 12.1.1 | Toggle button visible | Manual | Open any page | Sun/moon button in sidebar |
+| 12.1.2 | Toggle to dark mode | Manual | Click toggle button | Body gets `dark-mode` class, colors change |
+| 12.1.3 | Toggle back to light | Manual | Click toggle again | `dark-mode` class removed |
+| 12.1.4 | localStorage persistence | Auto | Toggle dark, reload page | Still dark mode |
+| 12.1.5 | System preference detection | Manual | Set OS to dark mode, clear localStorage | App starts in dark mode |
+| 12.1.6 | No FOUC on load | Manual | Hard refresh (Ctrl+Shift+R) | No flash of wrong theme |
+| 12.1.7 | FOUC prevention script | Auto | Check `layout.html` for inline script | Script in `<head>` before CSS |
+
+### 12.2 Visual Correctness (All Manual)
+
+For EACH of these 18 templates, verify in BOTH light and dark mode:
+
+| # | Page | Check Items |
+|---|------|-------------|
+| 12.2.1 | Chat (instant playlist) | Background, text, input fields, buttons, results cards |
+| 12.2.2 | Similarity search | Background, search inputs, results table, cards |
+| 12.2.3 | Alchemy | Background, add/subtract buttons, results, projections |
+| 12.2.4 | Artist similarity | Background, search, results list |
+| 12.2.5 | Path finding | Background, start/end selectors, path visualization |
+| 12.2.6 | Map | Background, map container, tooltips |
+| 12.2.7 | CLAP search | Background, search input, results |
+| 12.2.8 | MuLan search | Background, search input, results |
+| 12.2.9 | Sonic fingerprint | Background, results, credentials form |
+| 12.2.10 | Waveform | Background, waveform canvas, controls |
+| 12.2.11 | Cleaning | Background, status display |
+| 12.2.12 | Cron | Background, cron table, add form |
+| 12.2.13 | Collection sync | Background, sync status |
+| 12.2.14 | Settings | Background, form fields, dropdowns |
+| 12.2.15 | Setup wizard | Background, wizard steps, buttons |
+| 12.2.16 | Sidebar navigation | Background, links, active state, toggle button |
+| 12.2.17 | Chart.js charts | Grid lines, labels, data points use CSS variable colors |
+| 12.2.18 | Error/loading states | Spinner, error messages visible in both themes |
+
+### 12.3 CSS Variables (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 12.3.1 | :root variables defined | Auto | All 30+ CSS custom properties in `:root` |
+| 12.3.2 | body.dark-mode overrides | Auto | All variables overridden in dark mode |
+| 12.3.3 | No hardcoded colors remaining | Auto | Grep for `#[0-9a-fA-F]{3,8}` outside `:root` |
+| 12.3.4 | Transition smoothing | Auto | `transition: background 0.3s, color 0.3s` present |
+
+---
+
+## 13. Analysis Pipeline
+
+### 13.1 Analysis with New Fields (Automated + Manual)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 13.1.1 | Analysis stores album_artist | Auto | `save_track_analysis_and_embedding()` stores field |
+| 13.1.2 | Analysis stores year | Auto | Year parsed and stored |
+| 13.1.3 | Analysis stores rating | Auto | Rating normalized and stored |
+| 13.1.4 | Analysis stores file_path | Auto | File path stored |
+| 13.1.5 | Analysis stores provider_id | Auto | Provider ID stored |
+| 13.1.6 | Cross-provider reuse | Auto | Same file_path → analysis copied, not re-run |
+| 13.1.7 | Full analysis pipeline | Manual | Start analysis, wait for completion | All tracks analyzed with new fields |
+| 13.1.8 | Queue drain before index rebuild | Auto | Analysis waits for all album jobs before Voyager rebuild |
+
+### 13.2 Voyager Index (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 13.2.1 | Index rebuild after analysis | Auto | New embeddings indexed |
+| 13.2.2 | search_tracks returns album_artist | Auto | Query result includes new field |
+| 13.2.3 | create_playlist_from_ids with provider_ids | Auto | Delegates to multi-provider creation |
+
+---
+
+## 14. Playlist Ordering
+
+### 14.1 Greedy Nearest-Neighbor (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 14.1.1 | Single song | Auto | Returns single song unchanged |
+| 14.1.2 | Two songs | Auto | Both songs in output |
+| 14.1.3 | Empty list | Auto | Returns empty list |
+| 14.1.4 | Start from 25th percentile energy | Auto | First song is low-energy |
+| 14.1.5 | Consecutive songs are similar | Auto | Adjacent songs have small composite distance |
+
+### 14.2 Composite Distance (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 14.2.1 | Tempo weight = 35% | Auto | BPM difference contributes 35% |
+| 14.2.2 | Energy weight = 35% | Auto | Energy difference contributes 35% |
+| 14.2.3 | Key weight = 30% | Auto | Key distance contributes 30% |
+| 14.2.4 | Tempo normalization (80 BPM span) | Auto | 80 BPM diff = 1.0, 0 BPM diff = 0.0 |
+| 14.2.5 | Energy normalization (0.14 span) | Auto | 0.14 diff = 1.0, 0 diff = 0.0 |
+| 14.2.6 | Same scale bonus (20%) | Auto | Same scale → key distance * 0.8 |
+
+### 14.3 Circle of Fifths Key Distance (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 14.3.1 | Same key = 0 | Auto | C → C = 0.0 |
+| 14.3.2 | Adjacent keys | Auto | C → G = 1/6, C → F = 1/6 |
+| 14.3.3 | Opposite keys | Auto | C → F# = 6/6 = 1.0 |
+| 14.3.4 | Enharmonic equivalents | Auto | F# == Gb |
+
+### 14.4 Energy Arc (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 14.4.1 | Arc disabled by default | Auto | `PLAYLIST_ENERGY_ARC=False` → no shaping |
+| 14.4.2 | Arc enabled | Auto | Gentle start → peak → cooldown |
+| 14.4.3 | Arc requires >= 10 songs | Auto | < 10 songs → no arc applied |
+
+---
+
+## 15. Deployment & Docker
+
+> **All Manual** - Requires Docker environment
+
+| # | Test Case | Steps | Expected |
+|---|-----------|-------|----------|
+| 15.1 | Unified CPU compose | `docker compose -f docker-compose-unified.yaml up` | App + worker start, health check passes |
+| 15.2 | Unified NVIDIA compose | `docker compose -f docker-compose-unified-nvidia.yaml up` | GPU detected, CUDA available |
+| 15.3 | Split deployment: server | Start server compose | API responds on port |
+| 15.4 | Split deployment: worker | Start worker compose with remote Redis/PG | Worker connects and processes jobs |
+| 15.5 | Unraid templates | Import XML templates | Containers configured correctly |
+| 15.6 | .env.example works | Copy to .env, start | App starts with setup wizard |
+| 15.7 | No `version:` in compose | Check all compose files | No deprecated `version: '3.8'` line |
+| 15.8 | Test provider stack | Start test compose files | Jellyfin + Navidrome + AudioMuse running |
+
+---
+
+## 16. Regression Tests
+
+### 16.1 Features That Must Still Work (from main)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 16.1.1 | CLAP text search | Manual | Search by text description → relevant results |
+| 16.1.2 | MuLan text search | Manual | Search by text → relevant results |
+| 16.1.3 | Voyager similarity search | Auto | Song similarity returns correct neighbors |
+| 16.1.4 | Song alchemy | Manual | Add/subtract songs → blended results |
+| 16.1.5 | Song path finding | Manual | Start/end song → smooth path |
+| 16.1.6 | Music map visualization | Manual | 2D projection renders |
+| 16.1.7 | Artist similarity | Manual | Similar artists found |
+| 16.1.8 | Sonic fingerprint | Manual | Listening profile generated |
+| 16.1.9 | Waveform visualization | Manual | Audio peaks extracted and rendered |
+| 16.1.10 | Clustering/playlist generation | Manual | Evolutionary clustering produces playlists |
+| 16.1.11 | Cron scheduling | Manual | Scheduled task executes on time |
+| 16.1.12 | Database cleaning | Manual | Orphaned albums removed |
+| 16.1.13 | Audio analysis (ONNX) | Manual | Tracks analyzed, embeddings stored |
+| 16.1.14 | Memory management | Auto | Memory utils function correctly |
+
+### 16.2 Breaking Changes to Verify
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 16.2.1 | MPD removal | Auto | No references to `mediaserver_mpd` or `python-mpd2` |
+| 16.2.2 | energy_normalized → energy fix | Auto | `chat_manager.py` uses `energy` column |
+| 16.2.3 | Default MEDIASERVER_TYPE | Auto | .env.example defaults to `localfiles` |
+| 16.2.4 | Setup redirect on upgrade | Manual | Existing installation sees setup wizard once |
+| 16.2.5 | Auto-created tables | Auto | `init_db()` creates new tables without errors |
+| 16.2.6 | Backward-compatible API | Auto | `create_playlist_from_ids()` works without `provider_ids` |
+
+---
+
+## 17. Security
+
+### 17.1 XSS Prevention (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 17.1.1 | escapeHtml in templates | Auto | All `innerHTML` assignments use `escapeHtml()` |
+| 17.1.2 | utils.js loaded | Auto | `escapeHtml()` function available in all pages |
+| 17.1.3 | Provider name escaping | Auto | `<script>` in provider name → escaped |
+| 17.1.4 | Track title escaping | Auto | `<script>` in track title → escaped |
+
+### 17.2 SQL Injection Prevention (Automated)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 17.2.1 | Parameterized queries in MCP tools | Auto | All SQL uses `%s` placeholders |
+| 17.2.2 | LIKE pattern escaping in brainstorm | Auto | `%` and `_` escaped in fuzzy search |
+| 17.2.3 | Provider config input validation | Auto | Malicious JSONB → rejected or escaped |
+
+### 17.3 Authentication & Authorization
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 17.3.1 | Provider credentials not logged | Manual | Check logs for token/password values |
+| 17.3.2 | API keys not in responses | Auto | GET endpoints don't return API keys |
+| 17.3.3 | Provider config API sanitized | Auto | `GET /api/providers` redacts sensitive fields |
+
+---
+
+## Test Execution Priority
+
+### P0 - Must Pass Before Merge
+
+- [ ] All existing unit tests pass (`pytest tests/unit/ -v`)
+- [ ] New MCP tool tests pass (Section 9)
+- [ ] New playlist ordering tests pass (Section 14)
+- [ ] New instant playlist pipeline tests pass (Section 8)
+- [ ] New setup wizard tests pass (Section 3)
+- [ ] Database migration is idempotent (Section 11)
+- [ ] Breaking changes verified (Section 16.2)
+- [ ] XSS prevention verified (Section 17.1)
+
+### P1 - Should Pass Before Release
+
+- [ ] All API endpoints respond correctly (Section 6)
+- [ ] Dark mode toggle and persistence (Section 12.1)
+- [ ] LocalFiles provider tests (Section 10.2)
+- [ ] Energy normalization tests (Section 9.6.8)
+- [ ] Artist diversity enforcement (Section 8.4)
+- [ ] Provider CRUD API (Section 3.3)
+- [ ] Setup wizard UI flow (Section 4)
+
+### P2 - Should Pass Before GA
+
+- [ ] Full regression testing of all features (Section 16.1)
+- [ ] Dark mode visual correctness on all pages (Section 12.2)
+- [ ] All provider-specific tests (Section 10.1)
+- [ ] Docker deployment tests (Section 15)
+- [ ] AI provider integration tests (Section 8.6)
+- [ ] Comparison suite benchmarks (testing_suite/)
+- [ ] Security audit (Section 17)
+
+---
+
+## Appendix: Test Count Summary
+
+| Category | Automated | Manual | Total |
+|----------|-----------|--------|-------|
+| Multi-Provider Architecture | 22 | 10 | 32 |
+| GUI Setup Wizard | 0 | 22 | 22 |
+| Environment / Config | 12 | 3 | 15 |
+| API Endpoints | 27 | 4 | 31 |
+| App Interactions | 0 | 14 | 14 |
+| Instant Playlist & AI | 30 | 6 | 36 |
+| MCP Tools | 40 | 0 | 40 |
+| Provider-Specific | 18 | 14 per provider | 88 |
+| Database & Schema | 12 | 0 | 12 |
+| Dark Mode | 5 | 20 | 25 |
+| Analysis Pipeline | 8 | 1 | 9 |
+| Playlist Ordering | 16 | 0 | 16 |
+| Deployment | 0 | 8 | 8 |
+| Regression | 6 | 13 | 19 |
+| Security | 7 | 1 | 8 |
+| **TOTAL** | **203** | **~116** | **~319** |
+
+**Existing automated tests:** ~200+
+**New automated tests to write:** ~203
+**Manual test cases:** ~116
diff --git a/app.py b/app.py
index e1003355..5333ca05 100644
--- a/app.py
+++ b/app.py
@@ -18,6 +18,7 @@
 from flasgger import Swagger, swag_from
 
 # Import configuration
+import config
 from config import JELLYFIN_URL, JELLYFIN_USER_ID, JELLYFIN_TOKEN, HEADERS, TEMP_DIR, \
   REDIS_URL, DATABASE_URL, MAX_DISTANCE, MAX_SONGS_PER_CLUSTER, MAX_SONGS_PER_ARTIST, NUM_RECENT_ALBUMS, \
   SCORE_WEIGHT_DIVERSITY, SCORE_WEIGHT_SILHOUETTE, SCORE_WEIGHT_DAVIES_BOULDIN, SCORE_WEIGHT_CALINSKI_HARABASZ, \
@@ -636,6 +637,14 @@ def listen_for_index_reloads():
     except Exception as e:
       logger.debug(f"Could not apply DB settings at startup: {e}")
 
+    # --- MPD removal warning ---
+    if config.MEDIASERVER_TYPE == 'mpd':
+      logger.warning("=" * 60)
+      logger.warning("MPD provider has been removed in v0.9.0.")
+      logger.warning("Please switch to 'localfiles' or another supported provider.")
+      logger.warning("See deployment/.env.example for configuration options.")
+      logger.warning("=" * 60)
+
     # --- Initial Voyager Index Load ---
     from tasks.voyager_manager import load_voyager_index_for_querying
     load_voyager_index_for_querying()
diff --git a/app_helper.py b/app_helper.py
index 8ded0ddc..d862595c 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -316,6 +316,10 @@ def init_db():
             cur.execute("ALTER TABLE score ADD COLUMN file_path TEXT")
             cur.execute("CREATE INDEX IF NOT EXISTS idx_score_file_path ON score(file_path)")
 
+        # Performance indexes for hot queries (brainstorm, artist search)
+        cur.execute("CREATE INDEX IF NOT EXISTS idx_score_author_lower ON score(LOWER(author))")
+        cur.execute("CREATE INDEX IF NOT EXISTS idx_score_title_author_lower ON score(LOWER(title), LOWER(author))")
+
         # Insert default settings if app_settings is empty
         cur.execute("SELECT COUNT(*) FROM app_settings")
         if cur.fetchone()[0] == 0:
@@ -336,6 +340,179 @@ def init_db():
                 """, (key, value, category, description))
             logger.info("Inserted default app settings")
 
+        # =================================================================
+        # MIGRATIONS (guarded by app_settings keys)
+        # =================================================================
+
+        # Migration: Recompute track.file_path_hash with case-normalized paths
+        cur.execute("SELECT value FROM app_settings WHERE key = 'migration_case_normalization_done'")
+        if not cur.fetchone():
+            try:
+                import hashlib as _hashlib
+                logger.info("Running migration: case normalization for track.file_path_hash")
+                cur.execute("SELECT id, file_path, normalized_path FROM track")
+                tracks_to_update = cur.fetchall()
+                merged_count = 0
+                updated_count = 0
+
+                # Group tracks by their new normalized hash
+                hash_groups = {}
+                for track_id, file_path, old_normalized in tracks_to_update:
+                    if not file_path:
+                        continue
+                    # Re-normalize with .lower() (normalize_provider_path now returns lowered)
+                    new_normalized = normalize_provider_path(file_path)
+                    if not new_normalized:
+                        continue
+                    new_hash = _hashlib.sha256(new_normalized.encode('utf-8')).hexdigest()
+                    if new_hash not in hash_groups:
+                        hash_groups[new_hash] = []
+                    hash_groups[new_hash].append((track_id, new_normalized, new_hash))
+
+                for new_hash, group in hash_groups.items():
+                    if len(group) == 1:
+                        # Simple update
+                        track_id, new_normalized, new_hash = group[0]
+                        cur.execute("""
+                            UPDATE track SET file_path_hash = %s, normalized_path = %s, updated_at = NOW()
+                            WHERE id = %s
+                        """, (new_hash, new_normalized, track_id))
+                        updated_count += 1
+                    else:
+                        # Merge: keep the first, redirect others' provider_track refs
+                        canonical_track_id = group[0][0]
+                        new_normalized = group[0][1]
+                        cur.execute("""
+                            UPDATE track SET file_path_hash = %s, normalized_path = %s, updated_at = NOW()
+                            WHERE id = %s
+                        """, (new_hash, new_normalized, canonical_track_id))
+                        for dup_track_id, _, _ in group[1:]:
+                            # Redirect provider_track references
+                            cur.execute("""
+                                UPDATE provider_track SET track_id = %s WHERE track_id = %s
+                            """, (canonical_track_id, dup_track_id))
+                            # Redirect score.track_id references
+                            cur.execute("""
+                                UPDATE score SET track_id = %s WHERE track_id = %s
+                            """, (canonical_track_id, dup_track_id))
+                            # Delete duplicate track
+                            cur.execute("DELETE FROM track WHERE id = %s", (dup_track_id,))
+                            merged_count += 1
+
+                cur.execute("""
+                    INSERT INTO app_settings (key, value, updated_at)
+                    VALUES ('migration_case_normalization_done', 'true', NOW())
+                    ON CONFLICT (key) DO NOTHING
+                """)
+                db.commit()
+                logger.info(f"Case normalization migration complete: {updated_count} updated, {merged_count} merged")
+            except Exception as e:
+                db.rollback()
+                logger.warning(f"Case normalization migration failed (will retry next startup): {e}")
+
+        # Migration: Consolidate duplicate score rows (one per track_id)
+        # MUST run AFTER all new code paths (link_provider_to_existing_track, updated remap, etc.)
+        cur.execute("SELECT value FROM app_settings WHERE key = 'migration_dedup_score_rows_done'")
+        if not cur.fetchone():
+            try:
+                logger.info("Running migration: consolidating duplicate score rows")
+                # Find track_ids with multiple score rows
+                cur.execute("""
+                    SELECT track_id, COUNT(*) as cnt
+                    FROM score
+                    WHERE track_id IS NOT NULL
+                    GROUP BY track_id
+                    HAVING COUNT(*) > 1
+                """)
+                dup_groups = cur.fetchall()
+                total_deleted = 0
+
+                for track_id, cnt in dup_groups:
+                    # Get all item_ids for this track_id
+                    cur.execute("""
+                        SELECT s.item_id FROM score s WHERE s.track_id = %s ORDER BY s.item_id
+                    """, (track_id,))
+                    item_ids = [row[0] for row in cur.fetchall()]
+
+                    # Ensure each item_id has a provider_track entry
+                    for item_id in item_ids:
+                        cur.execute("""
+                            SELECT 1 FROM provider_track WHERE item_id = %s
+                        """, (item_id,))
+                        if not cur.fetchone():
+                            # Check if this item_id is the canonical one used in Voyager etc.
+                            # Try to link it via score's file_path
+                            cur.execute("SELECT file_path FROM score WHERE item_id = %s", (item_id,))
+                            fp_row = cur.fetchone()
+                            if fp_row and fp_row[0]:
+                                logger.debug(f"Dedup migration: item {item_id} has no provider_track entry, creating placeholder")
+                                # We can't create a full link without provider_id, skip this group
+                                logger.warning(f"Skipping dedup for track_id {track_id}: item {item_id} has no provider_track mapping")
+                                break
+                    else:
+                        # All items have provider_track entries — safe to dedup
+                        # Pick canonical: prefer the one from the primary provider
+                        primary_pid = get_primary_provider_id()
+                        canonical_id = None
+                        if primary_pid:
+                            cur.execute("""
+                                SELECT pt.item_id FROM provider_track pt
+                                WHERE pt.track_id = %s AND pt.provider_id = %s
+                                LIMIT 1
+                            """, (track_id, primary_pid))
+                            row = cur.fetchone()
+                            if row:
+                                canonical_id = row[0]
+                        if not canonical_id:
+                            canonical_id = item_ids[0]  # First alphabetically
+
+                        # Delete non-canonical rows (in FK order)
+                        non_canonical = [iid for iid in item_ids if iid != canonical_id]
+                        if non_canonical:
+                            cur.execute("DELETE FROM mulan_embedding WHERE item_id = ANY(%s)", (non_canonical,))
+                            cur.execute("DELETE FROM clap_embedding WHERE item_id = ANY(%s)", (non_canonical,))
+                            cur.execute("DELETE FROM embedding WHERE item_id = ANY(%s)", (non_canonical,))
+                            cur.execute("DELETE FROM score WHERE item_id = ANY(%s)", (non_canonical,))
+                            total_deleted += len(non_canonical)
+
+                cur.execute("""
+                    INSERT INTO app_settings (key, value, updated_at)
+                    VALUES ('migration_dedup_score_rows_done', 'true', NOW())
+                    ON CONFLICT (key) DO NOTHING
+                """)
+                db.commit()
+                logger.info(f"Score dedup migration complete: {total_deleted} duplicate rows removed from {len(dup_groups)} track groups")
+            except Exception as e:
+                db.rollback()
+                logger.warning(f"Score dedup migration failed (will retry next startup): {e}")
+
+        # Migration: Encrypt existing unencrypted provider configs
+        cur.execute("SELECT value FROM app_settings WHERE key = 'migration_encrypt_provider_configs_done'")
+        if not cur.fetchone():
+            try:
+                cur.execute("SELECT id, config FROM provider")
+                for row in cur.fetchall():
+                    provider_id, pconfig = row
+                    if pconfig and isinstance(pconfig, dict):
+                        needs_encrypt = any(
+                            k in pconfig and pconfig[k] and not str(pconfig[k]).startswith('gAAAAA')
+                            for k in SENSITIVE_CONFIG_KEYS
+                        )
+                        if needs_encrypt:
+                            encrypted = encrypt_provider_config(pconfig)
+                            cur.execute("UPDATE provider SET config = %s WHERE id = %s",
+                                        (json.dumps(encrypted), provider_id))
+                cur.execute("""
+                    INSERT INTO app_settings (key, value, updated_at)
+                    VALUES ('migration_encrypt_provider_configs_done', 'true', NOW())
+                    ON CONFLICT (key) DO NOTHING
+                """)
+                db.commit()
+                logger.info("Encrypted existing provider configs")
+            except Exception as e:
+                db.rollback()
+                logger.warning(f"Provider config encryption migration failed: {e}")
+
         db.commit()
 
 # --- Status Constants ---
@@ -615,6 +792,12 @@ def _sanitize_string(s, max_length=1000, field_name="field"):
     other_features = _sanitize_string(other_features, max_length=2000, field_name="other_features")
     file_path = _sanitize_string(file_path, max_length=2000, field_name="file_path")
 
+    # Normalize file_path for consistent cross-provider matching
+    if file_path:
+        normalized_fp = normalize_provider_path(file_path)
+        if normalized_fp:
+            file_path = normalized_fp
+
     # year: parse from various date formats and validate
     def _parse_year_from_date(year_value):
         """
@@ -1442,6 +1625,75 @@ def set_primary_provider(provider_id):
         db.commit()
 
 
+# ##############################################################################
+# CREDENTIAL ENCRYPTION
+# ##############################################################################
+
+SENSITIVE_CONFIG_KEYS = {'token', 'password', 'api_key'}
+
+def _get_fernet():
+    """Get or create a Fernet cipher using ENCRYPTION_KEY from config/env."""
+    from cryptography.fernet import Fernet
+    import config as _config
+    key = getattr(_config, 'ENCRYPTION_KEY', None) or os.environ.get('ENCRYPTION_KEY')
+    if not key:
+        # Check app_settings for a previously generated key
+        db = get_db()
+        with db.cursor() as cur:
+            cur.execute("SELECT value FROM app_settings WHERE key = 'encryption_key'")
+            row = cur.fetchone()
+            if row and row[0]:
+                key = row[0] if isinstance(row[0], str) else str(row[0])
+                # Strip JSON quotes if present
+                key = key.strip('"')
+        if not key:
+            # Auto-generate and persist
+            key = Fernet.generate_key().decode()
+            db = get_db()
+            with db.cursor() as cur:
+                cur.execute("""
+                    INSERT INTO app_settings (key, value, updated_at)
+                    VALUES ('encryption_key', %s, NOW())
+                    ON CONFLICT (key) DO UPDATE SET value = EXCLUDED.value, updated_at = NOW()
+                """, (json.dumps(key),))
+                db.commit()
+            logger.info("Generated and stored new encryption key")
+    return Fernet(key.encode() if isinstance(key, str) else key)
+
+
+def encrypt_provider_config(config_dict):
+    """Encrypt sensitive fields in a provider config dict before storage."""
+    if not config_dict or not isinstance(config_dict, dict):
+        return config_dict
+    encrypted = dict(config_dict)
+    try:
+        f = _get_fernet()
+        for k in SENSITIVE_CONFIG_KEYS:
+            if k in encrypted and encrypted[k] and not str(encrypted[k]).startswith('gAAAAA'):
+                encrypted[k] = f.encrypt(str(encrypted[k]).encode()).decode()
+    except Exception as e:
+        logger.error(f"Failed to encrypt provider config: {e}")
+    return encrypted
+
+
+def decrypt_provider_config(config_dict):
+    """Decrypt sensitive fields in a provider config dict after retrieval."""
+    if not config_dict or not isinstance(config_dict, dict):
+        return config_dict
+    decrypted = dict(config_dict)
+    try:
+        f = _get_fernet()
+        for k in SENSITIVE_CONFIG_KEYS:
+            if k in decrypted and decrypted[k] and str(decrypted[k]).startswith('gAAAAA'):
+                try:
+                    decrypted[k] = f.decrypt(str(decrypted[k]).encode()).decode()
+                except Exception:
+                    pass  # Not encrypted or wrong key, leave as-is
+    except Exception as e:
+        logger.error(f"Failed to decrypt provider config: {e}")
+    return decrypted
+
+
 # ##############################################################################
 # TRACK LINKING FUNCTIONS - For multi-provider track identity
 # ##############################################################################
@@ -1542,7 +1794,8 @@ def normalize_provider_path(file_path, provider_id=None):
         except Exception:
             pass  # Ignore errors - continue with standard normalization
 
-    return normalized.lstrip('/') if normalized else None
+    result = normalized.lstrip('/') if normalized else None
+    return result.lower() if result else None
 
 
 def _compute_file_path_hash(file_path, provider_id=None):
@@ -1843,13 +2096,46 @@ def find_existing_analysis_by_file_path(file_path, provider_id=None):
         return None
 
 
+def link_provider_to_existing_track(file_path, provider_id, item_id, title=None, artist=None, album=None):
+    """
+    Link a new provider's item_id to an already-analyzed track via provider_track.
+
+    Unlike copy_analysis_to_new_item(), this does NOT duplicate score/embedding rows.
+    It only creates a provider_track mapping so the provider's item_id resolves
+    to the existing canonical track.
+
+    Args:
+        file_path: File path of the track (used to find/create the track record)
+        provider_id: ID of the provider being linked
+        item_id: The provider's native item identifier
+        title: Optional track title from this provider
+        artist: Optional artist name from this provider
+        album: Optional album name from this provider
+
+    Returns:
+        True if linking succeeded, False otherwise
+    """
+    if not file_path or not provider_id or not item_id:
+        return False
+    try:
+        track_id = get_or_create_track(file_path, provider_id=provider_id)
+        if not track_id:
+            return False
+        link_provider_track(provider_id, track_id, item_id, title, artist, album)
+        logger.info(f"Linked provider {provider_id} item {item_id} to track {track_id} (no row duplication)")
+        return True
+    except Exception as e:
+        logger.error(f"Failed to link provider track for {item_id}: {e}")
+        return False
+
+
 def copy_analysis_to_new_item(source_item_id, target_item_id, file_path=None, provider_id=None):
     """
-    Copy analysis data from one item_id to another.
+    DEPRECATED: Use link_provider_to_existing_track() instead.
 
-    This is used in multi-provider setups when a track has already been analyzed
-    under a different provider's item_id. Instead of re-analyzing, we copy the
-    existing analysis to the new provider's item_id.
+    Copy analysis data from one item_id to another.
+    This duplicates score + embedding rows, which wastes storage and causes
+    duplicate Voyager index entries. Kept temporarily for migration.
 
     Args:
         source_item_id: The item_id that has existing analysis
@@ -2132,4 +2418,26 @@ def basic_normalize(path):
         'prefix_occurrences': occurrence_count,
         'sample_comparisons': sample_comparisons[:5],
         'had_existing_tracks': True
-    }
\ No newline at end of file
+    }
+
+
+def detect_path_format(sample_tracks):
+    """
+    Detect whether sample track paths are absolute or relative.
+
+    Navidrome's "Report Real Path" setting controls this:
+    - OFF (default): relative paths like "Artist/Album/Track.flac"
+    - ON: absolute paths like "/music/Artist/Album/Track.flac"
+
+    Args:
+        sample_tracks: List of track dicts with 'file_path' key
+
+    Returns:
+        'absolute', 'relative', or 'unknown'
+    """
+    paths = [t.get('file_path', '') for t in sample_tracks if t]
+    paths = [p for p in paths if p]
+    if not paths:
+        return 'unknown'
+    absolute_count = sum(1 for p in paths if p.startswith('/'))
+    return 'absolute' if absolute_count > len(paths) / 2 else 'relative'
\ No newline at end of file
diff --git a/app_setup.py b/app_setup.py
index 85d99204..5111cdc8 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -16,7 +16,7 @@
 from flask import Blueprint, jsonify, request, render_template, redirect, url_for, g
 from functools import wraps
 
-from app_helper import get_db, detect_music_path_prefix
+from app_helper import get_db, detect_music_path_prefix, detect_path_format, encrypt_provider_config, decrypt_provider_config
 from tasks.mediaserver import (
     get_available_provider_types,
     get_provider_info,
@@ -123,9 +123,45 @@ def apply_settings_to_config():
 
 
 def is_setup_completed():
-    """Check if initial setup has been completed."""
+    """Check if initial setup has been completed.
+
+    If the DB flag is already set, return immediately.  Otherwise, check
+    whether the user has configured a supported provider via environment
+    variables (non-placeholder values).  If so, auto-create the default
+    provider row and mark setup as completed so that env-configured users
+    are never redirected to the setup wizard.
+
+    ``localfiles`` is excluded because it requires explicit path
+    configuration via the wizard.
+    """
     result = get_setting('setup_completed')
-    return result is True or result == 'true' or result == True
+    if result is True or result == 'true' or result == True:
+        return True
+
+    # Auto-detect env-var configuration for server-based providers
+    _ENV_REQUIREMENTS = {
+        'jellyfin': [config.JELLYFIN_URL, config.JELLYFIN_TOKEN, config.JELLYFIN_USER_ID],
+        'navidrome': [config.NAVIDROME_URL, config.NAVIDROME_USER, config.NAVIDROME_PASSWORD],
+        'lyrion': [config.LYRION_URL],
+        'emby': [config.EMBY_URL, config.EMBY_TOKEN, config.EMBY_USER_ID],
+    }
+
+    provider_type = config.MEDIASERVER_TYPE
+    required_values = _ENV_REQUIREMENTS.get(provider_type)
+    if required_values is None:
+        return False  # localfiles or unknown — require wizard
+
+    # All values must be non-empty and must not contain placeholder text
+    if all(v and 'your_' not in v for v in required_values):
+        try:
+            create_default_provider_from_env()
+            set_setting('setup_completed', True, 'system', 'Auto-completed from environment variables')
+            logger.info(f"Auto-completed setup for env-configured provider: {provider_type}")
+            return True
+        except Exception as e:
+            logger.warning(f"Failed to auto-complete setup from env: {e}")
+
+    return False
 
 
 def is_multi_provider_enabled():
@@ -166,7 +202,7 @@ def get_providers(enabled_only=False):
                 'id': row[0],
                 'provider_type': row[1],
                 'name': row[2],
-                'config': row[3],  # JSONB is automatically parsed
+                'config': decrypt_provider_config(row[3]),  # JSONB is automatically parsed, decrypt sensitive fields
                 'enabled': row[4],
                 'priority': row[5],
                 'created_at': row[6].isoformat() if row[6] else None,
@@ -199,7 +235,7 @@ def get_provider_by_id(provider_id):
                 'id': row[0],
                 'provider_type': row[1],
                 'name': row[2],
-                'config': row[3],
+                'config': decrypt_provider_config(row[3]),
                 'enabled': row[4],
                 'priority': row[5],
             }
@@ -209,12 +245,13 @@ def get_provider_by_id(provider_id):
 def add_provider(provider_type, name, config_data, enabled=True, priority=0):
     """Add a new provider configuration."""
     db = get_db()
+    encrypted_config = encrypt_provider_config(config_data)
     with db.cursor() as cur:
         cur.execute("""
             INSERT INTO provider (provider_type, name, config, enabled, priority)
             VALUES (%s, %s, %s, %s, %s)
             RETURNING id
-        """, (provider_type, name, json.dumps(config_data), enabled, priority))
+        """, (provider_type, name, json.dumps(encrypted_config), enabled, priority))
         provider_id = cur.fetchone()[0]
         db.commit()
         return provider_id
@@ -231,7 +268,7 @@ def update_provider(provider_id, name=None, config_data=None, enabled=None, prio
         values.append(name)
     if config_data is not None:
         updates.append("config = %s")
-        values.append(json.dumps(config_data))
+        values.append(json.dumps(encrypt_provider_config(config_data)))
     if enabled is not None:
         updates.append("enabled = %s")
         values.append(enabled)
@@ -526,7 +563,7 @@ def create_provider():
 
     try:
         # Check if provider of this type already exists - upsert to prevent duplicates
-        existing_providers = get_all_providers()
+        existing_providers = get_providers(enabled_only=False)
         existing = next((p for p in existing_providers if p['provider_type'] == provider_type), None)
 
         if existing:
@@ -714,6 +751,10 @@ def test_provider_config():
                 # Return sample tracks so frontend can cache them for subsequent provider tests
                 result['sample_tracks'] = sample_tracks
 
+                # Detect path format for Navidrome (relative vs absolute)
+                if provider_type == 'navidrome':
+                    result['path_format'] = detect_path_format(sample_tracks)
+
                 # Detect prefix by comparing with existing tracks (DB + cached tracks from previously tested providers)
                 prefix_result = detect_music_path_prefix(sample_tracks, extra_sample_tracks=existing_sample_tracks)
                 result['prefix_detection'] = prefix_result
@@ -745,6 +786,66 @@ def test_provider_config():
     return jsonify(result)
 
 
+@setup_bp.route('/api/setup/providers/<int:provider_id>/rescan-paths', methods=['POST'])
+def rescan_provider_paths(provider_id):
+    """
+    Rescan file paths for a provider to detect path format and prefix changes.
+    Useful after changing Navidrome's "Report Real Path" setting.
+    ---
+    tags:
+      - Setup
+    parameters:
+      - name: provider_id
+        in: path
+        required: true
+        schema:
+          type: integer
+    responses:
+      200:
+        description: Rescan results
+      404:
+        description: Provider not found
+    """
+    provider = get_provider_by_id(provider_id)
+    if not provider:
+        return jsonify({'error': 'Provider not found'}), 404
+
+    provider_type = provider['provider_type']
+    config_data = provider['config']
+
+    try:
+        sample_tracks = get_sample_tracks_from_provider(provider_type, config_data, limit=50)
+        if not sample_tracks:
+            return jsonify({
+                'success': False,
+                'message': 'Could not fetch sample tracks from provider'
+            })
+
+        path_format = detect_path_format(sample_tracks)
+        prefix_result = detect_music_path_prefix(sample_tracks)
+
+        current_prefix = config_data.get('music_path_prefix', '')
+        suggested_prefix = prefix_result.get('detected_prefix', '')
+        prefix_changed = current_prefix != suggested_prefix and prefix_result.get('matches_found', 0) > 0
+
+        return jsonify({
+            'success': True,
+            'path_format': path_format,
+            'suggested_prefix': suggested_prefix,
+            'current_prefix': current_prefix,
+            'prefix_changed': prefix_changed,
+            'confidence': prefix_result.get('confidence', 'none'),
+            'matches_found': prefix_result.get('matches_found', 0),
+            'message': f'Path format: {path_format}. '
+                       + (f'Suggested prefix: "{suggested_prefix}" ({prefix_result.get("confidence")} confidence)'
+                          if prefix_result.get('matches_found', 0) > 0
+                          else 'No matching tracks found for prefix detection.')
+        })
+    except Exception as e:
+        logger.error(f"Error rescanning paths for provider {provider_id}: {e}")
+        return jsonify({'success': False, 'message': f'Rescan failed: {str(e)}'}), 500
+
+
 @setup_bp.route('/api/setup/providers/libraries', methods=['POST'])
 def get_provider_libraries():
     """
diff --git a/config.py b/config.py
index 7b49ca73..24c85b76 100644
--- a/config.py
+++ b/config.py
@@ -52,7 +52,7 @@
 
 
 # --- General Constants (Read from Environment Variables where applicable) ---
-APP_VERSION = "v0.8.8"
+APP_VERSION = "v0.9.0"
 MAX_DISTANCE = float(os.environ.get("MAX_DISTANCE", "0.5"))
 MAX_SONGS_PER_CLUSTER = int(os.environ.get("MAX_SONGS_PER_CLUSTER", "0"))
 MAX_SONGS_PER_ARTIST = int(os.getenv("MAX_SONGS_PER_ARTIST", "3")) # Max songs per artist in similarity results and clustering
@@ -455,6 +455,9 @@
 # }
 ENABLE_PROXY_FIX = os.environ.get("ENABLE_PROXY_FIX", "False").lower() == "true"
 
+# --- Credential Encryption ---
+ENCRYPTION_KEY = os.getenv('ENCRYPTION_KEY', '')
+
 # --- Instant Playlist Optimization ---
 # Max songs from a single artist in the instant playlist (diversity enforcement)
 MAX_SONGS_PER_ARTIST_PLAYLIST = int(os.environ.get("MAX_SONGS_PER_ARTIST_PLAYLIST", "5"))
diff --git a/deployment/.env.example b/deployment/.env.example
index f07a7d59..15eb51fb 100644
--- a/deployment/.env.example
+++ b/deployment/.env.example
@@ -162,3 +162,7 @@ OPENAI_API_CALL_DELAY_SECONDS=7
 # --- Other AI Provider API Keys ---
 GEMINI_API_KEY=
 MISTRAL_API_KEY=
+
+# --- Credential Encryption ---
+# Optional: encryption key for provider credentials (auto-generated if not set)
+# ENCRYPTION_KEY=
diff --git a/requirements/common-noavx2.txt b/requirements/common-noavx2.txt
index 56543855..220f2faf 100644
--- a/requirements/common-noavx2.txt
+++ b/requirements/common-noavx2.txt
@@ -33,3 +33,4 @@ httpx
 voyager==2.1.0
 transformers==4.35.2
 sentencepiece
+cryptography
diff --git a/requirements/common.txt b/requirements/common.txt
index bdb40da4..d1d59de5 100644
--- a/requirements/common.txt
+++ b/requirements/common.txt
@@ -34,3 +34,4 @@ httpx
 voyager==2.1.0
 transformers==4.57.3
 sentencepiece==0.2.1
+cryptography
diff --git a/tasks/analysis.py b/tasks/analysis.py
index 5cfc7b93..524b2a8f 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -655,7 +655,7 @@ def analyze_album_task(album_id, album_name, top_n_moods, parent_task_id, provid
     from app_helper import (redis_conn, get_db, save_task_status, get_task_info_from_db,
                      save_track_analysis_and_embedding, save_clap_embedding,
                      get_primary_provider_id, find_existing_analysis_by_file_path,
-                     copy_analysis_to_new_item,
+                     link_provider_to_existing_track,
                      TASK_STATUS_STARTED, TASK_STATUS_PROGRESS, TASK_STATUS_SUCCESS, TASK_STATUS_FAILURE, TASK_STATUS_REVOKED)
     from .clap_analyzer import analyze_audio_file as clap_analyze, is_clap_available
     from .mulan_analyzer import analyze_audio_file as mulan_analyze
@@ -726,23 +726,63 @@ def get_existing_track_ids(track_ids):
                 if not track_ids: return set()
                 with get_db() as conn, conn.cursor() as cur:
                     track_ids_as_strings = [str(id) for id in track_ids]
-                    cur.execute("SELECT s.item_id FROM score s JOIN embedding e ON s.item_id = e.item_id WHERE s.item_id IN %s AND s.other_features IS NOT NULL AND s.energy IS NOT NULL AND s.mood_vector IS NOT NULL AND s.tempo IS NOT NULL", (tuple(track_ids_as_strings),))
-                    return {row[0] for row in cur.fetchall()}
+                    # Path 1: Direct match in score
+                    cur.execute("""
+                        SELECT s.item_id FROM score s
+                        JOIN embedding e ON s.item_id = e.item_id
+                        WHERE s.item_id IN %s AND s.other_features IS NOT NULL
+                        AND s.energy IS NOT NULL AND s.mood_vector IS NOT NULL AND s.tempo IS NOT NULL
+                    """, (tuple(track_ids_as_strings),))
+                    found = {row[0] for row in cur.fetchall()}
+                    # Path 2: provider_track chain (secondary providers linked without row duplication)
+                    remaining = set(track_ids_as_strings) - found
+                    if remaining:
+                        cur.execute("""
+                            SELECT pt.item_id FROM provider_track pt
+                            JOIN score s ON pt.track_id = s.track_id
+                            JOIN embedding e ON s.item_id = e.item_id
+                            WHERE pt.item_id IN %s AND s.other_features IS NOT NULL
+                            AND s.energy IS NOT NULL AND s.mood_vector IS NOT NULL AND s.tempo IS NOT NULL
+                        """, (tuple(remaining),))
+                        found.update(row[0] for row in cur.fetchall())
+                    return found
 
             def get_missing_clap_track_ids(track_ids):
                 if not track_ids: return set()
                 with get_db() as conn, conn.cursor() as cur:
                     track_ids_as_strings = [str(id) for id in track_ids]
+                    # Path 1: Direct match
                     cur.execute("SELECT item_id FROM clap_embedding WHERE item_id IN %s", (tuple(track_ids_as_strings),))
                     existing_clap_ids = {row[0] for row in cur.fetchall()}
+                    # Path 2: provider_track chain (linked secondary providers)
+                    remaining = set(track_ids_as_strings) - existing_clap_ids
+                    if remaining:
+                        cur.execute("""
+                            SELECT pt.item_id FROM provider_track pt
+                            JOIN score s ON pt.track_id = s.track_id
+                            JOIN clap_embedding ce ON s.item_id = ce.item_id
+                            WHERE pt.item_id IN %s
+                        """, (tuple(remaining),))
+                        existing_clap_ids.update(row[0] for row in cur.fetchall())
                     return set(track_ids_as_strings) - existing_clap_ids
 
             def get_missing_mulan_track_ids(track_ids):
                 if not track_ids: return set()
                 with get_db() as conn, conn.cursor() as cur:
                     track_ids_as_strings = [str(id) for id in track_ids]
+                    # Path 1: Direct match
                     cur.execute("SELECT item_id FROM mulan_embedding WHERE item_id IN %s", (tuple(track_ids_as_strings),))
                     existing_mulan_ids = {row[0] for row in cur.fetchall()}
+                    # Path 2: provider_track chain (linked secondary providers)
+                    remaining = set(track_ids_as_strings) - existing_mulan_ids
+                    if remaining:
+                        cur.execute("""
+                            SELECT pt.item_id FROM provider_track pt
+                            JOIN score s ON pt.track_id = s.track_id
+                            JOIN mulan_embedding me ON s.item_id = me.item_id
+                            WHERE pt.item_id IN %s
+                        """, (tuple(remaining),))
+                        existing_mulan_ids.update(row[0] for row in cur.fetchall())
                     return set(track_ids_as_strings) - existing_mulan_ids
 
             existing_track_ids_set = get_existing_track_ids([str(t['Id']) for t in tracks])
@@ -783,21 +823,26 @@ def get_missing_mulan_track_ids(track_ids):
                 needs_mulan = track_id_str in missing_mulan_ids_set
 
                 # Multi-provider: Check if this track was already analyzed under a different provider's item_id
-                # If so, copy the analysis instead of re-analyzing (saves significant compute time)
+                # If so, link to the existing analysis via provider_track instead of re-analyzing
                 item_file_path = item.get('Path') or item.get('FilePath')
                 if needs_musicnn and item_file_path:
                     existing_analysis = find_existing_analysis_by_file_path(item_file_path, active_provider_id)
                     if existing_analysis and existing_analysis.get('has_musicnn'):
-                        # Found existing analysis from another provider - copy it
                         source_item_id = existing_analysis.get('item_id')
                         if source_item_id and source_item_id != track_id_str:
-                            if copy_analysis_to_new_item(source_item_id, track_id_str, item_file_path, active_provider_id):
-                                logger.info(f"Copied existing analysis for '{track_name_full}' from provider item {source_item_id}")
+                            if link_provider_to_existing_track(
+                                file_path=item_file_path,
+                                provider_id=active_provider_id,
+                                item_id=track_id_str,
+                                title=item.get('Name'),
+                                artist=item.get('AlbumArtist'),
+                                album=item.get('Album')
+                            ):
+                                logger.info(f"Linked '{track_name_full}' to existing analysis (provider item {source_item_id})")
                                 needs_musicnn = False
-                                # Also check if CLAP/MuLan can be copied
                                 if needs_clap and existing_analysis.get('has_clap'):
                                     needs_clap = False
-                                    logger.info(f"  - Also copied CLAP embedding")
+                                    logger.info(f"  - CLAP embedding available via canonical track")
 
                 # Album name update now handled in main analysis task. If needed, uncomment below:
                 # try:
diff --git a/tasks/mcp_server.py b/tasks/mcp_server.py
index 6d1c622c..f74330ca 100644
--- a/tasks/mcp_server.py
+++ b/tasks/mcp_server.py
@@ -304,40 +304,67 @@ def _artist_hits_query_sync(artist: str, ai_config: Dict, get_songs: int) -> Lis
             log_messages.append(f"Failed to parse AI response: {str(e)}")
             return {"songs": [], "message": "\n".join(log_messages)}
         
-        # Query database for exact matches
+        # Query database for matches (batched)
         with db_conn.cursor(cursor_factory=DictCursor) as cur:
             found_songs = []
-            for title in suggested_titles:
-                cur.execute("""
+            seen_ids = set()
+
+            if suggested_titles:
+                # Build a single query with OR conditions for all suggested titles
+                or_conditions = []
+                title_params = []
+                for title in suggested_titles:
+                    or_conditions.append("title ILIKE %s")
+                    title_params.append(f"%{title}%")
+
+                where_clause = ' OR '.join(or_conditions)
+                cur.execute(f"""
                     SELECT item_id, title, author
                     FROM public.score
-                    WHERE author = %s AND title ILIKE %s
-                    LIMIT 1
-                """, (artist, f"%{title}%"))
-                result = cur.fetchone()
-                if result:
-                    found_songs.append({
-                        "item_id": result['item_id'],
-                        "title": result['title'],
-                        "artist": result['author']
-                    })
-            
+                    WHERE author = %s AND ({where_clause})
+                """, [artist] + title_params)
+                rows = cur.fetchall()
+
+                for title in suggested_titles:
+                    # Find matching row (ILIKE %title% match)
+                    for row in rows:
+                        if title.lower() in row['title'].lower() and row['item_id'] not in seen_ids:
+                            found_songs.append({
+                                "item_id": row['item_id'],
+                                "title": row['title'],
+                                "artist": row['author']
+                            })
+                            seen_ids.add(row['item_id'])
+                            break
+
             # If we found some but not enough, add more random songs from this artist
             if len(found_songs) < get_songs:
-                cur.execute("""
-                    SELECT item_id, title, author
-                    FROM public.score
-                    WHERE author = %s
-                    ORDER BY RANDOM()
-                    LIMIT %s
-                """, (artist, get_songs - len(found_songs)))
+                exclude_ids = list(seen_ids)
+                if exclude_ids:
+                    cur.execute("""
+                        SELECT item_id, title, author
+                        FROM public.score
+                        WHERE author = %s AND item_id != ALL(%s)
+                        ORDER BY RANDOM()
+                        LIMIT %s
+                    """, (artist, exclude_ids, get_songs - len(found_songs)))
+                else:
+                    cur.execute("""
+                        SELECT item_id, title, author
+                        FROM public.score
+                        WHERE author = %s
+                        ORDER BY RANDOM()
+                        LIMIT %s
+                    """, (artist, get_songs - len(found_songs)))
                 additional = cur.fetchall()
                 for r in additional:
-                    found_songs.append({
-                        "item_id": r['item_id'],
-                        "title": r['title'],
-                        "artist": r['author']
-                    })
+                    if r['item_id'] not in seen_ids:
+                        found_songs.append({
+                            "item_id": r['item_id'],
+                            "title": r['title'],
+                            "artist": r['author']
+                        })
+                        seen_ids.add(r['item_id'])
         
         log_messages.append(f"Found {len(found_songs)} songs by {artist}")
         return {"songs": found_songs, "message": "\n".join(log_messages)}
@@ -539,7 +566,7 @@ def _ai_brainstorm_sync(user_request: str, ai_config: Dict, get_songs: int) -> L
             log_messages.append(f"Raw AI response (first 500 chars): {raw_response[:500]}")
             return {"songs": [], "message": "\n".join(log_messages)}
         
-        # Search database for these songs using strict two-stage matching
+        # Search database for these songs using strict two-stage matching (batched)
         found_songs = []
         seen_ids = set()
 
@@ -551,50 +578,96 @@ def _escape_like(s: str) -> str:
             """Escape LIKE wildcards to prevent injection."""
             return s.replace('%', r'\%').replace('_', r'\_')
 
-        for item in song_list:
-            title = item.get('title', '')
-            artist = item.get('artist', '')
-
-            if not title or not artist:
-                continue
+        # Filter valid items (need both title and artist)
+        valid_items = [(item.get('title', ''), item.get('artist', ''))
+                       for item in song_list
+                       if item.get('title') and item.get('artist')]
 
-            with db_conn.cursor(cursor_factory=DictCursor) as cur:
-                # Stage 1: Exact case-insensitive match on BOTH title AND artist
-                cur.execute("""
+        stage2_items = []
+        with db_conn.cursor(cursor_factory=DictCursor) as cur:
+            # Stage 1: Batch exact case-insensitive match on BOTH title AND artist
+            if valid_items:
+                values_params = []
+                for title, artist in valid_items:
+                    values_params.extend([title.lower(), artist.lower()])
+                values_clause = ', '.join(['(%s, %s)'] * len(valid_items))
+                cur.execute(f"""
                     SELECT item_id, title, author
                     FROM public.score
-                    WHERE LOWER(title) = LOWER(%s) AND LOWER(author) = LOWER(%s)
-                    LIMIT 1
-                """, (title, artist))
-                result = cur.fetchone()
-
-                # Stage 2: Normalized fuzzy match requiring BOTH title AND artist to match
-                if not result:
+                    WHERE (LOWER(title), LOWER(author)) IN (VALUES {values_clause})
+                """, values_params)
+                exact_rows = cur.fetchall()
+
+                # Index exact matches by (lower_title, lower_author) for lookup
+                exact_match_map = {}
+                for row in exact_rows:
+                    key = (row['title'].lower(), row['author'].lower())
+                    if key not in exact_match_map:
+                        exact_match_map[key] = row
+
+                # Collect results from stage 1, track unmatched for stage 2
+                stage2_items = []
+                for title, artist in valid_items:
+                    key = (title.lower(), artist.lower())
+                    result = exact_match_map.get(key)
+                    if result and result['item_id'] not in seen_ids:
+                        found_songs.append({
+                            "item_id": result['item_id'],
+                            "title": result['title'],
+                            "artist": result['author']
+                        })
+                        seen_ids.add(result['item_id'])
+                    elif not result:
+                        stage2_items.append((title, artist))
+
+            # Stage 2: Batch normalized fuzzy match for items not found in stage 1
+            if stage2_items:
+                or_conditions = []
+                fuzzy_params = []
+                fuzzy_lookup_order = []
+                for title, artist in stage2_items:
                     title_norm = _normalize(title)
                     artist_norm = _normalize(artist)
                     if title_norm and artist_norm:
-                        cur.execute("""
-                            SELECT item_id, title, author
-                            FROM public.score
-                            WHERE LOWER(REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(title, ' ', ''), '-', ''), '''', ''), '.', ''), ',', ''))
-                                  LIKE LOWER(%s)
-                              AND LOWER(REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(author, ' ', ''), '-', ''), '''', ''), '.', ''), ',', ''))
-                                  LIKE LOWER(%s)
-                            ORDER BY LENGTH(title) + LENGTH(author)
-                            LIMIT 1
-                        """, (f"%{_escape_like(title_norm)}%", f"%{_escape_like(artist_norm)}%"))
-                        result = cur.fetchone()
-
-                if result and result['item_id'] not in seen_ids:
-                    found_songs.append({
-                        "item_id": result['item_id'],
-                        "title": result['title'],
-                        "artist": result['author']
-                    })
-                    seen_ids.add(result['item_id'])
-
-            if len(found_songs) >= get_songs:
-                break
+                        or_conditions.append("""(
+                            LOWER(REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(title, ' ', ''), '-', ''), '''', ''), '.', ''), ',', ''))
+                                LIKE LOWER(%s)
+                            AND LOWER(REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(author, ' ', ''), '-', ''), '''', ''), '.', ''), ',', ''))
+                                LIKE LOWER(%s)
+                        )""")
+                        fuzzy_params.extend([f"%{_escape_like(title_norm)}%", f"%{_escape_like(artist_norm)}%"])
+                        fuzzy_lookup_order.append((title_norm, artist_norm))
+
+                if or_conditions:
+                    where_clause = ' OR '.join(or_conditions)
+                    cur.execute(f"""
+                        SELECT item_id, title, author
+                        FROM public.score
+                        WHERE {where_clause}
+                        ORDER BY LENGTH(title) + LENGTH(author)
+                    """, fuzzy_params)
+                    fuzzy_rows = cur.fetchall()
+
+                    # Match fuzzy results back to requested items
+                    # Build a normalized lookup from DB results
+                    for row in fuzzy_rows:
+                        if row['item_id'] not in seen_ids:
+                            db_title_norm = _normalize(row['title'])
+                            db_artist_norm = _normalize(row['author'])
+                            # Check if this row matches any of the stage2 requests
+                            for t_norm, a_norm in fuzzy_lookup_order:
+                                if t_norm in db_title_norm and a_norm in db_artist_norm:
+                                    found_songs.append({
+                                        "item_id": row['item_id'],
+                                        "title": row['title'],
+                                        "artist": row['author']
+                                    })
+                                    seen_ids.add(row['item_id'])
+                                    fuzzy_lookup_order.remove((t_norm, a_norm))
+                                    break
+
+        # Trim to requested count
+        found_songs = found_songs[:get_songs]
 
         log_messages.append(f"Found {len(found_songs)} songs in database (from {len(song_list)} AI suggestions)")
 
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index 9c5b61ee..74d8306a 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -73,7 +73,7 @@
     get_all_playlists as emby_get_all_playlists,
     delete_playlist as emby_delete_playlist,
     get_recent_albums as emby_get_recent_albums,
-    get_recent_music_items as emby_get_recent_music_items,
+
     get_tracks_from_album as emby_get_tracks_from_album,
     download_track as emby_download_track,
     get_all_songs as emby_get_all_songs,
@@ -332,25 +332,6 @@ def get_recent_albums(limit):
     if config.MEDIASERVER_TYPE == 'localfiles': return localfiles_get_recent_albums(limit)
     return []
 
-def get_recent_music_items(limit):
-    """
-    Fetches both recent albums AND standalone tracks for comprehensive music discovery.
-    This ensures no music is missed during analysis, even with incomplete metadata.
-    Now implemented for Jellyfin, Navidrome, and Lyrion - all provide comprehensive discovery.
-    """
-    if config.MEDIASERVER_TYPE == 'jellyfin': 
-        return jellyfin_get_recent_music_items(limit)
-    elif config.MEDIASERVER_TYPE == 'navidrome': 
-        return navidrome_get_recent_music_items(limit)
-    elif config.MEDIASERVER_TYPE == 'lyrion': 
-        return lyrion_get_recent_music_items(limit)
-    elif config.MEDIASERVER_TYPE == 'emby': 
-        return emby_get_recent_music_items(limit)
-    else:
-        # Fallback to regular album fetching for servers without comprehensive discovery
-        logger.info(f"get_recent_music_items not yet implemented for {config.MEDIASERVER_TYPE}, falling back to get_recent_albums")
-        return get_recent_albums(limit)
-
 def get_tracks_from_album(album_id):
     """Fetches tracks for an album using admin credentials."""
     if config.MEDIASERVER_TYPE == 'jellyfin': return jellyfin_get_tracks_from_album(album_id)
@@ -932,93 +913,65 @@ def _get_playlists_for_provider_type(provider_type):
     return []
 
 
-def remap_item_ids_for_provider(item_ids: list, source_provider_id: int, target_provider_id: int) -> list:
+def remap_item_ids_for_provider(item_ids: list, target_provider_id: int) -> list:
     """
-    Remap item IDs from one provider's namespace to another's using file_path as the common key.
+    Remap canonical item IDs (from score) to a target provider's native IDs.
+
+    Uses the provider_track table to resolve canonical item_ids to the target
+    provider's namespace. With single-row-per-track in score, this is the only
+    correct way to remap across providers.
 
-    When creating playlists across providers, item_ids from the source provider need to be
-    translated to the target provider's item_ids. This is done by:
-    1. Looking up file_path for each source item_id in the score table
-    2. Finding the matching item_id in the target provider by file_path
+    The lookup chain is:
+      canonical item_id -> score.track_id -> provider_track(target_provider_id) -> target item_id
+
+    Also handles the case where the canonical item_id already belongs to the target provider.
 
     Args:
-        item_ids: List of item IDs from the source provider
-        source_provider_id: ID of the source provider
+        item_ids: List of canonical item IDs (from score table)
         target_provider_id: ID of the target provider
 
     Returns:
         List of remapped item IDs for the target provider (preserving order, skipping unmatchable)
     """
-    if not item_ids:
-        return []
-
-    # If same provider, no remapping needed
-    if source_provider_id == target_provider_id:
-        return item_ids
+    if not item_ids or not target_provider_id:
+        return item_ids or []
 
     from app_helper import get_db
 
     db = get_db()
-    remapped_ids = []
-
     try:
         with db.cursor() as cur:
-            # Get file_paths for source item_ids
-            cur.execute("""
-                SELECT item_id, file_path
-                FROM score
-                WHERE item_id = ANY(%s) AND file_path IS NOT NULL
-            """, (item_ids,))
-            source_id_to_path = {row[0]: row[1] for row in cur.fetchall()}
-
-            if not source_id_to_path:
-                logger.warning(f"No file_paths found for source item_ids (provider {source_provider_id})")
-                return item_ids  # Fall back to original IDs
-
-            # Get the file paths we need to look up
-            paths_to_find = list(source_id_to_path.values())
-
-            # Find matching item_ids in target provider by file_path,
-            # excluding source item_ids so we get the target provider's IDs
+            # Single batch query: canonical -> track_id -> target provider's item_id
+            # pt_track: resolves via score.track_id -> provider_track
+            # pt_direct: handles case where canonical item_id IS the target provider's ID
             cur.execute("""
-                SELECT item_id, file_path
-                FROM score
-                WHERE file_path = ANY(%s) AND item_id != ALL(%s)
-            """, (paths_to_find, item_ids))
-            path_to_ids = {}
-            for row in cur.fetchall():
-                path = row[1]
-                if path not in path_to_ids:
-                    path_to_ids[path] = []
-                path_to_ids[path].append(row[0])
-
-            # Remap in order, preserving the original playlist order
-            for orig_id in item_ids:
-                path = source_id_to_path.get(orig_id)
-                if path and path in path_to_ids:
-                    # Use the first matching ID (there might be multiple if same file analyzed multiple times)
-                    target_ids = path_to_ids[path]
-                    if target_ids:
-                        # Prefer an ID that's different from source if available (for cross-provider)
-                        for tid in target_ids:
-                            if tid != orig_id:
-                                remapped_ids.append(tid)
-                                break
-                        else:
-                            # All IDs are the same, use the first one
-                            remapped_ids.append(target_ids[0])
-                else:
-                    # No match found, keep original ID (might work if providers share IDs)
-                    logger.debug(f"No cross-provider match for item_id {orig_id}, keeping original")
-                    remapped_ids.append(orig_id)
+                SELECT s.item_id AS canonical_id,
+                       COALESCE(pt_track.item_id, pt_direct.item_id) AS target_id
+                FROM score s
+                LEFT JOIN provider_track pt_track
+                    ON pt_track.track_id = s.track_id AND pt_track.provider_id = %s
+                LEFT JOIN provider_track pt_direct
+                    ON pt_direct.item_id = s.item_id AND pt_direct.provider_id = %s
+                WHERE s.item_id = ANY(%s)
+                  AND (pt_track.item_id IS NOT NULL OR pt_direct.item_id IS NOT NULL)
+            """, (target_provider_id, target_provider_id, item_ids))
+
+            canonical_to_target = {row[0]: row[1] for row in cur.fetchall()}
+
+        remapped = []
+        for canonical_id in item_ids:
+            target_id = canonical_to_target.get(canonical_id)
+            if target_id:
+                remapped.append(target_id)
+            else:
+                logger.debug(f"No mapping for {canonical_id} to provider {target_provider_id}")
 
-            logger.info(f"Remapped {len(remapped_ids)} of {len(item_ids)} item IDs for cross-provider playlist")
+        logger.info(f"Remapped {len(remapped)} of {len(item_ids)} item IDs for provider {target_provider_id}")
+        return remapped
 
     except Exception as e:
         logger.error(f"Error remapping item IDs: {e}")
-        return item_ids  # Fall back to original IDs
-
-    return remapped_ids
+        return item_ids
 
 
 def create_playlist_multi_provider(playlist_name, item_ids, provider_ids=None, user_creds=None):
@@ -1070,24 +1023,15 @@ def create_playlist_multi_provider(playlist_name, item_ids, provider_ids=None, u
             provider = get_provider_by_id(provider_ids)
             providers = [provider] if provider else []
 
-    # Determine source provider for ID remapping
-    # If we have a primary provider, use its IDs as the source
-    source_provider_id = get_primary_provider_id()
-    if not source_provider_id and providers:
-        source_provider_id = providers[0]['id']
-
     # Create playlist on each provider
     for provider in providers:
         provider_id = provider['id']
         provider_type = provider['provider_type']
 
         try:
-            # Remap item IDs if creating on a different provider
-            if source_provider_id and provider_id != source_provider_id:
-                remapped_ids = remap_item_ids_for_provider(item_ids, source_provider_id, provider_id)
-                logger.info(f"Cross-provider playlist: remapped {len(item_ids)} IDs for provider {provider.get('name')}")
-            else:
-                remapped_ids = item_ids
+            # ALWAYS remap - canonical item_ids are provider-agnostic
+            remapped_ids = remap_item_ids_for_provider(item_ids, provider_id)
+            logger.info(f"Playlist remap: {len(remapped_ids)} of {len(item_ids)} IDs resolved for provider {provider.get('name')}")
 
             if not remapped_ids:
                 logger.warning(f"No valid track IDs after remapping for provider {provider.get('name')}")
diff --git a/tasks/mediaserver_localfiles.py b/tasks/mediaserver_localfiles.py
index 1182a69a..78affc39 100644
--- a/tasks/mediaserver_localfiles.py
+++ b/tasks/mediaserver_localfiles.py
@@ -40,15 +40,18 @@
 # CONFIGURATION
 # ##############################################################################
 
-def get_config() -> Dict:
+def get_config(overrides: Dict = None) -> Dict:
     """Get local file provider configuration from environment or defaults."""
-    return {
+    cfg = {
         'music_directory': os.environ.get('LOCALFILES_MUSIC_DIRECTORY', '/music'),
         'supported_formats': os.environ.get('LOCALFILES_FORMATS', ','.join(SUPPORTED_FORMATS)).split(','),
         'scan_subdirectories': os.environ.get('LOCALFILES_SCAN_SUBDIRS', 'true').lower() == 'true',
         'use_embedded_metadata': os.environ.get('LOCALFILES_USE_METADATA', 'true').lower() == 'true',
         'playlist_directory': os.environ.get('LOCALFILES_PLAYLIST_DIR', '/music/playlists'),
     }
+    if overrides:
+        cfg.update(overrides)
+    return cfg
 
 
 # ##############################################################################
@@ -60,6 +63,9 @@ def _get_songs_from_db() -> List[Dict]:
     Query the score table for songs with file_path set (previously analyzed).
     Returns a list of dicts matching the format returned by get_all_songs().
     Falls back to empty list if DB is unavailable.
+
+    Uses provider_track join to return the localfiles provider's native item_id
+    when available, with fallback to score.item_id for legacy data.
     """
     try:
         from app_helper import get_db
@@ -67,13 +73,27 @@ def _get_songs_from_db() -> List[Dict]:
         if not db:
             return []
         with db.cursor() as cur:
+            # Try provider-filtered query first (returns localfiles provider item_ids)
             cur.execute("""
-                SELECT item_id, title, author, album, album_artist, file_path,
-                       year, rating
-                FROM score
-                WHERE file_path IS NOT NULL
+                SELECT pt.item_id, s.title, s.author, s.album, s.album_artist,
+                       s.file_path, s.year, s.rating
+                FROM score s
+                JOIN provider_track pt ON pt.track_id = s.track_id
+                JOIN provider p ON p.id = pt.provider_id AND p.provider_type = 'localfiles'
+                WHERE s.file_path IS NOT NULL
+                LIMIT 100000
             """)
             rows = cur.fetchall()
+            if not rows:
+                # Fallback for legacy data without provider_track mappings
+                cur.execute("""
+                    SELECT item_id, title, author, album, album_artist, file_path,
+                           year, rating
+                    FROM score
+                    WHERE file_path IS NOT NULL
+                    LIMIT 100000
+                """)
+                rows = cur.fetchall()
             songs = []
             for row in rows:
                 songs.append({
@@ -87,6 +107,14 @@ def _get_songs_from_db() -> List[Dict]:
                     'Year': row[6],
                     'Rating': row[7],
                 })
+            # Verify sample of file paths exist on disk (stale-data check)
+            sample_size = min(5, len(songs))
+            if sample_size > 0:
+                import random
+                sample = random.sample(songs, sample_size)
+                missing = [s for s in sample if s.get('FilePath') and not os.path.exists(s['FilePath'])]
+                if len(missing) == sample_size:
+                    logger.warning(f"Stale data detected: none of {sample_size} sampled file paths exist on disk")
             return songs
     except Exception as e:
         logger.debug(f"DB cache lookup failed (expected during first scan): {e}")
@@ -622,13 +650,13 @@ def get_playlist_by_name(playlist_name: str) -> Optional[Dict]:
     return None
 
 
-def create_playlist(base_name: str, item_ids: List[str]) -> Optional[str]:
+def create_playlist(base_name: str, item_ids: List[str], config_override: Dict = None) -> Optional[str]:
     """
     Create an M3U playlist file.
 
     item_ids are the file path hashes - we need to look up the actual paths.
     """
-    cfg = get_config()
+    cfg = get_config(overrides=config_override)
     playlist_dir = cfg['playlist_directory']
     music_dir = cfg['music_directory']
 
@@ -698,26 +726,16 @@ def delete_playlist(playlist_id: str) -> bool:
 def create_instant_playlist(playlist_name: str, item_ids: List[str], user_creds=None, server_config=None) -> Optional[Dict]:
     """Create an instant playlist (same as regular playlist for local files)."""
     sc = server_config or {}
-    # Temporarily override env vars if server_config provides directories
-    overrides = {}
+    config_override = {}
     if sc.get('music_directory'):
-        overrides['LOCALFILES_MUSIC_DIRECTORY'] = os.environ.get('LOCALFILES_MUSIC_DIRECTORY')
-        os.environ['LOCALFILES_MUSIC_DIRECTORY'] = sc['music_directory']
+        config_override['music_directory'] = sc['music_directory']
     if sc.get('playlist_directory'):
-        overrides['LOCALFILES_PLAYLIST_DIR'] = os.environ.get('LOCALFILES_PLAYLIST_DIR')
-        os.environ['LOCALFILES_PLAYLIST_DIR'] = sc['playlist_directory']
-    try:
-        final_name = f"{playlist_name.strip()}_instant"
-        result = create_playlist(final_name, item_ids)
-        if result:
-            return {'Id': result, 'Name': final_name}
-        return None
-    finally:
-        for key, original in overrides.items():
-            if original is None:
-                os.environ.pop(key, None)
-            else:
-                os.environ[key] = original
+        config_override['playlist_directory'] = sc['playlist_directory']
+    final_name = f"{playlist_name.strip()}_instant"
+    result = create_playlist(final_name, item_ids, config_override=config_override or None)
+    if result:
+        return {'Id': result, 'Name': final_name}
+    return None
 
 
 def get_top_played_songs(limit: int, user_creds=None) -> List[Dict]:
diff --git a/tasks/mediaserver_lyrion.py b/tasks/mediaserver_lyrion.py
index e8f87abe..26440ad4 100644
--- a/tasks/mediaserver_lyrion.py
+++ b/tasks/mediaserver_lyrion.py
@@ -325,12 +325,12 @@ def _get_first_player():
         logger.error(f"Error getting Lyrion player: {e}")
         return "10.42.6.0"  # Use the player from your example as fallback
 
-def _jsonrpc_request(method, params, player_id=""):
+def _jsonrpc_request(method, params, player_id="", base_url=None):
     """
     Helper to make a JSON-RPC request to the Lyrion server without authentication.
     Returns the 'result' field on success, or None on failure.
     """
-    url = f"{config.LYRION_URL}/jsonrpc.js"
+    url = f"{base_url or config.LYRION_URL}/jsonrpc.js"
     payload = {
         "id": 1,
         "method": "slim.request",
@@ -852,7 +852,7 @@ def get_all_songs():
 
     return all_songs
 
-def _add_to_playlist(playlist_id, item_ids):
+def _add_to_playlist(playlist_id, item_ids, base_url=None):
     """Adds songs to a Lyrion playlist using the working player-based method."""
     if not item_ids: 
         return True
@@ -868,7 +868,7 @@ def _add_to_playlist(playlist_id, item_ids):
     try:
         # Get the original playlist name FIRST, before any operations
         logger.debug("Step 0: Getting original playlist name before operations")
-        playlist_info = _jsonrpc_request("playlists", [0, 999999])  # Get all playlists
+        playlist_info = _jsonrpc_request("playlists", [0, 999999], base_url=base_url)  # Get all playlists
         
         original_name = None
         if playlist_info and "playlists_loop" in playlist_info:
@@ -890,7 +890,7 @@ def _add_to_playlist(playlist_id, item_ids):
         load_response = _jsonrpc_request("playlistcontrol", [
             "cmd:load",
             f"playlist_id:{playlist_id}"
-        ], player_id)
+        ], player_id, base_url=base_url)
         
         logger.debug(f"Load playlist response: {load_response}")
         
@@ -906,7 +906,7 @@ def _add_to_playlist(playlist_id, item_ids):
             add_response = _jsonrpc_request("playlistcontrol", [
                 "cmd:add",
                 f"track_id:{track_id_list}"
-            ], player_id)
+            ], player_id, base_url=base_url)
             
             logger.debug(f"Add batch response: {add_response}")
             
@@ -925,7 +925,7 @@ def _add_to_playlist(playlist_id, item_ids):
         delete_response = _jsonrpc_request("playlists", [
             "delete",
             f"playlist_id:{playlist_id}"
-        ])
+        ], base_url=base_url)
         logger.debug(f"Delete response: {delete_response}")
         
         # Step 4: Save the current player playlist with the original name
@@ -934,7 +934,7 @@ def _add_to_playlist(playlist_id, item_ids):
             "save",
             original_name,
             "silent:1"
-        ], player_id)
+        ], player_id, base_url=base_url)
         
         logger.debug(f"Save playlist response: {save_response}")
         
@@ -965,13 +965,13 @@ def _add_to_playlist(playlist_id, item_ids):
         logger.error(f"Error in playlist update method: {e}")
         return False
 
-def _create_playlist_batched(playlist_name, item_ids):
+def _create_playlist_batched(playlist_name, item_ids, base_url=None):
     """Creates a new Lyrion playlist and adds tracks using the web interface approach."""
     logger.info(f"Attempting to create Lyrion playlist '{playlist_name}' with {len(item_ids)} songs using web interface method.")
 
     try:
         # Step 1: Create the playlist using JSON-RPC (this part works)
-        create_response = _jsonrpc_request("playlists", ["new", f"name:{playlist_name}"])
+        create_response = _jsonrpc_request("playlists", ["new", f"name:{playlist_name}"], base_url=base_url)
         
         if create_response:
             playlist_id = (
@@ -985,7 +985,7 @@ def _create_playlist_batched(playlist_name, item_ids):
                 
                 # Step 2: Add tracks using the web interface method
                 if item_ids:
-                    if _add_to_playlist(playlist_id, item_ids):
+                    if _add_to_playlist(playlist_id, item_ids, base_url=base_url):
                         logger.info(f"✅ Successfully added {len(item_ids)} tracks to playlist '{playlist_name}'.")
                     else:
                         logger.warning(f"Playlist '{playlist_name}' created but some tracks may not have been added.")
@@ -1197,14 +1197,6 @@ def get_last_played_time(item_id):
 def create_instant_playlist(playlist_name, item_ids, server_config=None):
     """Creates a new instant playlist on Lyrion for a specific user, with batching."""
     sc = server_config or {}
-    # Temporarily override URL if server_config provides one
-    effective_url = sc.get('url') if sc.get('url') else None
-    if effective_url:
-        original_url = config.LYRION_URL
-        config.LYRION_URL = effective_url
-    try:
-        final_playlist_name = f"{playlist_name.strip()}_instant"
-        return _create_playlist_batched(final_playlist_name, item_ids)
-    finally:
-        if effective_url:
-            config.LYRION_URL = original_url
+    base_url = sc.get('url') or config.LYRION_URL
+    final_playlist_name = f"{playlist_name.strip()}_instant"
+    return _create_playlist_batched(final_playlist_name, item_ids, base_url=base_url)
diff --git a/tasks/mediaserver_navidrome.py b/tasks/mediaserver_navidrome.py
index 7d07ce4c..37fc8ec5 100644
--- a/tasks/mediaserver_navidrome.py
+++ b/tasks/mediaserver_navidrome.py
@@ -112,7 +112,7 @@ def get_navidrome_auth_params(username=None, password=None):
     hex_encoded_password = auth_pass.encode('utf-8').hex()
     return {"u": auth_user, "p": f"enc:{hex_encoded_password}", "v": "1.16.1", "c": "AudioMuse", "f": "json"}
 
-def _navidrome_request(endpoint, params=None, method='get', stream=False, user_creds=None):
+def _navidrome_request(endpoint, params=None, method='get', stream=False, user_creds=None, base_url=None):
     """
     Helper to make Navidrome API requests. It sends all parameters in the URL's
     query string, which is the expected behavior for Subsonic APIs, but can cause
@@ -127,7 +127,7 @@ def _navidrome_request(endpoint, params=None, method='get', stream=False, user_c
         logger.error("Navidrome credentials not configured. Cannot make API call.")
         return None
 
-    url = f"{config.NAVIDROME_URL}/rest/{endpoint}.view"
+    url = f"{base_url or config.NAVIDROME_URL}/rest/{endpoint}.view"
     all_params = {**auth_params, **params}
 
     try:
@@ -384,7 +384,7 @@ def get_all_songs():
 
     return all_songs
 
-def _add_to_playlist(playlist_id, item_ids, user_creds=None):
+def _add_to_playlist(playlist_id, item_ids, user_creds=None, base_url=None):
     """
     Adds a list of songs to an existing Navidrome playlist in batches.
     Uses the 'updatePlaylist' endpoint.
@@ -396,9 +396,9 @@ def _add_to_playlist(playlist_id, item_ids, user_creds=None):
     for i in range(0, len(item_ids), NAVIDROME_API_BATCH_SIZE):
         batch_ids = item_ids[i:i + NAVIDROME_API_BATCH_SIZE]
         params = {"playlistId": playlist_id, "songIdToAdd": batch_ids}
-        
+
         # Note: updatePlaylist uses a POST method.
-        response = _navidrome_request("updatePlaylist", params, method='post', user_creds=user_creds)
+        response = _navidrome_request("updatePlaylist", params, method='post', user_creds=user_creds, base_url=base_url)
         
         if not (response and response.get("status") == "ok"):
             logger.error(f"Failed to add batch of {len(batch_ids)} songs to playlist {playlist_id}.")
@@ -406,7 +406,7 @@ def _add_to_playlist(playlist_id, item_ids, user_creds=None):
     logger.info(f"Successfully added all songs to playlist {playlist_id}.")
     return True
 
-def _create_playlist_batched(playlist_name, item_ids, user_creds=None):
+def _create_playlist_batched(playlist_name, item_ids, user_creds=None, base_url=None):
     """
     Creates a new playlist on Navidrome. Handles large numbers of
     songs by batching and captures the new playlist ID directly from the
@@ -421,7 +421,7 @@ def _create_playlist_batched(playlist_name, item_ids, user_creds=None):
     ids_to_add_later = item_ids[NAVIDROME_API_BATCH_SIZE:]
 
     create_params = {"name": playlist_name, "songId": ids_for_creation}
-    create_response = _navidrome_request("createPlaylist", create_params, method='post', user_creds=user_creds)
+    create_response = _navidrome_request("createPlaylist", create_params, method='post', user_creds=user_creds, base_url=base_url)
 
     # --- Extract playlist object directly from the creation response ---
     if not (create_response and create_response.get("status") == "ok" and "playlist" in create_response):
@@ -439,7 +439,7 @@ def _create_playlist_batched(playlist_name, item_ids, user_creds=None):
 
     # If there are more songs to add, use the ID we just got
     if ids_to_add_later:
-        if not _add_to_playlist(new_playlist_id, ids_to_add_later, user_creds):
+        if not _add_to_playlist(new_playlist_id, ids_to_add_later, user_creds, base_url=base_url):
             logger.error(f"Failed to add all songs to the new playlist '{playlist_name}'. The playlist was created but may be incomplete.")
             # We still return the playlist object, as it was created.
     
@@ -546,14 +546,6 @@ def create_instant_playlist(playlist_name, item_ids, user_creds=None, server_con
             'user': sc.get('user', ''),
             'password': sc.get('password', ''),
         }
-    # Temporarily override URL if server_config provides one
-    effective_url = sc.get('url') if sc.get('url') else None
-    if effective_url:
-        original_url = config.NAVIDROME_URL
-        config.NAVIDROME_URL = effective_url
-    try:
-        final_playlist_name = f"{playlist_name.strip()}_instant"
-        return _create_playlist_batched(final_playlist_name, item_ids, user_creds)
-    finally:
-        if effective_url:
-            config.NAVIDROME_URL = original_url
+    base_url = sc.get('url') or config.NAVIDROME_URL
+    final_playlist_name = f"{playlist_name.strip()}_instant"
+    return _create_playlist_batched(final_playlist_name, item_ids, user_creds, base_url=base_url)
diff --git a/tasks/voyager_manager.py b/tasks/voyager_manager.py
index c9a3c26c..bf3e2c46 100644
--- a/tasks/voyager_manager.py
+++ b/tasks/voyager_manager.py
@@ -222,8 +222,14 @@ def build_and_store_voyager_index(db_conn=None):
 
     cur = db_conn.cursor()
     try:
-        logger.info("Fetching all embeddings from the database...")
-        cur.execute("SELECT item_id, embedding FROM embedding")
+        logger.info("Fetching all embeddings from the database (deduplicated by track)...")
+        cur.execute("""
+            SELECT DISTINCT ON (COALESCE(s.track_id, e.item_id))
+                   e.item_id, e.embedding
+            FROM embedding e
+            JOIN score s ON e.item_id = s.item_id
+            ORDER BY COALESCE(s.track_id, e.item_id), s.item_id
+        """)
         all_embeddings = cur.fetchall()
 
         if not all_embeddings:
diff --git a/templates/settings.html b/templates/settings.html
index 95e5c56d..70a9bf06 100644
--- a/templates/settings.html
+++ b/templates/settings.html
@@ -180,6 +180,7 @@
         display: flex;
         align-items: center;
         justify-content: space-between;
+        flex-wrap: wrap;
         padding: 1rem;
         background: var(--bg-card);
         border-radius: 8px;
@@ -493,6 +494,27 @@
         color: #dc3545;
     }
 
+    .test-result.warning {
+        background: rgba(255, 193, 7, 0.2);
+        color: #856404;
+    }
+
+    body.dark-mode .test-result.warning {
+        background: rgba(255, 193, 7, 0.15);
+        color: #ffc107;
+    }
+
+    .rescan-result {
+        margin-top: 0.5rem;
+        width: 100%;
+    }
+
+    .rescan-actions {
+        display: flex;
+        gap: 0.5rem;
+        margin-top: 0.5rem;
+    }
+
     /* Library Checklist */
     .library-checklist {
         margin-top: 0.75rem;
@@ -890,8 +912,10 @@ <h3 id="modal-title">Add Provider</h3>
                 <div class="provider-actions">
                     <button onclick="editProvider(${p.id})">Edit</button>
                     <button onclick="toggleProvider(${p.id}, ${!p.enabled})">${p.enabled ? 'Disable' : 'Enable'}</button>
+                    ${p.provider_type === 'navidrome' ? `<button onclick="rescanPaths(${p.id})">Rescan Paths</button>` : ''}
                     <button class="btn-danger" onclick="deleteProvider(${p.id})">Delete</button>
                 </div>
+                <div id="rescan-result-${p.id}" class="rescan-result"></div>
             `;
             list.appendChild(item);
 
@@ -1337,6 +1361,81 @@ <h3 id="modal-title">Add Provider</h3>
         }
     }
 
+    async function rescanPaths(providerId) {
+        const resultDiv = document.getElementById(`rescan-result-${providerId}`);
+        resultDiv.innerHTML = '<div class="test-result">Rescanning paths...</div>';
+
+        try {
+            const response = await fetch(`/api/setup/providers/${providerId}/rescan-paths`, {
+                method: 'POST',
+                headers: { 'Content-Type': 'application/json' }
+            });
+            const data = await response.json();
+
+            if (!data.success) {
+                resultDiv.innerHTML = `<div class="test-result error">${data.message}</div>`;
+                return;
+            }
+
+            let html = `<div class="test-result ${data.path_format === 'relative' && providers.length > 1 ? 'warning' : 'success'}">`;
+            html += `<strong>Path format:</strong> ${data.path_format}`;
+
+            if (data.path_format === 'relative' && providers.length > 1) {
+                html += `<br>Relative paths may prevent cross-provider track matching.`;
+                html += `<br><small>Enable <strong>"Report Real Path"</strong> in Navidrome's Subsonic settings, then rescan again.</small>`;
+            }
+
+            if (data.matches_found > 0) {
+                html += `<br><strong>Prefix:</strong> "${data.suggested_prefix}" (${data.confidence} confidence, ${data.matches_found} matches)`;
+                if (data.current_prefix !== undefined) {
+                    html += `<br><strong>Current prefix:</strong> "${data.current_prefix}"`;
+                }
+            }
+
+            html += `</div>`;
+
+            if (data.prefix_changed) {
+                html += `<div class="rescan-actions">
+                    <button onclick="updateProviderPrefix(${providerId}, '${data.suggested_prefix.replace(/'/g, "\\'")}')">
+                        Apply Prefix "${data.suggested_prefix}"
+                    </button>
+                </div>`;
+            }
+
+            resultDiv.innerHTML = html;
+        } catch (err) {
+            resultDiv.innerHTML = `<div class="test-result error">Rescan failed: ${err.message}</div>`;
+        }
+    }
+
+    async function updateProviderPrefix(providerId, newPrefix) {
+        try {
+            const provider = providers.find(p => p.id === providerId);
+            if (!provider) {
+                showToast('Provider not found', 'error');
+                return;
+            }
+
+            const updatedConfig = { ...provider.config, music_path_prefix: newPrefix };
+            const response = await fetch(`/api/setup/providers/${providerId}`, {
+                method: 'PUT',
+                headers: { 'Content-Type': 'application/json' },
+                body: JSON.stringify({ config: updatedConfig })
+            });
+
+            if (response.ok) {
+                showToast('Path prefix updated', 'success');
+                await loadProviders();
+                renderProviders();
+            } else {
+                const data = await response.json();
+                showToast(data.error || 'Failed to update prefix', 'error');
+            }
+        } catch (err) {
+            showToast('Error updating prefix: ' + err.message, 'error');
+        }
+    }
+
     // Save settings
     async function saveSettings() {
         // Collect current values
diff --git a/templates/setup.html b/templates/setup.html
index ff61a5d1..435a06db 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -251,6 +251,16 @@
         color: #dc3545;
     }
 
+    .test-result.warning {
+        background: rgba(255, 193, 7, 0.2);
+        color: #856404;
+    }
+
+    body.dark-mode .test-result.warning {
+        background: rgba(255, 193, 7, 0.15);
+        color: #ffc107;
+    }
+
     /* Browse Input Group */
     .input-with-browse {
         display: flex;
@@ -786,6 +796,89 @@
         color: var(--text-muted);
         margin-top: 0.5rem;
     }
+
+    /* Provider Guide Info Box */
+    .provider-guide {
+        margin-bottom: 1rem;
+        border-radius: 4px;
+        background: var(--bg-body);
+        border: 1px solid var(--border-color);
+        border-left: 3px solid var(--color-primary);
+    }
+
+    .provider-guide summary {
+        padding: 0.75rem 1rem;
+        cursor: pointer;
+        font-weight: 600;
+        font-size: 0.95rem;
+        color: var(--color-primary);
+        list-style: none;
+        display: flex;
+        align-items: center;
+        gap: 0.5rem;
+    }
+
+    .provider-guide summary::-webkit-details-marker {
+        display: none;
+    }
+
+    .provider-guide summary::before {
+        content: '\25B6';
+        font-size: 0.7rem;
+        transition: transform 0.2s ease;
+    }
+
+    .provider-guide[open] summary::before {
+        transform: rotate(90deg);
+    }
+
+    .provider-guide .guide-content {
+        padding: 0 1rem 1rem 1rem;
+        font-size: 0.9rem;
+        line-height: 1.6;
+        color: var(--text-body);
+    }
+
+    .provider-guide .guide-content h4 {
+        margin: 0.75rem 0 0.25rem 0;
+        font-size: 0.9rem;
+        color: var(--text-title);
+    }
+
+    .provider-guide .guide-content ul,
+    .provider-guide .guide-content ol {
+        margin: 0.25rem 0 0.5rem 1.25rem;
+        padding: 0;
+    }
+
+    .provider-guide .guide-content li {
+        margin-bottom: 0.25rem;
+    }
+
+    .provider-guide .guide-content code {
+        background: var(--bg-card);
+        padding: 0.1rem 0.35rem;
+        border-radius: 3px;
+        font-size: 0.85rem;
+    }
+
+    .provider-guide .guide-content a {
+        color: var(--color-primary);
+        text-decoration: none;
+    }
+
+    .provider-guide .guide-content a:hover {
+        text-decoration: underline;
+    }
+
+    .provider-guide .guide-content .guide-tested {
+        margin-top: 0.5rem;
+        padding: 0.4rem 0.6rem;
+        background: rgba(40, 167, 69, 0.1);
+        border-radius: 4px;
+        font-size: 0.85rem;
+        color: var(--text-muted);
+    }
 </style>
 {% endblock %}
 
@@ -1237,6 +1330,71 @@ <h4>Existing Installation Detected</h4>
         }
     }
 
+    // Provider setup guides - shown as expandable info box in provider config section
+    const PROVIDER_GUIDES = {
+        jellyfin: `
+            <h4>Getting Your Credentials</h4>
+            <ul>
+                <li><strong>User ID:</strong> Go to the Jellyfin admin panel, click on a user, and copy the User ID from the URL (the long string after <code>/users/</code>)</li>
+                <li><strong>API Token:</strong> Go to <strong>Dashboard &gt; API Keys</strong>, click <strong>"+"</strong> to create a new key, and give it a name like "AudioMuse"</li>
+            </ul>
+            <h4>Optional Plugin</h4>
+            <p>For enhanced integration, install the <a href="https://github.com/NeptuneHub/audiomuse-ai-plugin" target="_blank" rel="noopener">AudioMuse-AI Plugin for Jellyfin</a> to trigger analysis directly from Jellyfin.</p>
+            <div class="guide-tested">Validated with Jellyfin <strong>10.11.3</strong></div>
+        `,
+        navidrome: `
+            <h4>Getting Your Credentials</h4>
+            <ul>
+                <li>Use your standard Navidrome <strong>username</strong> and <strong>password</strong></li>
+                <li>For LMS or other Subsonic-compatible servers, use the <strong>Subsonic API token</strong> instead of the password</li>
+            </ul>
+            <h4>Enabling Real Path (Multi-Provider)</h4>
+            <p>By default, Navidrome reports an internal path (artist/album/track) rather than the real file path. If you use multiple providers and want to match files across them, enable "Report Real Path":</p>
+            <ol>
+                <li>Log into the Navidrome web interface</li>
+                <li>Go to <strong>Players</strong> in the right sidebar</li>
+                <li>Click on the <strong>AudioMuse</strong> player entry (appears after AudioMuse first connects)</li>
+                <li>Toggle <strong>"Report Real Path"</strong> to enabled</li>
+            </ol>
+            <p>Alternatively, set <code>ND_DEFAULTREPORTREALPATH=true</code> as a Navidrome environment variable to enable this by default for all players.</p>
+            <h4>Optional Plugin</h4>
+            <p>For enhanced integration, install the <a href="https://github.com/NeptuneHub/AudioMuse-AI-NV-plugin" target="_blank" rel="noopener">AudioMuse-AI Plugin for Navidrome</a> to trigger analysis directly from Navidrome.</p>
+            <div class="guide-tested">Validated with Navidrome <strong>0.58.0</strong></div>
+        `,
+        lyrion: `
+            <h4>Getting Your Credentials</h4>
+            <ul>
+                <li><strong>No authentication required</strong> &mdash; just enter your Lyrion / LMS server URL</li>
+            </ul>
+            <h4>Compatibility</h4>
+            <p>Also compatible with Logitech Media Server (LMS). No additional plugins are required.</p>
+            <div class="guide-tested">Validated with Lyrion <strong>9.0.2</strong> / LMS <strong>v3.69.0</strong></div>
+        `,
+        emby: `
+            <h4>Getting Your Credentials</h4>
+            <ul>
+                <li><strong>User ID:</strong> Go to the Emby admin panel, click on a user, and copy the User ID from the URL</li>
+                <li><strong>API Token:</strong> Go to <strong>Dashboard &gt; API Keys</strong>, create a new key, and give it a name like "AudioMuse"</li>
+            </ul>
+            <div class="guide-tested">Validated with Emby <strong>4.9.1.80</strong></div>
+        `,
+        localfiles: `
+            <h4>Setup</h4>
+            <ul>
+                <li>Point <strong>Music Directory</strong> to the root folder containing your music files</li>
+                <li>Optionally set a <strong>Playlist Directory</strong> for M3U playlist output</li>
+            </ul>
+            <h4>Supported Formats</h4>
+            <p>MP3, FLAC, OGG, M4A, WAV, WMA, AAC, OPUS</p>
+            <h4>Features</h4>
+            <ul>
+                <li>Extracts metadata from ID3, Vorbis, and MP4 tags</li>
+                <li>Creates M3U playlists in your playlist directory</li>
+                <li>No media server required</li>
+            </ul>
+        `
+    };
+
     // AI Provider configuration fields - names match config.py environment variables
     const aiProviderFields = {
         'OLLAMA': [
@@ -1369,6 +1527,15 @@ <h4>Existing Installation Detected</h4>
             configDiv.className = 'provider-config visible';
             configDiv.innerHTML = `<h4>${provider.name} Configuration</h4>`;
 
+            // Add provider setup guide if available
+            const guide = PROVIDER_GUIDES[type];
+            if (guide) {
+                const guideEl = document.createElement('details');
+                guideEl.className = 'provider-guide';
+                guideEl.innerHTML = `<summary>How to use AudioMuse-AI with ${provider.name}</summary><div class="guide-content">${guide}</div>`;
+                configDiv.appendChild(guideEl);
+            }
+
             const form = document.createElement('div');
 
             provider.config_fields.forEach(field => {
@@ -1505,6 +1672,15 @@ <h4>Existing Installation Detected</h4>
                         resultHTML += `<br><small>${pd.message}</small>`;
                     }
                 }
+
+                // Warn about relative paths for Navidrome in multi-provider setups
+                if (type === 'navidrome' && data.path_format === 'relative' && selectedProviders.length > 1) {
+                    resultHTML += `<div class="test-result warning" style="margin-top: 0.5rem;">
+                        <strong>Warning:</strong> Navidrome is returning relative file paths.
+                        In a multi-provider setup, this will prevent cross-provider track matching.
+                        <br><small>To fix: In Navidrome, go to Settings &gt; Subsonic &gt; enable <strong>"Report Real Path"</strong>, then re-test the connection.</small>
+                    </div>`;
+                }
             }
 
             resultDiv.innerHTML = resultHTML;
diff --git a/testing_suite/ai_naming_test_config.yaml b/testing_suite/ai_naming_test_config.example.yaml
similarity index 100%
rename from testing_suite/ai_naming_test_config.yaml
rename to testing_suite/ai_naming_test_config.example.yaml
diff --git a/testing_suite/comparison_config.yaml b/testing_suite/comparison_config.yaml
deleted file mode 100644
index b085780f..00000000
--- a/testing_suite/comparison_config.yaml
+++ /dev/null
@@ -1,78 +0,0 @@
-# AudioMuse-AI Testing & Comparison Suite - Active Configuration
-
-# Instance A - Main branch (baseline)
-instance_a:
-  name: "main"
-  branch: "main"
-  api_url: "http://localhost:8001"
-  api_timeout: 120
-  pg_host: "localhost"
-  pg_port: 5433
-  pg_user: "audiomuse"
-  pg_password: "audiomusepassword"
-  pg_database: "audiomusedb"
-  redis_url: "redis://localhost:6379/0"
-  docker_flask_container: "test-am-flask-jellyfin"
-  docker_worker_container: "test-am-worker-jellyfin"
-  docker_postgres_container: "test-am-pg-jellyfin"
-  docker_redis_container: "test-am-redis-jellyfin"
-  ssh_host: ""
-  ssh_user: ""
-  ssh_key: ""
-  ssh_port: 22
-
-# Instance B - Feature branch (under test)
-instance_b:
-  name: "feature"
-  branch: "multi-provider-testing-suite"
-  api_url: "http://localhost:8000"
-  api_timeout: 120
-  pg_host: "localhost"
-  pg_port: 5432
-  pg_user: "audiomuse"
-  pg_password: "audiomusepassword"
-  pg_database: "audiomusedb"
-  redis_url: "redis://localhost:6379/0"
-  docker_flask_container: "audiomuse-ai-flask-app"
-  docker_worker_container: "audiomuse-ai-worker-instance"
-  docker_postgres_container: "audiomuse-postgres"
-  docker_redis_container: "audiomuse-redis"
-  ssh_host: ""
-  ssh_user: ""
-  ssh_key: ""
-  ssh_port: 22
-
-# Test modules to run
-run_api_tests: true
-run_db_tests: true
-run_docker_tests: true
-run_performance_tests: true
-run_existing_unit_tests: false
-run_existing_integration_tests: false
-
-# Performance test settings
-perf_warmup_requests: 3
-perf_benchmark_requests: 10
-perf_concurrent_users: 5
-
-# API test settings
-api_retries: 3
-api_retry_delay: 2.0
-api_task_timeout: 1200
-
-# Database quality thresholds
-db_row_count_tolerance_pct: 5.0
-db_embedding_dimension_expected: 200
-db_clap_dimension_expected: 512
-db_score_null_threshold_pct: 10.0
-
-# Reporting
-output_dir: "testing_suite/reports/output"
-report_format: "both"
-verbose: false
-
-# Test track references - tracks that exist in BOTH instances
-test_track_artist_1: "Coldplay"
-test_track_title_1: "Fix You"
-test_track_artist_2: "Linkin Park"
-test_track_title_2: "Papercut"
diff --git a/testing_suite/instant_playlist_test_config.yaml b/testing_suite/instant_playlist_test_config.example.yaml
similarity index 100%
rename from testing_suite/instant_playlist_test_config.yaml
rename to testing_suite/instant_playlist_test_config.example.yaml
diff --git a/testing_suite/test_ai_naming.py b/testing_suite/test_ai_naming.py
index 6d1553df..398945fb 100644
--- a/testing_suite/test_ai_naming.py
+++ b/testing_suite/test_ai_naming.py
@@ -785,9 +785,12 @@ def main():
         description="AudioMuse-AI - AI Playlist Naming Performance Test",
         formatter_class=argparse.RawDescriptionHelpFormatter,
     )
+    _default_cfg = "testing_suite/ai_naming_test_config.yaml"
+    if not os.path.exists(_default_cfg):
+        _default_cfg = "testing_suite/ai_naming_test_config.example.yaml"
     parser.add_argument("--config", "-c", type=str,
-                        default="testing_suite/ai_naming_test_config.yaml",
-                        help="Path to YAML config file (default: testing_suite/ai_naming_test_config.yaml)")
+                        default=_default_cfg,
+                        help="Path to YAML config file (default: ai_naming_test_config.yaml)")
     parser.add_argument("--runs", "-n", type=int, default=None,
                         help="Override num_runs_per_model from config")
     parser.add_argument("--dry-run", action="store_true",
diff --git a/testing_suite/test_instant_playlist.py b/testing_suite/test_instant_playlist.py
index ce629ba1..4ba1debc 100644
--- a/testing_suite/test_instant_playlist.py
+++ b/testing_suite/test_instant_playlist.py
@@ -1569,9 +1569,12 @@ def main():
         description="AudioMuse-AI - Instant Playlist Tool-Calling Performance Test",
         formatter_class=argparse.RawDescriptionHelpFormatter,
     )
+    _default_cfg = "testing_suite/instant_playlist_test_config.yaml"
+    if not os.path.exists(_default_cfg):
+        _default_cfg = "testing_suite/instant_playlist_test_config.example.yaml"
     parser.add_argument("--config", "-c", type=str,
-                        default="testing_suite/instant_playlist_test_config.yaml",
-                        help="Path to YAML config file (default: testing_suite/instant_playlist_test_config.yaml)")
+                        default=_default_cfg,
+                        help="Path to YAML config file (default: instant_playlist_test_config.yaml)")
     parser.add_argument("--runs", "-n", type=int, default=None,
                         help="Override num_runs_per_model from config")
     parser.add_argument("--dry-run", action="store_true",
diff --git a/tests/conftest.py b/tests/conftest.py
new file mode 100644
index 00000000..c6415ace
--- /dev/null
+++ b/tests/conftest.py
@@ -0,0 +1,115 @@
+"""Shared fixtures and helpers for AudioMuse-AI test suite.
+
+Centralises duplicated helpers across test files:
+- importlib bypass loader (avoids tasks/__init__.py -> pydub -> audioop chain)
+- Session-scoped module fixtures for mcp_server, ai_mcp_client, mediaserver_localfiles
+- FakeRow / mock-connection helpers
+- Autouse config restoration fixture
+"""
+import os
+import sys
+import importlib.util
+import pytest
+from unittest.mock import Mock, MagicMock
+
+
+# ---------------------------------------------------------------------------
+# Module import helper
+# ---------------------------------------------------------------------------
+
+def _import_module(mod_name: str, relative_path: str):
+    """Load a module directly by file path, bypassing package __init__.py.
+
+    Args:
+        mod_name: Dotted module name to register in sys.modules
+                  (e.g. 'tasks.mcp_server').
+        relative_path: Path relative to the repo root
+                       (e.g. 'tasks/mcp_server.py').
+    """
+    repo_root = os.path.normpath(
+        os.path.join(os.path.dirname(os.path.abspath(__file__)), '..')
+    )
+    mod_path = os.path.normpath(os.path.join(repo_root, relative_path))
+
+    if mod_name not in sys.modules:
+        spec = importlib.util.spec_from_file_location(mod_name, mod_path)
+        mod = importlib.util.module_from_spec(spec)
+        sys.modules[mod_name] = mod
+        spec.loader.exec_module(mod)
+    return sys.modules[mod_name]
+
+
+# ---------------------------------------------------------------------------
+# Session-scoped module fixtures
+# ---------------------------------------------------------------------------
+
+@pytest.fixture(scope='session')
+def mcp_server_mod():
+    """Load tasks.mcp_server directly (session-scoped)."""
+    return _import_module('tasks.mcp_server', 'tasks/mcp_server.py')
+
+
+@pytest.fixture(scope='session')
+def ai_mcp_client_mod():
+    """Load ai_mcp_client directly (session-scoped)."""
+    return _import_module('ai_mcp_client', 'ai_mcp_client.py')
+
+
+@pytest.fixture(scope='session')
+def localfiles_mod():
+    """Load tasks.mediaserver_localfiles directly (session-scoped)."""
+    return _import_module(
+        'tasks.mediaserver_localfiles',
+        'tasks/mediaserver_localfiles.py',
+    )
+
+
+# ---------------------------------------------------------------------------
+# DB mock helpers
+# ---------------------------------------------------------------------------
+
+def make_dict_row(mapping: dict):
+    """Create an object that supports both dict-key and attribute access,
+    mimicking psycopg2 DictRow."""
+    class FakeRow(dict):
+        def __getattr__(self, name):
+            try:
+                return self[name]
+            except KeyError:
+                raise AttributeError(name)
+    return FakeRow(mapping)
+
+
+def make_mock_connection(cursor):
+    """Wrap a mock cursor in a mock connection with close()."""
+    conn = MagicMock()
+    conn.cursor.return_value = cursor
+    conn.close = Mock()
+    return conn
+
+
+# ---------------------------------------------------------------------------
+# Config restoration (autouse)
+# ---------------------------------------------------------------------------
+
+_CONFIG_ATTRS_TO_RESTORE = (
+    'ENERGY_MIN',
+    'ENERGY_MAX',
+    'MAX_SONGS_PER_ARTIST_PLAYLIST',
+    'PLAYLIST_ENERGY_ARC',
+    'CLAP_ENABLED',
+    'AI_REQUEST_TIMEOUT_SECONDS',
+)
+
+
+@pytest.fixture(autouse=True)
+def config_restore():
+    """Save and restore mutated config attributes after each test."""
+    import config as cfg
+    saved = {}
+    for attr in _CONFIG_ATTRS_TO_RESTORE:
+        if hasattr(cfg, attr):
+            saved[attr] = getattr(cfg, attr)
+    yield
+    for attr, val in saved.items():
+        setattr(cfg, attr, val)
diff --git a/tests/unit/test_ai_mcp_client.py b/tests/unit/test_ai_mcp_client.py
new file mode 100644
index 00000000..5bff9cea
--- /dev/null
+++ b/tests/unit/test_ai_mcp_client.py
@@ -0,0 +1,945 @@
+"""Unit tests for ai_mcp_client.py
+
+Tests cover:
+- _build_system_prompt(): Prompt generation with tool decision trees, library context
+- get_mcp_tools(): Tool definitions based on CLAP_ENABLED
+- execute_mcp_tool(): Tool dispatch with energy conversion, normalization
+- call_ai_with_mcp_tools(): Provider dispatch routing
+- _call_ollama_with_tools(): JSON parsing, fallbacks, timeouts
+- _call_gemini_with_tools(): Gemini API mocking, schema conversion
+- _call_openai_with_tools(): OpenAI API mocking, tool extraction
+- _call_mistral_with_tools(): Mistral API mocking, key validation
+
+NOTE: uses importlib via conftest.py ai_mcp_client_mod fixture to load
+ai_mcp_client directly, bypassing tasks/__init__.py -> pydub -> audioop chain.
+
+httpx and google.genai are not installed in the test environment, so we
+install lightweight mock modules into sys.modules at import time.
+"""
+import json
+import sys
+import types
+import pytest
+from unittest.mock import Mock, MagicMock, patch, PropertyMock
+
+
+# ---------------------------------------------------------------------------
+# Install stub modules for optional dependencies not present in test env
+# ---------------------------------------------------------------------------
+
+def _ensure_httpx_stub():
+    """Install a lightweight httpx stub if httpx is not installed."""
+    if 'httpx' in sys.modules and not isinstance(sys.modules['httpx'], types.ModuleType):
+        return  # already a mock
+    try:
+        import httpx  # noqa: F401
+    except ImportError:
+        httpx_mod = types.ModuleType('httpx')
+
+        class _ReadTimeout(Exception):
+            pass
+
+        class _TimeoutException(Exception):
+            pass
+
+        class _Client:
+            def __init__(self, **kw):
+                pass
+            def __enter__(self):
+                return self
+            def __exit__(self, *a):
+                pass
+            def post(self, *a, **kw):
+                raise NotImplementedError("stub")
+
+        httpx_mod.ReadTimeout = _ReadTimeout
+        httpx_mod.TimeoutException = _TimeoutException
+        httpx_mod.Client = _Client
+        sys.modules['httpx'] = httpx_mod
+
+
+def _ensure_google_genai_stub():
+    """Install google.genai stub if not installed."""
+    try:
+        import google.genai  # noqa: F401
+    except (ImportError, ModuleNotFoundError):
+        # Create the google package if needed
+        if 'google' not in sys.modules:
+            google_mod = types.ModuleType('google')
+            google_mod.__path__ = []
+            sys.modules['google'] = google_mod
+        genai_mod = types.ModuleType('google.genai')
+        genai_mod.Client = MagicMock
+        genai_types = types.ModuleType('google.genai.types')
+        genai_types.Tool = MagicMock
+        genai_types.GenerateContentConfig = MagicMock
+        genai_types.ToolConfig = MagicMock
+        genai_types.FunctionCallingConfig = MagicMock
+        genai_mod.types = genai_types
+        sys.modules['google.genai'] = genai_mod
+        sys.modules['google.genai.types'] = genai_types
+
+
+_ensure_httpx_stub()
+_ensure_google_genai_stub()
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+def _make_library_context(**overrides):
+    """Build a library_context dict with sensible defaults."""
+    ctx = {
+        'total_songs': 500,
+        'unique_artists': 80,
+        'year_min': 1965,
+        'year_max': 2024,
+        'has_ratings': True,
+        'rated_songs_pct': 40.0,
+        'top_genres': ['rock', 'pop', 'metal', 'jazz', 'electronic'],
+        'top_moods': ['danceable', 'aggressive', 'happy'],
+        'scales': ['major', 'minor'],
+    }
+    ctx.update(overrides)
+    return ctx
+
+
+def _make_tools(include_text_search=True):
+    """Build a minimal list of tool dicts for prompt building."""
+    tools = [
+        {'name': 'song_similarity', 'description': 'Find similar songs', 'inputSchema': {}},
+        {'name': 'artist_similarity', 'description': 'Find artist songs', 'inputSchema': {}},
+        {'name': 'song_alchemy', 'description': 'Blend artists', 'inputSchema': {}},
+        {'name': 'ai_brainstorm', 'description': 'AI knowledge', 'inputSchema': {}},
+        {'name': 'search_database', 'description': 'Search by filters', 'inputSchema': {}},
+    ]
+    if include_text_search:
+        tools.insert(1, {'name': 'text_search', 'description': 'CLAP text search', 'inputSchema': {}})
+    return tools
+
+
+# ---------------------------------------------------------------------------
+# TestBuildSystemPrompt
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestBuildSystemPrompt:
+    """Test _build_system_prompt() - pure logic, no network/DB."""
+
+    def test_prompt_includes_tool_names(self, ai_mcp_client_mod):
+        tools = _make_tools(include_text_search=True)
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, None)
+        for t in tools:
+            assert t['name'] in prompt
+
+    def test_clap_decision_tree_has_six_steps(self, ai_mcp_client_mod):
+        """With text_search present, decision tree should have 6 numbered steps."""
+        tools = _make_tools(include_text_search=True)
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, None)
+        # The decision tree section should contain step 6
+        lines = prompt.split('\n')
+        decision_lines = [l for l in lines if l.strip().startswith(('1.', '2.', '3.', '4.', '5.', '6.'))]
+        assert any(l.strip().startswith('6.') for l in decision_lines)
+        assert 'text_search' in prompt
+
+    def test_no_clap_decision_tree_has_five_steps(self, ai_mcp_client_mod):
+        """Without text_search, decision tree should have 5 steps, not 6."""
+        tools = _make_tools(include_text_search=False)
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, None)
+        # Extract only the TOOL SELECTION section lines (numbered decision tree)
+        lines = prompt.split('\n')
+        decision_lines = [l for l in lines
+                          if l.strip() and l.strip()[0].isdigit()
+                          and l.strip()[1] == '.'
+                          and '->' in l]
+        # Should have exactly 5 decision tree entries
+        assert len(decision_lines) == 5
+        # text_search should NOT appear as a decision tree target
+        decision_text = '\n'.join(decision_lines)
+        assert '-> text_search' not in decision_text
+
+    def test_library_context_injected(self, ai_mcp_client_mod):
+        ctx = _make_library_context()
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, ctx)
+        assert '500 songs' in prompt
+        assert '80 artists' in prompt
+
+    def test_no_library_section_when_none(self, ai_mcp_client_mod):
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, None)
+        assert "USER'S MUSIC LIBRARY" not in prompt
+
+    def test_no_library_section_when_zero_songs(self, ai_mcp_client_mod):
+        ctx = _make_library_context(total_songs=0)
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, ctx)
+        assert "USER'S MUSIC LIBRARY" not in prompt
+
+    def test_dynamic_genres_from_context(self, ai_mcp_client_mod):
+        ctx = _make_library_context(top_genres=['synthwave', 'darkwave', 'ebm'])
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, ctx)
+        assert 'synthwave' in prompt
+        assert 'darkwave' in prompt
+
+    def test_dynamic_moods_from_context(self, ai_mcp_client_mod):
+        ctx = _make_library_context(top_moods=['melancholic', 'euphoric'])
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, ctx)
+        assert 'melancholic' in prompt
+        assert 'euphoric' in prompt
+
+    def test_fallback_genres_when_no_context(self, ai_mcp_client_mod):
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, None)
+        # Fallback genres from _FALLBACK_GENRES
+        assert 'rock' in prompt
+        assert 'jazz' in prompt
+        assert 'electronic' in prompt
+
+    def test_fallback_moods_when_no_context(self, ai_mcp_client_mod):
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, None)
+        # Fallback moods from _FALLBACK_MOODS
+        assert 'danceable' in prompt
+        assert 'aggressive' in prompt
+
+    def test_year_range_shown(self, ai_mcp_client_mod):
+        ctx = _make_library_context(year_min=1980, year_max=2023)
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, ctx)
+        assert '1980' in prompt
+        assert '2023' in prompt
+
+    def test_rating_info_shown_when_has_ratings(self, ai_mcp_client_mod):
+        ctx = _make_library_context(has_ratings=True, rated_songs_pct=65.0)
+        tools = _make_tools()
+        prompt = ai_mcp_client_mod._build_system_prompt(tools, ctx)
+        assert '65.0%' in prompt
+        assert 'ratings' in prompt
+
+
+# ---------------------------------------------------------------------------
+# TestGetMcpTools
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestGetMcpTools:
+    """Test get_mcp_tools() - tool definitions based on CLAP_ENABLED."""
+
+    def test_returns_six_tools_with_clap(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.CLAP_ENABLED = True
+        tools = ai_mcp_client_mod.get_mcp_tools()
+        assert len(tools) == 6
+
+    def test_returns_five_tools_without_clap(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.CLAP_ENABLED = False
+        tools = ai_mcp_client_mod.get_mcp_tools()
+        assert len(tools) == 5
+
+    def test_core_tool_names_present(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.CLAP_ENABLED = True
+        tools = ai_mcp_client_mod.get_mcp_tools()
+        names = [t['name'] for t in tools]
+        for expected in ['song_similarity', 'artist_similarity', 'song_alchemy',
+                         'ai_brainstorm', 'search_database']:
+            assert expected in names
+
+    def test_text_search_present_only_with_clap(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.CLAP_ENABLED = True
+        names_clap = [t['name'] for t in ai_mcp_client_mod.get_mcp_tools()]
+        assert 'text_search' in names_clap
+
+        cfg.CLAP_ENABLED = False
+        names_no_clap = [t['name'] for t in ai_mcp_client_mod.get_mcp_tools()]
+        assert 'text_search' not in names_no_clap
+
+    def test_tools_have_required_keys(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.CLAP_ENABLED = True
+        tools = ai_mcp_client_mod.get_mcp_tools()
+        for tool in tools:
+            assert 'name' in tool
+            assert 'description' in tool
+            assert 'inputSchema' in tool
+
+    def test_song_similarity_requires_title_and_artist(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.CLAP_ENABLED = True
+        tools = ai_mcp_client_mod.get_mcp_tools()
+        ss = next(t for t in tools if t['name'] == 'song_similarity')
+        required = ss['inputSchema'].get('required', [])
+        assert 'song_title' in required
+        assert 'song_artist' in required
+
+    def test_search_database_has_filter_properties(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.CLAP_ENABLED = True
+        tools = ai_mcp_client_mod.get_mcp_tools()
+        sd = next(t for t in tools if t['name'] == 'search_database')
+        props = sd['inputSchema']['properties']
+        for key in ['genres', 'moods', 'energy_min', 'energy_max',
+                     'tempo_min', 'tempo_max', 'key', 'scale',
+                     'year_min', 'year_max', 'min_rating']:
+            assert key in props, f"Missing property: {key}"
+
+    def test_priority_numbering_with_clap(self, ai_mcp_client_mod):
+        """artist_similarity description says #3 when CLAP enabled."""
+        import config as cfg
+        cfg.CLAP_ENABLED = True
+        tools = ai_mcp_client_mod.get_mcp_tools()
+        artist_tool = next(t for t in tools if t['name'] == 'artist_similarity')
+        assert '#3' in artist_tool['description']
+
+    def test_priority_numbering_without_clap(self, ai_mcp_client_mod):
+        """artist_similarity description says #2 when CLAP disabled."""
+        import config as cfg
+        cfg.CLAP_ENABLED = False
+        tools = ai_mcp_client_mod.get_mcp_tools()
+        artist_tool = next(t for t in tools if t['name'] == 'artist_similarity')
+        assert '#2' in artist_tool['description']
+
+
+# ---------------------------------------------------------------------------
+# TestExecuteMcpTool
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestExecuteMcpTool:
+    """Test execute_mcp_tool() - tool dispatch with energy conversion."""
+
+    def _mock_mcp_server(self):
+        """Create a mock mcp_server module with all required functions."""
+        mock_mod = MagicMock()
+        mock_mod._artist_similarity_api_sync = Mock(return_value={'songs': []})
+        mock_mod._song_similarity_api_sync = Mock(return_value={'songs': []})
+        mock_mod._database_genre_query_sync = Mock(return_value={'songs': []})
+        mock_mod._ai_brainstorm_sync = Mock(return_value={'songs': []})
+        mock_mod._song_alchemy_sync = Mock(return_value={'songs': []})
+        mock_mod._text_search_sync = Mock(return_value={'songs': []})
+        return mock_mod
+
+    def test_energy_min_zero_maps_to_energy_min(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.ENERGY_MIN = 0.01
+        cfg.ENERGY_MAX = 0.15
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('search_database', {
+                'genres': ['rock'], 'energy_min': 0.0
+            }, {})
+        args = mock_mod._database_genre_query_sync.call_args[0]
+        # args[5] is energy_min_raw
+        assert abs(args[5] - 0.01) < 1e-9
+
+    def test_energy_max_one_maps_to_energy_max(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.ENERGY_MIN = 0.01
+        cfg.ENERGY_MAX = 0.15
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('search_database', {
+                'genres': ['rock'], 'energy_max': 1.0
+            }, {})
+        args = mock_mod._database_genre_query_sync.call_args[0]
+        # args[6] is energy_max_raw
+        assert abs(args[6] - 0.15) < 1e-9
+
+    def test_energy_mid_maps_to_midpoint(self, ai_mcp_client_mod):
+        import config as cfg
+        cfg.ENERGY_MIN = 0.01
+        cfg.ENERGY_MAX = 0.15
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('search_database', {
+                'genres': ['rock'], 'energy_min': 0.5
+            }, {})
+        args = mock_mod._database_genre_query_sync.call_args[0]
+        assert abs(args[5] - 0.08) < 1e-9
+
+    def test_no_energy_args_passes_none(self, ai_mcp_client_mod):
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('search_database', {
+                'genres': ['rock']
+            }, {})
+        args = mock_mod._database_genre_query_sync.call_args[0]
+        # args[5]=energy_min_raw, args[6]=energy_max_raw should be None
+        assert args[5] is None
+        assert args[6] is None
+
+    def test_unknown_tool_returns_error(self, ai_mcp_client_mod):
+        # Must mock tasks.mcp_server to avoid pyaudioop import
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            result = ai_mcp_client_mod.execute_mcp_tool('nonexistent_tool', {}, {})
+        assert 'error' in result
+
+    def test_exception_returns_error(self, ai_mcp_client_mod):
+        mock_mod = self._mock_mcp_server()
+        mock_mod._artist_similarity_api_sync.side_effect = RuntimeError("boom")
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            result = ai_mcp_client_mod.execute_mcp_tool('artist_similarity', {
+                'artist': 'Test'
+            }, {})
+        assert 'error' in result
+
+    def test_get_songs_defaults_to_100(self, ai_mcp_client_mod):
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('artist_similarity', {
+                'artist': 'Test'
+            }, {})
+        args = mock_mod._artist_similarity_api_sync.call_args[0]
+        # args: (artist, count=15, get_songs)
+        assert args[2] == 100  # default get_songs
+
+    def test_song_alchemy_normalizes_string_items(self, ai_mcp_client_mod):
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('song_alchemy', {
+                'add_items': ['Metallica', 'Iron Maiden'],
+                'subtract_items': ['Ballads']
+            }, {})
+        args = mock_mod._song_alchemy_sync.call_args[0]
+        add_items = args[0]
+        subtract_items = args[1]
+        assert add_items == [
+            {'type': 'artist', 'id': 'Metallica'},
+            {'type': 'artist', 'id': 'Iron Maiden'}
+        ]
+        assert subtract_items == [{'type': 'artist', 'id': 'Ballads'}]
+
+    def test_song_alchemy_handles_dict_items(self, ai_mcp_client_mod):
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('song_alchemy', {
+                'add_items': [{'type': 'artist', 'id': 'Metallica'}]
+            }, {})
+        args = mock_mod._song_alchemy_sync.call_args[0]
+        assert args[0] == [{'type': 'artist', 'id': 'Metallica'}]
+
+    def test_artist_similarity_hardcoded_count_15(self, ai_mcp_client_mod):
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('artist_similarity', {
+                'artist': 'Queen', 'get_songs': 50
+            }, {})
+        args = mock_mod._artist_similarity_api_sync.call_args[0]
+        assert args[1] == 15  # hardcoded count
+
+    def test_song_similarity_passes_title_and_artist(self, ai_mcp_client_mod):
+        mock_mod = self._mock_mcp_server()
+        with patch.dict('sys.modules', {'tasks.mcp_server': mock_mod}):
+            ai_mcp_client_mod.execute_mcp_tool('song_similarity', {
+                'song_title': 'Bohemian Rhapsody',
+                'song_artist': 'Queen'
+            }, {})
+        args = mock_mod._song_similarity_api_sync.call_args[0]
+        assert args[0] == 'Bohemian Rhapsody'
+        assert args[1] == 'Queen'
+
+
+# ---------------------------------------------------------------------------
+# TestCallAiWithMcpTools
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestCallAiWithMcpTools:
+    """Test call_ai_with_mcp_tools() - provider dispatch routing."""
+
+    def test_dispatch_gemini(self, ai_mcp_client_mod):
+        with patch.object(ai_mcp_client_mod, '_call_gemini_with_tools',
+                          return_value={'tool_calls': []}) as mock_fn:
+            result = ai_mcp_client_mod.call_ai_with_mcp_tools(
+                'GEMINI', 'test', [], {}, [])
+            mock_fn.assert_called_once()
+        assert 'tool_calls' in result
+
+    def test_dispatch_openai(self, ai_mcp_client_mod):
+        with patch.object(ai_mcp_client_mod, '_call_openai_with_tools',
+                          return_value={'tool_calls': []}) as mock_fn:
+            result = ai_mcp_client_mod.call_ai_with_mcp_tools(
+                'OPENAI', 'test', [], {}, [])
+            mock_fn.assert_called_once()
+        assert 'tool_calls' in result
+
+    def test_dispatch_mistral(self, ai_mcp_client_mod):
+        with patch.object(ai_mcp_client_mod, '_call_mistral_with_tools',
+                          return_value={'tool_calls': []}) as mock_fn:
+            result = ai_mcp_client_mod.call_ai_with_mcp_tools(
+                'MISTRAL', 'test', [], {}, [])
+            mock_fn.assert_called_once()
+        assert 'tool_calls' in result
+
+    def test_dispatch_ollama(self, ai_mcp_client_mod):
+        with patch.object(ai_mcp_client_mod, '_call_ollama_with_tools',
+                          return_value={'tool_calls': []}) as mock_fn:
+            result = ai_mcp_client_mod.call_ai_with_mcp_tools(
+                'OLLAMA', 'test', [], {}, [])
+            mock_fn.assert_called_once()
+        assert 'tool_calls' in result
+
+    def test_unknown_provider_returns_error(self, ai_mcp_client_mod):
+        result = ai_mcp_client_mod.call_ai_with_mcp_tools(
+            'UNKNOWN', 'test', [], {}, [])
+        assert 'error' in result
+        assert 'Unsupported' in result['error']
+
+
+# ---------------------------------------------------------------------------
+# TestCallOllamaWithTools
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestCallOllamaWithTools:
+    """Test _call_ollama_with_tools() - JSON parsing, fallbacks, timeouts."""
+
+    def _make_httpx_client_mock(self, response_data):
+        """Create a mock httpx.Client context manager returning given response."""
+        mock_response = MagicMock()
+        mock_response.json.return_value = response_data
+        mock_response.raise_for_status = Mock()
+        mock_client = MagicMock()
+        mock_client.post.return_value = mock_response
+        mock_client.__enter__ = Mock(return_value=mock_client)
+        mock_client.__exit__ = Mock(return_value=False)
+        return mock_client
+
+    def _call(self, ai_mcp_client_mod, response_data, **kwargs):
+        """Helper to call _call_ollama_with_tools with a mocked httpx.Client."""
+        import httpx
+        mock_client = self._make_httpx_client_mock(response_data)
+        tools = _make_tools(include_text_search=False)
+        ai_config = kwargs.get('ai_config', {'ollama_url': 'http://localhost:11434/api/generate',
+                                              'ollama_model': 'llama3.1:8b'})
+        log = []
+        with patch.object(httpx, 'Client', return_value=mock_client):
+            result = ai_mcp_client_mod._call_ollama_with_tools(
+                'test request', tools, ai_config, log)
+        return result, log
+
+    def test_valid_json_tool_calls_parsed(self, ai_mcp_client_mod):
+        response_text = json.dumps({
+            'tool_calls': [{'name': 'search_database', 'arguments': {'genres': ['rock']}}]
+        })
+        result, _ = self._call(ai_mcp_client_mod, {'response': response_text})
+        assert 'tool_calls' in result
+        assert len(result['tool_calls']) == 1
+        assert result['tool_calls'][0]['name'] == 'search_database'
+
+    def test_fallback_direct_array(self, ai_mcp_client_mod):
+        response_text = json.dumps([
+            {'name': 'search_database', 'arguments': {'genres': ['pop']}}
+        ])
+        result, _ = self._call(ai_mcp_client_mod, {'response': response_text})
+        assert 'tool_calls' in result
+        assert result['tool_calls'][0]['name'] == 'search_database'
+
+    def test_fallback_single_object(self, ai_mcp_client_mod):
+        response_text = json.dumps(
+            {'name': 'artist_similarity', 'arguments': {'artist': 'Queen'}}
+        )
+        result, _ = self._call(ai_mcp_client_mod, {'response': response_text})
+        assert 'tool_calls' in result
+        assert result['tool_calls'][0]['name'] == 'artist_similarity'
+
+    def test_markdown_code_block_stripping(self, ai_mcp_client_mod):
+        inner = json.dumps({
+            'tool_calls': [{'name': 'search_database', 'arguments': {'genres': ['jazz']}}]
+        })
+        response_text = f"```json\n{inner}\n```"
+        result, _ = self._call(ai_mcp_client_mod, {'response': response_text})
+        assert 'tool_calls' in result
+
+    def test_schema_detection_returns_error(self, ai_mcp_client_mod):
+        # JSON that looks like a schema: starts with '{', has '"type"' and '"array"'
+        schema_response = json.dumps({
+            'type': 'object',
+            'properties': {'tool_calls': {'type': 'array', 'items': {}}}
+        })
+        result, _ = self._call(ai_mcp_client_mod, {'response': schema_response})
+        assert 'error' in result
+        assert 'schema' in result['error'].lower()
+
+    def test_json_decode_error_returns_error(self, ai_mcp_client_mod):
+        result, _ = self._call(ai_mcp_client_mod, {'response': 'not valid json {{'})
+        assert 'error' in result
+        assert 'Failed to parse' in result['error']
+
+    def test_missing_arguments_defaults_to_empty(self, ai_mcp_client_mod):
+        response_text = json.dumps({
+            'tool_calls': [{'name': 'search_database'}]
+        })
+        result, _ = self._call(ai_mcp_client_mod, {'response': response_text})
+        assert 'tool_calls' in result
+        assert result['tool_calls'][0]['arguments'] == {}
+
+    def test_invalid_tool_calls_skipped_all_invalid_returns_error(self, ai_mcp_client_mod):
+        response_text = json.dumps({
+            'tool_calls': [{'invalid': True}, {'also_invalid': 'yes'}]
+        })
+        result, _ = self._call(ai_mcp_client_mod, {'response': response_text})
+        assert 'error' in result
+        assert 'No valid tool calls' in result['error']
+
+    def test_read_timeout_returns_error(self, ai_mcp_client_mod):
+        import httpx
+        mock_client = MagicMock()
+        mock_client.post.side_effect = httpx.ReadTimeout("read timed out")
+        mock_client.__enter__ = Mock(return_value=mock_client)
+        mock_client.__exit__ = Mock(return_value=False)
+        tools = _make_tools(include_text_search=False)
+        log = []
+        with patch.object(httpx, 'Client', return_value=mock_client):
+            result = ai_mcp_client_mod._call_ollama_with_tools(
+                'test', tools, {'ollama_url': 'http://localhost:11434/api/generate'}, log)
+        assert 'error' in result
+        assert 'timed out' in result['error']
+
+    def test_timeout_exception_returns_error(self, ai_mcp_client_mod):
+        import httpx
+        mock_client = MagicMock()
+        mock_client.post.side_effect = httpx.TimeoutException("connection timeout")
+        mock_client.__enter__ = Mock(return_value=mock_client)
+        mock_client.__exit__ = Mock(return_value=False)
+        tools = _make_tools(include_text_search=False)
+        log = []
+        with patch.object(httpx, 'Client', return_value=mock_client):
+            result = ai_mcp_client_mod._call_ollama_with_tools(
+                'test', tools, {'ollama_url': 'http://localhost:11434/api/generate'}, log)
+        assert 'error' in result
+        assert 'timed out' in result['error']
+
+    def test_generic_exception_returns_ollama_error(self, ai_mcp_client_mod):
+        import httpx
+        mock_client = MagicMock()
+        mock_client.post.side_effect = RuntimeError("unexpected error")
+        mock_client.__enter__ = Mock(return_value=mock_client)
+        mock_client.__exit__ = Mock(return_value=False)
+        tools = _make_tools(include_text_search=False)
+        log = []
+        with patch.object(httpx, 'Client', return_value=mock_client):
+            result = ai_mcp_client_mod._call_ollama_with_tools(
+                'test', tools, {'ollama_url': 'http://localhost:11434/api/generate'}, log)
+        assert 'error' in result
+        assert 'Ollama error' in result['error']
+
+    def test_missing_response_key_returns_error(self, ai_mcp_client_mod):
+        result, _ = self._call(ai_mcp_client_mod, {'other_key': 'value'})
+        assert 'error' in result
+        assert 'Invalid Ollama response' in result['error']
+
+
+# ---------------------------------------------------------------------------
+# TestCallGeminiWithTools
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestCallGeminiWithTools:
+    """Test _call_gemini_with_tools() - Gemini API mocking."""
+
+    def _make_mock_genai(self):
+        """Create a fresh mock google.genai module and install it."""
+        mock_genai = MagicMock()
+        mock_genai.types = MagicMock()
+        mock_genai.types.Tool = MagicMock()
+        mock_genai.types.GenerateContentConfig = MagicMock()
+        mock_genai.types.ToolConfig = MagicMock()
+        mock_genai.types.FunctionCallingConfig = MagicMock()
+        return mock_genai
+
+    def _make_response_with_tool_calls(self, tool_calls):
+        """Create a mock Gemini response with function_call parts."""
+        parts = []
+        for tc in tool_calls:
+            part = MagicMock()
+            fc = MagicMock()
+            fc.name = tc['name']
+            fc.args = tc.get('arguments', {})
+            # Make sure hasattr(fc, 'args') returns True and hasattr(fc, 'arguments') is also accessible
+            part.function_call = fc
+            parts.append(part)
+        candidate = MagicMock()
+        candidate.content.parts = parts
+        response = MagicMock()
+        response.candidates = [candidate]
+        return response
+
+    def _call_gemini(self, ai_mcp_client_mod, mock_genai, tools, ai_config, user_msg='test'):
+        """Call _call_gemini_with_tools with mock genai injected."""
+        # We need to patch sys.modules so `import google.genai as genai` resolves
+        google_mock = MagicMock()
+        google_mock.genai = mock_genai
+        with patch.dict('sys.modules', {
+            'google': google_mock,
+            'google.genai': mock_genai,
+        }):
+            return ai_mcp_client_mod._call_gemini_with_tools(
+                user_msg, tools, ai_config, [])
+
+    def test_missing_api_key_returns_error(self, ai_mcp_client_mod):
+        mock_genai = self._make_mock_genai()
+        result = self._call_gemini(
+            ai_mcp_client_mod, mock_genai, _make_tools(),
+            {'gemini_key': '', 'gemini_model': 'gemini-2.5-pro'})
+        assert 'error' in result
+        assert 'Valid Gemini API key required' in result['error']
+
+    def test_placeholder_api_key_returns_error(self, ai_mcp_client_mod):
+        mock_genai = self._make_mock_genai()
+        result = self._call_gemini(
+            ai_mcp_client_mod, mock_genai, _make_tools(),
+            {'gemini_key': 'YOUR-GEMINI-API-KEY-HERE', 'gemini_model': 'gemini-2.5-pro'})
+        assert 'error' in result
+        assert 'Valid Gemini API key required' in result['error']
+
+    def test_successful_tool_call_extraction(self, ai_mcp_client_mod):
+        mock_genai = self._make_mock_genai()
+        response = self._make_response_with_tool_calls([
+            {'name': 'search_database', 'arguments': {'genres': ['rock']}}
+        ])
+        mock_client = MagicMock()
+        mock_client.models.generate_content.return_value = response
+        mock_genai.Client.return_value = mock_client
+
+        result = self._call_gemini(
+            ai_mcp_client_mod, mock_genai, _make_tools(),
+            {'gemini_key': 'real-key-123', 'gemini_model': 'gemini-2.5-pro'},
+            user_msg='play rock music')
+        assert 'tool_calls' in result
+        assert len(result['tool_calls']) == 1
+        assert result['tool_calls'][0]['name'] == 'search_database'
+
+    def test_no_tool_calls_returns_error(self, ai_mcp_client_mod):
+        mock_genai = self._make_mock_genai()
+        response = MagicMock()
+        response.candidates = []
+        response.text = "I cannot call tools"
+        mock_client = MagicMock()
+        mock_client.models.generate_content.return_value = response
+        mock_genai.Client.return_value = mock_client
+
+        result = self._call_gemini(
+            ai_mcp_client_mod, mock_genai, _make_tools(),
+            {'gemini_key': 'real-key-123', 'gemini_model': 'gemini-2.5-pro'})
+        assert 'error' in result
+        assert 'AI did not call any tools' in result['error']
+
+    def test_exception_returns_gemini_error(self, ai_mcp_client_mod):
+        mock_genai = self._make_mock_genai()
+        mock_genai.Client.side_effect = RuntimeError("API failure")
+
+        result = self._call_gemini(
+            ai_mcp_client_mod, mock_genai, _make_tools(),
+            {'gemini_key': 'real-key-123', 'gemini_model': 'gemini-2.5-pro'})
+        assert 'error' in result
+        assert 'Gemini error' in result['error']
+
+    def test_schema_type_conversion(self, ai_mcp_client_mod):
+        """Verify the convert_schema_for_gemini produces uppercase types."""
+        mock_genai = self._make_mock_genai()
+        response = self._make_response_with_tool_calls([
+            {'name': 'test_tool', 'arguments': {}}
+        ])
+        mock_client = MagicMock()
+        mock_client.models.generate_content.return_value = response
+        mock_genai.Client.return_value = mock_client
+
+        # Use a tool with known schema types
+        tools = [{
+            'name': 'test_tool',
+            'description': 'test',
+            'inputSchema': {
+                'type': 'object',
+                'properties': {
+                    'name': {'type': 'string', 'description': 'A name'},
+                    'count': {'type': 'number', 'description': 'A count'},
+                    'flag': {'type': 'boolean', 'description': 'A flag'},
+                    'items': {'type': 'array', 'items': {'type': 'integer'}},
+                }
+            }
+        }]
+
+        self._call_gemini(
+            ai_mcp_client_mod, mock_genai, tools,
+            {'gemini_key': 'real-key-123', 'gemini_model': 'gemini-2.5-pro'})
+
+        # The Tool() call should have been made with converted schemas
+        tool_call = mock_genai.types.Tool.call_args
+        # Tool(function_declarations=...) - check keyword arg
+        if tool_call[1] and 'function_declarations' in tool_call[1]:
+            func_decls = tool_call[1]['function_declarations']
+        else:
+            # positional: Tool(function_declarations_list)
+            func_decls = tool_call[0][0] if tool_call[0] else None
+        assert func_decls is not None, "function_declarations not found in Tool() call"
+        params = func_decls[0]['parameters']
+        assert params['type'] == 'OBJECT'
+        assert params['properties']['name']['type'] == 'STRING'
+        assert params['properties']['count']['type'] == 'NUMBER'
+        assert params['properties']['flag']['type'] == 'BOOLEAN'
+        assert params['properties']['items']['type'] == 'ARRAY'
+        assert params['properties']['items']['items']['type'] == 'INTEGER'
+
+
+# ---------------------------------------------------------------------------
+# TestCallOpenaiWithTools
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestCallOpenaiWithTools:
+    """Test _call_openai_with_tools() - OpenAI API mocking."""
+
+    def _make_httpx_client_mock(self, response_data):
+        mock_response = MagicMock()
+        mock_response.json.return_value = response_data
+        mock_response.raise_for_status = Mock()
+        mock_client = MagicMock()
+        mock_client.post.return_value = mock_response
+        mock_client.__enter__ = Mock(return_value=mock_client)
+        mock_client.__exit__ = Mock(return_value=False)
+        return mock_client
+
+    def test_successful_tool_call_extraction(self, ai_mcp_client_mod):
+        import httpx
+        response_data = {
+            'choices': [{
+                'message': {
+                    'tool_calls': [{
+                        'type': 'function',
+                        'function': {
+                            'name': 'search_database',
+                            'arguments': json.dumps({'genres': ['rock']})
+                        }
+                    }]
+                }
+            }]
+        }
+        mock_client = self._make_httpx_client_mock(response_data)
+        with patch.object(httpx, 'Client', return_value=mock_client):
+            result = ai_mcp_client_mod._call_openai_with_tools(
+                'play rock', _make_tools(),
+                {'openai_url': 'http://localhost', 'openai_key': 'test', 'openai_model': 'gpt-4'},
+                [])
+        assert 'tool_calls' in result
+        assert result['tool_calls'][0]['name'] == 'search_database'
+
+    def test_no_tool_calls_returns_error(self, ai_mcp_client_mod):
+        import httpx
+        response_data = {
+            'choices': [{
+                'message': {
+                    'content': 'I found some songs for you'
+                }
+            }]
+        }
+        mock_client = self._make_httpx_client_mock(response_data)
+        with patch.object(httpx, 'Client', return_value=mock_client):
+            result = ai_mcp_client_mod._call_openai_with_tools(
+                'play rock', _make_tools(),
+                {'openai_url': 'http://localhost', 'openai_key': 'test', 'openai_model': 'gpt-4'},
+                [])
+        assert 'error' in result
+        assert 'AI did not call any tools' in result['error']
+
+    def test_read_timeout_returns_error(self, ai_mcp_client_mod):
+        import httpx
+        mock_client = MagicMock()
+        mock_client.post.side_effect = httpx.ReadTimeout("read timed out")
+        mock_client.__enter__ = Mock(return_value=mock_client)
+        mock_client.__exit__ = Mock(return_value=False)
+        with patch.object(httpx, 'Client', return_value=mock_client):
+            result = ai_mcp_client_mod._call_openai_with_tools(
+                'test', _make_tools(),
+                {'openai_url': 'http://localhost', 'openai_key': 'test', 'openai_model': 'gpt-4'},
+                [])
+        assert 'error' in result
+        assert 'timed out' in result['error']
+
+    def test_generic_exception_returns_error(self, ai_mcp_client_mod):
+        import httpx
+        mock_client = MagicMock()
+        mock_client.post.side_effect = RuntimeError("connection failed")
+        mock_client.__enter__ = Mock(return_value=mock_client)
+        mock_client.__exit__ = Mock(return_value=False)
+        with patch.object(httpx, 'Client', return_value=mock_client):
+            result = ai_mcp_client_mod._call_openai_with_tools(
+                'test', _make_tools(),
+                {'openai_url': 'http://localhost', 'openai_key': 'test', 'openai_model': 'gpt-4'},
+                [])
+        assert 'error' in result
+        assert 'OpenAI error' in result['error']
+
+
+# ---------------------------------------------------------------------------
+# TestCallMistralWithTools
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestCallMistralWithTools:
+    """Test _call_mistral_with_tools() - Mistral API mocking."""
+
+    def _make_mock_mistral_module(self):
+        """Create a mock mistralai module."""
+        mock_mod = MagicMock()
+        return mock_mod
+
+    def test_missing_api_key_returns_error(self, ai_mcp_client_mod):
+        mock_mistral_mod = self._make_mock_mistral_module()
+        with patch.dict('sys.modules', {'mistralai': mock_mistral_mod}):
+            result = ai_mcp_client_mod._call_mistral_with_tools(
+                'test', _make_tools(),
+                {'mistral_key': '', 'mistral_model': 'mistral-large-latest'}, [])
+        assert 'error' in result
+        assert 'Valid Mistral API key required' in result['error']
+
+    def test_placeholder_key_returns_error(self, ai_mcp_client_mod):
+        mock_mistral_mod = self._make_mock_mistral_module()
+        with patch.dict('sys.modules', {'mistralai': mock_mistral_mod}):
+            result = ai_mcp_client_mod._call_mistral_with_tools(
+                'test', _make_tools(),
+                {'mistral_key': 'YOUR-GEMINI-API-KEY-HERE', 'mistral_model': 'mistral-large-latest'}, [])
+        assert 'error' in result
+        assert 'Valid Mistral API key required' in result['error']
+
+    def test_successful_tool_call_extraction(self, ai_mcp_client_mod):
+        mock_mistral_mod = self._make_mock_mistral_module()
+        # Build mock response
+        mock_tc = MagicMock()
+        mock_tc.function.name = 'search_database'
+        mock_tc.function.arguments = json.dumps({'genres': ['jazz']})
+        mock_message = MagicMock()
+        mock_message.tool_calls = [mock_tc]
+        mock_choice = MagicMock()
+        mock_choice.message = mock_message
+        mock_response = MagicMock()
+        mock_response.choices = [mock_choice]
+
+        mock_client_instance = MagicMock()
+        mock_client_instance.chat.complete.return_value = mock_response
+        mock_mistral_mod.Mistral.return_value = mock_client_instance
+
+        with patch.dict('sys.modules', {'mistralai': mock_mistral_mod}):
+            result = ai_mcp_client_mod._call_mistral_with_tools(
+                'play jazz', _make_tools(),
+                {'mistral_key': 'real-key-abc', 'mistral_model': 'mistral-large-latest'}, [])
+        assert 'tool_calls' in result
+        assert result['tool_calls'][0]['name'] == 'search_database'
+
+    def test_exception_returns_mistral_error(self, ai_mcp_client_mod):
+        mock_mistral_mod = self._make_mock_mistral_module()
+        mock_mistral_mod.Mistral.side_effect = RuntimeError("API down")
+
+        with patch.dict('sys.modules', {'mistralai': mock_mistral_mod}):
+            result = ai_mcp_client_mod._call_mistral_with_tools(
+                'test', _make_tools(),
+                {'mistral_key': 'real-key-abc', 'mistral_model': 'mistral-large-latest'}, [])
+        assert 'error' in result
+        assert 'Mistral error' in result['error']
diff --git a/tests/unit/test_app_chat.py b/tests/unit/test_app_chat.py
new file mode 100644
index 00000000..2b3fcbeb
--- /dev/null
+++ b/tests/unit/test_app_chat.py
@@ -0,0 +1,533 @@
+"""Unit tests for app_chat.py instant playlist pipeline
+
+Tests cover the agentic playlist workflow:
+- Artist diversity enforcement (max songs per artist, backfill)
+- Proportional sampling from tool calls
+- Pre-execution validation (empty song_similarity, filterless search_database)
+- Ollama JSON extraction edge cases
+- Iteration deduplication (song_ids_seen)
+- Stopping conditions (target reached, no new songs, AI error)
+- API key validation for cloud providers
+"""
+import json
+import pytest
+from unittest.mock import Mock, MagicMock, patch, call
+
+flask = pytest.importorskip('flask', reason='Flask not installed')
+from flask import Flask
+
+
+# ---------------------------------------------------------------------------
+# Fixtures
+# ---------------------------------------------------------------------------
+
+@pytest.fixture
+def app():
+    """Create a Flask app with the chat blueprint registered."""
+    with patch('app_chat.OLLAMA_SERVER_URL', 'http://localhost:11434'), \
+         patch('app_chat.OLLAMA_MODEL_NAME', 'test-model'), \
+         patch('app_chat.OPENAI_SERVER_URL', 'http://localhost'), \
+         patch('app_chat.OPENAI_MODEL_NAME', 'gpt-4'), \
+         patch('app_chat.OPENAI_API_KEY', ''), \
+         patch('app_chat.GEMINI_MODEL_NAME', 'gemini-pro'), \
+         patch('app_chat.GEMINI_API_KEY', ''), \
+         patch('app_chat.MISTRAL_MODEL_NAME', 'mistral-7b'), \
+         patch('app_chat.MISTRAL_API_KEY', ''), \
+         patch('app_chat.AI_MODEL_PROVIDER', 'OLLAMA'):
+        from app_chat import chat_bp
+        flask_app = Flask(__name__)
+        flask_app.register_blueprint(chat_bp)
+        flask_app.config['TESTING'] = True
+        yield flask_app
+
+
+@pytest.fixture
+def client(app):
+    return app.test_client()
+
+
+def _song(item_id, title="Song", artist="Artist"):
+    """Helper to create a song dict."""
+    return {'item_id': item_id, 'title': title, 'artist': artist}
+
+
+# ---------------------------------------------------------------------------
+# Artist Diversity Enforcement
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestArtistDiversity:
+    """Test artist diversity enforcement (Phase 3B)."""
+
+    def test_under_limit_keeps_all(self):
+        """Songs under the per-artist limit are all kept."""
+        songs = [_song(f'id{i}', artist='ArtistA') for i in range(3)]
+        max_per = 5
+        artist_counts = {}
+        diverse = []
+        overflow = []
+        for s in songs:
+            a = s.get('artist', 'Unknown')
+            artist_counts[a] = artist_counts.get(a, 0) + 1
+            if artist_counts[a] <= max_per:
+                diverse.append(s)
+            else:
+                overflow.append(s)
+        assert len(diverse) == 3
+        assert len(overflow) == 0
+
+    def test_over_limit_trims_excess(self):
+        """Songs over the per-artist limit go to overflow."""
+        songs = [_song(f'id{i}', artist='ArtistA') for i in range(8)]
+        max_per = 5
+        artist_counts = {}
+        diverse = []
+        overflow = []
+        for s in songs:
+            a = s.get('artist', 'Unknown')
+            artist_counts[a] = artist_counts.get(a, 0) + 1
+            if artist_counts[a] <= max_per:
+                diverse.append(s)
+            else:
+                overflow.append(s)
+        assert len(diverse) == 5
+        assert len(overflow) == 3
+
+    def test_multiple_artists_independent_limits(self):
+        """Each artist gets an independent limit."""
+        songs = [_song(f'a{i}', artist='A') for i in range(6)]
+        songs += [_song(f'b{i}', artist='B') for i in range(4)]
+        max_per = 5
+        artist_counts = {}
+        diverse = []
+        for s in songs:
+            a = s.get('artist', 'Unknown')
+            artist_counts[a] = artist_counts.get(a, 0) + 1
+            if artist_counts[a] <= max_per:
+                diverse.append(s)
+        assert sum(1 for s in diverse if s['artist'] == 'A') == 5
+        assert sum(1 for s in diverse if s['artist'] == 'B') == 4
+
+    def test_backfill_from_overflow(self):
+        """Overflow songs backfill from least-represented artists."""
+        # 10 songs from ArtistA, 2 from ArtistB, limit=3, target=8
+        songs = [_song(f'a{i}', artist='ArtistA') for i in range(10)]
+        songs += [_song(f'b{i}', artist='ArtistB') for i in range(2)]
+        max_per = 3
+        target = 8
+        artist_counts = {}
+        diverse = []
+        overflow = []
+        for s in songs:
+            a = s.get('artist', 'Unknown')
+            artist_counts[a] = artist_counts.get(a, 0) + 1
+            if artist_counts[a] <= max_per:
+                diverse.append(s)
+            else:
+                overflow.append(s)
+        # diverse has 3 A + 2 B = 5 songs, need 3 more from overflow
+        if len(diverse) < target and overflow:
+            diverse_artist_counts = {}
+            for s in diverse:
+                a = s.get('artist', 'Unknown')
+                diverse_artist_counts[a] = diverse_artist_counts.get(a, 0) + 1
+            overflow.sort(key=lambda s: diverse_artist_counts.get(s.get('artist', ''), 0))
+            backfill_needed = target - len(diverse)
+            diverse.extend(overflow[:backfill_needed])
+        assert len(diverse) == 8
+
+    def test_default_max_per_artist_is_5(self):
+        """Config default MAX_SONGS_PER_ARTIST_PLAYLIST is 5."""
+        from config import MAX_SONGS_PER_ARTIST_PLAYLIST
+        assert MAX_SONGS_PER_ARTIST_PLAYLIST == 5
+
+
+# ---------------------------------------------------------------------------
+# Proportional Sampling
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestProportionalSampling:
+    """Test proportional sampling when more songs than target."""
+
+    def test_under_target_uses_all(self):
+        """When total < target, all songs are kept."""
+        all_songs = [_song(f'id{i}') for i in range(50)]
+        target = 100
+        assert len(all_songs) <= target
+
+    def test_over_target_samples_proportionally(self):
+        """When total > target, songs are sampled proportionally by source."""
+        song_sources = {}
+        songs_by_call = {0: [], 1: []}
+        for i in range(80):
+            s = _song(f'id{i}')
+            songs_by_call[0].append(s)
+            song_sources[f'id{i}'] = 0
+        for i in range(80, 120):
+            s = _song(f'id{i}')
+            songs_by_call[1].append(s)
+            song_sources[f'id{i}'] = 1
+        total = 120
+        target = 100
+        final = []
+        for call_index, tool_songs in songs_by_call.items():
+            proportion = len(tool_songs) / total
+            allocated = int(proportion * target)
+            if allocated == 0 and len(tool_songs) > 0:
+                allocated = 1
+            final.extend(tool_songs[:allocated])
+        # Call 0: 80/120*100=66, Call 1: 40/120*100=33 => 99 total
+        assert len(final) <= target
+
+    def test_each_call_gets_at_least_one(self):
+        """Even a tool call with 1 song gets at least 1 in the final list."""
+        songs_by_call = {0: [_song('majority')]*99, 1: [_song('tiny')]}
+        total = 100
+        target = 50
+        final = []
+        for call_index, tool_songs in songs_by_call.items():
+            proportion = len(tool_songs) / total
+            allocated = int(proportion * target)
+            if allocated == 0 and len(tool_songs) > 0:
+                allocated = 1
+            final.extend(tool_songs[:allocated])
+        # Check that call 1's song is included
+        assert any(s['item_id'] == 'tiny' for s in final)
+
+    def test_rounding_backfill(self):
+        """Remaining songs are backfilled if proportional rounding falls short."""
+        all_songs = [_song(f'id{i}') for i in range(120)]
+        song_sources = {f'id{i}': i % 3 for i in range(120)}
+        target = 100
+        songs_by_call = {}
+        for s in all_songs:
+            ci = song_sources[s['item_id']]
+            songs_by_call.setdefault(ci, []).append(s)
+        final = []
+        for ci, ts in songs_by_call.items():
+            proportion = len(ts) / len(all_songs)
+            allocated = int(proportion * target)
+            if allocated == 0 and len(ts) > 0:
+                allocated = 1
+            final.extend(ts[:allocated])
+        if len(final) < target:
+            remaining = [s for s in all_songs if s not in final]
+            final.extend(remaining[:target - len(final)])
+        assert len(final) == target
+
+
+# ---------------------------------------------------------------------------
+# Pre-Execution Validation
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestPreExecutionValidation:
+    """Test pre-execution validation of tool calls."""
+
+    def test_song_similarity_empty_title_rejected(self):
+        """song_similarity with empty title is rejected."""
+        tc = {'name': 'song_similarity', 'arguments': {'song_title': '', 'song_artist': 'Artist'}}
+        ta = tc['arguments']
+        assert not ta.get('song_title', '').strip()
+
+    def test_song_similarity_empty_artist_rejected(self):
+        """song_similarity with empty artist is rejected."""
+        tc = {'name': 'song_similarity', 'arguments': {'song_title': 'Title', 'song_artist': ''}}
+        ta = tc['arguments']
+        assert not ta.get('song_artist', '').strip()
+
+    def test_song_similarity_whitespace_only_rejected(self):
+        """song_similarity with whitespace-only values is rejected."""
+        tc = {'name': 'song_similarity', 'arguments': {'song_title': '   ', 'song_artist': '  '}}
+        ta = tc['arguments']
+        assert not ta.get('song_title', '').strip()
+        assert not ta.get('song_artist', '').strip()
+
+    def test_song_similarity_valid_passes(self):
+        """song_similarity with valid title and artist passes."""
+        tc = {'name': 'song_similarity', 'arguments': {'song_title': 'Bohemian Rhapsody', 'song_artist': 'Queen'}}
+        ta = tc['arguments']
+        assert ta.get('song_title', '').strip()
+        assert ta.get('song_artist', '').strip()
+
+    def test_search_database_no_filters_rejected(self):
+        """search_database with no filters is rejected."""
+        tc = {'name': 'search_database', 'arguments': {'get_songs': 50}}
+        ta = tc['arguments']
+        filter_keys = ['genres', 'moods', 'tempo_min', 'tempo_max', 'energy_min', 'energy_max',
+                       'key', 'scale', 'year_min', 'year_max', 'min_rating']
+        has_filter = any(ta.get(k) for k in filter_keys)
+        assert not has_filter
+
+    def test_search_database_with_genres_passes(self):
+        """search_database with genres filter passes."""
+        tc = {'name': 'search_database', 'arguments': {'genres': ['rock'], 'get_songs': 50}}
+        ta = tc['arguments']
+        filter_keys = ['genres', 'moods', 'tempo_min', 'tempo_max', 'energy_min', 'energy_max',
+                       'key', 'scale', 'year_min', 'year_max', 'min_rating']
+        has_filter = any(ta.get(k) for k in filter_keys)
+        assert has_filter
+
+    def test_search_database_with_energy_passes(self):
+        """search_database with energy filter passes."""
+        tc = {'name': 'search_database', 'arguments': {'energy_min': 0.5, 'get_songs': 50}}
+        ta = tc['arguments']
+        filter_keys = ['genres', 'moods', 'tempo_min', 'tempo_max', 'energy_min', 'energy_max',
+                       'key', 'scale', 'year_min', 'year_max', 'min_rating']
+        has_filter = any(ta.get(k) for k in filter_keys)
+        assert has_filter
+
+    def test_search_database_with_year_filter_passes(self):
+        """search_database with year_min filter passes."""
+        tc = {'name': 'search_database', 'arguments': {'year_min': 2000, 'get_songs': 50}}
+        ta = tc['arguments']
+        filter_keys = ['genres', 'moods', 'tempo_min', 'tempo_max', 'energy_min', 'energy_max',
+                       'key', 'scale', 'year_min', 'year_max', 'min_rating']
+        has_filter = any(ta.get(k) for k in filter_keys)
+        assert has_filter
+
+
+# ---------------------------------------------------------------------------
+# Iteration Deduplication
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestIterationDeduplication:
+    """Test song deduplication across iterations."""
+
+    def test_duplicate_ids_filtered(self):
+        """Duplicate item_ids are not added twice."""
+        song_ids_seen = set()
+        all_songs = []
+        batch1 = [_song('id1'), _song('id2'), _song('id3')]
+        batch2 = [_song('id2'), _song('id3'), _song('id4')]  # id2, id3 are dupes
+        for s in batch1:
+            if s['item_id'] not in song_ids_seen:
+                all_songs.append(s)
+                song_ids_seen.add(s['item_id'])
+        for s in batch2:
+            if s['item_id'] not in song_ids_seen:
+                all_songs.append(s)
+                song_ids_seen.add(s['item_id'])
+        assert len(all_songs) == 4
+        assert song_ids_seen == {'id1', 'id2', 'id3', 'id4'}
+
+    def test_all_duplicates_adds_zero(self):
+        """When all songs are duplicates, zero new songs are added."""
+        song_ids_seen = {'id1', 'id2'}
+        all_songs = [_song('id1'), _song('id2')]
+        batch = [_song('id1'), _song('id2')]
+        new_count = 0
+        for s in batch:
+            if s['item_id'] not in song_ids_seen:
+                all_songs.append(s)
+                song_ids_seen.add(s['item_id'])
+                new_count += 1
+        assert new_count == 0
+
+
+# ---------------------------------------------------------------------------
+# Stopping Conditions
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestStoppingConditions:
+    """Test the agentic loop stopping conditions."""
+
+    def test_target_reached_stops(self):
+        """Loop stops when target song count is reached."""
+        target = 100
+        current = 105
+        assert current >= target
+
+    def test_no_tool_calls_stops(self):
+        """Loop stops when AI returns no tool calls."""
+        tool_calls = []
+        assert not tool_calls
+
+    def test_no_new_songs_stops(self):
+        """Loop stops when an iteration adds 0 new songs."""
+        iteration_songs_added = 0
+        assert iteration_songs_added == 0
+
+    def test_max_iterations_stops(self):
+        """Loop stops at max_iterations."""
+        max_iterations = 5
+        for iteration in range(max_iterations):
+            pass
+        assert iteration == max_iterations - 1
+
+    def test_ai_error_stops_after_first_iteration(self):
+        """AI error on iteration > 0 breaks the loop."""
+        iteration = 2
+        error = True
+        should_break = iteration > 0 and error
+        assert should_break
+
+
+# ---------------------------------------------------------------------------
+# API Key Validation
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestAPIKeyValidation:
+    """Test API key validation for cloud providers."""
+
+    def test_missing_input_returns_400(self, client):
+        """Request without userInput returns 400."""
+        resp = client.post('/api/chatPlaylist', json={})
+        assert resp.status_code == 400
+        assert resp.content_type.startswith('application/json')
+        assert 'error' in resp.get_json()
+
+    def test_none_provider_returns_no_ai_message(self, client):
+        """Provider NONE returns informational message."""
+        resp = client.post('/api/chatPlaylist', json={
+            'userInput': 'test',
+            'ai_provider': 'NONE'
+        })
+        assert resp.status_code == 200
+        assert resp.content_type.startswith('application/json')
+        data = resp.get_json()
+        assert 'No AI provider selected' in data['response']['message']
+
+    def test_openai_missing_key_returns_400(self, client):
+        """OpenAI without API key returns 400."""
+        resp = client.post('/api/chatPlaylist', json={
+            'userInput': 'test',
+            'ai_provider': 'OPENAI',
+            'openai_api_key': ''
+        })
+        assert resp.status_code == 400
+        assert resp.content_type.startswith('application/json')
+        assert 'error' in resp.get_json() or 'response' in resp.get_json()
+
+    def test_gemini_placeholder_key_returns_400(self, client):
+        """Gemini with placeholder key returns 400."""
+        resp = client.post('/api/chatPlaylist', json={
+            'userInput': 'test',
+            'ai_provider': 'GEMINI',
+            'gemini_api_key': 'YOUR-GEMINI-API-KEY-HERE'
+        })
+        assert resp.status_code == 400
+        assert resp.content_type.startswith('application/json')
+        assert 'error' in resp.get_json() or 'response' in resp.get_json()
+
+    def test_mistral_placeholder_key_returns_400(self, client):
+        """Mistral with placeholder key returns 400."""
+        resp = client.post('/api/chatPlaylist', json={
+            'userInput': 'test',
+            'ai_provider': 'MISTRAL',
+            'mistral_api_key': 'YOUR-MISTRAL-API-KEY-HERE'
+        })
+        assert resp.status_code == 400
+        assert resp.content_type.startswith('application/json')
+        assert 'error' in resp.get_json() or 'response' in resp.get_json()
+
+
+# ---------------------------------------------------------------------------
+# Create Playlist Endpoint
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestCreatePlaylistEndpoint:
+    """Test the /api/create_playlist endpoint."""
+
+    def _mock_voyager(self):
+        """Context manager to mock tasks.voyager_manager for import."""
+        mock_vm = MagicMock()
+        return patch.dict('sys.modules', {'tasks.voyager_manager': mock_vm})
+
+    def test_missing_params_returns_400(self, client):
+        """Missing playlist_name or item_ids returns 400."""
+        with self._mock_voyager():
+            resp = client.post('/api/create_playlist', json={'playlist_name': 'Test'})
+            assert resp.status_code == 400
+
+    def test_empty_name_returns_400(self, client):
+        """Empty playlist name returns 400."""
+        with self._mock_voyager():
+            resp = client.post('/api/create_playlist', json={
+                'playlist_name': '  ',
+                'item_ids': ['id1']
+            })
+            assert resp.status_code == 400
+
+    def test_empty_item_ids_returns_400(self, client):
+        """Empty item_ids list returns 400."""
+        with self._mock_voyager():
+            resp = client.post('/api/create_playlist', json={
+                'playlist_name': 'Test',
+                'item_ids': []
+            })
+            assert resp.status_code == 400
+
+    def test_single_provider_success(self, client):
+        """Successful single-provider playlist creation."""
+        mock_vm = MagicMock()
+        mock_vm.create_playlist_from_ids = Mock(return_value='playlist-123')
+        with patch.dict('sys.modules', {'tasks.voyager_manager': mock_vm}):
+            resp = client.post('/api/create_playlist', json={
+                'playlist_name': 'My Mix',
+                'item_ids': ['id1', 'id2']
+            })
+            assert resp.status_code == 200
+            data = resp.get_json()
+            assert 'Successfully created' in data['message']
+
+    def test_multi_provider_success(self, client):
+        """Successful multi-provider playlist creation."""
+        mock_vm = MagicMock()
+        mock_vm.create_playlist_from_ids = Mock(return_value={
+            'jellyfin': {'success': True, 'id': 'jf-1'},
+            'navidrome': {'success': False, 'error': 'timeout'}
+        })
+        with patch.dict('sys.modules', {'tasks.voyager_manager': mock_vm}):
+            resp = client.post('/api/create_playlist', json={
+                'playlist_name': 'My Mix',
+                'item_ids': ['id1'],
+                'provider_ids': 'all'
+            })
+            assert resp.status_code == 200
+            data = resp.get_json()
+            assert '1/2' in data['message']
+
+
+# ---------------------------------------------------------------------------
+# Config Defaults Endpoint
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestConfigDefaultsEndpoint:
+    """Test the /api/config_defaults endpoint."""
+
+    def test_returns_200(self, client):
+        """GET /api/config_defaults returns 200."""
+        resp = client.get('/api/config_defaults')
+        assert resp.status_code == 200
+
+    def test_returns_json_content_type(self, client):
+        """Response has application/json content type."""
+        resp = client.get('/api/config_defaults')
+        assert resp.content_type.startswith('application/json')
+
+    def test_returns_json_with_expected_keys(self, client):
+        """Response includes provider configuration defaults."""
+        resp = client.get('/api/config_defaults')
+        data = resp.get_json()
+        assert isinstance(data, dict)
+        assert 'default_ai_provider' in data
+        assert 'default_ollama_model_name' in data
+        assert 'ollama_server_url' in data
+        assert 'default_openai_model_name' in data
+        assert 'openai_server_url' in data
+        assert 'default_gemini_model_name' in data
+        assert 'default_mistral_model_name' in data
+
+    def test_values_are_strings(self, client):
+        """All returned values are strings."""
+        resp = client.get('/api/config_defaults')
+        data = resp.get_json()
+        for key, value in data.items():
+            assert isinstance(value, str), f"Expected string for '{key}', got {type(value)}"
diff --git a/tests/unit/test_app_setup.py b/tests/unit/test_app_setup.py
new file mode 100644
index 00000000..ae52aca7
--- /dev/null
+++ b/tests/unit/test_app_setup.py
@@ -0,0 +1,603 @@
+"""Unit tests for app_setup.py Flask blueprint
+
+Tests cover the setup wizard and provider management:
+- Provider config validation (PROVIDER_SCHEMAS)
+- Setup status detection (env auto-detect, DB flag)
+- Provider CRUD operations
+- Settings management (get/set/apply)
+- API endpoint responses
+- Multi-provider mode
+"""
+import json
+import sys
+import pytest
+from datetime import datetime
+from unittest.mock import Mock, MagicMock, patch, call
+
+flask = pytest.importorskip('flask', reason='Flask not installed')
+from flask import Flask
+
+# Pre-register mock for tasks.mediaserver to avoid pydub/audioop import chain
+if 'tasks.mediaserver' not in sys.modules:
+    _mock_mediaserver = MagicMock()
+    _mock_mediaserver.get_available_provider_types = Mock(return_value={})
+    _mock_mediaserver.get_provider_info = Mock(return_value=None)
+    _mock_mediaserver.test_provider_connection = Mock(return_value=(True, 'OK'))
+    _mock_mediaserver.get_sample_tracks_from_provider = Mock(return_value=[])
+    _mock_mediaserver.get_libraries_for_provider = Mock(return_value=[])
+    _mock_mediaserver.PROVIDER_TYPES = {
+        'jellyfin': {'name': 'Jellyfin', 'description': 'Jellyfin Server',
+                     'supports_user_auth': True, 'supports_play_history': True},
+        'navidrome': {'name': 'Navidrome', 'description': 'Navidrome Server',
+                      'supports_user_auth': True, 'supports_play_history': True},
+        'lyrion': {'name': 'Lyrion', 'description': 'Lyrion Music Server',
+                   'supports_user_auth': False, 'supports_play_history': True},
+        'emby': {'name': 'Emby', 'description': 'Emby Server',
+                 'supports_user_auth': True, 'supports_play_history': True},
+        'localfiles': {'name': 'Local Files', 'description': 'Local file system',
+                       'supports_user_auth': False, 'supports_play_history': False},
+    }
+    sys.modules['tasks.mediaserver'] = _mock_mediaserver
+
+
+# ---------------------------------------------------------------------------
+# Fixtures
+# ---------------------------------------------------------------------------
+
+@pytest.fixture
+def app():
+    """Create a Flask app with the setup blueprint registered."""
+    with patch('app_setup.get_db') as _mock_get_db, \
+         patch('app_setup.detect_music_path_prefix') as _mock_detect, \
+         patch('app_setup.encrypt_provider_config', side_effect=lambda x: x), \
+         patch('app_setup.decrypt_provider_config', side_effect=lambda x: x):
+        from app_setup import setup_bp
+        flask_app = Flask(__name__)
+        flask_app.register_blueprint(setup_bp)
+        flask_app.config['TESTING'] = True
+        yield flask_app
+
+
+@pytest.fixture
+def client(app):
+    """Create a Flask test client."""
+    return app.test_client()
+
+
+def _make_mock_cursor(rows=None, fetchone_val=None, rowcount=1):
+    """Helper to create a mock DB cursor with context-manager support."""
+    mock_cur = MagicMock()
+    if rows is not None:
+        mock_cur.fetchall.return_value = rows
+    if fetchone_val is not None:
+        mock_cur.fetchone.return_value = fetchone_val
+    mock_cur.rowcount = rowcount
+    return mock_cur
+
+
+def _make_mock_db(cursor):
+    """Helper to create a mock DB connection that yields the given cursor."""
+    mock_db = MagicMock()
+    mock_db.cursor.return_value.__enter__ = Mock(return_value=cursor)
+    mock_db.cursor.return_value.__exit__ = Mock(return_value=False)
+    return mock_db
+
+
+# ---------------------------------------------------------------------------
+# Provider Config Validation (PROVIDER_SCHEMAS)
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestProviderConfigValidation:
+    """Test validate_provider_config() for all provider types."""
+
+    def _validate(self, provider_type, config_data):
+        from app_setup import validate_provider_config
+        return validate_provider_config(provider_type, config_data)
+
+    def test_unknown_provider_type_invalid(self):
+        valid, errors = self._validate('unknown_type', {})
+        assert not valid
+        assert 'Unknown provider type' in errors[0]
+
+    def test_jellyfin_valid(self):
+        valid, errors = self._validate('jellyfin', {
+            'url': 'http://localhost:8096',
+            'user_id': 'user123',
+            'token': 'abc123'
+        })
+        assert valid
+        assert len(errors) == 0
+
+    def test_jellyfin_missing_required_fields(self):
+        valid, errors = self._validate('jellyfin', {'url': 'http://localhost'})
+        assert not valid
+        assert any('user_id' in e for e in errors)
+        assert any('token' in e for e in errors)
+
+    def test_jellyfin_invalid_url_scheme(self):
+        valid, errors = self._validate('jellyfin', {
+            'url': 'ftp://localhost:8096',
+            'user_id': 'user123',
+            'token': 'abc123'
+        })
+        assert not valid
+        assert any('http://' in e for e in errors)
+
+    def test_navidrome_valid(self):
+        valid, errors = self._validate('navidrome', {
+            'url': 'https://navidrome.local',
+            'user': 'admin',
+            'password': 'pass123'
+        })
+        assert valid
+
+    def test_navidrome_missing_password(self):
+        valid, errors = self._validate('navidrome', {
+            'url': 'https://navidrome.local',
+            'user': 'admin'
+        })
+        assert not valid
+        assert any('password' in e for e in errors)
+
+    def test_lyrion_valid(self):
+        valid, errors = self._validate('lyrion', {
+            'url': 'http://lyrion.local:9000'
+        })
+        assert valid
+
+    def test_lyrion_missing_url(self):
+        valid, errors = self._validate('lyrion', {})
+        assert not valid
+        assert any('url' in e for e in errors)
+
+    def test_emby_valid(self):
+        valid, errors = self._validate('emby', {
+            'url': 'http://emby.local:8096',
+            'user_id': 'uid',
+            'token': 'tok'
+        })
+        assert valid
+
+    def test_localfiles_valid(self):
+        with patch('os.path.isabs', return_value=True):
+            valid, errors = self._validate('localfiles', {
+                'music_directory': '/music/library'
+            })
+        assert valid
+
+    def test_localfiles_relative_path_invalid(self):
+        valid, errors = self._validate('localfiles', {
+            'music_directory': 'relative/path'
+        })
+        assert not valid
+        assert any('absolute' in e for e in errors)
+
+    def test_localfiles_missing_music_directory(self):
+        valid, errors = self._validate('localfiles', {})
+        assert not valid
+        assert any('music_directory' in e for e in errors)
+
+    def test_all_provider_types_in_schema(self):
+        """All known provider types have validation schemas."""
+        from app_setup import PROVIDER_SCHEMAS
+        expected = {'jellyfin', 'navidrome', 'lyrion', 'emby', 'localfiles'}
+        assert set(PROVIDER_SCHEMAS.keys()) == expected
+
+
+# ---------------------------------------------------------------------------
+# Setup Status Detection
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestSetupStatus:
+    """Test is_setup_completed() with env-var auto-detection."""
+
+    @patch('app_setup.get_setting', return_value=True)
+    def test_completed_from_db_flag(self, mock_get):
+        from app_setup import is_setup_completed
+        assert is_setup_completed() is True
+
+    @patch('app_setup.get_setting', return_value=None)
+    @patch('app_setup.create_default_provider_from_env')
+    @patch('app_setup.set_setting')
+    def test_auto_detect_jellyfin_env(self, mock_set, mock_create, mock_get):
+        """Jellyfin env vars auto-complete setup."""
+        import config
+        with patch.object(config, 'MEDIASERVER_TYPE', 'jellyfin'), \
+             patch.object(config, 'JELLYFIN_URL', 'http://jf:8096'), \
+             patch.object(config, 'JELLYFIN_TOKEN', 'tok123'), \
+             patch.object(config, 'JELLYFIN_USER_ID', 'user1'):
+            from app_setup import is_setup_completed
+            result = is_setup_completed()
+            assert result is True
+            mock_create.assert_called_once()
+
+    @patch('app_setup.get_setting', return_value=None)
+    def test_localfiles_requires_wizard(self, mock_get):
+        """localfiles provider type requires the wizard."""
+        import config
+        with patch.object(config, 'MEDIASERVER_TYPE', 'localfiles'):
+            from app_setup import is_setup_completed
+            result = is_setup_completed()
+            assert result is False
+
+    @patch('app_setup.get_setting', return_value=None)
+    def test_placeholder_values_not_detected(self, mock_get):
+        """Placeholder values like 'your_...' are not auto-detected."""
+        import config
+        with patch.object(config, 'MEDIASERVER_TYPE', 'jellyfin'), \
+             patch.object(config, 'JELLYFIN_URL', 'http://your_jellyfin_url'), \
+             patch.object(config, 'JELLYFIN_TOKEN', 'your_token'), \
+             patch.object(config, 'JELLYFIN_USER_ID', 'your_user_id'):
+            from app_setup import is_setup_completed
+            result = is_setup_completed()
+            assert result is False
+
+
+# ---------------------------------------------------------------------------
+# Settings Management
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestSettingsManagement:
+    """Test get/set settings and apply_settings_to_config."""
+
+    @patch('app_setup.get_setting')
+    def test_apply_int_setting(self, mock_get_setting):
+        """Integer settings are type-cast correctly."""
+        mock_get_setting.return_value = '10'
+        import config
+        original = config.MAX_SONGS_PER_ARTIST_PLAYLIST
+        try:
+            from app_setup import apply_settings_to_config
+            # Only the max_songs_per_artist_playlist key should match
+            mock_get_setting.side_effect = lambda key: '10' if key == 'max_songs_per_artist_playlist' else None
+            apply_settings_to_config()
+            assert config.MAX_SONGS_PER_ARTIST_PLAYLIST == 10
+        finally:
+            config.MAX_SONGS_PER_ARTIST_PLAYLIST = original
+
+    @patch('app_setup.get_setting')
+    def test_apply_bool_setting(self, mock_get_setting):
+        """Boolean settings are type-cast correctly."""
+        import config
+        original = config.PLAYLIST_ENERGY_ARC
+        try:
+            mock_get_setting.side_effect = lambda key: 'true' if key == 'playlist_energy_arc' else None
+            from app_setup import apply_settings_to_config
+            apply_settings_to_config()
+            assert config.PLAYLIST_ENERGY_ARC is True
+        finally:
+            config.PLAYLIST_ENERGY_ARC = original
+
+
+# ---------------------------------------------------------------------------
+# API Endpoints
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestSetupEndpoints:
+    """Test setup API endpoints."""
+
+    def test_setup_page_renders(self, client):
+        """GET /setup returns 200."""
+        with patch('app_setup.render_template', return_value='<html>setup</html>'):
+            resp = client.get('/setup')
+            assert resp.status_code == 200
+            assert 'text/html' in resp.content_type
+
+    def test_settings_page_renders(self, client):
+        """GET /settings returns 200."""
+        with patch('app_setup.render_template', return_value='<html>settings</html>'):
+            resp = client.get('/settings')
+            assert resp.status_code == 200
+            assert 'text/html' in resp.content_type
+
+    @patch('app_setup.get_providers', return_value=[])
+    @patch('app_setup.is_setup_completed', return_value=False)
+    @patch('app_setup.is_multi_provider_enabled', return_value=False)
+    @patch('app_setup.create_default_provider_from_env')
+    def test_status_endpoint(self, mock_create, mock_multi, mock_setup, mock_providers, client):
+        """GET /api/setup/status returns status JSON."""
+        resp = client.get('/api/setup/status')
+        assert resp.status_code == 200
+        assert resp.content_type.startswith('application/json')
+        data = resp.get_json()
+        assert 'setup_completed' in data
+        assert 'provider_count' in data
+
+    @patch('app_setup.get_available_provider_types')
+    @patch('app_setup.get_provider_info')
+    def test_provider_types_endpoint(self, mock_info, mock_types, client):
+        """GET /api/setup/providers/types returns provider type list."""
+        mock_types.return_value = {
+            'jellyfin': {'name': 'Jellyfin', 'description': 'Jellyfin Server',
+                         'supports_user_auth': True, 'supports_play_history': True}
+        }
+        mock_info.return_value = {'config_fields': [{'name': 'url'}]}
+        resp = client.get('/api/setup/providers/types')
+        assert resp.status_code == 200
+        assert resp.content_type.startswith('application/json')
+        data = resp.get_json()
+        assert len(data) == 1
+        assert data[0]['type'] == 'jellyfin'
+
+    @patch('app_setup.get_providers', return_value=[])
+    def test_list_providers_empty(self, mock_providers, client):
+        """GET /api/setup/providers returns empty list."""
+        resp = client.get('/api/setup/providers')
+        assert resp.status_code == 200
+        assert resp.content_type.startswith('application/json')
+        assert resp.get_json() == []
+
+
+# ---------------------------------------------------------------------------
+# Provider CRUD
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestProviderCRUD:
+    """Test provider create/update/delete endpoints."""
+
+    def test_create_provider_missing_data(self, client):
+        """POST /api/setup/providers with no body returns 400."""
+        resp = client.post('/api/setup/providers',
+                          data='', content_type='application/json')
+        assert resp.status_code in (400, 415)
+
+    def test_create_provider_missing_type(self, client):
+        """POST /api/setup/providers without provider_type returns 400."""
+        resp = client.post('/api/setup/providers', json={'name': 'Test'})
+        assert resp.status_code == 400
+        assert 'provider_type' in resp.get_json()['error']
+
+    def test_create_provider_missing_name(self, client):
+        """POST /api/setup/providers without name returns 400."""
+        resp = client.post('/api/setup/providers', json={'provider_type': 'jellyfin'})
+        assert resp.status_code == 400
+        assert 'name' in resp.get_json()['error']
+
+    @patch('app_setup.PROVIDER_TYPES', {'jellyfin': {'name': 'Jellyfin'}})
+    @patch('app_setup.validate_provider_config', return_value=(True, []))
+    @patch('app_setup.get_providers', return_value=[])
+    @patch('app_setup.add_provider', return_value=1)
+    def test_create_provider_success(self, mock_add, mock_get, mock_validate, client):
+        """Successful provider creation returns 201."""
+        resp = client.post('/api/setup/providers', json={
+            'provider_type': 'jellyfin',
+            'name': 'My Jellyfin',
+            'config': {'url': 'http://jf:8096', 'user_id': 'u', 'token': 't'}
+        })
+        assert resp.status_code == 201
+        assert resp.get_json()['id'] == 1
+
+    @patch('app_setup.PROVIDER_TYPES', {'jellyfin': {'name': 'Jellyfin'}})
+    @patch('app_setup.validate_provider_config', return_value=(True, []))
+    @patch('app_setup.get_providers', return_value=[
+        {'id': 1, 'provider_type': 'jellyfin', 'name': 'Old', 'config': {}}
+    ])
+    @patch('app_setup.update_provider', return_value=True)
+    def test_create_provider_upserts_existing(self, mock_update, mock_get, mock_validate, client):
+        """Creating a provider of existing type upserts instead."""
+        resp = client.post('/api/setup/providers', json={
+            'provider_type': 'jellyfin',
+            'name': 'Updated Jellyfin',
+            'config': {'url': 'http://jf:8096', 'user_id': 'u', 'token': 't'}
+        })
+        assert resp.status_code == 200
+        assert resp.get_json().get('was_update') is True
+
+    @patch('app_setup.validate_provider_config', return_value=(False, ['Missing url']))
+    @patch('app_setup.PROVIDER_TYPES', {'jellyfin': {'name': 'Jellyfin'}})
+    def test_create_provider_validation_failure(self, mock_validate, client):
+        """Provider creation with invalid config returns 400."""
+        resp = client.post('/api/setup/providers', json={
+            'provider_type': 'jellyfin',
+            'name': 'Bad Config',
+            'config': {}
+        })
+        assert resp.status_code == 400
+        assert 'Validation failed' in resp.get_json()['error']
+
+    @patch('app_setup.delete_provider', return_value=True)
+    def test_delete_provider_success(self, mock_delete, client):
+        """DELETE /api/setup/providers/<id> returns success."""
+        resp = client.delete('/api/setup/providers/1')
+        assert resp.status_code == 200
+
+    @patch('app_setup.delete_provider', return_value=False)
+    def test_delete_provider_not_found(self, mock_delete, client):
+        """DELETE nonexistent provider returns 404."""
+        resp = client.delete('/api/setup/providers/999')
+        assert resp.status_code == 404
+
+
+# ---------------------------------------------------------------------------
+# Complete Setup & Multi-Provider
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestSetupCompletion:
+    """Test setup completion and multi-provider mode."""
+
+    @patch('app_setup.set_setting')
+    def test_complete_setup_marks_flag(self, mock_set, client):
+        """POST /api/setup/complete marks setup as completed."""
+        resp = client.post('/api/setup/complete')
+        assert resp.status_code == 200
+        data = resp.get_json()
+        assert data['setup_completed'] is True
+        # Verify set_setting was called with setup_completed=True
+        calls = [c for c in mock_set.call_args_list if c[0][0] == 'setup_completed']
+        assert len(calls) >= 1
+
+    @patch('app_setup.set_setting')
+    def test_enable_multi_provider(self, mock_set, client):
+        """POST /api/setup/multi-provider enables multi-provider mode."""
+        resp = client.post('/api/setup/multi-provider', json={'enabled': True})
+        assert resp.status_code == 200
+        data = resp.get_json()
+        assert data['multi_provider_enabled'] is True
+
+    @patch('app_setup.set_setting')
+    def test_disable_multi_provider(self, mock_set, client):
+        """POST /api/setup/multi-provider disables multi-provider mode."""
+        resp = client.post('/api/setup/multi-provider', json={'enabled': False})
+        assert resp.status_code == 200
+        data = resp.get_json()
+        assert data['multi_provider_enabled'] is False
+
+    def test_multi_provider_no_data(self, client):
+        """POST /api/setup/multi-provider with no data returns 400."""
+        resp = client.post('/api/setup/multi-provider',
+                          data='', content_type='application/json')
+        assert resp.status_code in (400, 415)
+
+
+# ---------------------------------------------------------------------------
+# Settings Endpoints
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestSettingsEndpoints:
+    """Test settings API endpoints."""
+
+    @patch('app_setup.get_all_settings', return_value={'general': {'key1': {'value': 'val1'}}})
+    def test_get_settings(self, mock_all, client):
+        """GET /api/setup/settings returns grouped settings."""
+        resp = client.get('/api/setup/settings')
+        assert resp.status_code == 200
+        data = resp.get_json()
+        assert 'general' in data
+
+    @patch('app_setup.set_setting')
+    @patch('app_setup.apply_settings_to_config')
+    def test_update_settings(self, mock_apply, mock_set, client):
+        """PUT /api/setup/settings updates settings and applies them."""
+        resp = client.put('/api/setup/settings', json={'ai_provider': 'GEMINI'})
+        assert resp.status_code == 200
+        mock_set.assert_called_once_with('ai_provider', 'GEMINI')
+        mock_apply.assert_called_once()
+
+    def test_update_settings_no_data(self, client):
+        """PUT /api/setup/settings with no data returns 400."""
+        resp = client.put('/api/setup/settings',
+                         data='', content_type='application/json')
+        assert resp.status_code in (400, 415)
+
+
+# ---------------------------------------------------------------------------
+# Provider Update Endpoint
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestProviderUpdateEndpoint:
+    """Test PUT /api/setup/providers/<id> endpoint."""
+
+    @patch('app_setup.get_provider_by_id', return_value=None)
+    def test_update_nonexistent_provider_returns_404(self, mock_get, client):
+        """PUT on nonexistent provider returns 404."""
+        resp = client.put('/api/setup/providers/999', json={'name': 'New Name'})
+        assert resp.status_code == 404
+        assert resp.content_type.startswith('application/json')
+        assert 'error' in resp.get_json()
+
+    @patch('app_setup.get_provider_by_id', return_value={
+        'id': 1, 'provider_type': 'jellyfin', 'name': 'Jelly',
+        'config': {'url': 'http://jf:8096', 'user_id': 'u', 'token': 't'},
+        'enabled': True, 'priority': 0,
+    })
+    def test_update_provider_no_data_returns_400(self, mock_get, client):
+        """PUT with empty body returns 400."""
+        resp = client.put('/api/setup/providers/1',
+                         data='', content_type='application/json')
+        assert resp.status_code in (400, 415)
+
+    @patch('app_setup.update_provider', return_value=True)
+    @patch('app_setup.validate_provider_config', return_value=(True, []))
+    @patch('app_setup.get_provider_by_id', return_value={
+        'id': 1, 'provider_type': 'jellyfin', 'name': 'Jelly',
+        'config': {'url': 'http://jf:8096', 'user_id': 'u', 'token': 't'},
+        'enabled': True, 'priority': 0,
+    })
+    def test_update_provider_success(self, mock_get, mock_validate, mock_update, client):
+        """Successful provider update returns 200."""
+        resp = client.put('/api/setup/providers/1', json={
+            'name': 'Updated Jellyfin',
+            'config': {'url': 'http://jf:8096', 'user_id': 'u2', 'token': 't2'}
+        })
+        assert resp.status_code == 200
+        assert resp.content_type.startswith('application/json')
+        assert 'message' in resp.get_json()
+
+
+# ---------------------------------------------------------------------------
+# Provider Test Endpoints
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestProviderTestEndpoints:
+    """Test provider connection test endpoints."""
+
+    @patch('app_setup.get_provider_by_id', return_value=None)
+    def test_test_saved_provider_not_found(self, mock_get, client):
+        """POST /api/setup/providers/<id>/test returns 404 for missing provider."""
+        resp = client.post('/api/setup/providers/999/test')
+        assert resp.status_code == 404
+        assert 'error' in resp.get_json()
+
+    @patch('app_setup.test_provider_connection', return_value=(True, 'Connection OK'))
+    @patch('app_setup.get_provider_by_id', return_value={
+        'id': 1, 'provider_type': 'jellyfin', 'name': 'Jelly',
+        'config': {'url': 'http://jf:8096', 'user_id': 'u', 'token': 't'},
+        'enabled': True, 'priority': 0,
+    })
+    def test_test_saved_provider_success(self, mock_get, mock_test, client):
+        """POST /api/setup/providers/<id>/test returns success result."""
+        resp = client.post('/api/setup/providers/1/test')
+        assert resp.status_code == 200
+        data = resp.get_json()
+        assert data['success'] is True
+        assert 'message' in data
+        assert data['provider_type'] == 'jellyfin'
+
+    def test_test_unsaved_provider_no_data(self, client):
+        """POST /api/setup/providers/test with no data returns 400."""
+        resp = client.post('/api/setup/providers/test',
+                          data='', content_type='application/json')
+        assert resp.status_code in (400, 415)
+
+    def test_test_unsaved_provider_missing_type(self, client):
+        """POST /api/setup/providers/test without provider_type returns 400."""
+        resp = client.post('/api/setup/providers/test', json={'config': {}})
+        assert resp.status_code == 400
+        assert 'error' in resp.get_json()
+
+    @patch('app_setup.test_provider_connection', return_value=(False, 'Connection refused'))
+    def test_test_unsaved_provider_failure(self, mock_test, client):
+        """POST /api/setup/providers/test with failing connection."""
+        resp = client.post('/api/setup/providers/test', json={
+            'provider_type': 'jellyfin',
+            'config': {'url': 'http://bad:8096'},
+            'detect_prefix': False
+        })
+        assert resp.status_code == 200
+        data = resp.get_json()
+        assert data['success'] is False
+        assert 'message' in data
+
+
+# ---------------------------------------------------------------------------
+# Browse Directories Endpoint
+# ---------------------------------------------------------------------------
+
+@pytest.mark.integration
+class TestBrowseDirectoriesEndpoint:
+    """Test GET /api/setup/browse-directories endpoint."""
+
+    def test_path_traversal_rejected(self, client):
+        """Path traversal with '..' is rejected."""
+        resp = client.get('/api/setup/browse-directories?path=/music/../etc')
+        assert resp.status_code == 400
+        assert 'error' in resp.get_json()
diff --git a/tests/unit/test_mcp_server.py b/tests/unit/test_mcp_server.py
new file mode 100644
index 00000000..e6e67ae3
--- /dev/null
+++ b/tests/unit/test_mcp_server.py
@@ -0,0 +1,1322 @@
+"""Unit tests for tasks/mcp_server.py
+
+Tests cover MCP server tool functions:
+- get_library_context(): Library statistics with caching
+- _database_genre_query_sync(): Genre regex matching, filters, relevance scoring
+- _ai_brainstorm_sync(): Two-stage matching (exact + fuzzy normalized)
+- _song_similarity_api_sync(): Song lookup with exact/fuzzy fallback
+- Energy normalization in execute_mcp_tool()
+- Pre-execution validation (filterless search_database rejection)
+
+NOTE: uses importlib to load tasks.mcp_server directly, bypassing
+tasks/__init__.py which pulls in pydub (requires audioop removed in Python 3.14).
+"""
+import json
+import re
+import os
+import sys
+import importlib.util
+import pytest
+from unittest.mock import Mock, MagicMock, patch, call
+
+
+# ---------------------------------------------------------------------------
+# Module loaders (bypass tasks/__init__.py -> pydub -> audioop chain)
+# ---------------------------------------------------------------------------
+
+def _import_mcp_server():
+    """Load tasks.mcp_server directly without triggering tasks/__init__.py."""
+    mod_path = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)), '..', '..', 'tasks', 'mcp_server.py'
+    )
+    mod_path = os.path.normpath(mod_path)
+    mod_name = 'tasks.mcp_server'
+    if mod_name not in sys.modules:
+        spec = importlib.util.spec_from_file_location(mod_name, mod_path)
+        mod = importlib.util.module_from_spec(spec)
+        sys.modules[mod_name] = mod
+        spec.loader.exec_module(mod)
+    return sys.modules[mod_name]
+
+
+def _import_ai_mcp_client():
+    """Load ai_mcp_client directly."""
+    mod_path = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)), '..', '..', 'ai_mcp_client.py'
+    )
+    mod_path = os.path.normpath(mod_path)
+    mod_name = 'ai_mcp_client'
+    if mod_name not in sys.modules:
+        spec = importlib.util.spec_from_file_location(mod_name, mod_path)
+        mod = importlib.util.module_from_spec(spec)
+        sys.modules[mod_name] = mod
+        spec.loader.exec_module(mod)
+    return sys.modules[mod_name]
+
+
+# ---------------------------------------------------------------------------
+# Helpers to build mock DB cursors
+# ---------------------------------------------------------------------------
+
+def _make_dict_row(mapping: dict):
+    """Create an object that supports both dict-key access and attribute access,
+    mimicking psycopg2 DictRow."""
+    class FakeRow(dict):
+        def __getattr__(self, name):
+            try:
+                return self[name]
+            except KeyError:
+                raise AttributeError(name)
+    return FakeRow(mapping)
+
+
+def _make_connection(cursor):
+    """Wrap a mock cursor in a mock connection."""
+    conn = MagicMock()
+    conn.cursor.return_value = cursor
+    conn.close = Mock()
+    return conn
+
+
+# ---------------------------------------------------------------------------
+# Genre regex pattern tests (pure pattern tests, no DB needed)
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestGenreRegexPattern:
+    """Test the regex pattern used in _database_genre_query_sync for genre matching."""
+
+    def _matches(self, genre, mood_vector):
+        """Check if the genre regex pattern matches the mood_vector string."""
+        pattern = f"(^|,)\\s*{re.escape(genre)}:"
+        return bool(re.search(pattern, mood_vector, re.IGNORECASE))
+
+    def test_genre_at_start_matches(self):
+        assert self._matches("rock", "rock:0.82,pop:0.45")
+
+    def test_genre_after_comma_matches(self):
+        assert self._matches("rock", "pop:0.45,rock:0.82")
+
+    def test_genre_after_comma_with_space_matches(self):
+        assert self._matches("rock", "pop:0.45, rock:0.82")
+
+    def test_substring_does_not_match(self):
+        """'rock' must NOT match 'indie rock'."""
+        assert not self._matches("rock", "indie rock:0.31,pop:0.45")
+
+    def test_compound_genre_matches(self):
+        """'indie rock' should match 'indie rock:0.31'."""
+        assert self._matches("indie rock", "pop:0.45,indie rock:0.31")
+
+    def test_case_insensitive(self):
+        assert self._matches("Rock", "rock:0.82,pop:0.45")
+
+    def test_no_match_returns_false(self):
+        assert not self._matches("jazz", "rock:0.82,pop:0.45")
+
+    def test_single_genre_vector(self):
+        assert self._matches("rock", "rock:0.82")
+
+    def test_genre_with_special_chars(self):
+        """Genres with regex-special chars should be escaped."""
+        assert self._matches("r&b", "r&b:0.65,pop:0.45")
+
+    def test_hip_hop_no_substring_match(self):
+        """'hip hop' must not match 'trip hop'."""
+        assert not self._matches("hip hop", "trip hop:0.45")
+
+    def test_pop_no_substring_match(self):
+        """'pop' must not match 'indie pop'."""
+        assert not self._matches("pop", "indie pop:0.55,rock:0.82")
+
+    def test_pop_matches_at_start(self):
+        assert self._matches("pop", "pop:0.55,rock:0.82")
+
+
+# ---------------------------------------------------------------------------
+# get_library_context
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestGetLibraryContext:
+    """Tests for get_library_context() - library stats with caching."""
+
+    def _reset_cache(self):
+        mod = _import_mcp_server()
+        mod._library_context_cache = None
+
+    def test_returns_expected_keys(self):
+        mod = _import_mcp_server()
+        self._reset_cache()
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+
+        cur.fetchone = Mock(side_effect=[
+            _make_dict_row({"cnt": 500, "artists": 80}),
+            _make_dict_row({"ymin": 1965, "ymax": 2024}),
+            _make_dict_row({"rated": 200}),
+        ])
+
+        cur.__iter__ = Mock(side_effect=[
+            iter([_make_dict_row({"tag": "rock:0.82"}), _make_dict_row({"tag": "pop:0.45"})]),
+            iter([_make_dict_row({"mood": "danceable"}), _make_dict_row({"mood": "happy"})]),
+        ])
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"scale": "major"}),
+            _make_dict_row({"scale": "minor"}),
+        ])
+
+        conn = _make_connection(cur)
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            ctx = mod.get_library_context(force_refresh=True)
+
+        assert ctx["total_songs"] == 500
+        assert ctx["unique_artists"] == 80
+        assert ctx["year_min"] == 1965
+        assert ctx["year_max"] == 2024
+        assert ctx["has_ratings"] is True
+        assert ctx["rated_songs_pct"] == 40.0
+        assert "rock" in ctx["top_genres"]
+        assert "danceable" in ctx["top_moods"]
+        assert "major" in ctx["scales"]
+        conn.close.assert_called_once()
+
+    def test_caching_returns_same_result(self):
+        """Second call without force_refresh returns cached result."""
+        mod = _import_mcp_server()
+        self._reset_cache()
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+        cur.fetchone = Mock(return_value=_make_dict_row({"cnt": 100, "artists": 10, "ymin": 2000, "ymax": 2020, "rated": 50}))
+        cur.__iter__ = Mock(return_value=iter([]))
+        cur.fetchall = Mock(return_value=[])
+        conn = _make_connection(cur)
+        mock_get_conn = Mock(return_value=conn)
+
+        with patch.object(mod, 'get_db_connection', mock_get_conn):
+            ctx1 = mod.get_library_context(force_refresh=True)
+            ctx2 = mod.get_library_context(force_refresh=False)
+
+        # DB should only be called once
+        assert mock_get_conn.call_count == 1
+        assert ctx1 is ctx2
+
+    def test_empty_library_returns_defaults(self):
+        mod = _import_mcp_server()
+        self._reset_cache()
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+        cur.fetchone = Mock(return_value=_make_dict_row({"cnt": 0, "artists": 0, "ymin": None, "ymax": None, "rated": 0}))
+        cur.__iter__ = Mock(return_value=iter([]))
+        cur.fetchall = Mock(return_value=[])
+        conn = _make_connection(cur)
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            ctx = mod.get_library_context(force_refresh=True)
+
+        assert ctx["total_songs"] == 0
+        assert ctx["unique_artists"] == 0
+        assert ctx["has_ratings"] is False
+
+
+# ---------------------------------------------------------------------------
+# Energy normalization
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestEnergyNormalization:
+    """Test energy conversion from 0-1 (AI scale) to raw (DB scale)."""
+
+    def test_zero_maps_to_energy_min(self):
+        e_min, e_max = 0.01, 0.15
+        raw = e_min + 0.0 * (e_max - e_min)
+        assert raw == pytest.approx(0.01)
+
+    def test_one_maps_to_energy_max(self):
+        e_min, e_max = 0.01, 0.15
+        raw = e_min + 1.0 * (e_max - e_min)
+        assert raw == pytest.approx(0.15)
+
+    def test_half_maps_to_midpoint(self):
+        e_min, e_max = 0.01, 0.15
+        raw = e_min + 0.5 * (e_max - e_min)
+        assert raw == pytest.approx(0.08)
+
+    def test_quarter_maps_correctly(self):
+        e_min, e_max = 0.01, 0.15
+        raw = e_min + 0.25 * (e_max - e_min)
+        assert raw == pytest.approx(0.045)
+
+    def test_three_quarter_maps_correctly(self):
+        e_min, e_max = 0.01, 0.15
+        raw = e_min + 0.75 * (e_max - e_min)
+        assert raw == pytest.approx(0.115)
+
+
+# ---------------------------------------------------------------------------
+# _database_genre_query_sync
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestDatabaseGenreQuery:
+    """Tests for _database_genre_query_sync - database filtering."""
+
+    def _setup_mock_conn(self):
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+        cur.fetchall = Mock(return_value=[])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+        return conn, cur
+
+    def test_genre_filter_builds_regex_condition(self):
+        """Verify the SQL contains the regex pattern for genre matching."""
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            mod._database_genre_query_sync(genres=["rock"], get_songs=10)
+
+        call_args = cur.execute.call_args
+        sql = call_args[0][0]
+        params = call_args[0][1] if len(call_args[0]) > 1 else []
+        assert "~*" in sql  # PostgreSQL case-insensitive regex
+        found_regex = any("rock:" in str(p) for p in params) if params else False
+        assert found_regex or "rock" in sql
+
+    def test_tempo_range_filter(self):
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            mod._database_genre_query_sync(tempo_min=120, tempo_max=140, get_songs=10)
+
+        sql = cur.execute.call_args[0][0]
+        assert "tempo >=" in sql
+        assert "tempo <=" in sql
+
+    def test_key_filter_uppercased(self):
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            mod._database_genre_query_sync(key="c", get_songs=10)
+
+        sql = cur.execute.call_args[0][0]
+        params = cur.execute.call_args[0][1]
+        assert "key = %s" in sql
+        assert "C" in params  # should be uppercased
+
+    def test_scale_filter_case_insensitive(self):
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            mod._database_genre_query_sync(scale="Major", get_songs=10)
+
+        sql = cur.execute.call_args[0][0]
+        assert "LOWER(scale)" in sql
+
+    def test_year_range_filter(self):
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            mod._database_genre_query_sync(year_min=1980, year_max=1989, get_songs=10)
+
+        sql = cur.execute.call_args[0][0]
+        assert "year >=" in sql
+        assert "year <=" in sql
+
+    def test_min_rating_filter(self):
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            mod._database_genre_query_sync(min_rating=4, get_songs=10)
+
+        sql = cur.execute.call_args[0][0]
+        assert "rating >=" in sql
+
+    def test_mood_filter_uses_like(self):
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            mod._database_genre_query_sync(moods=["danceable"], get_songs=10)
+
+        sql = cur.execute.call_args[0][0]
+        assert "LIKE" in sql
+
+    def test_combined_filters_use_and(self):
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            mod._database_genre_query_sync(
+                genres=["rock"], tempo_min=120, energy_min=0.05,
+                key="C", scale="major", year_min=2000, min_rating=3, get_songs=10
+            )
+
+        sql = cur.execute.call_args[0][0]
+        assert sql.count("AND") >= 5  # Multiple AND conditions
+
+    def test_results_returned_as_list(self):
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "1", "title": "Song A", "author": "Artist A",
+                           "album": "Album", "album_artist": "AA", "tempo": 120,
+                           "key": "C", "scale": "major", "energy": 0.08,
+                           "mood_vector": "rock:0.82", "other_features": "danceable"}),
+        ])
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            result = mod._database_genre_query_sync(genres=["rock"], get_songs=10)
+
+        assert isinstance(result, (list, dict))
+        if isinstance(result, dict):
+            assert "songs" in result
+
+    def test_get_songs_converted_to_int(self):
+        """Gemini may send float for get_songs - should be converted to int."""
+        mod = _import_mcp_server()
+        conn, cur = self._setup_mock_conn()
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            # Should not raise - float get_songs handled
+            mod._database_genre_query_sync(genres=["rock"], get_songs=50.0)
+
+
+# ---------------------------------------------------------------------------
+# ai_brainstorm normalization patterns (unit-testable without DB)
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestBrainstormNormalization:
+    """Test the normalization logic used in _ai_brainstorm_sync."""
+
+    def _normalize(self, text):
+        """Reproduce the normalization from mcp_server."""
+        return (text.lower()
+                .replace(' ', '')
+                .replace('-', '')
+                .replace("'", '')
+                .replace('.', '')
+                .replace(',', ''))
+
+    def test_lowercase(self):
+        assert self._normalize("Hello") == "hello"
+
+    def test_remove_spaces(self):
+        assert self._normalize("The Beatles") == "thebeatles"
+
+    def test_remove_dashes(self):
+        assert self._normalize("up-beat") == "upbeat"
+
+    def test_remove_apostrophes(self):
+        assert self._normalize("Don't Stop") == "dontstop"
+
+    def test_remove_periods(self):
+        assert self._normalize("Mr. Jones") == "mrjones"
+
+    def test_remove_commas(self):
+        assert self._normalize("Hello, World") == "helloworld"
+
+    def test_ac_dc_normalization(self):
+        """AC/DC normalizes consistently (slash not removed but spaces/dots are)."""
+        result = self._normalize("AC DC")
+        assert result == "acdc"
+
+    def test_complex_normalization(self):
+        assert self._normalize("Don't Stop Me Now") == "dontstopmenow"
+
+    def test_both_title_and_artist_required(self):
+        """Demonstrate that matching requires BOTH title and artist."""
+        title_norm = self._normalize("Bohemian Rhapsody")
+        artist_norm = self._normalize("Queen")
+        assert title_norm == "bohemianrhapsody"
+        assert artist_norm == "queen"
+
+    def test_same_title_different_artist_not_equal(self):
+        """Same title with different artist should not be considered same."""
+        t1 = self._normalize("Yesterday") + "|" + self._normalize("The Beatles")
+        t2 = self._normalize("Yesterday") + "|" + self._normalize("Some Cover Artist")
+        assert t1 != t2
+
+
+# ---------------------------------------------------------------------------
+# execute_mcp_tool energy conversion
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestExecuteMcpToolEnergyConversion:
+    """Test that execute_mcp_tool converts energy from 0-1 to raw."""
+
+    def test_search_database_energy_conversion(self):
+        ai_mod = _import_ai_mcp_client()
+        mcp_mod = _import_mcp_server()
+
+        mock_query = Mock(return_value={"songs": []})
+        import config as cfg
+        orig_min, orig_max = cfg.ENERGY_MIN, cfg.ENERGY_MAX
+        try:
+            cfg.ENERGY_MIN = 0.01
+            cfg.ENERGY_MAX = 0.15
+            with patch.object(mcp_mod, '_database_genre_query_sync', mock_query):
+                # Patch the lazy import inside execute_mcp_tool
+                with patch.dict('sys.modules', {'tasks.mcp_server': mcp_mod}):
+                    ai_mod.execute_mcp_tool("search_database", {
+                        "genres": ["rock"],
+                        "energy_min": 0.5,
+                        "energy_max": 0.8
+                    }, {})
+
+            # Check the raw energy values passed to the query function
+            if mock_query.called:
+                kwargs = mock_query.call_args[1] if mock_query.call_args[1] else {}
+                args = mock_query.call_args[0] if mock_query.call_args[0] else ()
+                # energy should have been converted from 0-1 to raw
+        finally:
+            cfg.ENERGY_MIN = orig_min
+            cfg.ENERGY_MAX = orig_max
+
+    def test_unknown_tool_returns_error(self):
+        ai_mod = _import_ai_mcp_client()
+        result = ai_mod.execute_mcp_tool("nonexistent_tool", {}, {})
+        assert "error" in result
+
+
+# ---------------------------------------------------------------------------
+# Song similarity lookup patterns
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestSongSimilarityLookup:
+    """Tests for _song_similarity_api_sync patterns."""
+
+    def test_exact_match_case_insensitive(self):
+        mod = _import_mcp_server()
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+        cur.fetchone = Mock(return_value=_make_dict_row({
+            "item_id": "123", "title": "Bohemian Rhapsody", "author": "Queen"
+        }))
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        mock_nn = Mock(return_value=[
+            {"item_id": "123", "distance": 0.0},
+            {"item_id": "456", "distance": 0.1},
+        ])
+        # Create a mock voyager_manager module in sys.modules to avoid tasks/__init__.py
+        mock_voyager = MagicMock()
+        mock_voyager.find_nearest_neighbors_by_id = mock_nn
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.voyager_manager': mock_voyager}):
+            result = mod._song_similarity_api_sync("bohemian rhapsody", "queen", 10)
+
+        # Should have tried a DB lookup
+        assert cur.execute.called
+
+    def test_no_match_returns_empty(self):
+        mod = _import_mcp_server()
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+        cur.fetchone = Mock(return_value=None)
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        with patch.object(mod, 'get_db_connection', return_value=conn):
+            result = mod._song_similarity_api_sync("nonexistent song", "unknown artist", 10)
+
+        assert isinstance(result, (list, dict))
+        if isinstance(result, dict):
+            assert len(result.get("songs", [])) == 0
+
+
+# ---------------------------------------------------------------------------
+# _artist_similarity_api_sync
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestArtistSimilarityApiSync:
+    """Tests for _artist_similarity_api_sync - artist similarity with GMM."""
+
+    def _setup_cursor(self):
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+        return cur
+
+    def _setup_gmm_module(self, find_return=None, reverse_map=None):
+        """Build a mock tasks.artist_gmm_manager module."""
+        mock_mod = MagicMock()
+        mock_mod.find_similar_artists = Mock(return_value=find_return or [])
+        mock_mod.reverse_artist_map = reverse_map if reverse_map is not None else {}
+        return mock_mod
+
+    def test_exact_match_returns_songs(self):
+        """Exact DB match -> find_similar_artists -> songs returned."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        cur.fetchone = Mock(return_value=_make_dict_row({"author": "Radiohead"}))
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "1", "title": "Creep", "author": "Radiohead"}),
+            _make_dict_row({"item_id": "2", "title": "Paranoid Android", "author": "Muse"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        gmm_mod = self._setup_gmm_module(
+            find_return=[{"artist": "Muse", "distance": 0.1}]
+        )
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.artist_gmm_manager': gmm_mod}):
+            result = mod._artist_similarity_api_sync("Radiohead", count=5, get_songs=10)
+
+        assert "songs" in result
+        assert len(result["songs"]) > 0
+
+    def test_fuzzy_match_fallback(self):
+        """No exact match -> fuzzy ILIKE match used."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        cur.fetchone = Mock(side_effect=[
+            None,
+            _make_dict_row({"author": "AC/DC", "len": 5}),
+        ])
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "10", "title": "Back in Black", "author": "AC/DC"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        gmm_mod = self._setup_gmm_module(
+            find_return=[{"artist": "Guns N' Roses", "distance": 0.2}]
+        )
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.artist_gmm_manager': gmm_mod}):
+            result = mod._artist_similarity_api_sync("AC DC", count=5, get_songs=10)
+
+        assert "songs" in result
+        assert cur.fetchone.call_count == 2
+
+    def test_no_match_returns_empty(self):
+        """All DB lookups return None -> empty songs with message."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        cur.fetchone = Mock(return_value=None)
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        gmm_mod = self._setup_gmm_module(find_return=[])
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.artist_gmm_manager': gmm_mod}):
+            result = mod._artist_similarity_api_sync("ZZZ Unknown", count=5, get_songs=10)
+
+        assert result["songs"] == []
+        assert "message" in result
+
+    def test_gmm_empty_fallback_to_reverse_artist_map(self):
+        """GMM returns [] -> fallback to reverse_artist_map fuzzy match."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        cur.fetchone = Mock(return_value=_make_dict_row({"author": "Queen"}))
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "5", "title": "We Will Rock You", "author": "Queen"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        gmm_mod = MagicMock()
+        gmm_mod.find_similar_artists = Mock(side_effect=[
+            [],
+            [{"artist": "David Bowie", "distance": 0.3}],
+        ])
+        gmm_mod.reverse_artist_map = {"queen": 0, "david bowie": 1}
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.artist_gmm_manager': gmm_mod}):
+            result = mod._artist_similarity_api_sync("Queen", count=5, get_songs=10)
+
+        assert gmm_mod.find_similar_artists.call_count >= 2
+        assert "songs" in result
+
+    def test_special_chars_fallback_via_resub(self):
+        """Artist with special chars, GMM empty, re.sub cleanup triggers fallback."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        cur.fetchone = Mock(return_value=_make_dict_row({"author": "P!nk"}))
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "20", "title": "So What", "author": "P!nk"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        gmm_mod = MagicMock()
+        gmm_mod.find_similar_artists = Mock(side_effect=[
+            [],
+            [{"artist": "Kelly Clarkson", "distance": 0.4}],
+        ])
+        gmm_mod.reverse_artist_map = {}
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.artist_gmm_manager': gmm_mod}):
+            result = mod._artist_similarity_api_sync("P!nk", count=5, get_songs=10)
+
+        assert gmm_mod.find_similar_artists.call_count >= 2
+        assert "songs" in result
+
+    def test_result_structure_has_required_keys(self):
+        """Returned dict has songs, similar_artists, component_matches, message."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        cur.fetchone = Mock(return_value=_make_dict_row({"author": "Nirvana"}))
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "30", "title": "Smells Like Teen Spirit", "author": "Nirvana"}),
+            _make_dict_row({"item_id": "31", "title": "Everlong", "author": "Foo Fighters"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        gmm_mod = self._setup_gmm_module(
+            find_return=[{"artist": "Foo Fighters", "distance": 0.15}]
+        )
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.artist_gmm_manager': gmm_mod}):
+            result = mod._artist_similarity_api_sync("Nirvana", count=5, get_songs=10)
+
+        assert "songs" in result
+        assert "similar_artists" in result
+        assert "component_matches" in result
+        assert "message" in result
+
+    def test_component_matches_includes_original_artist(self):
+        """component_matches marks the original artist with is_original=True."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        cur.fetchone = Mock(return_value=_make_dict_row({"author": "The Beatles"}))
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "40", "title": "Hey Jude", "author": "The Beatles"}),
+            _make_dict_row({"item_id": "41", "title": "Imagine", "author": "John Lennon"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        gmm_mod = self._setup_gmm_module(
+            find_return=[{"artist": "John Lennon", "distance": 0.1}]
+        )
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.artist_gmm_manager': gmm_mod}):
+            result = mod._artist_similarity_api_sync("The Beatles", count=5, get_songs=10)
+
+        original_entries = [
+            c for c in result["component_matches"] if c.get("is_original") is True
+        ]
+        assert len(original_entries) >= 1
+        assert original_entries[0]["artist"] == "The Beatles"
+
+    def test_get_songs_limits_results(self):
+        """get_songs value is passed as LIMIT to the SQL query."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        cur.fetchone = Mock(return_value=_make_dict_row({"author": "Coldplay"}))
+        many_songs = [
+            _make_dict_row({"item_id": str(i), "title": f"Song {i}", "author": "Coldplay"})
+            for i in range(50)
+        ]
+        cur.fetchall = Mock(return_value=many_songs)
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        gmm_mod = self._setup_gmm_module(
+            find_return=[{"artist": "U2", "distance": 0.2}]
+        )
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'tasks.artist_gmm_manager': gmm_mod}):
+            result = mod._artist_similarity_api_sync("Coldplay", count=5, get_songs=5)
+
+        execute_calls = cur.execute.call_args_list
+        for c in execute_calls:
+            args = c[0]
+            if len(args) >= 2 and isinstance(args[1], list):
+                assert args[1][-1] == 5
+                break
+
+
+# ---------------------------------------------------------------------------
+# _song_alchemy_sync
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestSongAlchemySync:
+    """Tests for _song_alchemy_sync - blend/subtract musical vibes."""
+
+    def _setup_alchemy_module(self, return_value=None, side_effect=None):
+        mock_mod = MagicMock()
+        if side_effect:
+            mock_mod.song_alchemy = Mock(side_effect=side_effect)
+        else:
+            mock_mod.song_alchemy = Mock(return_value=return_value or {"results": []})
+        return mock_mod
+
+    def test_correct_args_passed(self):
+        """Verify add_items and subtract_items are forwarded correctly."""
+        mod = _import_mcp_server()
+
+        add = [{"type": "song", "id": "s1"}, {"type": "artist", "id": "a1"}]
+        sub = [{"type": "song", "id": "s2"}]
+        alchemy_mod = self._setup_alchemy_module(
+            return_value={"results": [{"item_id": "r1", "title": "Result", "artist": "Art"}]}
+        )
+
+        with patch.dict(sys.modules, {'tasks.song_alchemy': alchemy_mod}):
+            result = mod._song_alchemy_sync(add_items=add, subtract_items=sub, get_songs=10)
+
+        alchemy_mod.song_alchemy.assert_called_once_with(
+            add_items=add,
+            subtract_items=sub,
+            n_results=10
+        )
+        assert "songs" in result
+
+    def test_empty_add_items(self):
+        """Empty add_items list should still call song_alchemy without error."""
+        mod = _import_mcp_server()
+
+        alchemy_mod = self._setup_alchemy_module(return_value={"results": []})
+
+        with patch.dict(sys.modules, {'tasks.song_alchemy': alchemy_mod}):
+            result = mod._song_alchemy_sync(add_items=[], subtract_items=None, get_songs=10)
+
+        alchemy_mod.song_alchemy.assert_called_once()
+        assert result["songs"] == []
+
+    def test_exception_returns_error(self):
+        """If song_alchemy raises, result has empty songs and error message."""
+        mod = _import_mcp_server()
+
+        alchemy_mod = self._setup_alchemy_module(side_effect=Exception("Voyager index missing"))
+
+        with patch.dict(sys.modules, {'tasks.song_alchemy': alchemy_mod}):
+            result = mod._song_alchemy_sync(
+                add_items=[{"type": "song", "id": "s1"}],
+                subtract_items=None,
+                get_songs=10
+            )
+
+        assert result["songs"] == []
+        assert "error" in result["message"].lower()
+
+    def test_result_structure(self):
+        """Returned dict has 'songs' and 'message' keys."""
+        mod = _import_mcp_server()
+
+        alchemy_mod = self._setup_alchemy_module(
+            return_value={"results": [{"item_id": "r1", "title": "T", "artist": "A"}]}
+        )
+
+        with patch.dict(sys.modules, {'tasks.song_alchemy': alchemy_mod}):
+            result = mod._song_alchemy_sync(
+                add_items=[{"type": "song", "id": "s1"}],
+                get_songs=10
+            )
+
+        assert "songs" in result
+        assert "message" in result
+
+
+# ---------------------------------------------------------------------------
+# _ai_brainstorm_sync
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestAiBrainstormSync:
+    """Tests for _ai_brainstorm_sync - AI knowledge brainstorming with two-stage matching."""
+
+    def _make_ai_module(self, response="[]"):
+        mock_mod = MagicMock()
+        mock_mod.call_ai_for_chat = Mock(return_value=response)
+        return mock_mod
+
+    def _make_ai_config(self):
+        return {
+            "provider": "gemini",
+            "gemini_key": "fake-key",
+            "gemini_model": "gemini-pro",
+        }
+
+    def _setup_cursor(self):
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+        cur.fetchall = Mock(return_value=[])
+        return cur
+
+    def test_ai_error_response_returns_empty(self):
+        """AI returns 'Error: ...' -> result has empty songs."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        ai_mod = self._make_ai_module("Error: API rate limit exceeded")
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'ai': ai_mod}):
+            result = mod._ai_brainstorm_sync("rock classics", self._make_ai_config(), 10)
+
+        assert result["songs"] == []
+        assert "Error" in result["message"]
+
+    def test_valid_json_array_parsed(self):
+        """AI returns valid JSON array, DB finds matching rows."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        ai_response = json.dumps([
+            {"title": "Bohemian Rhapsody", "artist": "Queen"},
+            {"title": "Stairway to Heaven", "artist": "Led Zeppelin"},
+        ])
+        ai_mod = self._make_ai_module(ai_response)
+
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "100", "title": "Bohemian Rhapsody", "author": "Queen"}),
+            _make_dict_row({"item_id": "101", "title": "Stairway to Heaven", "author": "Led Zeppelin"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'ai': ai_mod}):
+            result = mod._ai_brainstorm_sync("classic rock", self._make_ai_config(), 10)
+
+        assert len(result["songs"]) == 2
+        titles = [s["title"] for s in result["songs"]]
+        assert "Bohemian Rhapsody" in titles
+
+    def test_markdown_code_blocks_stripped(self):
+        """AI response wrapped in ```json...``` is still parsed correctly."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        ai_response = '```json\n[{"title": "Hey Jude", "artist": "The Beatles"}]\n```'
+        ai_mod = self._make_ai_module(ai_response)
+
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "200", "title": "Hey Jude", "author": "The Beatles"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'ai': ai_mod}):
+            result = mod._ai_brainstorm_sync("beatles hits", self._make_ai_config(), 10)
+
+        assert len(result["songs"]) == 1
+        assert result["songs"][0]["title"] == "Hey Jude"
+
+    def test_stage1_exact_match(self):
+        """AI suggests song in DB with exact title+artist -> found via stage 1."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        ai_response = json.dumps([{"title": "Creep", "artist": "Radiohead"}])
+        ai_mod = self._make_ai_module(ai_response)
+
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "300", "title": "Creep", "author": "Radiohead"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'ai': ai_mod}):
+            result = mod._ai_brainstorm_sync("90s alternative", self._make_ai_config(), 10)
+
+        assert len(result["songs"]) == 1
+        assert result["songs"][0]["item_id"] == "300"
+
+    def test_stage2_fuzzy_normalized_match(self):
+        """AI suggests 'Don't Stop Me Now' by 'Queen', DB has 'Dont Stop Me Now' -> fuzzy match."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        ai_response = json.dumps([{"title": "Don't Stop Me Now", "artist": "Queen"}])
+        ai_mod = self._make_ai_module(ai_response)
+
+        call_count = [0]
+
+        def _fetchall_side_effect():
+            call_count[0] += 1
+            if call_count[0] == 1:
+                return []
+            else:
+                return [_make_dict_row({
+                    "item_id": "400",
+                    "title": "Dont Stop Me Now",
+                    "author": "Queen"
+                })]
+
+        cur.fetchall = Mock(side_effect=_fetchall_side_effect)
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'ai': ai_mod}):
+            result = mod._ai_brainstorm_sync("fun queen songs", self._make_ai_config(), 10)
+
+        assert len(result["songs"]) == 1
+        assert result["songs"][0]["item_id"] == "400"
+
+    def test_normalize_logic(self):
+        """Verify _normalize strips spaces, dashes, apostrophes, periods, commas."""
+        # Reproduce the normalization regex from _ai_brainstorm_sync
+        def _normalize(s):
+            return re.sub(r"[\s\-\u2010\u2011\u2012\u2013\u2014/'\".,!?()]", '', s).lower()
+
+        assert _normalize("Don't Stop Me Now") == "dontstopmenow"
+        assert _normalize("Mr. Jones") == "mrjones"
+        assert _normalize("Hello, World") == "helloworld"
+        assert _normalize("up-beat") == "upbeat"
+        assert _normalize("rock & roll") == "rock&roll"
+
+    def test_escape_like(self):
+        """_escape_like escapes % and _ characters."""
+        def _escape_like(s):
+            return s.replace('%', r'\%').replace('_', r'\_')
+
+        assert _escape_like("100%") == r"100\%"
+        assert _escape_like("under_score") == r"under\_score"
+        assert _escape_like("normal") == "normal"
+
+    def test_float_get_songs_converted_to_int(self):
+        """Passing get_songs=50.0 (Gemini float) should not raise."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        ai_response = json.dumps([{"title": "Song", "artist": "Artist"}])
+        ai_mod = self._make_ai_module(ai_response)
+
+        cur.fetchall = Mock(return_value=[])
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'ai': ai_mod}):
+            result = mod._ai_brainstorm_sync("test", self._make_ai_config(), 50.0)
+
+        assert "songs" in result
+
+    def test_invalid_json_returns_empty(self):
+        """AI returns non-JSON text -> result has empty songs."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        ai_mod = self._make_ai_module("Here are some great rock songs that you might enjoy!")
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'ai': ai_mod}):
+            result = mod._ai_brainstorm_sync("rock", self._make_ai_config(), 10)
+
+        assert result["songs"] == []
+        assert "parse" in result["message"].lower() or "Failed" in result["message"]
+
+    def test_results_trimmed_to_get_songs(self):
+        """AI suggests 30 songs, get_songs=10 -> only 10 returned."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        suggestions = [
+            {"title": f"Song {i}", "artist": f"Artist {i}"} for i in range(30)
+        ]
+        ai_response = json.dumps(suggestions)
+        ai_mod = self._make_ai_module(ai_response)
+
+        exact_rows = [
+            _make_dict_row({"item_id": str(i), "title": f"Song {i}", "author": f"Artist {i}"})
+            for i in range(30)
+        ]
+        cur.fetchall = Mock(return_value=exact_rows)
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        with patch.object(mod, 'get_db_connection', return_value=conn), \
+             patch.dict(sys.modules, {'ai': ai_mod}):
+            result = mod._ai_brainstorm_sync("test", self._make_ai_config(), 10)
+
+        assert len(result["songs"]) <= 10
+
+
+# ---------------------------------------------------------------------------
+# _text_search_sync
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestTextSearchSync:
+    """Tests for _text_search_sync - CLAP text search with hybrid filtering."""
+
+    def _setup_cursor(self):
+        cur = MagicMock()
+        cur.__enter__ = Mock(return_value=cur)
+        cur.__exit__ = Mock(return_value=False)
+        cur.fetchall = Mock(return_value=[])
+        return cur
+
+    def _make_clap_module(self, results=None, side_effect=None):
+        mock_mod = MagicMock()
+        if side_effect:
+            mock_mod.search_by_text = Mock(side_effect=side_effect)
+        else:
+            mock_mod.search_by_text = Mock(return_value=results if results is not None else [])
+        return mock_mod
+
+    def test_clap_disabled_returns_message(self):
+        """CLAP_ENABLED=False -> message says not enabled."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        clap_mod = self._make_clap_module()
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = False
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("dreamy soundscape", None, None, 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert result["songs"] == []
+        assert "not enabled" in result["message"]
+
+    def test_empty_description_returns_empty(self):
+        """Empty description -> empty songs."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        clap_mod = self._make_clap_module()
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = True
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("", None, None, 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert result["songs"] == []
+
+    def test_no_clap_results(self):
+        """search_by_text returns [] -> empty songs."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        clap_mod = self._make_clap_module(results=[])
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = True
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("ambient forest", None, None, 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert result["songs"] == []
+
+    def test_no_filters_returns_clap_results_directly(self):
+        """No tempo/energy filters -> CLAP results returned as-is."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        clap_results = [
+            {"item_id": "c1", "title": "Ambient Song", "author": "Artist A"},
+            {"item_id": "c2", "title": "Dreamy Track", "author": "Artist B"},
+        ]
+        clap_mod = self._make_clap_module(results=clap_results)
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = True
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("ambient dreamy", None, None, 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert len(result["songs"]) == 2
+        assert result["songs"][0]["item_id"] == "c1"
+
+    def test_tempo_filter_applied(self):
+        """Tempo filter 'slow' triggers DB filtering of CLAP results."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        clap_results = [
+            {"item_id": "c1", "title": "Slow Song", "author": "A1"},
+            {"item_id": "c2", "title": "Fast Song", "author": "A2"},
+        ]
+        clap_mod = self._make_clap_module(results=clap_results)
+
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "c1", "title": "Slow Song", "author": "A1"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = True
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("chill music", "slow", None, 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert len(result["songs"]) == 1
+        assert result["songs"][0]["item_id"] == "c1"
+
+    def test_energy_filter_applied(self):
+        """Energy filter 'high' triggers DB filtering of CLAP results."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        clap_results = [
+            {"item_id": "c1", "title": "High Energy", "author": "A1"},
+            {"item_id": "c2", "title": "Low Energy", "author": "A2"},
+        ]
+        clap_mod = self._make_clap_module(results=clap_results)
+
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "c1", "title": "High Energy", "author": "A1"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = True
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("energetic music", None, "high", 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert len(result["songs"]) == 1
+        assert result["songs"][0]["item_id"] == "c1"
+
+    def test_combined_tempo_and_energy_filters(self):
+        """Both tempo and energy filters applied together."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+
+        clap_results = [
+            {"item_id": "c1", "title": "Perfect Match", "author": "A1"},
+            {"item_id": "c2", "title": "No Match", "author": "A2"},
+            {"item_id": "c3", "title": "Also Match", "author": "A3"},
+        ]
+        clap_mod = self._make_clap_module(results=clap_results)
+
+        cur.fetchall = Mock(return_value=[
+            _make_dict_row({"item_id": "c1", "title": "Perfect Match", "author": "A1"}),
+            _make_dict_row({"item_id": "c3", "title": "Also Match", "author": "A3"}),
+        ])
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = True
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("upbeat dance", "fast", "high", 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert len(result["songs"]) == 2
+        assert result["songs"][0]["item_id"] == "c1"
+        assert result["songs"][1]["item_id"] == "c3"
+
+    def test_results_limited_to_get_songs(self):
+        """CLAP returns 50 results, get_songs=10 -> only 10 returned."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        clap_results = [
+            {"item_id": f"c{i}", "title": f"Song {i}", "author": f"Artist {i}"}
+            for i in range(50)
+        ]
+        clap_mod = self._make_clap_module(results=clap_results)
+
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = True
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("anything", None, None, 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert len(result["songs"]) == 10
+
+    def test_exception_returns_empty_with_message(self):
+        """search_by_text raises -> empty songs with error message."""
+        mod = _import_mcp_server()
+        cur = self._setup_cursor()
+        conn = _make_connection(cur)
+        conn.cursor = Mock(return_value=cur)
+
+        clap_mod = self._make_clap_module(side_effect=RuntimeError("CLAP model not loaded"))
+
+        import config as cfg
+        orig = cfg.CLAP_ENABLED
+        try:
+            cfg.CLAP_ENABLED = True
+            with patch.object(mod, 'get_db_connection', return_value=conn), \
+                 patch.dict(sys.modules, {'tasks.clap_text_search': clap_mod}):
+                result = mod._text_search_sync("test query", None, None, 10)
+        finally:
+            cfg.CLAP_ENABLED = orig
+
+        assert result["songs"] == []
+        assert "error" in result["message"].lower()
diff --git a/tests/unit/test_mediaserver_localfiles.py b/tests/unit/test_mediaserver_localfiles.py
new file mode 100644
index 00000000..71f8f8ae
--- /dev/null
+++ b/tests/unit/test_mediaserver_localfiles.py
@@ -0,0 +1,620 @@
+"""Unit tests for tasks/mediaserver_localfiles.py
+
+Tests cover the LocalFiles media provider:
+- Path normalization (POSIX conversion, relative paths)
+- File path hashing (SHA-256 stability)
+- Supported format filtering
+- Metadata extraction (tags, fallbacks)
+- Rating extraction (POPM, TXXX, Vorbis, M4A)
+- M3U playlist management (create, list, delete)
+- Directory scanning (recursive, flat)
+- Connection testing
+"""
+import os
+import sys
+import hashlib
+import pytest
+from unittest.mock import Mock, MagicMock, patch, mock_open
+from pathlib import Path, PurePosixPath
+
+
+# ---------------------------------------------------------------------------
+# Import helpers (bypass tasks/__init__.py -> pydub -> audioop chain)
+# ---------------------------------------------------------------------------
+
+def _import_localfiles():
+    """Load tasks.mediaserver_localfiles directly without triggering tasks/__init__.py."""
+    import importlib.util
+    import sys
+    mod_path = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)), '..', '..', 'tasks', 'mediaserver_localfiles.py'
+    )
+    mod_path = os.path.normpath(mod_path)
+    mod_name = 'tasks.mediaserver_localfiles'
+    if mod_name not in sys.modules:
+        spec = importlib.util.spec_from_file_location(mod_name, mod_path)
+        mod = importlib.util.module_from_spec(spec)
+        sys.modules[mod_name] = mod
+        spec.loader.exec_module(mod)
+    return sys.modules[mod_name]
+
+
+# ---------------------------------------------------------------------------
+# Path Normalization
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestPathNormalization:
+    """Test normalize_file_path()."""
+
+    def test_posix_conversion(self):
+        mod = _import_localfiles()
+        result = mod.normalize_file_path('Artist\\Album\\song.mp3')
+        assert '\\' not in result
+        assert 'Artist/Album/song.mp3' == result
+
+    @pytest.mark.skipif(sys.platform == 'win32', reason='POSIX absolute paths not valid on Windows')
+    def test_relative_to_base(self):
+        mod = _import_localfiles()
+        result = mod.normalize_file_path('/music/Artist/Album/song.mp3', '/music')
+        assert result == 'Artist/Album/song.mp3'
+
+    @pytest.mark.skipif(sys.platform == 'win32', reason='POSIX absolute paths not valid on Windows')
+    def test_no_base_keeps_absolute(self):
+        mod = _import_localfiles()
+        result = mod.normalize_file_path('/music/Artist/song.mp3', '')
+        # Without base_path, absolute path stays (converted to POSIX)
+        assert result.startswith('/')
+
+    def test_whitespace_stripped(self):
+        mod = _import_localfiles()
+        result = mod.normalize_file_path('  Artist/song.mp3  ')
+        assert result == 'Artist/song.mp3'
+
+    def test_different_base_keeps_original(self):
+        mod = _import_localfiles()
+        # If path is not relative to base, keep as-is
+        result = mod.normalize_file_path('/other/Artist/song.mp3', '/music')
+        assert 'Artist/song.mp3' in result
+
+
+# ---------------------------------------------------------------------------
+# File Path Hash
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestFilePathHash:
+    """Test file_path_hash() SHA-256 generation."""
+
+    def test_deterministic(self):
+        mod = _import_localfiles()
+        h1 = mod.file_path_hash('Artist/Album/song.mp3')
+        h2 = mod.file_path_hash('Artist/Album/song.mp3')
+        assert h1 == h2
+
+    def test_different_paths_different_hashes(self):
+        mod = _import_localfiles()
+        h1 = mod.file_path_hash('Artist/Album/song1.mp3')
+        h2 = mod.file_path_hash('Artist/Album/song2.mp3')
+        assert h1 != h2
+
+    def test_is_sha256_hex(self):
+        mod = _import_localfiles()
+        h = mod.file_path_hash('test/path.mp3')
+        assert len(h) == 64  # SHA-256 hex = 64 chars
+        assert all(c in '0123456789abcdef' for c in h)
+
+    def test_matches_manual_sha256(self):
+        mod = _import_localfiles()
+        path = 'Artist/Album/song.mp3'
+        expected = hashlib.sha256(path.encode('utf-8')).hexdigest()
+        assert mod.file_path_hash(path) == expected
+
+    def test_utf8_paths(self):
+        mod = _import_localfiles()
+        h = mod.file_path_hash('Artiste/Café/chanson.mp3')
+        assert len(h) == 64
+
+
+# ---------------------------------------------------------------------------
+# Supported Formats
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestFormatFiltering:
+    """Test SUPPORTED_FORMATS constant and format-related logic."""
+
+    def test_supported_formats_exist(self):
+        mod = _import_localfiles()
+        assert '.mp3' in mod.SUPPORTED_FORMATS
+        assert '.flac' in mod.SUPPORTED_FORMATS
+        assert '.ogg' in mod.SUPPORTED_FORMATS
+        assert '.m4a' in mod.SUPPORTED_FORMATS
+
+    def test_wav_supported(self):
+        mod = _import_localfiles()
+        assert '.wav' in mod.SUPPORTED_FORMATS
+
+    def test_opus_supported(self):
+        mod = _import_localfiles()
+        assert '.opus' in mod.SUPPORTED_FORMATS
+
+    def test_unsupported_format_excluded(self):
+        mod = _import_localfiles()
+        assert '.pdf' not in mod.SUPPORTED_FORMATS
+        assert '.txt' not in mod.SUPPORTED_FORMATS
+        assert '.jpg' not in mod.SUPPORTED_FORMATS
+
+    def test_get_config_default_formats(self):
+        """get_config returns SUPPORTED_FORMATS as default."""
+        mod = _import_localfiles()
+        with patch.dict(os.environ, {}, clear=False):
+            cfg = mod.get_config()
+            # Formats should be a list of supported extensions
+            assert isinstance(cfg['supported_formats'], list)
+            assert len(cfg['supported_formats']) > 0
+
+    def test_get_config_override(self):
+        """get_config accepts overrides."""
+        mod = _import_localfiles()
+        cfg = mod.get_config(overrides={'music_directory': '/custom/path'})
+        assert cfg['music_directory'] == '/custom/path'
+
+
+# ---------------------------------------------------------------------------
+# Metadata Extraction
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestMetadataExtraction:
+    """Test extract_metadata() with mocked mutagen."""
+
+    def test_fallback_title_from_filename(self):
+        """When mutagen returns None, title defaults to filename."""
+        mod = _import_localfiles()
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', False):
+            meta = mod.extract_metadata('/music/Artist/My Song.mp3')
+            assert meta['title'] == 'My Song'
+            assert meta['artist'] == 'Unknown Artist'
+            assert meta['album'] == 'Unknown Album'
+
+    def _inject_mutagen_mock(self, mod, mock_file):
+        """Inject MutagenFile into module if mutagen isn't installed."""
+        if not hasattr(mod, 'MutagenFile'):
+            mod.MutagenFile = Mock()
+        return patch.object(mod, 'MutagenFile', mock_file)
+
+    def test_mutagen_extracts_tags(self):
+        """When mutagen is available, tags are extracted."""
+        mod = _import_localfiles()
+        mock_audio = MagicMock()
+        mock_audio.tags = {
+            'title': ['Test Song'],
+            'artist': ['Test Artist'],
+            'album': ['Test Album'],
+            'albumartist': ['Album Artist'],
+            'date': ['2023'],
+            'tracknumber': ['5/12'],
+            'genre': ['Rock'],
+        }
+        mock_audio.info = MagicMock()
+        mock_audio.info.length = 180.5
+        mock_mutagen = Mock(return_value=mock_audio)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen_mock(mod, mock_mutagen), \
+             patch.object(mod, '_extract_rating', return_value=None):
+            meta = mod.extract_metadata('/music/test.mp3')
+            assert meta['title'] == 'Test Song'
+            assert meta['artist'] == 'Test Artist'
+            assert meta['album'] == 'Test Album'
+            assert meta['album_artist'] == 'Album Artist'
+            assert meta['year'] == 2023
+            assert meta['track_number'] == 5
+            assert meta['genre'] == 'Rock'
+            assert meta['duration'] == 180.5
+
+    def test_track_number_slash_format(self):
+        """Track number '3/12' extracts as 3."""
+        mod = _import_localfiles()
+        mock_audio = MagicMock()
+        mock_audio.tags = {'tracknumber': ['3/12']}
+        mock_audio.info = None
+        mock_mutagen = Mock(return_value=mock_audio)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen_mock(mod, mock_mutagen), \
+             patch.object(mod, '_extract_rating', return_value=None):
+            meta = mod.extract_metadata('/music/test.mp3')
+            assert meta['track_number'] == 3
+
+    def test_performer_fallback_for_artist(self):
+        """If 'artist' tag missing but 'performer' present, use performer."""
+        mod = _import_localfiles()
+        mock_audio = MagicMock()
+        mock_audio.tags = {'performer': ['Performer Name']}
+        mock_audio.info = None
+        mock_mutagen = Mock(return_value=mock_audio)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen_mock(mod, mock_mutagen), \
+             patch.object(mod, '_extract_rating', return_value=None):
+            meta = mod.extract_metadata('/music/test.mp3')
+            assert meta['artist'] == 'Performer Name'
+
+    def test_mutagen_returns_none(self):
+        """When MutagenFile returns None, defaults are used."""
+        mod = _import_localfiles()
+        mock_mutagen = Mock(return_value=None)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen_mock(mod, mock_mutagen):
+            meta = mod.extract_metadata('/music/test.mp3')
+            assert meta['title'] == 'test'
+            assert meta['artist'] == 'Unknown Artist'
+
+    def test_exception_returns_defaults(self):
+        """Exceptions during extraction return default metadata."""
+        mod = _import_localfiles()
+        mock_mutagen = Mock(side_effect=Exception('corrupt file'))
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen_mock(mod, mock_mutagen):
+            meta = mod.extract_metadata('/music/test.mp3')
+            assert meta['title'] == 'test'
+            assert meta['artist'] == 'Unknown Artist'
+
+
+# ---------------------------------------------------------------------------
+# Rating Extraction
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestRatingExtraction:
+    """Test _extract_rating() for various tag formats."""
+
+    def _inject_mutagen(self, mod, mock_file):
+        """Ensure MutagenFile exists on module so patch.object works."""
+        if not hasattr(mod, 'MutagenFile'):
+            mod.MutagenFile = Mock()
+        return patch.object(mod, 'MutagenFile', mock_file)
+
+    def _make_popm_audio(self, popm_rating):
+        """Build a mock audio object with POPM tag."""
+        mock_popm = MagicMock()
+        mock_popm.rating = popm_rating
+        mock_audio = MagicMock()
+        mock_tags = MagicMock()
+        mock_tags.keys.return_value = ['POPM:no@email']
+        mock_tags.__getitem__ = Mock(return_value=mock_popm)
+        mock_audio.tags = mock_tags
+        return mock_audio
+
+    def _make_flac_audio(self, tag_dict):
+        """Build a mock audio object with Vorbis-style tags (dict-like)."""
+        mock_audio = MagicMock()
+        # Use a MagicMock that supports dict operations
+        mock_tags = MagicMock()
+        mock_tags.__contains__ = lambda self, key: key in tag_dict
+        mock_tags.__getitem__ = lambda self, key: tag_dict[key]
+        mock_tags.__bool__ = lambda self: bool(tag_dict)
+        mock_audio.tags = mock_tags
+        return mock_audio
+
+    def test_no_mutagen_returns_none(self):
+        mod = _import_localfiles()
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', False):
+            assert mod._extract_rating('/test.mp3') is None
+
+    def test_popm_rating_zero(self):
+        """POPM rating 0 maps to 0."""
+        mod = _import_localfiles()
+        mock_audio = self._make_popm_audio(0)
+        mock_mutagen = Mock(return_value=mock_audio)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen(mod, mock_mutagen):
+            result = mod._extract_rating('/test.mp3')
+            assert result == 0
+
+    def test_popm_rating_255_maps_to_5(self):
+        """POPM rating 255 maps to 5."""
+        mod = _import_localfiles()
+        mock_audio = self._make_popm_audio(255)
+        mock_mutagen = Mock(return_value=mock_audio)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen(mod, mock_mutagen):
+            result = mod._extract_rating('/test.mp3')
+            assert result == 5
+
+    def test_popm_rating_128_maps_to_3(self):
+        """POPM rating 128 maps to 3."""
+        mod = _import_localfiles()
+        mock_audio = self._make_popm_audio(128)
+        mock_mutagen = Mock(return_value=mock_audio)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen(mod, mock_mutagen):
+            result = mod._extract_rating('/test.mp3')
+            assert result == 3
+
+    def test_flac_fmps_rating_0_5(self):
+        """FLAC FMPS_RATING 0.5 maps to round(0.5*5)=3."""
+        mod = _import_localfiles()
+        mock_audio = self._make_flac_audio({'FMPS_RATING': ['0.5']})
+        mock_mutagen = Mock(return_value=mock_audio)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen(mod, mock_mutagen):
+            result = mod._extract_rating('/test.flac')
+            # 0.5 * 5 = 2.5, round() = 2 (banker's rounding)
+            assert result == 2
+
+    def test_flac_rating_direct_scale(self):
+        """FLAC RATING tag with direct 0-5 value."""
+        mod = _import_localfiles()
+        mock_audio = self._make_flac_audio({'RATING': ['4']})
+        mock_mutagen = Mock(return_value=mock_audio)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen(mod, mock_mutagen):
+            result = mod._extract_rating('/test.flac')
+            assert result == 4
+
+    def test_mutagen_file_none_returns_none(self):
+        """MutagenFile returning None gives None rating."""
+        mod = _import_localfiles()
+        mock_mutagen = Mock(return_value=None)
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen(mod, mock_mutagen):
+            assert mod._extract_rating('/test.mp3') is None
+
+    def test_exception_returns_none(self):
+        """Exceptions during rating extraction return None."""
+        mod = _import_localfiles()
+        mock_mutagen = Mock(side_effect=Exception('error'))
+        with patch.object(mod, 'MUTAGEN_AVAILABLE', True), \
+             self._inject_mutagen(mod, mock_mutagen):
+            assert mod._extract_rating('/test.mp3') is None
+
+
+# ---------------------------------------------------------------------------
+# M3U Playlist Management
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestM3UPlaylistManagement:
+    """Test M3U playlist create/list/delete operations."""
+
+    def test_get_all_playlists_no_dir(self):
+        """Missing playlist directory returns empty list."""
+        mod = _import_localfiles()
+        with patch.object(mod, 'get_config', return_value={'playlist_directory': '/nonexistent'}), \
+             patch('os.path.isdir', return_value=False):
+            result = mod.get_all_playlists()
+            assert result == []
+
+    def test_get_all_playlists_finds_m3u(self):
+        """Lists .m3u and .m3u8 files."""
+        mod = _import_localfiles()
+        with patch.object(mod, 'get_config', return_value={'playlist_directory': '/playlists'}), \
+             patch('os.path.isdir', return_value=True), \
+             patch('os.listdir', return_value=['rock.m3u', 'jazz.m3u8', 'notes.txt']):
+            result = mod.get_all_playlists()
+            names = [p['Name'] for p in result]
+            assert 'rock' in names
+            assert 'jazz' in names
+            assert len(result) == 2
+
+    def test_get_playlist_by_name(self):
+        """Find a playlist by exact name."""
+        mod = _import_localfiles()
+        with patch.object(mod, 'get_all_playlists', return_value=[
+            {'Id': 'rock.m3u', 'Name': 'rock', 'Path': '/p/rock.m3u'},
+            {'Id': 'jazz.m3u', 'Name': 'jazz', 'Path': '/p/jazz.m3u'},
+        ]):
+            result = mod.get_playlist_by_name('jazz')
+            assert result is not None
+            assert result['Name'] == 'jazz'
+
+    def test_get_playlist_by_name_not_found(self):
+        """Non-existent playlist returns None."""
+        mod = _import_localfiles()
+        with patch.object(mod, 'get_all_playlists', return_value=[]):
+            assert mod.get_playlist_by_name('nonexistent') is None
+
+    def test_delete_playlist_success(self):
+        """Deleting an existing playlist returns True."""
+        mod = _import_localfiles()
+        with patch.object(mod, 'get_config', return_value={'playlist_directory': '/playlists'}), \
+             patch('os.path.exists', return_value=True), \
+             patch('os.remove') as mock_rm:
+            result = mod.delete_playlist('rock.m3u')
+            assert result is True
+            mock_rm.assert_called_once()
+
+    def test_delete_playlist_not_found(self):
+        """Deleting a nonexistent playlist returns False."""
+        mod = _import_localfiles()
+        with patch.object(mod, 'get_config', return_value={'playlist_directory': '/playlists'}), \
+             patch('os.path.exists', return_value=False):
+            result = mod.delete_playlist('missing.m3u')
+            assert result is False
+
+
+# ---------------------------------------------------------------------------
+# Connection Testing
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestConnectionTesting:
+    """Test test_connection()."""
+
+    def test_missing_directory(self):
+        mod = _import_localfiles()
+        with patch('os.path.exists', return_value=False):
+            ok, msg = mod.test_connection({'music_directory': '/nonexistent'})
+            assert not ok
+            assert 'does not exist' in msg
+
+    def test_not_a_directory(self):
+        mod = _import_localfiles()
+        with patch('os.path.exists', return_value=True), \
+             patch('os.path.isdir', return_value=False):
+            ok, msg = mod.test_connection({'music_directory': '/music/file.txt'})
+            assert not ok
+            assert 'not a directory' in msg
+
+    def test_not_readable(self):
+        mod = _import_localfiles()
+        with patch('os.path.exists', return_value=True), \
+             patch('os.path.isdir', return_value=True), \
+             patch('os.access', return_value=False):
+            ok, msg = mod.test_connection({'music_directory': '/music'})
+            assert not ok
+            assert 'not readable' in msg
+
+    def test_no_audio_files(self):
+        mod = _import_localfiles()
+        with patch('os.path.exists', return_value=True), \
+             patch('os.path.isdir', return_value=True), \
+             patch('os.access', return_value=True), \
+             patch('os.walk', return_value=[('/music', [], ['readme.txt'])]):
+            ok, msg = mod.test_connection({'music_directory': '/music'})
+            assert not ok
+            assert 'No audio files' in msg
+
+    def test_success_with_audio_files(self):
+        mod = _import_localfiles()
+        with patch('os.path.exists', return_value=True), \
+             patch('os.path.isdir', return_value=True), \
+             patch('os.access', return_value=True), \
+             patch('os.walk', return_value=[('/music', [], ['song.mp3', 'track.flac'])]):
+            ok, msg = mod.test_connection({'music_directory': '/music'})
+            assert ok
+            assert 'Found audio files' in msg
+
+
+# ---------------------------------------------------------------------------
+# Directory Scanning
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestDirectoryScanning:
+    """Test get_all_songs() directory scanning."""
+
+    def test_nonexistent_dir_returns_empty(self):
+        mod = _import_localfiles()
+        with patch.object(mod, 'get_config', return_value={
+            'music_directory': '/nonexistent',
+            'supported_formats': ['.mp3'],
+            'scan_subdirectories': True
+        }), patch('os.path.isdir', return_value=False):
+            result = mod.get_all_songs()
+            assert result == []
+
+    def test_recursive_scan(self):
+        """Recursive scan finds files in subdirectories."""
+        mod = _import_localfiles()
+        walk_data = [
+            ('/music', ['Artist'], ['root.mp3']),
+            ('/music/Artist', [], ['song.flac']),
+        ]
+        with patch.object(mod, 'get_config', return_value={
+            'music_directory': '/music',
+            'supported_formats': ['.mp3', '.flac'],
+            'scan_subdirectories': True
+        }), patch('os.path.isdir', return_value=True), \
+             patch('os.walk', return_value=walk_data), \
+             patch.object(mod, '_format_song', side_effect=lambda fp, bp: {
+                 'Id': 'hash', 'Name': os.path.basename(fp), 'Path': fp
+             }):
+            result = mod.get_all_songs()
+            assert len(result) == 2
+
+    def test_flat_scan(self):
+        """Non-recursive scan only finds files in the root."""
+        mod = _import_localfiles()
+        with patch.object(mod, 'get_config', return_value={
+            'music_directory': '/music',
+            'supported_formats': ['.mp3'],
+            'scan_subdirectories': False
+        }), patch('os.path.isdir', return_value=True), \
+             patch('os.listdir', return_value=['song.mp3', 'notes.txt', 'track.mp3']), \
+             patch('os.path.isfile', return_value=True), \
+             patch.object(mod, '_format_song', side_effect=lambda fp, bp: {
+                 'Id': 'hash', 'Name': os.path.basename(fp), 'Path': fp
+             }):
+            result = mod.get_all_songs()
+            assert len(result) == 2  # Only .mp3 files
+
+    def test_unsupported_format_skipped(self):
+        """Files with unsupported extensions are skipped."""
+        mod = _import_localfiles()
+        walk_data = [('/music', [], ['song.mp3', 'image.jpg', 'doc.pdf'])]
+        with patch.object(mod, 'get_config', return_value={
+            'music_directory': '/music',
+            'supported_formats': ['.mp3'],
+            'scan_subdirectories': True
+        }), patch('os.path.isdir', return_value=True), \
+             patch('os.walk', return_value=walk_data), \
+             patch.object(mod, '_format_song', side_effect=lambda fp, bp: {
+                 'Id': 'hash', 'Name': os.path.basename(fp), 'Path': fp
+             }):
+            result = mod.get_all_songs()
+            assert len(result) == 1
+
+
+# ---------------------------------------------------------------------------
+# Download Track
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestDownloadTrack:
+    """Test download_track() (copy to temp dir)."""
+
+    def test_missing_source_returns_none(self):
+        mod = _import_localfiles()
+        result = mod.download_track('/tmp', {'Path': '/nonexistent/file.mp3'})
+        assert result is None
+
+    def test_no_path_returns_none(self):
+        mod = _import_localfiles()
+        result = mod.download_track('/tmp', {'Id': '123'})
+        assert result is None
+
+    def test_successful_copy(self):
+        mod = _import_localfiles()
+        with patch('os.path.exists', return_value=True), \
+             patch('shutil.copy2') as mock_copy:
+            # First exists check is for source, second is for dest collision
+            with patch('os.path.exists', side_effect=[True, False]):
+                result = mod.download_track('/tmp', {
+                    'Path': '/music/Artist/song.mp3',
+                    'Name': 'song'
+                })
+            assert result is not None
+
+
+# ---------------------------------------------------------------------------
+# Provider Info
+# ---------------------------------------------------------------------------
+
+@pytest.mark.unit
+class TestProviderInfo:
+    """Test provider info metadata."""
+
+    def test_provider_type(self):
+        mod = _import_localfiles()
+        info = mod.get_provider_info()
+        assert info['type'] == 'localfiles'
+
+    def test_no_play_history(self):
+        mod = _import_localfiles()
+        info = mod.get_provider_info()
+        assert info['supports_play_history'] is False
+
+    def test_config_fields_include_music_directory(self):
+        mod = _import_localfiles()
+        info = mod.get_provider_info()
+        field_names = [f['name'] for f in info['config_fields']]
+        assert 'music_directory' in field_names
+
+    def test_top_played_returns_empty(self):
+        mod = _import_localfiles()
+        assert mod.get_top_played_songs(10) == []
+
+    def test_last_played_returns_none(self):
+        mod = _import_localfiles()
+        assert mod.get_last_played_time('id123') is None
diff --git a/tests/unit/test_playlist_ordering.py b/tests/unit/test_playlist_ordering.py
new file mode 100644
index 00000000..45918a15
--- /dev/null
+++ b/tests/unit/test_playlist_ordering.py
@@ -0,0 +1,538 @@
+"""Unit tests for playlist ordering module
+
+Tests cover the composite distance calculation, Circle of Fifths key distance,
+greedy nearest-neighbor ordering algorithm, energy arc shaping, and edge cases.
+All tests run without external services using unittest.mock for database calls.
+"""
+import pytest
+from unittest.mock import patch, MagicMock, Mock
+
+
+def _import_ordering():
+    """Import playlist_ordering directly, bypassing tasks/__init__.py which
+    pulls in heavyweight deps (pydub, librosa) not needed for these tests."""
+    import importlib.util, os, sys
+    mod_path = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)), '..', '..', 'tasks', 'playlist_ordering.py'
+    )
+    mod_path = os.path.normpath(mod_path)
+    if 'tasks.playlist_ordering' not in sys.modules:
+        spec = importlib.util.spec_from_file_location('tasks.playlist_ordering', mod_path)
+        mod = importlib.util.module_from_spec(spec)
+        sys.modules['tasks.playlist_ordering'] = mod
+        spec.loader.exec_module(mod)
+    mod = sys.modules['tasks.playlist_ordering']
+    return (
+        mod._key_distance,
+        mod._composite_distance,
+        mod.order_playlist,
+        mod._apply_energy_arc,
+        mod.CIRCLE_OF_FIFTHS,
+    )
+
+
+@pytest.mark.unit
+class TestKeyDistance:
+    def test_same_key_zero_distance(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", "major", "C", "major") == 0.0
+
+    def test_same_key_different_scale_zero(self):
+        kd, *_ = _import_ordering()
+        assert kd("G", "major", "G", "minor") == 0.0
+
+    def test_adjacent_key_c_to_g(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", None, "G", None) == pytest.approx(1.0/6.0)
+
+    def test_adjacent_key_c_to_f(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", None, "F", None) == pytest.approx(1.0/6.0)
+
+    def test_opposite_key_c_to_fsharp(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", None, "F#", None) == pytest.approx(1.0)
+
+    def test_opposite_key_c_to_gb(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", None, "Gb", None) == pytest.approx(1.0)
+
+    def test_two_steps_c_to_d(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", None, "D", None) == pytest.approx(2.0/6.0)
+
+    def test_three_steps_c_to_a(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", None, "A", None) == pytest.approx(0.5)
+
+    def test_four_steps_c_to_e(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", None, "E", None) == pytest.approx(4.0/6.0)
+
+    def test_five_steps_c_to_b(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", None, "B", None) == pytest.approx(5.0/6.0)
+
+    def test_symmetry(self):
+        kd, *_ = _import_ordering()
+        assert kd("A", None, "E", None) == kd("E", None, "A", None)
+
+    def test_same_scale_bonus_reduces_distance(self):
+        kd, *_ = _import_ordering()
+        d_no = kd("C", None, "D", None)
+        d_same = kd("C", "major", "D", "major")
+        assert d_same == pytest.approx(d_no * 0.8)
+
+    def test_different_scale_no_bonus(self):
+        kd, *_ = _import_ordering()
+        d_diff = kd("C", "major", "D", "minor")
+        d_no = kd("C", None, "D", None)
+        assert d_diff == pytest.approx(d_no)
+
+    def test_missing_key1_returns_neutral(self):
+        kd, *_ = _import_ordering()
+        assert kd(None, "major", "C", "major") == 0.5
+        assert kd("", "major", "C", "major") == 0.5
+
+    def test_missing_key2_returns_neutral(self):
+        kd, *_ = _import_ordering()
+        assert kd("C", "major", None, "major") == 0.5
+        assert kd("C", "major", "", "major") == 0.5
+
+    def test_both_keys_missing_returns_neutral(self):
+        kd, *_ = _import_ordering()
+        assert kd(None, None, None, None) == 0.5
+
+    def test_unknown_key_name_returns_neutral(self):
+        kd, *_ = _import_ordering()
+        assert kd("X", None, "C", None) == 0.5
+        assert kd("C", None, "Z", None) == 0.5
+
+    def test_case_insensitive_keys(self):
+        kd, *_ = _import_ordering()
+        assert kd("c", None, "g", None) == kd("C", None, "G", None)
+
+    def test_sharp_flat_enharmonic_equivalents(self):
+        kd, *_ = _import_ordering()
+        assert kd("C#", None, "Db", None) == 0.0
+        assert kd("D#", None, "Eb", None) == 0.0
+        assert kd("G#", None, "Ab", None) == 0.0
+        assert kd("A#", None, "Bb", None) == 0.0
+
+    def test_scale_comparison_case_insensitive(self):
+        kd, *_ = _import_ordering()
+        d1 = kd("C", "major", "D", "major")
+        d2 = kd("C", "Major", "D", "MAJOR")
+        assert d1 == pytest.approx(d2)
+
+
+@pytest.mark.unit
+class TestCompositeDistance:
+    def test_identical_songs_zero_distance(self):
+        _, cd, *_ = _import_ordering()
+        s = {"tempo": 120, "energy": 0.08, "key": "C", "scale": "major"}
+        assert cd(s, s) == 0.0
+
+    def test_tempo_weight_35_percent(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 100, "energy": 0.08, "key": "C", "scale": "major"}
+        b = {"tempo": 180, "energy": 0.08, "key": "C", "scale": "major"}
+        assert cd(a, b) == pytest.approx(0.35)
+
+    def test_energy_weight_35_percent(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 120, "energy": 0.01, "key": "C", "scale": "major"}
+        b = {"tempo": 120, "energy": 0.15, "key": "C", "scale": "major"}
+        assert cd(a, b) == pytest.approx(0.35)
+
+    def test_key_weight_30_percent(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 120, "energy": 0.08, "key": "C", "scale": "major"}
+        b = {"tempo": 120, "energy": 0.08, "key": "F#", "scale": "minor"}
+        assert cd(a, b) == pytest.approx(0.30)
+
+    def test_max_distance_all_features_differ(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 80, "energy": 0.01, "key": "C", "scale": "major"}
+        b = {"tempo": 160, "energy": 0.15, "key": "F#", "scale": "minor"}
+        assert cd(a, b) == pytest.approx(1.0)
+
+    def test_tempo_normalised_by_80bpm(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 100, "energy": 0, "key": "", "scale": ""}
+        b = {"tempo": 140, "energy": 0, "key": "", "scale": ""}
+        assert cd(a, b) == pytest.approx(0.35*0.5 + 0.30*0.5)
+
+    def test_tempo_diff_capped_at_one(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 60, "energy": 0.08, "key": "C", "scale": "major"}
+        b = {"tempo": 200, "energy": 0.08, "key": "C", "scale": "major"}
+        assert cd(a, b) == pytest.approx(0.35)
+
+    def test_energy_diff_capped_at_one(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 120, "energy": 0.0, "key": "C", "scale": "major"}
+        b = {"tempo": 120, "energy": 0.5, "key": "C", "scale": "major"}
+        assert cd(a, b) == pytest.approx(0.35)
+
+    def test_missing_tempo_treated_as_zero(self):
+        _, cd, *_ = _import_ordering()
+        a = {"energy": 0.08, "key": "C", "scale": "major"}
+        b = {"tempo": 80, "energy": 0.08, "key": "C", "scale": "major"}
+        assert cd(a, b) == pytest.approx(0.35)
+
+    def test_missing_energy_treated_as_zero(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 120, "key": "C", "scale": "major"}
+        b = {"tempo": 120, "energy": 0.07, "key": "C", "scale": "major"}
+        assert cd(a, b) == pytest.approx(0.35*0.5)
+
+    def test_missing_key_gives_neutral(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 120, "energy": 0.08}
+        b = {"tempo": 120, "energy": 0.08}
+        assert cd(a, b) == pytest.approx(0.30*0.5)
+
+    def test_custom_weights(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 100, "energy": 0.01, "key": "C", "scale": "major"}
+        b = {"tempo": 180, "energy": 0.15, "key": "F#", "scale": "minor"}
+        assert cd(a, b, w_tempo=0.5, w_energy=0.3, w_key=0.2) == pytest.approx(1.0)
+
+    def test_symmetry(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 90, "energy": 0.05, "key": "D", "scale": "minor"}
+        b = {"tempo": 140, "energy": 0.12, "key": "Ab", "scale": "major"}
+        assert cd(a, b) == cd(b, a)
+
+    def test_partial_distance_contribution(self):
+        _, cd, *_ = _import_ordering()
+        a = {"tempo": 120, "energy": 0.08, "key": "C", "scale": "major"}
+        b = {"tempo": 160, "energy": 0.08, "key": "G", "scale": "major"}
+        expected = 0.35*0.5 + 0.30*(1.0/6.0*0.8)
+        assert cd(a, b) == pytest.approx(expected)
+
+
+def _make_mock_db_rows(sd):
+    rows = []
+    for iid, data in sd.items():
+        row = dict(data)
+        row["item_id"] = iid
+        rows.append(row)
+    return rows
+
+def _patch_order_playlist(sd):
+    """Patch DB calls for order_playlist.  Pre-register mock modules
+    so the lazy imports inside order_playlist() never trigger the heavy
+    tasks/__init__.py import chain."""
+    import sys
+    rows = _make_mock_db_rows(sd)
+    mc = MagicMock()
+    mc.fetchall.return_value = rows
+    conn = MagicMock()
+    conn.cursor.return_value.__enter__ = Mock(return_value=mc)
+    conn.cursor.return_value.__exit__ = Mock(return_value=None)
+    # Pre-register lightweight mocks for modules imported inside order_playlist()
+    if 'tasks.mcp_server' not in sys.modules:
+        mock_mcp = MagicMock()
+        sys.modules['tasks.mcp_server'] = mock_mcp
+    if 'psycopg2' not in sys.modules:
+        sys.modules['psycopg2'] = MagicMock()
+    if 'psycopg2.extras' not in sys.modules:
+        sys.modules['psycopg2.extras'] = MagicMock()
+    sys.modules['tasks.mcp_server'].get_db_connection = Mock(return_value=conn)
+    return patch.object(sys.modules['tasks.mcp_server'], 'get_db_connection', return_value=conn)
+
+
+@pytest.mark.unit
+class TestOrderPlaylist:
+    def test_empty_list_returns_empty(self):
+        _, _, op, *_ = _import_ordering()
+        with _patch_order_playlist({}):
+            assert op([]) == []
+
+    def test_single_song_returns_unchanged(self):
+        _, _, op, *_ = _import_ordering()
+        assert op(["song1"]) == ["song1"]
+
+    def test_two_songs_returns_both(self):
+        _, _, op, *_ = _import_ordering()
+        assert op(["song1", "song2"]) == ["song1", "song2"]
+
+    def test_all_input_songs_in_output(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 80+i*10, "energy": 0.02+i*0.02, "key": "C", "scale": "major"} for i in range(10)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            result = op(ids)
+        assert set(result) == set(ids) and len(result) == len(ids)
+
+    def test_no_duplicates_in_output(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 100+i*5, "energy": 0.05+i*0.01, "key": "G", "scale": "minor"} for i in range(15)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            result = op(ids)
+        assert len(result) == len(set(result))
+
+    def test_starts_from_25th_percentile_energy(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": 0.02+i*0.01, "key": "C", "scale": "major"} for i in range(8)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            result = op(ids)
+        first_e = sd[result[0]]["energy"]
+        sorted_e = sorted(sd[s]["energy"] for s in ids)
+        expected_e = sorted_e[len(sorted_e) // 4]
+        assert first_e == pytest.approx(expected_e)
+
+    def test_adjacent_songs_have_small_distance(self):
+        _, cd, op, *_ = _import_ordering()
+        import random
+        random.seed(42)
+        kl = ["C","G","D","A","E","B","F#","Db","Ab","Eb"]
+        sd = {f"s{i}": {"tempo": 80+i*8, "energy": 0.02+i*0.012, "key": kl[i%10], "scale": "major" if i%2==0 else "minor"} for i in range(12)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            ordered = op(ids)
+        def td(seq):
+            return sum(cd(sd[seq[i]], sd[seq[i+1]]) for i in range(len(seq)-1))
+        od = td(ordered)
+        rd = []
+        for _ in range(20):
+            s = list(ids)
+            random.shuffle(s)
+            rd.append(td(s))
+        assert od <= sum(rd)/len(rd)
+
+    def test_unorderable_songs_appended_at_end(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 100+i*10, "energy": 0.05+i*0.02, "key": "C", "scale": "major"} for i in range(3)}
+        ids = ["s0", "s1", "s2", "s_missing"]
+        with _patch_order_playlist(sd):
+            result = op(ids)
+        assert result[-1] == "s_missing"
+        assert set(result) == set(ids)
+
+    def test_no_db_rows_returns_original_order(self):
+        _, _, op, *_ = _import_ordering()
+        ids = ["a", "b", "c"]
+        with _patch_order_playlist({}):
+            assert op(ids) == ids
+
+    def test_only_two_orderable_returns_original(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {
+            "s0": {"tempo": 100, "energy": 0.05, "key": "C", "scale": "major"},
+            "s1": {"tempo": 110, "energy": 0.06, "key": "G", "scale": "major"},
+        }
+        ids = ["s0", "s1", "s_no_data"]
+        with _patch_order_playlist(sd):
+            assert op(ids) == ids
+
+
+@pytest.mark.unit
+class TestEnergyArc:
+    def test_energy_arc_false_deterministic(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": 0.01+i*0.013, "key": "C", "scale": "major"} for i in range(12)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            r1 = op(ids, energy_arc=False)
+        with _patch_order_playlist(sd):
+            r2 = op(ids, energy_arc=False)
+        assert r1 == r2
+
+    def test_energy_arc_true_reshapes_10_plus(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": 0.01+i*0.013, "key": "C", "scale": "major"} for i in range(12)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            r_arc = op(ids, energy_arc=True)
+        with _patch_order_playlist(sd):
+            r_no = op(ids, energy_arc=False)
+        assert r_arc != r_no
+        assert set(r_arc) == set(r_no)
+
+    def test_energy_arc_skipped_under_10(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": 0.01+i*0.02, "key": "C", "scale": "major"} for i in range(8)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            r1 = op(ids, energy_arc=True)
+        with _patch_order_playlist(sd):
+            r2 = op(ids, energy_arc=False)
+        assert r1 == r2
+
+    def test_apply_energy_arc_peak_in_middle(self):
+        *_, ea, _ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": 0.01+i*0.012, "key": "C", "scale": "major"} for i in range(12)}
+        ids = [f"s{i}" for i in range(12)]
+        arc = ea(ids, sd)
+        assert set(arc) == set(ids) and len(arc) == 12
+        energies = [sd[s]["energy"] for s in arc]
+        n = len(energies)
+        fq = sum(energies[:n//4]) / (n//4)
+        mid = sum(energies[n//3:2*n//3]) / (2*n//3 - n//3)
+        lq = sum(energies[3*n//4:]) / (n - 3*n//4)
+        assert mid > fq and mid > lq
+
+    def test_apply_energy_arc_preserves_all(self):
+        *_, ea, _ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 100, "energy": 0.01+i*0.01, "key": "D", "scale": "minor"} for i in range(15)}
+        ids = list(sd.keys())
+        arc = ea(ids, sd)
+        assert set(arc) == set(ids) and len(arc) == len(ids)
+
+    def test_apply_energy_arc_exact_10(self):
+        *_, ea, _ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": 0.01+i*0.014, "key": "C", "scale": "major"} for i in range(10)}
+        ids = list(sd.keys())
+        arc = ea(ids, sd)
+        assert set(arc) == set(ids) and len(arc) == 10
+
+
+@pytest.mark.unit
+class TestEdgeCases:
+    def test_songs_with_missing_tempo(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {
+            "s0": {"tempo": None, "energy": 0.05, "key": "C", "scale": "major"},
+            "s1": {"tempo": 120, "energy": 0.06, "key": "G", "scale": "major"},
+            "s2": {"tempo": None, "energy": 0.07, "key": "D", "scale": "minor"},
+        }
+        with _patch_order_playlist(sd):
+            assert set(op(list(sd.keys()))) == set(sd.keys())
+
+    def test_songs_with_missing_energy(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {
+            "s0": {"tempo": 100, "energy": None, "key": "C", "scale": "major"},
+            "s1": {"tempo": 110, "energy": 0.05, "key": "G", "scale": "major"},
+            "s2": {"tempo": 120, "energy": None, "key": "D", "scale": "minor"},
+        }
+        with _patch_order_playlist(sd):
+            assert set(op(list(sd.keys()))) == set(sd.keys())
+
+    def test_songs_with_missing_key(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {
+            "s0": {"tempo": 100, "energy": 0.05, "key": None, "scale": None},
+            "s1": {"tempo": 110, "energy": 0.06, "key": "", "scale": ""},
+            "s2": {"tempo": 120, "energy": 0.07, "key": "C", "scale": "major"},
+        }
+        with _patch_order_playlist(sd):
+            assert set(op(list(sd.keys()))) == set(sd.keys())
+
+    def test_songs_with_all_missing_attributes(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {
+            "s0": {"tempo": None, "energy": None, "key": None, "scale": None},
+            "s1": {"tempo": None, "energy": None, "key": None, "scale": None},
+            "s2": {"tempo": None, "energy": None, "key": None, "scale": None},
+        }
+        with _patch_order_playlist(sd):
+            assert set(op(list(sd.keys()))) == set(sd.keys())
+
+    def test_all_songs_same_bpm_energy_key(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": 0.08, "key": "C", "scale": "major"} for i in range(6)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            result = op(ids)
+        assert set(result) == set(ids) and len(result) == 6
+
+    @pytest.mark.slow
+    def test_large_playlist_completes(self):
+        _, _, op, *_ = _import_ordering()
+        n = 120
+        keys = ["C","G","D","A","E","B","F#","Db","Ab","Eb","Bb","F"]
+        sd = {f"s{i}": {"tempo": 70+(i*7)%130, "energy": 0.01+(i*0.0012)%0.14, "key": keys[i%12], "scale": "major" if i%2==0 else "minor"} for i in range(n)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            result = op(ids)
+        assert len(result) == n and set(result) == set(ids)
+
+    @pytest.mark.slow
+    def test_large_playlist_with_energy_arc(self):
+        _, _, op, *_ = _import_ordering()
+        n = 100
+        keys = ["C","G","D","A","E","B","F#","Db","Ab","Eb","Bb","F"]
+        sd = {f"s{i}": {"tempo": 80+(i*5)%100, "energy": 0.01+(i*0.0014)%0.14, "key": keys[i%12], "scale": "major" if i%3!=0 else "minor"} for i in range(n)}
+        ids = list(sd.keys())
+        with _patch_order_playlist(sd):
+            result = op(ids, energy_arc=True)
+        assert len(result) == n and set(result) == set(ids)
+
+    def test_duplicate_ids_in_input(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {
+            "s0": {"tempo": 100, "energy": 0.05, "key": "C", "scale": "major"},
+            "s1": {"tempo": 110, "energy": 0.06, "key": "G", "scale": "major"},
+            "s2": {"tempo": 120, "energy": 0.07, "key": "D", "scale": "minor"},
+        }
+        with _patch_order_playlist(sd):
+            result = op(["s0", "s1", "s2", "s0"])
+        assert len(result) >= 3
+
+    def test_zero_tempo_and_energy_songs(self):
+        _, _, op, *_ = _import_ordering()
+        sd = {
+            "s0": {"tempo": 0, "energy": 0, "key": "C", "scale": "major"},
+            "s1": {"tempo": 0, "energy": 0, "key": "G", "scale": "major"},
+            "s2": {"tempo": 0, "energy": 0, "key": "D", "scale": "minor"},
+        }
+        with _patch_order_playlist(sd):
+            assert set(op(list(sd.keys()))) == set(sd.keys())
+
+
+@pytest.mark.unit
+class TestCircleOfFifthsMap:
+    def test_all_12_chromatic_notes_mapped(self):
+        *_, cof = _import_ordering()
+        assert set(cof.values()) == set(range(12))
+
+    def test_enharmonic_pairs_same_position(self):
+        *_, cof = _import_ordering()
+        for a, b in [("F#","GB"),("C#","DB"),("G#","AB"),("D#","EB"),("A#","BB")]:
+            assert cof[a] == cof[b], f"{a} and {b} should be equal"
+
+    def test_c_is_position_zero(self):
+        *_, cof = _import_ordering()
+        assert cof["C"] == 0
+
+    def test_g_is_position_one(self):
+        *_, cof = _import_ordering()
+        assert cof["G"] == 1
+
+    def test_f_is_position_eleven(self):
+        *_, cof = _import_ordering()
+        assert cof["F"] == 11
+
+
+@pytest.mark.unit
+class TestApplyEnergyArcDirect:
+    def test_low_energy_at_start_and_end(self):
+        *_, ea, _ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": float(i)} for i in range(12)}
+        ids = [f"s{i}" for i in range(12)]
+        arc = ea(ids, sd)
+        energies = [sd[s]["energy"] for s in arc]
+        assert energies[0] < 4.0 and energies[-1] < 4.0
+
+    def test_high_energy_in_middle(self):
+        *_, ea, _ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": float(i)} for i in range(15)}
+        ids = [f"s{i}" for i in range(15)]
+        arc = ea(ids, sd)
+        energies = [sd[s]["energy"] for s in arc]
+        n = len(energies)
+        mid_sec = energies[n//3:2*n//3]
+        assert sum(mid_sec)/len(mid_sec) > sum(energies)/len(energies)
+
+    def test_arc_with_identical_energies(self):
+        *_, ea, _ = _import_ordering()
+        sd = {f"s{i}": {"tempo": 120, "energy": 0.08} for i in range(12)}
+        ids = [f"s{i}" for i in range(12)]
+        arc = ea(ids, sd)
+        assert set(arc) == set(ids) and len(arc) == 12

From 2a4a8449c2f32f24d99e9d08ce82b3c85204d12b Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Mon, 9 Feb 2026 14:18:41 +0100
Subject: [PATCH 23/33] clean compose

---
 deployment/docker-compose-emby.yaml           |  99 --------------
 deployment/docker-compose-lyrion.yaml         |  93 -------------
 deployment/docker-compose-navidrome.yaml      |  97 --------------
 .../docker-compose-navidrome_local.yaml       | 119 -----------------
 .../docker-compose-navidrome_local_cpu.yaml   | 107 ---------------
 deployment/docker-compose-nvidia-local.yaml   | 123 ------------------
 deployment/docker-compose-nvidia.yaml         | 116 -----------------
 deployment/docker-compose-unified-nvidia.yaml |   5 -
 deployment/docker-compose-unified.yaml        |   5 -
 deployment/docker-compose-worker.yaml         |  37 ------
 deployment/docker-compose-worker_local.yaml   |  61 ---------
 .../docker-compose-worker_local_cpu.yaml      |  53 --------
 deployment/docker-compose.yaml                |  99 --------------
 deployment/docker-compose_local_cpu.yaml      | 110 ----------------
 docs/DEPLOYMENT.md                            |  21 ++-
 docs/GPU.md                                   |   2 +-
 docs/MULTI_PROVIDER_ARCHITECTURE.md           |   6 +-
 17 files changed, 13 insertions(+), 1140 deletions(-)
 delete mode 100644 deployment/docker-compose-emby.yaml
 delete mode 100644 deployment/docker-compose-lyrion.yaml
 delete mode 100644 deployment/docker-compose-navidrome.yaml
 delete mode 100644 deployment/docker-compose-navidrome_local.yaml
 delete mode 100644 deployment/docker-compose-navidrome_local_cpu.yaml
 delete mode 100644 deployment/docker-compose-nvidia-local.yaml
 delete mode 100644 deployment/docker-compose-nvidia.yaml
 delete mode 100644 deployment/docker-compose-worker.yaml
 delete mode 100644 deployment/docker-compose-worker_local.yaml
 delete mode 100644 deployment/docker-compose-worker_local_cpu.yaml
 delete mode 100644 deployment/docker-compose.yaml
 delete mode 100644 deployment/docker-compose_local_cpu.yaml

diff --git a/deployment/docker-compose-emby.yaml b/deployment/docker-compose-emby.yaml
deleted file mode 100644
index 2175f123..00000000
--- a/deployment/docker-compose-emby.yaml
+++ /dev/null
@@ -1,99 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379" # Expose Redis port to the host
-    volumes:
-      - redis-data:/data # Persistent storage for Redis data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432" # Expose PostgreSQL port to the host
-    volumes:
-      - postgres-data:/var/lib/postgresql/data # Persistent storage for PostgreSQL data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service
-  audiomuse-ai-flask:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest # Reflects deployment.yaml
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000" # Map host port 8000 to container port 8000
-    environment:
-      SERVICE_TYPE: "flask" # Tells the container to run the Flask app
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "emby" # Specify the media server type
-      EMBY_USER_ID: "${EMBY_USER_ID}"
-      EMBY_TOKEN: "${EMBY_TOKEN}"
-      EMBY_URL: "${EMBY_URL}"
-      # DATABASE_URL is now constructed by config.py from the following:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres" # Service name of the postgres container
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}" # Connects to the 'redis' service
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}" # From gemini-api-credentials secret
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}" # From mistral-api-credentials secret
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-flask:/app/temp_audio # Volume for temporary audio files
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-  # AudioMuse-AI RQ Worker service
-  audiomuse-ai-worker:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest # Reflects deployment.yaml
-    container_name: audiomuse-ai-worker-instance
-    environment:
-      SERVICE_TYPE: "worker" # Tells the container to run the RQ worker
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "emby" # Specify the media server type
-      EMBY_USER_ID: "${EMBY_USER_ID}"
-      EMBY_TOKEN: "${EMBY_TOKEN}"
-      EMBY_URL: "${EMBY_URL}"
-      # DATABASE_URL is now constructed by config.py from the following:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres" # Service name of the postgres container
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}" # Connects to the 'redis' service
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}" # From gemini-api-credentials secret
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-worker:/app/temp_audio # Volume for temporary audio files
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-# Define volumes for persistent data and temporary files
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask: # Volume for Flask app's temporary audio
-  temp-audio-worker: # Volume for Worker's temporary audio
diff --git a/deployment/docker-compose-lyrion.yaml b/deployment/docker-compose-lyrion.yaml
deleted file mode 100644
index b7c07078..00000000
--- a/deployment/docker-compose-lyrion.yaml
+++ /dev/null
@@ -1,93 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379" # Expose Redis port to the host
-    volumes:
-      - redis-data:/data # Persistent storage for Redis data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432" # Expose PostgreSQL port to the host
-    volumes:
-      - postgres-data:/var/lib/postgresql/data # Persistent storage for PostgreSQL data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service
-  audiomuse-ai-flask:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000"
-    environment:
-      SERVICE_TYPE: "flask"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "lyrion"
-      LYRION_URL: "${LYRION_URL}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-flask:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-  # AudioMuse-AI RQ Worker service
-  audiomuse-ai-worker:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest
-    container_name: audiomuse-ai-worker-instance
-    environment:
-      SERVICE_TYPE: "worker"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "lyrion"
-      LYRION_URL: "${LYRION_URL}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-worker:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-# Define volumes for persistent data and temporary files
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask:
-  temp-audio-worker:
diff --git a/deployment/docker-compose-navidrome.yaml b/deployment/docker-compose-navidrome.yaml
deleted file mode 100644
index ef85a5b9..00000000
--- a/deployment/docker-compose-navidrome.yaml
+++ /dev/null
@@ -1,97 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379" # Expose Redis port to the host
-    volumes:
-      - redis-data:/data # Persistent storage for Redis data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432" # Expose PostgreSQL port to the host
-    volumes:
-      - postgres-data:/var/lib/postgresql/data # Persistent storage for PostgreSQL data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service
-  audiomuse-ai-flask:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000"
-    environment:
-      SERVICE_TYPE: "flask"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "navidrome"
-      NAVIDROME_URL: "${NAVIDROME_URL}"
-      NAVIDROME_USER: "${NAVIDROME_USER}"
-      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-flask:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-  # AudioMuse-AI RQ Worker service
-  audiomuse-ai-worker:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest
-    container_name: audiomuse-ai-worker-instance
-    environment:
-      SERVICE_TYPE: "worker"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "navidrome"
-      NAVIDROME_URL: "${NAVIDROME_URL}"
-      NAVIDROME_USER: "${NAVIDROME_USER}"
-      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-worker:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-# Define volumes for persistent data and temporary files
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask:
-  temp-audio-worker:
diff --git a/deployment/docker-compose-navidrome_local.yaml b/deployment/docker-compose-navidrome_local.yaml
deleted file mode 100644
index 53276f08..00000000
--- a/deployment/docker-compose-navidrome_local.yaml
+++ /dev/null
@@ -1,119 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379" # Expose Redis port to the host
-    volumes:
-      - redis-data:/data # Persistent storage for Redis data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432"
-    volumes:
-      - postgres-data:/var/lib/postgresql/data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service (GPU-enabled)
-  audiomuse-ai-flask:
-    image: audiomuse-ai:pr195-gpu
-    build:
-      context: ../       # Build from project root (one level up from deployment/)
-      dockerfile: Dockerfile
-      args:  # GPU build args
-        BASE_IMAGE: nvidia/cuda:12.8.1-cudnn-runtime-ubuntu24.04
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000"
-    environment:
-      SERVICE_TYPE: "flask"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "navidrome"
-      NAVIDROME_URL: "${NAVIDROME_URL}"
-      NAVIDROME_USER: "${NAVIDROME_USER}"
-      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-false}"
-    volumes:
-      - temp-audio-flask:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              device_ids: ["0"]
-              capabilities: [gpu]
-
-  # AudioMuse-AI RQ Worker service (GPU-enabled)
-  # NOTE: This service uses the SAME image as flask, built only once
-  audiomuse-ai-worker:
-    image: audiomuse-ai:pr195-gpu  # Reuses the image built above
-    environment:
-      SERVICE_TYPE: "worker"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "navidrome"
-      NAVIDROME_URL: "${NAVIDROME_URL}"
-      NAVIDROME_USER: "${NAVIDROME_USER}"
-      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-false}"
-    volumes:
-      - temp-audio-worker:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-    deploy:
-      replicas: 1  # Run 1 worker instance
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              device_ids: ["0"]
-              capabilities: [gpu]
-
-# Define volumes for persistent data and temporary files
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask:
-  temp-audio-worker:
diff --git a/deployment/docker-compose-navidrome_local_cpu.yaml b/deployment/docker-compose-navidrome_local_cpu.yaml
deleted file mode 100644
index 20a9b49b..00000000
--- a/deployment/docker-compose-navidrome_local_cpu.yaml
+++ /dev/null
@@ -1,107 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379" # Expose Redis port to the host
-    volumes:
-      - redis-data:/data # Persistent storage for Redis data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432"
-    volumes:
-      - postgres-data:/var/lib/postgresql/data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service (CPU-only)
-  audiomuse-ai-flask:
-    image: audiomuse-ai:pr195-cpu
-    build:
-      context: ../       # Build from project root (one level up from deployment/)
-      dockerfile: Dockerfile
-      # No args needed - defaults to ubuntu:24.04 (CPU-only)
-    pull_policy: never  # Always use locally built image, never pull from registry
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000"
-    environment:
-      SERVICE_TYPE: "flask"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "navidrome"
-      NAVIDROME_URL: "${NAVIDROME_URL}"
-      NAVIDROME_USER: "${NAVIDROME_USER}"
-      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-      USE_GPU_CLUSTERING: "false"
-    volumes:
-      - temp-audio-flask:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-  # AudioMuse-AI RQ Worker service (CPU-only)
-  # NOTE: This service uses the SAME image as flask, built only once
-  audiomuse-ai-worker:
-    image: audiomuse-ai:pr195-cpu  # Reuses the image built above
-    pull_policy: never  # Always use locally built image, never pull from registry
-    environment:
-      SERVICE_TYPE: "worker"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "navidrome"
-      NAVIDROME_URL: "${NAVIDROME_URL}"
-      NAVIDROME_USER: "${NAVIDROME_USER}"
-      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-      USE_GPU_CLUSTERING: "false"
-    volumes:
-      - temp-audio-worker:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-    deploy:
-      replicas: 1  # Run 1 worker instance
-
-# Define volumes for persistent data and temporary files
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask:
-  temp-audio-worker:
diff --git a/deployment/docker-compose-nvidia-local.yaml b/deployment/docker-compose-nvidia-local.yaml
deleted file mode 100644
index f49ab7c4..00000000
--- a/deployment/docker-compose-nvidia-local.yaml
+++ /dev/null
@@ -1,123 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379"
-    volumes:
-      - redis-data:/data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432"
-    volumes:
-      - postgres-data:/var/lib/postgresql/data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service (LOCAL BUILD)
-  audiomuse-ai-flask:
-    build:
-      context: ..
-      dockerfile: Dockerfile
-      args:
-        BASE_IMAGE: nvidia/cuda:12.8.1-cudnn-runtime-ubuntu24.04
-    image: audiomuse-ai:local-nvidia
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000"
-    environment:
-      SERVICE_TYPE: "flask"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-flask:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              device_ids: ["0"]
-              capabilities: [gpu]
-
-  # AudioMuse-AI RQ Worker service (LOCAL BUILD)
-  audiomuse-ai-worker:
-    build:
-      context: ..
-      dockerfile: Dockerfile
-      args:
-        BASE_IMAGE: nvidia/cuda:12.8.1-cudnn-runtime-ubuntu24.04
-    image: audiomuse-ai:local-nvidia
-    container_name: audiomuse-ai-worker-instance
-    environment:
-      SERVICE_TYPE: "worker"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres"
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}"
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}"
-      NVIDIA_VISIBLE_DEVICES: "0"
-      NVIDIA_DRIVER_CAPABILITIES: "compute,utility"
-      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-true}"
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-worker:/app/temp_audio
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              device_ids: ["0"]
-              capabilities: [gpu]
-
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask:
-  temp-audio-worker:
diff --git a/deployment/docker-compose-nvidia.yaml b/deployment/docker-compose-nvidia.yaml
deleted file mode 100644
index a6f95366..00000000
--- a/deployment/docker-compose-nvidia.yaml
+++ /dev/null
@@ -1,116 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379" # Expose Redis port to the host
-    volumes:
-      - redis-data:/data # Persistent storage for Redis data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432" # Expose PostgreSQL port to the host
-    volumes:
-      - postgres-data:/var/lib/postgresql/data # Persistent storage for PostgreSQL data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service
-  audiomuse-ai-flask:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest-nvidia
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000" # Map host port 8000 to container port 8000
-    environment:
-      SERVICE_TYPE: "flask" # Tells the container to run the Flask app
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin" # Specify the media server type
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      # DATABASE_URL is now constructed by config.py from the following:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres" # Service name of the postgres container
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}" # Connects to the 'redis' service
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-flask:/app/temp_audio # Volume for temporary audio files
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              device_ids: ["0"]
-              capabilities: [gpu]
-
-  # AudioMuse-AI RQ Worker service
-  audiomuse-ai-worker:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest-nvidia
-    container_name: audiomuse-ai-worker-instance
-    environment:
-      SERVICE_TYPE: "worker" # Tells the container to run the RQ worker
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin" # Specify the media server type
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      # DATABASE_URL is now constructed by config.py from the following:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres" # Service name of the postgres container
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}" # Connects to the 'redis' service
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      NVIDIA_VISIBLE_DEVICES: "0"
-      NVIDIA_DRIVER_CAPABILITIES: "compute,utility"
-      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-true}"
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-worker:/app/temp_audio # Volume for temporary audio files
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              device_ids: ["0"]
-              capabilities: [gpu]
-
-# Define volumes for persistent data and temporary files
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask: # Volume for Flask app's temporary audio
-  temp-audio-worker: # Volume for Worker's temporary audio
diff --git a/deployment/docker-compose-unified-nvidia.yaml b/deployment/docker-compose-unified-nvidia.yaml
index 13e16dfa..3e7b3b83 100644
--- a/deployment/docker-compose-unified-nvidia.yaml
+++ b/deployment/docker-compose-unified-nvidia.yaml
@@ -192,14 +192,9 @@ services:
 # =============================================================================
 volumes:
   redis-data:
-    name: audiomuse-redis-data
   postgres-data:
-    name: audiomuse-postgres-data
   temp-audio-flask:
-    name: audiomuse-temp-flask
   temp-audio-worker:
-    name: audiomuse-temp-worker
   # Default music volume - only used if MUSIC_PATH env var is not set
   # For local files: set MUSIC_PATH=/your/music/folder in .env or environment
   music-data:
-    name: audiomuse-music-data
diff --git a/deployment/docker-compose-unified.yaml b/deployment/docker-compose-unified.yaml
index 5cbff99a..daf19b26 100644
--- a/deployment/docker-compose-unified.yaml
+++ b/deployment/docker-compose-unified.yaml
@@ -170,14 +170,9 @@ services:
 # =============================================================================
 volumes:
   redis-data:
-    name: audiomuse-redis-data
   postgres-data:
-    name: audiomuse-postgres-data
   temp-audio-flask:
-    name: audiomuse-temp-flask
   temp-audio-worker:
-    name: audiomuse-temp-worker
   # Default music volume - only used if MUSIC_PATH env var is not set
   # For local files: set MUSIC_PATH=/your/music/folder in .env or environment
   music-data:
-    name: audiomuse-music-data
diff --git a/deployment/docker-compose-worker.yaml b/deployment/docker-compose-worker.yaml
deleted file mode 100644
index 10845f17..00000000
--- a/deployment/docker-compose-worker.yaml
+++ /dev/null
@@ -1,37 +0,0 @@
-# AudioMuse-AI Deployment Configuration
-#
-# WORKER TEMPLATE - Run this for heavy CPU tasks like analysis and clustering, connected to a lightweight server with Jellyfin and AudioMuse-AI Flask application and databases.
-services:
-  # AudioMuse-AI Worker service (GPU-dependent)
-  audiomuse-ai-worker:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest
-    container_name: audiomuse-ai-worker-instance
-    ports:
-      - "${WORKER_PORT:-8029}:8000"  # Expose worker API
-    environment:
-      SERVICE_TYPE: "worker"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "${WORKER_POSTGRES_HOST:-postgres}" # Replace via WORKER_POSTGRES_HOST in .env when running remotely
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${WORKER_REDIS_URL:-redis://redis:6379/0}"  # Set WORKER_REDIS_URL in .env for remote connections
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-worker:/app/temp_audio
-    restart: unless-stopped
-
-volumes:
-  temp-audio-worker:
diff --git a/deployment/docker-compose-worker_local.yaml b/deployment/docker-compose-worker_local.yaml
deleted file mode 100644
index 7e69cf90..00000000
--- a/deployment/docker-compose-worker_local.yaml
+++ /dev/null
@@ -1,61 +0,0 @@
-# AudioMuse-AI Deployment Configuration
-#
-# WORKER LOCAL GPU TEMPLATE - Build and run a GPU-enabled worker for heavy tasks like analysis and clustering.
-# This worker connects to a remote server running AudioMuse-AI Flask application and databases.
-# Builds the image locally with GPU support.
-
-services:
-  # AudioMuse-AI Worker service (GPU-enabled, locally built)
-  audiomuse-ai-worker:
-    image: audiomuse-ai:worker-gpu
-    build:
-      context: ../       # Build from project root (one level up from deployment/)
-      dockerfile: Dockerfile
-      args:  # GPU build args
-        BASE_IMAGE: nvidia/cuda:12.8.1-cudnn-runtime-ubuntu24.04
-    container_name: audiomuse-ai-worker-instance
-    ports:
-      - "${WORKER_PORT:-8029}:8000"  # Expose worker API
-    environment:
-      SERVICE_TYPE: "worker"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-jellyfin}"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      NAVIDROME_URL: "${NAVIDROME_URL}"
-      NAVIDROME_USER: "${NAVIDROME_USER}"
-      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD}"
-      LYRION_URL: "${LYRION_URL}"
-      EMBY_URL: "${EMBY_URL}"
-      EMBY_USER_ID: "${EMBY_USER_ID}"
-      EMBY_TOKEN: "${EMBY_TOKEN}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "${WORKER_POSTGRES_HOST:-postgres}" # Replace via WORKER_POSTGRES_HOST in .env when running remotely
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${WORKER_REDIS_URL:-redis://redis:6379/0}"  # Set WORKER_REDIS_URL in .env for remote connections
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-      USE_GPU_CLUSTERING: "${USE_GPU_CLUSTERING:-true}"
-      CLAP_PYTHON_MULTITHREADS: "${CLAP_PYTHON_MULTITHREADS:-false}"
-    volumes:
-      - temp-audio-worker:/app/temp_audio
-    restart: unless-stopped
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              device_ids: ["0"]
-              capabilities: [gpu]
-
-volumes:
-  temp-audio-worker:
diff --git a/deployment/docker-compose-worker_local_cpu.yaml b/deployment/docker-compose-worker_local_cpu.yaml
deleted file mode 100644
index 95677087..00000000
--- a/deployment/docker-compose-worker_local_cpu.yaml
+++ /dev/null
@@ -1,53 +0,0 @@
-# AudioMuse-AI Deployment Configuration
-#
-# WORKER LOCAL CPU TEMPLATE - Build and run a CPU-only worker for heavy tasks like analysis and clustering.
-# This worker connects to a remote server running AudioMuse-AI Flask application and databases.
-# Builds the image locally with CPU-only support (suitable for macOS or systems without NVIDIA GPU).
-
-services:
-  # AudioMuse-AI Worker service (CPU-only, locally built)
-  audiomuse-ai-worker:
-    image: audiomuse-ai:worker-cpu
-    build:
-      context: ../       # Build from project root (one level up from deployment/)
-      dockerfile: Dockerfile
-      # No args needed - defaults to ubuntu:24.04 (CPU-only)
-    container_name: audiomuse-ai-worker-cpu-instance
-    ports:
-      - "${WORKER_PORT:-8029}:8000"  # Expose worker API
-    environment:
-      SERVICE_TYPE: "worker"
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "${MEDIASERVER_TYPE:-jellyfin}"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      NAVIDROME_URL: "${NAVIDROME_URL}"
-      NAVIDROME_USER: "${NAVIDROME_USER}"
-      NAVIDROME_PASSWORD: "${NAVIDROME_PASSWORD}"
-      LYRION_URL: "${LYRION_URL}"
-      EMBY_URL: "${EMBY_URL}"
-      EMBY_USER_ID: "${EMBY_USER_ID}"
-      EMBY_TOKEN: "${EMBY_TOKEN}"
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "${WORKER_POSTGRES_HOST:-postgres}" # Replace via WORKER_POSTGRES_HOST in .env when running remotely
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${WORKER_REDIS_URL:-redis://redis:6379/0}"  # Set WORKER_REDIS_URL in .env for remote connections
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-      USE_GPU_CLUSTERING: "false"  # CPU-only mode
-      CLAP_PYTHON_MULTITHREADS: "${CLAP_PYTHON_MULTITHREADS:-false}"
-    volumes:
-      - temp-audio-worker:/app/temp_audio
-    restart: unless-stopped
-
-volumes:
-  temp-audio-worker:
diff --git a/deployment/docker-compose.yaml b/deployment/docker-compose.yaml
deleted file mode 100644
index e8342d4f..00000000
--- a/deployment/docker-compose.yaml
+++ /dev/null
@@ -1,99 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379" # Expose Redis port to the host
-    volumes:
-      - redis-data:/data # Persistent storage for Redis data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432" # Expose PostgreSQL port to the host
-    volumes:
-      - postgres-data:/var/lib/postgresql/data # Persistent storage for PostgreSQL data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service
-  audiomuse-ai-flask:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest # Reflects deployment.yaml
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000" # Map host port 8000 to container port 8000
-    environment:
-      SERVICE_TYPE: "flask" # Tells the container to run the Flask app
-      MEDIASERVER_TYPE: "jellyfin" # Specify the media server type
-      TZ: "${TZ:-UTC}"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      # DATABASE_URL is now constructed by config.py from the following:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres" # Service name of the postgres container
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}" # Connects to the 'redis' service
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-flask:/app/temp_audio # Volume for temporary audio files
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-  # AudioMuse-AI RQ Worker service
-  audiomuse-ai-worker:
-    image: ghcr.io/neptunehub/audiomuse-ai:latest # Reflects deployment.yaml
-    container_name: audiomuse-ai-worker-instance
-    environment:
-      SERVICE_TYPE: "worker" # Tells the container to run the RQ worker
-      MEDIASERVER_TYPE: "jellyfin" # Specify the media server type
-      TZ: "${TZ:-UTC}"
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      # DATABASE_URL is now constructed by config.py from the following:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres" # Service name of the postgres container
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}" # Connects to the 'redis' service
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-    volumes:
-      - temp-audio-worker:/app/temp_audio # Volume for temporary audio files
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-# Define volumes for persistent data and temporary files
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask: # Volume for Flask app's temporary audio
-  temp-audio-worker: # Volume for Worker's temporary audio
diff --git a/deployment/docker-compose_local_cpu.yaml b/deployment/docker-compose_local_cpu.yaml
deleted file mode 100644
index 1903d023..00000000
--- a/deployment/docker-compose_local_cpu.yaml
+++ /dev/null
@@ -1,110 +0,0 @@
-services:
-  # Redis service for RQ (task queue)
-  redis:
-    image: redis:7-alpine
-    container_name: audiomuse-redis
-    ports:
-      - "${REDIS_PORT:-6379}:6379" # Expose Redis port to the host
-    volumes:
-      - redis-data:/data # Persistent storage for Redis data
-    restart: unless-stopped
-
-  # PostgreSQL database service
-  postgres:
-    image: postgres:15-alpine
-    container_name: audiomuse-postgres
-    environment:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-    ports:
-      - "${POSTGRES_PORT:-5432}:5432" # Expose PostgreSQL port to the host
-    volumes:
-      - postgres-data:/var/lib/postgresql/data # Persistent storage for PostgreSQL data
-    restart: unless-stopped
-
-  # AudioMuse-AI Flask application service (CPU-only, locally built)
-  audiomuse-ai-flask:
-    image: audiomuse-ai:local-cpu
-    build:
-      context: ../       # Build from project root (one level up from deployment/)
-      dockerfile: Dockerfile
-      # No args needed - defaults to ubuntu:24.04 (CPU-only)
-    pull_policy: never  # Always use locally built image, never pull from registry
-    container_name: audiomuse-ai-flask-app
-    ports:
-      - "${FRONTEND_PORT:-8000}:8000" # Map host port 8000 to container port 8000
-    environment:
-      SERVICE_TYPE: "flask" # Tells the container to run the Flask app
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin" # Specify the media server type
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      # DATABASE_URL is now constructed by config.py from the following:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres" # Service name of the postgres container
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}" # Connects to the 'redis' service
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-      USE_GPU_CLUSTERING: "false"
-    volumes:
-      - temp-audio-flask:/app/temp_audio # Volume for temporary audio files
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-
-  # AudioMuse-AI RQ Worker service (CPU-only, locally built)
-  # NOTE: This service uses the SAME image as flask, built only once
-  audiomuse-ai-worker:
-    image: audiomuse-ai:local-cpu  # Reuses the image built above
-    pull_policy: never  # Always use locally built image, never pull from registry
-    container_name: audiomuse-ai-worker-instance
-    environment:
-      SERVICE_TYPE: "worker" # Tells the container to run the RQ worker
-      TZ: "${TZ:-UTC}"
-      MEDIASERVER_TYPE: "jellyfin" # Specify the media server type
-      JELLYFIN_USER_ID: "${JELLYFIN_USER_ID}"
-      JELLYFIN_TOKEN: "${JELLYFIN_TOKEN}"
-      JELLYFIN_URL: "${JELLYFIN_URL}"
-      # DATABASE_URL is now constructed by config.py from the following:
-      POSTGRES_USER: ${POSTGRES_USER:-audiomuse}
-      POSTGRES_PASSWORD: ${POSTGRES_PASSWORD:-audiomusepassword}
-      POSTGRES_DB: ${POSTGRES_DB:-audiomusedb}
-      POSTGRES_HOST: "postgres" # Service name of the postgres container
-      POSTGRES_PORT: "${POSTGRES_PORT:-5432}"
-      REDIS_URL: "${REDIS_URL:-redis://redis:6379/0}" # Connects to the 'redis' service
-      AI_MODEL_PROVIDER: "${AI_MODEL_PROVIDER}"
-      OPENAI_API_KEY: "${OPENAI_API_KEY}"
-      OPENAI_SERVER_URL: "${OPENAI_SERVER_URL}"
-      OPENAI_MODEL_NAME: "${OPENAI_MODEL_NAME}"
-      GEMINI_API_KEY: "${GEMINI_API_KEY}"
-      MISTRAL_API_KEY: "${MISTRAL_API_KEY}"
-      CLAP_ENABLED: "${CLAP_ENABLED:-true}" # Enable CLAP text search (set to false for slower systems)
-      TEMP_DIR: "/app/temp_audio"
-      USE_GPU_CLUSTERING: "false"
-    volumes:
-      - temp-audio-worker:/app/temp_audio # Volume for temporary audio files
-    depends_on:
-      - redis
-      - postgres
-    restart: unless-stopped
-    deploy:
-      replicas: 1  # Run 1 worker instance
-
-# Define volumes for persistent data and temporary files
-volumes:
-  redis-data:
-  postgres-data:
-  temp-audio-flask: # Volume for Flask app's temporary audio
-  temp-audio-worker: # Volume for Worker's temporary audio
diff --git a/docs/DEPLOYMENT.md b/docs/DEPLOYMENT.md
index 7c7a224f..3f51e9d5 100644
--- a/docs/DEPLOYMENT.md
+++ b/docs/DEPLOYMENT.md
@@ -67,14 +67,12 @@ This section provides a minimal guide to deploy AudioMuse-AI on a K3S (Kubernete
  
 ## **Local Deployment with Docker Compose**
 
-AudioMuse-AI provides Docker Compose files for different media server backends:
+AudioMuse-AI provides unified Docker Compose files that support all media servers:
 
-- **Jellyfin**: Use `deployment/docker-compose.yaml`
-- **Navidrome**: Use `deployment/docker-compose-navidrome.yaml`
-- **Lyrion**: Use `deployment/docker-compose-lyrion.yaml`
-- **Emby**: Use `deployment/docker-compose-emby.yaml`
+- **CPU**: Use `deployment/docker-compose-unified.yaml`
+- **NVIDIA GPU**: Use `deployment/docker-compose-unified-nvidia.yaml`
 
-Choose the appropriate file based on your media server setup.
+All provider-specific settings (Jellyfin, Navidrome, Lyrion, Emby, Local Files) are configured via the GUI setup wizard or the `.env` file.
 
 **Prerequisites:**
 *   Docker and Docker Compose installed.
@@ -93,23 +91,22 @@ Choose the appropriate file based on your media server setup.
     Edit `.env` and provide the media-server credentials (e.g., `JELLYFIN_URL`, `JELLYFIN_USER_ID`, `JELLYFIN_TOKEN` or `NAVIDROME_*`, `EMBY_*`, `LYRION_URL`) along with any API keys (`GEMINI_API_KEY`, `MISTRAL_API_KEY`). The same values are injected into every compose file, so you only need to edit them here.
 3.  **Start the Services:**
     ```bash
-    docker compose -f deployment/docker-compose.yaml up -d
+    docker compose -f deployment/docker-compose-unified.yaml up -d
     ```
-    Swap the compose filename if you're targeting Navidrome (`docker-compose-navidrome.yaml`), Lyrion (`docker-compose-lyrion.yaml`) or Emby (`docker-compose-emby.yaml`). This command starts all services (Flask app, RQ workers, Redis, PostgreSQL) in detached mode (`-d`).
+    For NVIDIA GPU acceleration, use `docker-compose-unified-nvidia.yaml` instead. This command starts all services (Flask app, RQ workers, Redis, PostgreSQL) in detached mode (`-d`).
 
-    **IMPORTANT:** both `docker-compose.yaml` and `.env` file need to be in the same directory.
+    **IMPORTANT:** both the compose file and `.env` file need to be in the same directory.
 5.  **Access the Application:**
     Once the containers are up, you can access the web UI at `http://localhost:8000`. You can change the value of the used port by changing the FRONTEND_PORT value
 6.  **Stopping the Services:**
     ```bash
-    docker compose -f deployment/docker-compose.yaml down
+    docker compose -f deployment/docker-compose-unified.yaml down
     ```
-    Swap the compose filename here as well if you started a different variant.
 **Note:**
   > If you use LMS instead of the password you need to create and use the Subsonic API token. Additional Subsonic API based Mediaserver could require it in place of the password.
 
 **Remote worker tip:**
-If you deploy a worker on different hardware (using `docker-compose-worker.yaml` or `docker-compose-worker-nvidia.yaml`), copy your `.env` to that machine and update `WORKER_POSTGRES_HOST` and `WORKER_REDIS_URL` so the worker can reach the main server.
+If you deploy a worker on different hardware (using `docker-compose-worker-cpu.yaml` or `docker-compose-worker-nvidia.yaml`), copy your `.env` to that machine and update `WORKER_POSTGRES_HOST` and `WORKER_REDIS_URL` so the worker can reach the main server.
 
 ## **Local Deployment with Podman Quadlets**
 
diff --git a/docs/GPU.md b/docs/GPU.md
index 42a0a6a2..490b3409 100644
--- a/docs/GPU.md
+++ b/docs/GPU.md
@@ -23,7 +23,7 @@ We suggest **8GB VRAM** on GPU, with less you can experience the NON BLOCKING Ou
    USE_GPU_CLUSTERING=true
    ```
 3. Ensure NVIDIA Container Toolkit is installed on your host
-4. Use docker-compose files with GPU support (e.g., `docker-compose-nvidia.yaml` or `docker-compose-worker-nvidia.yaml`)
+4. Use docker-compose files with GPU support (e.g., `docker-compose-unified-nvidia.yaml` or `docker-compose-worker-nvidia.yaml`)
 
 **Performance Impact:**
 - **KMeans**: 10-50x faster than CPU
diff --git a/docs/MULTI_PROVIDER_ARCHITECTURE.md b/docs/MULTI_PROVIDER_ARCHITECTURE.md
index 83f5ebc3..417052ed 100644
--- a/docs/MULTI_PROVIDER_ARCHITECTURE.md
+++ b/docs/MULTI_PROVIDER_ARCHITECTURE.md
@@ -208,9 +208,9 @@ Features:
 
 ```
 deployment/
-├── docker-compose.yaml           # CPU version (default)
-├── docker-compose-nvidia.yaml    # GPU/NVIDIA version
-└── docker-compose-extras.yaml    # Optional: pgAdmin, monitoring, etc.
+├── docker-compose-unified.yaml           # CPU version (default)
+├── docker-compose-unified-nvidia.yaml    # GPU/NVIDIA version
+└── docker-compose-unified-nvidia-test.yaml  # GPU local build (development)
 ```
 
 All provider-specific configuration moves to:

From 03add7a2816c2049b3d8f7b9f7a052b3f679a897 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Wed, 11 Feb 2026 14:52:34 +0100
Subject: [PATCH 24/33] Ongoing tests, initial minor bugs

---
 TEST_CHECKLIST.md               | 294 ++++++++++++++++++++------------
 TEST_RESULTS.md                 | 252 +++++++++++++++++++++++++++
 tasks/mediaserver.py            |   2 -
 tasks/mediaserver_localfiles.py |  28 ++-
 templates/setup.html            |  15 +-
 5 files changed, 458 insertions(+), 133 deletions(-)
 create mode 100644 TEST_RESULTS.md

diff --git a/TEST_CHECKLIST.md b/TEST_CHECKLIST.md
index cf84d445..ce404256 100644
--- a/TEST_CHECKLIST.md
+++ b/TEST_CHECKLIST.md
@@ -34,29 +34,32 @@
 
 ```
 AudioMuse-AI/
-├── tests/unit/              # Unit tests (no external services needed)
-│   ├── test_analysis.py     # Audio analysis (50+ tests)
-│   ├── test_ai.py           # AI provider routing (30+ tests)
-│   ├── test_clustering.py   # Clustering helpers (60+ tests)
-│   ├── test_clustering_helper.py
-│   ├── test_clustering_postprocessing.py
-│   ├── test_mediaserver.py  # Jellyfin provider (15+ tests)
-│   ├── test_voyager_manager.py  # Similarity search (20+ tests)
-│   ├── test_commons.py      # Score vectors (10+ tests)
-│   ├── test_app_analysis.py
-│   ├── test_clap_text_search.py
-│   ├── test_artist_gmm_manager.py
-│   ├── test_memory_cleanup.py
-│   ├── test_memory_utils.py
-│   ├── test_path_manager.py
-│   ├── test_song_alchemy.py
-│   ├── test_sonic_fingerprint_manager.py
-│   ├── test_string_sanitization.py
-│   ├── test_mcp_server.py         # NEW - MCP tools
-│   ├── test_playlist_ordering.py  # NEW - Playlist ordering
-│   ├── test_app_setup.py          # NEW - Setup wizard & providers
-│   ├── test_app_chat.py           # NEW - Instant playlist pipeline
-│   └── test_mediaserver_localfiles.py  # NEW - LocalFiles provider
+├── tests/
+│   ├── conftest.py              # Shared fixtures (importlib bypass, DB mocks, config restore)
+│   └── unit/                    # Unit tests (no external services needed)
+│       ├── test_analysis.py     # Audio analysis (50+ tests)
+│       ├── test_ai.py           # AI provider routing (30+ tests)
+│       ├── test_ai_mcp_client.py    # NEW - AI MCP client (60+ tests)
+│       ├── test_clustering.py   # Clustering helpers (60+ tests)
+│       ├── test_clustering_helper.py
+│       ├── test_clustering_postprocessing.py
+│       ├── test_mediaserver.py  # Jellyfin provider (15+ tests)
+│       ├── test_voyager_manager.py  # Similarity search (20+ tests)
+│       ├── test_commons.py      # Score vectors (10+ tests)
+│       ├── test_app_analysis.py
+│       ├── test_clap_text_search.py
+│       ├── test_artist_gmm_manager.py
+│       ├── test_memory_cleanup.py
+│       ├── test_memory_utils.py
+│       ├── test_path_manager.py
+│       ├── test_song_alchemy.py
+│       ├── test_sonic_fingerprint_manager.py
+│       ├── test_string_sanitization.py
+│       ├── test_mcp_server.py         # NEW - MCP tools
+│       ├── test_playlist_ordering.py  # NEW - Playlist ordering
+│       ├── test_app_setup.py          # NEW - Setup wizard & providers
+│       ├── test_app_chat.py           # NEW - Instant playlist pipeline
+│       └── test_mediaserver_localfiles.py  # NEW - LocalFiles provider
 ├── test/                    # Integration tests (require running services)
 │   ├── test.py              # End-to-end smoke tests
 │   ├── test_analysis_integration.py
@@ -68,6 +71,10 @@ AudioMuse-AI/
 │       ├── docker-compose-test-providers.yaml
 │       └── TEST_GUIDE.md
 ├── testing_suite/           # Comparison & benchmarking
+│   ├── __main__.py                # CLI entry point
+│   ├── config.py                  # Suite configuration
+│   ├── orchestrator.py            # Test orchestration
+│   ├── utils.py                   # Shared utilities
 │   ├── test_instant_playlist.py   # Instant playlist scenarios
 │   ├── test_ai_naming.py          # AI naming quality
 │   ├── comparators/               # Cross-instance comparison
@@ -75,6 +82,8 @@ AudioMuse-AI/
 │   │   ├── db_comparator.py
 │   │   ├── docker_comparator.py
 │   │   └── performance_comparator.py
+│   ├── test_runner/               # Existing test runner
+│   │   └── existing_tests.py
 │   ├── run_comparison.py          # Entry point
 │   └── reports/html_report.py
 └── pytest.ini               # Test configuration
@@ -103,7 +112,7 @@ pytest tests/unit/test_mcp_server.py::TestSearchDatabase::test_genre_regex_preve
 pytest tests/unit/ -v -m "not slow"
 
 # Run only new tests (for this branch)
-pytest tests/unit/test_mcp_server.py tests/unit/test_playlist_ordering.py tests/unit/test_app_setup.py tests/unit/test_app_chat.py tests/unit/test_mediaserver_localfiles.py -v
+pytest tests/unit/test_mcp_server.py tests/unit/test_playlist_ordering.py tests/unit/test_app_setup.py tests/unit/test_app_chat.py tests/unit/test_mediaserver_localfiles.py tests/unit/test_ai_mcp_client.py -v
 
 # ============================================================
 # INTEGRATION TESTS (require running services, 20+ minutes)
@@ -166,6 +175,14 @@ pytest -m integration -v   # Integration tests only
 pytest -m "not slow" -v    # Skip slow tests
 ```
 
+### URL Prefix Note
+
+Some unit tests register blueprints **without** `url_prefix` for simplicity (e.g., `test_app_chat.py` tests `/api/config_defaults`). In production, these routes have prefixes:
+- `chat_bp` → `/chat/...` (e.g., `/chat/api/config_defaults`)
+- `external_bp` → `/external/...` (e.g., `/external/get_score`)
+
+The endpoint paths in this checklist reflect **production** URLs.
+
 ### Test Dependencies
 
 ```bash
@@ -188,6 +205,7 @@ pip install -r testing_suite/requirements.txt
 | Area | Tests | Status |
 |------|-------|--------|
 | MCP tool logic (genre regex, brainstorm matching, relevance scoring) | 40+ | **NEW** |
+| AI MCP client (system prompt, tool defs, provider dispatch, energy conversion) | 60+ | **NEW** |
 | Playlist ordering (greedy NN, Circle of Fifths, energy arc) | 25+ | **NEW** |
 | Setup wizard (provider CRUD, settings, validation) | 30+ | **NEW** |
 | Instant playlist pipeline (iteration loop, diversity, sampling) | 35+ | **NEW** |
@@ -256,19 +274,24 @@ pip install -r testing_suite/requirements.txt
 
 | # | Test Case | Type | Endpoint | Expected |
 |---|-----------|------|----------|----------|
-| 3.3.1 | List providers (empty) | Auto | `GET /api/providers` | `[]` |
-| 3.3.2 | Add provider | Auto | `POST /api/providers` | 201, provider returned |
-| 3.3.3 | Get provider by ID | Auto | `GET /api/providers/<id>` | Provider details returned |
-| 3.3.4 | Update provider | Auto | `PUT /api/providers/<id>` | Updated fields reflected |
-| 3.3.5 | Delete provider | Auto | `DELETE /api/providers/<id>` | 200, provider removed |
-| 3.3.6 | Test connection (valid) | Auto | `POST /api/providers/test` | `{"success": true}` |
-| 3.3.7 | Test connection (invalid) | Auto | `POST /api/providers/test` with bad URL | `{"success": false, "error": "..."}` |
-| 3.3.8 | Get libraries | Manual | `GET /api/providers/<id>/libraries` | Library list returned |
-| 3.3.9 | Get sample tracks | Manual | `GET /api/providers/<id>/sample-tracks` | Track list with file paths |
-| 3.3.10 | Detect prefix | Auto | `POST /api/providers/detect-prefix` | Correct prefix string |
-| 3.3.11 | Get enabled providers | Auto | `GET /api/providers/enabled` | Only enabled providers |
-| 3.3.12 | Invalid provider type | Auto | `POST /api/providers` with bad type | 400 error |
-| 3.3.13 | Missing required fields | Auto | `POST /api/providers` incomplete | 400 error |
+| 3.3.1 | List providers (empty) | Auto | `GET /api/setup/providers` | `[]` |
+| 3.3.2 | Add provider | Auto | `POST /api/setup/providers` | 201, provider returned |
+| 3.3.3 | Get provider by ID | Auto | `GET /api/setup/providers/<id>` | Provider details returned |
+| 3.3.4 | Update provider | Auto | `PUT /api/setup/providers/<id>` | Updated fields reflected |
+| 3.3.5 | Delete provider | Auto | `DELETE /api/setup/providers/<id>` | 200, provider removed |
+| 3.3.6 | Test connection (by ID) | Auto | `POST /api/setup/providers/<id>/test` | `{"success": true}` |
+| 3.3.7 | Test connection (inline) | Auto | `POST /api/setup/providers/test` with config | `{"success": true}` or `{"success": false, "error": "..."}` |
+| 3.3.8 | Get libraries | Manual | `POST /api/setup/providers/libraries` | Library list returned |
+| 3.3.9 | Rescan paths | Manual | `POST /api/setup/providers/<id>/rescan-paths` | Track list with file paths |
+| 3.3.10 | Get enabled providers | Auto | `GET /api/providers/enabled` | Only enabled providers |
+| 3.3.11 | Invalid provider type | Auto | `POST /api/setup/providers` with bad type | 400 error |
+| 3.3.12 | Missing required fields | Auto | `POST /api/setup/providers` incomplete | 400 error |
+| 3.3.13 | Get provider types | Auto | `GET /api/setup/providers/types` | List of supported provider types |
+| 3.3.14 | Multi-provider config | Auto | `POST /api/setup/multi-provider` | Multi-provider setup applied |
+| 3.3.15 | Set primary provider | Auto | `PUT /api/setup/primary-provider` | Primary provider updated |
+| 3.3.16 | Server info | Auto | `GET /api/setup/server-info` | Server configuration returned |
+| 3.3.17 | Browse directories | Manual | `GET /api/setup/browse-directories` | Directory listing returned |
+| 3.3.18 | Complete setup | Auto | `POST /api/setup/complete` | Setup marked as complete |
 
 ### 3.4 Multi-Provider Playlist Creation
 
@@ -342,7 +365,7 @@ pip install -r testing_suite/requirements.txt
 
 | # | Test Case | Type | Steps | Expected |
 |---|-----------|------|-------|----------|
-| 5.3.1 | Settings saved to DB | Auto | `POST /api/settings` | Saved in `app_settings` table |
+| 5.3.1 | Settings saved to DB | Auto | `PUT /api/setup/settings` | Saved in `app_settings` table |
 | 5.3.2 | Settings loaded on startup | Auto | Restart app | `apply_settings_to_config()` overrides config |
 | 5.3.3 | Settings override env vars | Auto | Set env var AND DB setting | DB setting takes precedence |
 
@@ -360,17 +383,16 @@ pip install -r testing_suite/requirements.txt
 | 6.1.4 | Active tasks (none) | Auto | `GET /api/active_tasks` | 200, empty/null |
 | 6.1.5 | Cancel nonexistent task | Auto | `POST /api/cancel/nonexistent` | 404 |
 | 6.1.6 | Playlists (empty) | Auto | `GET /api/playlists` | 200, `[]` |
-| 6.1.7 | Setup status | Auto | `GET /api/setup/status` | 200, setup status |
-| 6.1.8 | Providers list (empty) | Auto | `GET /api/providers` | 200, `[]` |
-| 6.1.9 | Settings GET | Auto | `GET /api/settings` | 200, current settings |
-| 6.1.10 | Config defaults | Auto | `GET /api/config_defaults` | 200, AI provider defaults |
-| 6.1.11 | Filter options | Auto | `GET /api/filter_options` | 200 (may be empty) |
-| 6.1.12 | Similarity page | Auto | `GET /similarity` | 200, HTML |
-| 6.1.13 | Alchemy page | Auto | `GET /alchemy` | 200, HTML |
-| 6.1.14 | Map page | Auto | `GET /map` | 200, HTML |
-| 6.1.15 | Path page | Auto | `GET /path` | 200, HTML |
-| 6.1.16 | Cron page | Auto | `GET /cron` | 200, HTML |
-| 6.1.17 | Cleaning page | Auto | `GET /cleaning` | 200, HTML |
+| 6.1.7 | Setup status | Auto | `GET /api/setup/status` | 200, setup complete/incomplete |
+| 6.1.8 | Providers list (empty) | Auto | `GET /api/setup/providers` | 200, `[]` |
+| 6.1.9 | Settings GET | Auto | `GET /api/setup/settings` | 200, current settings |
+| 6.1.10 | Config defaults | Auto | `GET /chat/api/config_defaults` | 200, AI provider defaults |
+| 6.1.11 | Similarity page | Auto | `GET /similarity` | 200, HTML |
+| 6.1.12 | Alchemy page | Auto | `GET /alchemy` | 200, HTML |
+| 6.1.13 | Map page | Auto | `GET /map` | 200, HTML |
+| 6.1.14 | Path page | Auto | `GET /path` | 200, HTML |
+| 6.1.15 | Cron page | Auto | `GET /cron` | 200, HTML |
+| 6.1.16 | Cleaning page | Auto | `GET /cleaning` | 200, HTML |
 
 ### 6.2 Endpoints With Provider (Media server configured, tracks analyzed)
 
@@ -379,17 +401,17 @@ pip install -r testing_suite/requirements.txt
 | 6.2.1 | Search tracks | Auto | `GET /api/search_tracks?title=test` | 200, array of matches |
 | 6.2.2 | Similar tracks by ID | Auto | `GET /api/similar_tracks?item_id=X` | 200, similar tracks array |
 | 6.2.3 | Similar tracks by title+artist | Auto | `GET /api/similar_tracks?title=X&artist=Y` | 200, similar tracks array |
-| 6.2.4 | Get score | Auto | `GET /get_score?id=X` | 200, track metadata incl. new fields |
-| 6.2.5 | Get embedding | Auto | `GET /get_embedding?id=X` | 200, embedding vector |
+| 6.2.4 | Get score | Auto | `GET /external/get_score?id=X` | 200, track metadata incl. new fields |
+| 6.2.5 | Get embedding | Auto | `GET /external/get_embedding?id=X` | 200, embedding vector |
 | 6.2.6 | Artist search | Auto | `GET /api/search_artists?query=X` | 200, artist matches |
 | 6.2.7 | Similar artists | Auto | `GET /api/similar_artists?artist=X` | 200, similar artists |
 | 6.2.8 | Alchemy search | Auto | `POST /api/alchemy` with items | 200, results array |
 | 6.2.9 | Path finding | Auto | `GET /api/find_path?start_song_id=X&end_song_id=Y` | 200, path array |
-| 6.2.10 | Map data | Auto | `GET /api/map/100` | 200, items with projections |
-| 6.2.11 | Map data compressed | Auto | `GET /api/map/gzip/100` | 200, gzip content |
+| 6.2.10 | Map data | Auto | `GET /api/map?percent=100` | 200, items with projections |
+| 6.2.11 | Map cache status | Auto | `GET /api/map_cache_status` | 200, cache info |
 | 6.2.12 | CLAP search (if enabled) | Auto | `POST /api/clap/search` with query | 200, results |
 | 6.2.13 | MuLan search (if enabled) | Auto | `POST /api/mulan/search` with query | 200, results |
-| 6.2.14 | Chat playlist | Manual | `POST /api/chatPlaylist` | 200, streaming playlist |
+| 6.2.14 | Chat playlist | Manual | `POST /chat/api/chatPlaylist` | 200, streaming playlist |
 | 6.2.15 | Start analysis | Auto | `POST /api/analysis/start` | 202, task_id |
 | 6.2.16 | Start clustering | Auto | `POST /api/clustering/start` | 202, task_id |
 | 6.2.17 | Cron CRUD | Auto | `POST/GET/DELETE /api/cron` | Cron entry management |
@@ -483,32 +505,70 @@ pip install -r testing_suite/requirements.txt
 | 8.5.4 | CLAP tool included when enabled | Auto | `text_search` in tool list when `CLAP_ENABLED=true` |
 | 8.5.5 | CLAP tool excluded when disabled | Auto | `text_search` NOT in tool list when `CLAP_ENABLED=false` |
 
-### 8.6 AI Provider Integration (Manual + Automated)
+### 8.6 AI MCP Client (Automated - `test_ai_mcp_client.py`)
+
+| # | Test Case | Type | Details |
+|---|-----------|------|---------|
+| 8.6.1 | Prompt includes all tool names | Auto | All 5-6 tool names in prompt text |
+| 8.6.2 | CLAP decision tree has 6 steps | Auto | With CLAP enabled, 6 steps in decision tree |
+| 8.6.3 | No-CLAP decision tree has 5 steps | Auto | With CLAP disabled, 5 steps |
+| 8.6.4 | Library context injected | Auto | Total songs, artists, genres in prompt |
+| 8.6.5 | No library section when None | Auto | Graceful handling of missing context |
+| 8.6.6 | Dynamic genres from context | Auto | Top genres from DB in prompt |
+| 8.6.7 | Dynamic moods from context | Auto | Top moods from DB in prompt |
+| 8.6.8 | Fallback genres when no context | Auto | Default genre list used |
+| 8.6.9 | Year range shown | Auto | Min/max year in prompt |
+| 8.6.10 | Rating info shown | Auto | Rating coverage % in prompt |
+| 8.6.11 | 6 tools with CLAP | Auto | `get_mcp_tools()` returns 6 |
+| 8.6.12 | 5 tools without CLAP | Auto | `get_mcp_tools()` returns 5 |
+| 8.6.13 | Tools have required keys | Auto | name, description, parameters present |
+| 8.6.14 | search_database filter properties | Auto | Genre, mood, tempo, energy, key, scale, year, rating |
+| 8.6.15 | Energy 0 → ENERGY_MIN | Auto | `execute_mcp_tool` converts correctly |
+| 8.6.16 | Energy 1 → ENERGY_MAX | Auto | `execute_mcp_tool` converts correctly |
+| 8.6.17 | Energy 0.5 → midpoint | Auto | Linear interpolation |
+| 8.6.18 | No energy args → None | Auto | Missing args pass through as None |
+| 8.6.19 | Unknown tool → error | Auto | Returns error dict |
+| 8.6.20 | song_alchemy normalizes strings | Auto | Plain strings → dicts |
+| 8.6.21 | Provider dispatch routing | Auto | Gemini/OpenAI/Mistral/Ollama dispatch correctly |
+| 8.6.22 | Unknown provider → error | Auto | Returns error dict |
+| 8.6.23 | Ollama JSON parsing | Auto | Valid JSON tool_calls extracted |
+| 8.6.24 | Ollama markdown stripping | Auto | Code blocks stripped before parsing |
+| 8.6.25 | Ollama schema detection rejected | Auto | Schema-like response → error |
+| 8.6.26 | Ollama JSON decode error | Auto | Malformed JSON → error |
+| 8.6.27 | Ollama read timeout | Auto | httpx.ReadTimeout → error |
+| 8.6.28 | Gemini missing API key | Auto | Empty key → error |
+| 8.6.29 | Gemini schema type conversion | Auto | JSON schema → Gemini types |
+| 8.6.30 | OpenAI tool call extraction | Auto | Standard OpenAI format parsed |
+| 8.6.31 | OpenAI read timeout | Auto | httpx.ReadTimeout → error |
+| 8.6.32 | Mistral missing API key | Auto | Empty/placeholder key → error |
+| 8.6.33 | Mistral tool call extraction | Auto | Mistral SDK format parsed |
+
+### 8.7 AI Provider Integration (Manual + Automated)
 
 | # | Test Case | Type | Provider | Details |
 |---|-----------|------|----------|---------|
-| 8.6.1 | Gemini tool calling | Manual | Gemini | Sends request, receives tool calls, executes them |
-| 8.6.2 | Gemini protobuf handling | Auto | Gemini | `_convert_protobuf_to_dict()` converts correctly |
-| 8.6.3 | Gemini fc.args vs fc.arguments | Auto | Gemini | Both formats parsed correctly |
-| 8.6.4 | OpenAI tool calling | Manual | OpenAI | Standard tool calling works |
-| 8.6.5 | OpenAI timeout handling | Auto | OpenAI | `httpx.ReadTimeout` caught and handled |
-| 8.6.6 | Mistral tool calling | Manual | Mistral | SDK-based tool calling works |
-| 8.6.7 | Ollama JSON extraction | Auto | Ollama | Markdown code blocks stripped, JSON parsed |
-| 8.6.8 | Ollama edge case: text before JSON | Auto | Ollama | `Here is my response: {"tool_calls":...}` → parsed |
-| 8.6.9 | Ollama edge case: schema in response | Auto | Ollama | `{"tool_calls": {"_description": ...}}` → rejected |
-| 8.6.10 | Ollama edge case: invalid JSON | Auto | Ollama | Malformed JSON → empty tool_calls |
-| 8.6.11 | AI_MODEL_PROVIDER=NONE | Auto | None | Playlist naming skipped |
-| 8.6.12 | Full pipeline per provider | Manual | All | End-to-end playlist generation with each provider |
-
-### 8.7 Library Context (Automated)
+| 8.7.1 | Gemini tool calling | Manual | Gemini | Sends request, receives tool calls, executes them |
+| 8.7.2 | Gemini protobuf handling | Auto | Gemini | `_convert_protobuf_to_dict()` converts correctly |
+| 8.7.3 | Gemini fc.args vs fc.arguments | Auto | Gemini | Both formats parsed correctly |
+| 8.7.4 | OpenAI tool calling | Manual | OpenAI | Standard tool calling works |
+| 8.7.5 | OpenAI timeout handling | Auto | OpenAI | `httpx.ReadTimeout` caught and handled |
+| 8.7.6 | Mistral tool calling | Manual | Mistral | SDK-based tool calling works |
+| 8.7.7 | Ollama JSON extraction | Auto | Ollama | Markdown code blocks stripped, JSON parsed |
+| 8.7.8 | Ollama edge case: text before JSON | Auto | Ollama | `Here is my response: {"tool_calls":...}` → parsed |
+| 8.7.9 | Ollama edge case: schema in response | Auto | Ollama | `{"tool_calls": {"_description": ...}}` → rejected |
+| 8.7.10 | Ollama edge case: invalid JSON | Auto | Ollama | Malformed JSON → empty tool_calls |
+| 8.7.11 | AI_MODEL_PROVIDER=NONE | Auto | None | Playlist naming skipped |
+| 8.7.12 | Full pipeline per provider | Manual | All | End-to-end playlist generation with each provider |
+
+### 8.8 Library Context (Automated)
 
 | # | Test Case | Type | Details |
 |---|-----------|------|---------|
-| 8.7.1 | get_library_context returns stats | Auto | Total songs, unique artists, top genres, etc. |
-| 8.7.2 | Caching works | Auto | Second call returns cached result |
-| 8.7.3 | Empty library handling | Auto | No songs in DB → graceful defaults |
-| 8.7.4 | Year range calculation | Auto | Min/max year from DB |
-| 8.7.5 | Rating coverage percentage | Auto | % of tracks with rating > 0 |
+| 8.8.1 | get_library_context returns stats | Auto | Total songs, unique artists, top genres, etc. |
+| 8.8.2 | Caching works | Auto | Second call returns cached result |
+| 8.8.3 | Empty library handling | Auto | No songs in DB → graceful defaults |
+| 8.8.4 | Year range calculation | Auto | Min/max year from DB |
+| 8.8.5 | Rating coverage percentage | Auto | % of tracks with rating > 0 |
 
 ---
 
@@ -685,28 +745,31 @@ For EACH provider (Jellyfin, Navidrome, Lyrion, Emby, LocalFiles):
 
 ### 12.2 Visual Correctness (All Manual)
 
-For EACH of these 18 templates, verify in BOTH light and dark mode:
-
-| # | Page | Check Items |
-|---|------|-------------|
-| 12.2.1 | Chat (instant playlist) | Background, text, input fields, buttons, results cards |
-| 12.2.2 | Similarity search | Background, search inputs, results table, cards |
-| 12.2.3 | Alchemy | Background, add/subtract buttons, results, projections |
-| 12.2.4 | Artist similarity | Background, search, results list |
-| 12.2.5 | Path finding | Background, start/end selectors, path visualization |
-| 12.2.6 | Map | Background, map container, tooltips |
-| 12.2.7 | CLAP search | Background, search input, results |
-| 12.2.8 | MuLan search | Background, search input, results |
-| 12.2.9 | Sonic fingerprint | Background, results, credentials form |
-| 12.2.10 | Waveform | Background, waveform canvas, controls |
-| 12.2.11 | Cleaning | Background, status display |
-| 12.2.12 | Cron | Background, cron table, add form |
-| 12.2.13 | Collection sync | Background, sync status |
-| 12.2.14 | Settings | Background, form fields, dropdowns |
-| 12.2.15 | Setup wizard | Background, wizard steps, buttons |
-| 12.2.16 | Sidebar navigation | Background, links, active state, toggle button |
-| 12.2.17 | Chart.js charts | Grid lines, labels, data points use CSS variable colors |
-| 12.2.18 | Error/loading states | Spinner, error messages visible in both themes |
+For EACH of these 21 pages/templates, verify in BOTH light and dark mode:
+
+| # | Page | Template | Check Items |
+|---|------|----------|-------------|
+| 12.2.1 | Homepage | `index.html` | Background, navigation cards, layout |
+| 12.2.2 | Chat (instant playlist) | `chat.html` | Background, text, input fields, buttons, results cards |
+| 12.2.3 | Similarity search | `similarity.html` | Background, search inputs, results table, cards |
+| 12.2.4 | Alchemy | `alchemy.html` | Background, add/subtract buttons, results, projections |
+| 12.2.5 | Artist similarity | `artist_similarity.html` | Background, search, results list |
+| 12.2.6 | Path finding | `path.html` | Background, start/end selectors, path visualization |
+| 12.2.7 | Map | `map.html` | Background, map container, tooltips |
+| 12.2.8 | CLAP search | `clap_search.html` | Background, search input, results |
+| 12.2.9 | MuLan search | `mulan_search.html` | Background, search input, results |
+| 12.2.10 | Sonic fingerprint | `sonic_fingerprint.html` | Background, results, credentials form |
+| 12.2.11 | Waveform | `waveform.html` | Background, waveform canvas, controls |
+| 12.2.12 | Analysis | `script.html` | Background, progress display, status |
+| 12.2.13 | Cleaning | `cleaning.html` | Background, status display |
+| 12.2.14 | Cron | `cron.html` | Background, cron table, add form |
+| 12.2.15 | Collection sync | `collection.html` | Background, sync status |
+| 12.2.16 | Collection script | `collection_script.html` | Background, script display |
+| 12.2.17 | Settings | `settings.html` | Background, form fields, dropdowns |
+| 12.2.18 | Setup wizard | `setup.html` | Background, wizard steps, buttons |
+| 12.2.19 | Sidebar navigation | `sidebar_navi.html` | Background, links, active state, toggle button |
+| 12.2.20 | Chart.js charts | _(cross-cutting)_ | Grid lines, labels, data points use CSS variable colors |
+| 12.2.21 | Error/loading states | _(cross-cutting)_ | Spinner, error messages visible in both themes |
 
 ### 12.3 CSS Variables (Automated)
 
@@ -792,14 +855,17 @@ For EACH of these 18 templates, verify in BOTH light and dark mode:
 
 | # | Test Case | Steps | Expected |
 |---|-----------|-------|----------|
-| 15.1 | Unified CPU compose | `docker compose -f docker-compose-unified.yaml up` | App + worker start, health check passes |
-| 15.2 | Unified NVIDIA compose | `docker compose -f docker-compose-unified-nvidia.yaml up` | GPU detected, CUDA available |
-| 15.3 | Split deployment: server | Start server compose | API responds on port |
-| 15.4 | Split deployment: worker | Start worker compose with remote Redis/PG | Worker connects and processes jobs |
-| 15.5 | Unraid templates | Import XML templates | Containers configured correctly |
-| 15.6 | .env.example works | Copy to .env, start | App starts with setup wizard |
-| 15.7 | No `version:` in compose | Check all compose files | No deprecated `version: '3.8'` line |
-| 15.8 | Test provider stack | Start test compose files | Jellyfin + Navidrome + AudioMuse running |
+| 15.1 | Unified CPU compose | `docker compose -f deployment/docker-compose-unified.yaml up` | App + worker start, health check passes |
+| 15.2 | Unified NVIDIA compose | `docker compose -f deployment/docker-compose-unified-nvidia.yaml up` | GPU detected, CUDA available |
+| 15.3 | Unified NVIDIA test compose | `docker compose -f deployment/docker-compose-unified-nvidia-test.yaml up` | Test variant starts |
+| 15.4 | Split deployment: server | `docker compose -f deployment/docker-compose-server.yaml up` | API responds on port |
+| 15.5 | Split deployment: worker CPU | `docker compose -f deployment/docker-compose-worker-cpu.yaml up` | Worker connects and processes jobs |
+| 15.6 | Split deployment: worker NVIDIA | `docker compose -f deployment/docker-compose-worker-nvidia.yaml up` | GPU worker connects |
+| 15.7 | DMR compose | `docker compose -f deployment/docker-compose-dmr.yaml up` | DMR variant starts |
+| 15.8 | Unraid templates | Import XML templates | Containers configured correctly |
+| 15.9 | .env.example works | Copy to .env, start | App starts with setup wizard |
+| 15.10 | No `version:` in compose | Check all compose files | No deprecated `version: '3.8'` line |
+| 15.11 | Test provider stack | Start test compose files | Jellyfin + Navidrome + AudioMuse running |
 
 ---
 
@@ -862,7 +928,7 @@ For EACH of these 18 templates, verify in BOTH light and dark mode:
 |---|-----------|------|---------|
 | 17.3.1 | Provider credentials not logged | Manual | Check logs for token/password values |
 | 17.3.2 | API keys not in responses | Auto | GET endpoints don't return API keys |
-| 17.3.3 | Provider config API sanitized | Auto | `GET /api/providers` redacts sensitive fields |
+| 17.3.3 | Provider config API sanitized | Auto | `GET /api/setup/providers` redacts sensitive fields |
 
 ---
 
@@ -872,6 +938,7 @@ For EACH of these 18 templates, verify in BOTH light and dark mode:
 
 - [ ] All existing unit tests pass (`pytest tests/unit/ -v`)
 - [ ] New MCP tool tests pass (Section 9)
+- [ ] New AI MCP client tests pass (Section 8.6)
 - [ ] New playlist ordering tests pass (Section 14)
 - [ ] New instant playlist pipeline tests pass (Section 8)
 - [ ] New setup wizard tests pass (Section 3)
@@ -895,7 +962,7 @@ For EACH of these 18 templates, verify in BOTH light and dark mode:
 - [ ] Dark mode visual correctness on all pages (Section 12.2)
 - [ ] All provider-specific tests (Section 10.1)
 - [ ] Docker deployment tests (Section 15)
-- [ ] AI provider integration tests (Section 8.6)
+- [ ] AI provider integration tests (Section 8.7)
 - [ ] Comparison suite benchmarks (testing_suite/)
 - [ ] Security audit (Section 17)
 
@@ -908,20 +975,21 @@ For EACH of these 18 templates, verify in BOTH light and dark mode:
 | Multi-Provider Architecture | 22 | 10 | 32 |
 | GUI Setup Wizard | 0 | 22 | 22 |
 | Environment / Config | 12 | 3 | 15 |
-| API Endpoints | 27 | 4 | 31 |
+| API Endpoints | 26 | 4 | 30 |
 | App Interactions | 0 | 14 | 14 |
-| Instant Playlist & AI | 30 | 6 | 36 |
+| Instant Playlist & AI (pipeline) | 30 | 6 | 36 |
+| AI MCP Client (test_ai_mcp_client.py) | 63 | 0 | 63 |
 | MCP Tools | 40 | 0 | 40 |
 | Provider-Specific | 18 | 14 per provider | 88 |
 | Database & Schema | 12 | 0 | 12 |
-| Dark Mode | 5 | 20 | 25 |
+| Dark Mode | 5 | 23 | 28 |
 | Analysis Pipeline | 8 | 1 | 9 |
 | Playlist Ordering | 16 | 0 | 16 |
-| Deployment | 0 | 8 | 8 |
+| Deployment | 0 | 11 | 11 |
 | Regression | 6 | 13 | 19 |
 | Security | 7 | 1 | 8 |
-| **TOTAL** | **203** | **~116** | **~319** |
+| **TOTAL** | **265** | **~122** | **~387** |
 
 **Existing automated tests:** ~200+
-**New automated tests to write:** ~203
-**Manual test cases:** ~116
+**New automated tests:** ~265
+**Manual test cases:** ~122
diff --git a/TEST_RESULTS.md b/TEST_RESULTS.md
new file mode 100644
index 00000000..46c8c8e3
--- /dev/null
+++ b/TEST_RESULTS.md
@@ -0,0 +1,252 @@
+# AudioMuse-AI v0.9.0 - Test Results
+
+**Date:** 2026-02-11
+**Branch:** `multi-provider-setup-gui`
+**Tester:** Claude + User
+**Environment:** Docker (NVIDIA GPU test stack) + Windows 11 local
+**Docker Compose:** `deployment/docker-compose-unified-nvidia-test.yaml`
+**Local Python:** 3.14.2 (Windows 11 Pro)
+**Container Python:** 3.12 (Ubuntu 24.04 + CUDA 12.8.1)
+
+---
+
+## Pre-flight: Collection Status
+
+### Local Environment (Python 3.14.2, Windows)
+- **622 tests collected** across all test files
+- **9 files blocked** (import `librosa` via `tasks/__init__.py` — not installed locally)
+  - `test_analysis.py`, `test_artist_gmm_manager.py`, `test_clustering_helper.py`,
+    `test_clustering_postprocessing.py`, `test_commons.py`, `test_memory_utils.py`,
+    `test_path_manager.py`, `test_song_alchemy.py`, `test_sonic_fingerprint_manager.py`
+- **213 runtime failures** — also `librosa` import (test_clustering, test_mediaserver, test_voyager_manager, etc.)
+- **407 passed, 2 skipped, 0 real failures** on tests that don't need `librosa`
+- Installed `audioop-lts` to fix Python 3.14 `pydub` compatibility
+
+### Docker Environment (Python 3.12.3, Ubuntu 24.04 + CUDA 12.8.1)
+- **833 tests collected**, 0 collection errors
+- **832 passed, 1 failed, 4 warnings**
+- Build time: ~15 min (GPU packages + model downloads)
+- Containers: redis (healthy), postgres (healthy), flask-app (up), worker (up)
+
+### Bug Found & Fixed During Testing
+| Test | Error | Fix |
+|------|-------|-----|
+| `test_mediaserver_localfiles.py::TestPathNormalization::test_posix_conversion` | Backslashes not converted on Linux | `normalize_file_path()`: replace `\` before creating `PurePosixPath` |
+
+### After Fix: 833 passed, 0 failed, 4 warnings (63.80s)
+
+### Warnings (non-blocking)
+- `analysis.py:387` — RuntimeWarning: invalid value in log10 (known, edge case in mel spectrogram)
+- `sklearn.linear_model` — FutureWarning: `penalty`/`n_jobs` deprecated in 1.8 (upgrade notice)
+
+---
+
+## Section 3: Multi-Provider Architecture
+
+### 3.1 Fresh Install (No Existing Data)
+_(pending)_
+
+### 3.2 Migration (Existing Single-Provider Data)
+_(pending)_
+
+### 3.3 Provider CRUD API
+_(pending)_
+
+### 3.4 Multi-Provider Playlist Creation
+_(pending)_
+
+---
+
+## Section 4: GUI Setup Wizard
+_(pending - manual)_
+
+---
+
+## Section 5: Environment / Config Setup
+
+### 5.1 Config Variable Validation
+_(pending)_
+
+### 5.2 Environment File
+_(pending)_
+
+### 5.3 Settings Persistence
+_(pending)_
+
+---
+
+## Section 6: API Endpoints
+
+### 6.1 Without Provider
+_(pending)_
+
+### 6.2 With Provider
+_(pending)_
+
+### 6.3 Error Handling
+_(pending)_
+
+---
+
+## Section 7: App Interactions (UI/UX)
+_(pending - manual)_
+
+---
+
+## Section 8: Instant Playlist & AI Changes
+
+### 8.1 Agentic Loop
+_(pending)_
+
+### 8.2 Pre-Execution Validation
+_(pending)_
+
+### 8.3 Proportional Sampling
+_(pending)_
+
+### 8.4 Artist Diversity
+_(pending)_
+
+### 8.5 System Prompt
+_(pending)_
+
+### 8.6 AI MCP Client
+_(pending)_
+
+### 8.7 AI Provider Integration
+_(pending)_
+
+### 8.8 Library Context
+_(pending)_
+
+---
+
+## Section 9: MCP Tools
+
+### 9.1 song_similarity
+_(pending)_
+
+### 9.2 text_search
+_(pending)_
+
+### 9.3 artist_similarity
+_(pending)_
+
+### 9.4 song_alchemy
+_(pending)_
+
+### 9.5 ai_brainstorm
+_(pending)_
+
+### 9.6 search_database
+_(pending)_
+
+---
+
+## Section 10: Provider-Specific Testing
+
+### 10.1 Common Provider Interface
+_(pending - manual)_
+
+### 10.2 LocalFiles Provider
+_(pending)_
+
+---
+
+## Section 11: Database & Schema Changes
+
+### 11.1 Schema Migration
+_(pending)_
+
+### 11.2 Data Integrity
+_(pending)_
+
+---
+
+## Section 12: Dark Mode
+
+### 12.1 Toggle & Persistence
+_(pending)_
+
+### 12.2 Visual Correctness
+_(pending - manual)_
+
+### 12.3 CSS Variables
+_(pending)_
+
+---
+
+## Section 13: Analysis Pipeline
+
+### 13.1 Analysis with New Fields
+_(pending)_
+
+### 13.2 Voyager Index
+_(pending)_
+
+---
+
+## Section 14: Playlist Ordering
+
+### 14.1 Greedy Nearest-Neighbor
+_(pending)_
+
+### 14.2 Composite Distance
+_(pending)_
+
+### 14.3 Circle of Fifths Key Distance
+_(pending)_
+
+### 14.4 Energy Arc
+_(pending)_
+
+---
+
+## Section 15: Deployment & Docker
+_(pending - manual)_
+
+---
+
+## Section 16: Regression Tests
+
+### 16.1 Features That Must Still Work
+_(pending)_
+
+### 16.2 Breaking Changes to Verify
+_(pending)_
+
+---
+
+## Section 17: Security
+
+### 17.1 XSS Prevention
+_(pending)_
+
+### 17.2 SQL Injection Prevention
+_(pending)_
+
+### 17.3 Authentication & Authorization
+_(pending)_
+
+---
+
+## Summary
+
+| Section | Pass | Fail | Skip | Total |
+|---------|------|------|------|-------|
+| 3. Multi-Provider | | | | |
+| 4. Setup Wizard | | | | |
+| 5. Config | | | | |
+| 6. API | | | | |
+| 7. UI/UX | | | | |
+| 8. Instant Playlist | | | | |
+| 9. MCP Tools | | | | |
+| 10. Providers | | | | |
+| 11. Database | | | | |
+| 12. Dark Mode | | | | |
+| 13. Analysis | | | | |
+| 14. Playlist Ordering | | | | |
+| 15. Docker | | | | |
+| 16. Regression | | | | |
+| 17. Security | | | | |
+| **TOTAL** | | | | |
diff --git a/tasks/mediaserver.py b/tasks/mediaserver.py
index 74d8306a..6b74b94b 100644
--- a/tasks/mediaserver.py
+++ b/tasks/mediaserver.py
@@ -839,8 +839,6 @@ def _get_provider_config_fields(provider_type: str):
              'description': 'Path to your music library folder (e.g., /music)', 'default': '/music'},
             {'name': 'playlist_directory', 'label': 'Playlist Directory', 'type': 'path', 'required': False,
              'description': 'Where to save generated playlists', 'default': '/music/playlists'},
-            {'name': 'formats', 'label': 'Audio Formats', 'type': 'text', 'required': False,
-             'description': 'Comma-separated list of formats to scan', 'default': '.mp3,.flac,.ogg,.m4a,.wav'},
             {'name': 'scan_subdirs', 'label': 'Scan Subdirectories', 'type': 'boolean', 'required': False,
              'description': 'Recursively scan subdirectories', 'default': True},
         ],
diff --git a/tasks/mediaserver_localfiles.py b/tasks/mediaserver_localfiles.py
index 78affc39..e83c7832 100644
--- a/tasks/mediaserver_localfiles.py
+++ b/tasks/mediaserver_localfiles.py
@@ -133,18 +133,22 @@ def normalize_file_path(path: str, base_path: str = "") -> str:
     - Make relative to music library root
     - Strip leading/trailing whitespace
     """
-    p = Path(path)
+    # Replace backslashes first so Linux doesn't treat them as literal chars
+    path = path.replace('\\', '/')
+    p = PurePosixPath(path)
 
     # Make relative if absolute and base_path provided
-    if base_path and p.is_absolute():
-        try:
-            base = Path(base_path)
-            p = p.relative_to(base)
-        except ValueError:
-            pass  # Not relative to base, keep as-is
+    if base_path:
+        base_path = base_path.replace('\\', '/')
+        base = PurePosixPath(base_path)
+        if p.is_absolute():
+            try:
+                p = p.relative_to(base)
+            except ValueError:
+                pass  # Not relative to base, keep as-is
 
     # Convert to POSIX style
-    normalized = PurePosixPath(p).as_posix()
+    normalized = p.as_posix()
 
     return normalized.strip()
 
@@ -773,14 +777,6 @@ def get_provider_info() -> Dict:
                 'description': 'Path to your music library folder',
                 'default': '/music'
             },
-            {
-                'name': 'supported_formats',
-                'label': 'Supported Formats',
-                'type': 'text',
-                'required': False,
-                'description': 'Comma-separated list of audio file extensions',
-                'default': ','.join(SUPPORTED_FORMATS)
-            },
             {
                 'name': 'scan_subdirectories',
                 'label': 'Scan Subdirectories',
diff --git a/templates/setup.html b/templates/setup.html
index 435a06db..0d93646c 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -221,6 +221,7 @@
     /* Test Connection Button */
     .test-connection-btn {
         background: var(--bg-body);
+        color: var(--text-main);
         border: 1px solid var(--border-color);
         padding: 0.5rem 1rem;
         border-radius: 4px;
@@ -1553,9 +1554,19 @@ <h4>Features</h4>
                                  placeholder="${field.default || ''}"
                                  data-provider="${type}" data-field="${field.name}">`;
                 } else if (field.type === 'boolean') {
-                    inputHtml = `<input type="checkbox" id="config-${type}-${field.name}"
+                    // Render inline with label
+                    fieldDiv.innerHTML = `
+                        <label for="config-${type}-${field.name}" style="display:flex;align-items:center;gap:8px;">
+                            ${field.label}${field.required ? ' *' : ''}
+                            <input type="checkbox" id="config-${type}-${field.name}"
                                  ${field.default ? 'checked' : ''}
-                                 data-provider="${type}" data-field="${field.name}">`;
+                                 data-provider="${type}" data-field="${field.name}"
+                                 style="width:auto;margin:0;">
+                        </label>
+                        <div class="field-help">${field.description || ''}</div>
+                    `;
+                    form.appendChild(fieldDiv);
+                    return; // skip the default innerHTML below
                 } else if (field.type === 'number') {
                     inputHtml = `<input type="number" id="config-${type}-${field.name}"
                                  value="${field.default || ''}"

From 163dab532c11d1cd85e1101c74f3269e8e1f5292 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Wed, 11 Feb 2026 15:38:21 +0100
Subject: [PATCH 25/33] =?UTF-8?q?Bufixes=20=20=20Bug=201:=20AlbumArtist=20?=
 =?UTF-8?q?field=20using=20wrong=20column=20index=20(mediaserver=5Flocalfi?=
 =?UTF-8?q?les.py:102)=20=20=20=5Fget=5Fsongs=5Ffrom=5Fdb()=20mapped=20Alb?=
 =?UTF-8?q?umArtist=20to=20row[2]=20(the=20author=20column)=20instead=20of?=
 =?UTF-8?q?=20preferring=20row[4]=20(album=5Fartist).=20Fix:=20row[4]=20?=
 =?UTF-8?q?=20=20or=20row[2]=20or=20'Unknown=20Artist'=20=E2=80=94=20prefe?=
 =?UTF-8?q?r=20album=5Fartist,=20fall=20back=20to=20author.?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

  Bug 2: Stale-data filesystem check removed (mediaserver_localfiles.py:110-117)
  _get_songs_from_db() sampled 5 random file paths and checked os.path.exists() as a staleness heuristic. This was unreliable
  (random sampling could give false positives/negatives) and added unnecessary I/O. Removed entirely.

  Bug 3: COALESCE type mismatch in Voyager index build (voyager_manager.py:227,230)
  COALESCE(s.track_id, e.item_id) failed because track_id is integer and item_id is text — PostgreSQL can't coalesce mismatched
  types. Fix: cast to COALESCE(s.track_id::text, e.item_id) in both the DISTINCT ON and ORDER BY clauses.

  Bug 4: Redundant from rq.job import Job inside loop (analysis.py:1408)
  Job was imported inside a for loop iterating over job IDs, but it was already imported at the top of the file. Removed the
  redundant inner import.

  Bug 5: DB cache short-circuits filesystem scan (mediaserver_localfiles.py:514,562)
  _get_songs_from_db() or get_all_songs() in get_recent_albums() and get_tracks_from_album() — once any tracks were analyzed, the
  DB cache returned a truthy list, preventing the filesystem scan from ever running. Only 1 album was visible instead of 21. Fix:
  call get_all_songs() directly.

Root causes:
  - Bug 1 (AlbumArtist index): album_artist was a new column added in Phase 1.7. The _get_songs_from_db() query fetched it, but
  the dict mapping used the wrong positional index — off-by-one from adding the new columns.
  - Bug 2 (Stale-data check): Defensive code added for multi-provider where DB state might diverge from filesystem. Unreliable in
  practice and unnecessary.
  - Bug 3 (COALESCE type mismatch): track_id (integer) was added in Phase 1.6 for cross-provider ID remapping. LocalFiles uses
  SHA-256 hash strings as item_id. PostgreSQL can't coalesce an integer with a text column — this only surfaces with the
  LocalFiles provider since other providers use server-assigned IDs that don't hit this path the same way.
  - Bug 4 (Redundant import): Minor — likely a copy-paste artifact from development.
  - Bug 5 (DB cache short-circuit): _get_songs_from_db() was added as a performance optimization for multi-provider, querying
  score to avoid rescanning the filesystem. But score only contains analyzed tracks, so after partial analysis it returns a
  truthy-but-incomplete list, hiding undiscovered albums.

  So bugs 1, 3, and 5 are direct consequences of the new multi-provider fields (album_artist, track_id, file_path) and the caching
   layer built around them. The LocalFiles provider's string-based IDs specifically triggered bug 3.
---
 tasks/analysis.py               |  1 -
 tasks/mediaserver_localfiles.py | 16 ++++------------
 tasks/voyager_manager.py        |  4 ++--
 3 files changed, 6 insertions(+), 15 deletions(-)

diff --git a/tasks/analysis.py b/tasks/analysis.py
index 524b2a8f..75ef9f19 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -1405,7 +1405,6 @@ def monitor_and_clear_jobs():
                 started_registry = default_queue.started_job_registry
                 for job_id in started_registry.get_job_ids():
                     try:
-                        from rq.job import Job
                         job = Job.fetch(job_id, connection=redis_conn)
                         if hasattr(job, 'func_name') and 'analyze_album_task' in str(job.func_name):
                             pending_album_jobs += 1
diff --git a/tasks/mediaserver_localfiles.py b/tasks/mediaserver_localfiles.py
index e83c7832..a8306a1a 100644
--- a/tasks/mediaserver_localfiles.py
+++ b/tasks/mediaserver_localfiles.py
@@ -99,7 +99,7 @@ def _get_songs_from_db() -> List[Dict]:
                 songs.append({
                     'Id': row[0],
                     'Name': row[1] or 'Unknown',
-                    'AlbumArtist': row[2] or 'Unknown Artist',
+                    'AlbumArtist': row[4] or row[2] or 'Unknown Artist',
                     'Album': row[3] or 'Unknown Album',
                     'OriginalAlbumArtist': row[4],
                     'Path': row[5],
@@ -107,14 +107,6 @@ def _get_songs_from_db() -> List[Dict]:
                     'Year': row[6],
                     'Rating': row[7],
                 })
-            # Verify sample of file paths exist on disk (stale-data check)
-            sample_size = min(5, len(songs))
-            if sample_size > 0:
-                import random
-                sample = random.sample(songs, sample_size)
-                missing = [s for s in sample if s.get('FilePath') and not os.path.exists(s['FilePath'])]
-                if len(missing) == sample_size:
-                    logger.warning(f"Stale data detected: none of {sample_size} sampled file paths exist on disk")
             return songs
     except Exception as e:
         logger.debug(f"DB cache lookup failed (expected during first scan): {e}")
@@ -518,8 +510,8 @@ def get_recent_albums(limit: int) -> List[Dict]:
     cfg = get_config()
     music_dir = cfg['music_directory']
 
-    # Try DB cache first, fall back to filesystem scan
-    all_songs = _get_songs_from_db() or get_all_songs()
+    # Always do a full filesystem scan to discover all albums
+    all_songs = get_all_songs()
     if not all_songs:
         return []
 
@@ -567,7 +559,7 @@ def get_tracks_from_album(album_id: str) -> List[Dict]:
     For local files, album_id is "Artist - Album Name" format.
     Uses DB cache when available to avoid rescanning the filesystem.
     """
-    all_songs = _get_songs_from_db() or get_all_songs()
+    all_songs = get_all_songs()
 
     # Filter songs matching this album
     tracks = []
diff --git a/tasks/voyager_manager.py b/tasks/voyager_manager.py
index bf3e2c46..fb88c81e 100644
--- a/tasks/voyager_manager.py
+++ b/tasks/voyager_manager.py
@@ -224,11 +224,11 @@ def build_and_store_voyager_index(db_conn=None):
     try:
         logger.info("Fetching all embeddings from the database (deduplicated by track)...")
         cur.execute("""
-            SELECT DISTINCT ON (COALESCE(s.track_id, e.item_id))
+            SELECT DISTINCT ON (COALESCE(s.track_id::text, e.item_id))
                    e.item_id, e.embedding
             FROM embedding e
             JOIN score s ON e.item_id = s.item_id
-            ORDER BY COALESCE(s.track_id, e.item_id), s.item_id
+            ORDER BY COALESCE(s.track_id::text, e.item_id), s.item_id
         """)
         all_embeddings = cur.fetchall()
 

From a7a5007535110dd3a2326f049796a125e255d9bf Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Fri, 27 Feb 2026 20:58:27 +0100
Subject: [PATCH 26/33] Prevent track duplication across providers with
 metadata-based fallback
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

When multiple providers point to the same music library but produce different
file paths (different mount points, relative vs absolute, file:// URLs),
tracks could be duplicated in the score/embedding tables. This adds a 3-tier
deduplication strategy: path hash → direct file_path → title+artist+album
metadata matching. Also expands mount prefix lists for path normalization and
adds segment-based suffix matching for prefix detection.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 app_helper.py     | 185 +++++++++++++++++++++++++++++++++-------------
 tasks/analysis.py |  75 ++++++++++++-------
 2 files changed, 181 insertions(+), 79 deletions(-)

diff --git a/app_helper.py b/app_helper.py
index d862595c..1502d485 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -1755,6 +1755,13 @@ def normalize_provider_path(file_path, provider_id=None):
         '/share/',            # NAS style
         '/volume1/music/',    # Synology style
         '/volume1/',          # Synology style
+        '/srv/music/',        # Some Linux systems
+        '/srv/',              # Some Linux systems
+        '/home/music/',       # Home directory music
+        '/storage/music/',    # Some NAS/Android
+        '/opt/music/',        # Some deployments
+        '/nas/music/',        # NAS direct mount
+        '/library/music/',    # macOS-style
     ]
 
     # Strip mount point prefixes (case-insensitive)
@@ -2027,71 +2034,112 @@ def get_all_provider_item_ids_for_track(track_id):
         ]
 
 
-def find_existing_analysis_by_file_path(file_path, provider_id=None):
+def find_existing_analysis_by_file_path(file_path, provider_id=None, title=None, artist=None, album=None):
     """
     Find existing analysis data for a file path using cross-provider matching.
 
     This is used to check if a track has already been analyzed under a different
     provider's item_id, allowing reuse of analysis data in multi-provider setups.
 
+    Uses a 3-tier lookup strategy:
+    1. Hash-based match via track table (fastest, most reliable)
+    2. Direct file_path match in score table (legacy fallback)
+    3. Metadata match by title + artist + album (handles different mount points)
+
     Args:
         file_path: Full or relative path to the audio file
         provider_id: Optional provider ID for provider-specific path normalization
+        title: Optional track title for metadata-based fallback matching
+        artist: Optional artist name for metadata-based fallback matching
+        album: Optional album name for metadata-based fallback matching
 
     Returns:
         dict with item_id and analysis status, or None if not found
     """
-    if not file_path:
-        return None
-
-    file_path_hash = _compute_file_path_hash(file_path, provider_id)
-    if not file_path_hash:
+    if not file_path and not (title and artist and album):
         return None
 
     db = get_db()
     with db.cursor() as cur:
-        # First try via track table (proper linking)
-        cur.execute("""
-            SELECT s.item_id, s.title, s.author,
-                   (s.tempo IS NOT NULL) as has_musicnn,
-                   EXISTS(SELECT 1 FROM embedding e WHERE e.item_id = s.item_id) as has_embedding,
-                   EXISTS(SELECT 1 FROM clap_embedding ce WHERE ce.item_id = s.item_id) as has_clap
-            FROM track t
-            JOIN score s ON s.track_id = t.id
-            WHERE t.file_path_hash = %s
-        """, (file_path_hash,))
-        row = cur.fetchone()
-        if row:
-            return {
-                'item_id': row[0],
-                'title': row[1],
-                'author': row[2],
-                'has_musicnn': row[3],
-                'has_embedding': row[4],
-                'has_clap': row[5],
-                'source': 'track_table'
-            }
+        # Fallback 1 & 2: Hash-based and direct file_path matching (require file_path)
+        if file_path:
+            file_path_hash = _compute_file_path_hash(file_path, provider_id)
 
-        # Fall back to checking score.file_path directly (for legacy data)
-        cur.execute("""
-            SELECT s.item_id, s.title, s.author,
-                   (s.tempo IS NOT NULL) as has_musicnn,
-                   EXISTS(SELECT 1 FROM embedding e WHERE e.item_id = s.item_id) as has_embedding,
-                   EXISTS(SELECT 1 FROM clap_embedding ce WHERE ce.item_id = s.item_id) as has_clap
-            FROM score s
-            WHERE s.file_path = %s
-        """, (file_path,))
-        row = cur.fetchone()
-        if row:
-            return {
-                'item_id': row[0],
-                'title': row[1],
-                'author': row[2],
-                'has_musicnn': row[3],
-                'has_embedding': row[4],
-                'has_clap': row[5],
-                'source': 'score_file_path'
-            }
+            if file_path_hash:
+                # First try via track table (proper linking)
+                cur.execute("""
+                    SELECT s.item_id, s.title, s.author, s.track_id,
+                           (s.tempo IS NOT NULL) as has_musicnn,
+                           EXISTS(SELECT 1 FROM embedding e WHERE e.item_id = s.item_id) as has_embedding,
+                           EXISTS(SELECT 1 FROM clap_embedding ce WHERE ce.item_id = s.item_id) as has_clap
+                    FROM track t
+                    JOIN score s ON s.track_id = t.id
+                    WHERE t.file_path_hash = %s
+                """, (file_path_hash,))
+                row = cur.fetchone()
+                if row:
+                    return {
+                        'item_id': row[0],
+                        'title': row[1],
+                        'author': row[2],
+                        'track_id': row[3],
+                        'has_musicnn': row[4],
+                        'has_embedding': row[5],
+                        'has_clap': row[6],
+                        'source': 'track_table'
+                    }
+
+            # Fall back to checking score.file_path directly (for legacy data)
+            cur.execute("""
+                SELECT s.item_id, s.title, s.author, s.track_id,
+                       (s.tempo IS NOT NULL) as has_musicnn,
+                       EXISTS(SELECT 1 FROM embedding e WHERE e.item_id = s.item_id) as has_embedding,
+                       EXISTS(SELECT 1 FROM clap_embedding ce WHERE ce.item_id = s.item_id) as has_clap
+                FROM score s
+                WHERE s.file_path = %s
+            """, (file_path,))
+            row = cur.fetchone()
+            if row:
+                return {
+                    'item_id': row[0],
+                    'title': row[1],
+                    'author': row[2],
+                    'track_id': row[3],
+                    'has_musicnn': row[4],
+                    'has_embedding': row[5],
+                    'has_clap': row[6],
+                    'source': 'score_file_path'
+                }
+
+        # Fallback 3: Match by title + artist + album metadata
+        # This handles cases where file paths differ across providers
+        # (different mount points, relative vs absolute paths, etc.)
+        if title and artist and album:
+            cur.execute("""
+                SELECT s.item_id, s.title, s.author, s.track_id,
+                       (s.tempo IS NOT NULL) as has_musicnn,
+                       EXISTS(SELECT 1 FROM embedding e WHERE e.item_id = s.item_id) as has_embedding,
+                       EXISTS(SELECT 1 FROM clap_embedding ce WHERE ce.item_id = s.item_id) as has_clap
+                FROM score s
+                WHERE LOWER(s.title) = LOWER(%s)
+                  AND LOWER(s.author) = LOWER(%s)
+                  AND LOWER(s.album) = LOWER(%s)
+                  AND s.track_id IS NOT NULL
+                  AND s.tempo IS NOT NULL
+                LIMIT 1
+            """, (title, artist, album))
+            row = cur.fetchone()
+            if row:
+                return {
+                    'item_id': row[0],
+                    'title': row[1],
+                    'author': row[2],
+                    'track_id': row[3],
+                    'has_musicnn': row[4],
+                    'has_embedding': row[5],
+                    'has_clap': row[6],
+                    'source': 'metadata_match'
+                }
 
         return None
 
@@ -2306,9 +2354,18 @@ def basic_normalize(path):
             normalized = normalized[7:]
             normalized = unquote(normalized)
         normalized = normalized.replace('\\', '/')
-        # Strip common mount points
-        prefixes = ['/media/music/', '/media/', '/mnt/media/music/', '/mnt/music/',
-                    '/mnt/', '/data/music/', '/data/', '/music/', '/share/', '/volume1/']
+        # Strip common mount points (synced with normalize_provider_path)
+        prefixes = [
+            '/media/music/', '/media/Media/', '/media/',
+            '/mnt/media/music/', '/mnt/media/', '/mnt/music/',
+            '/mnt/data/music/', '/mnt/data/', '/mnt/',
+            '/data/music/', '/data/', '/music/',
+            '/share/music/', '/share/',
+            '/volume1/music/', '/volume1/',
+            '/srv/music/', '/srv/',
+            '/home/music/', '/storage/music/',
+            '/opt/music/', '/nas/music/', '/library/music/',
+        ]
         lower = normalized.lower()
         for prefix in prefixes:
             if lower.startswith(prefix.lower()):
@@ -2354,7 +2411,7 @@ def basic_normalize(path):
                 'sample_comparisons': [], 'message': 'No matching tracks found between providers',
                 'had_existing_tracks': True}
 
-    # Detect prefix by finding common suffix
+    # Detect prefix by finding common suffix (segment-based for robustness)
     prefix_candidates = {}
     sample_comparisons = []
 
@@ -2379,8 +2436,6 @@ def basic_normalize(path):
         elif existing_path.lower().endswith(new_path.lower()):
             # The existing path has a prefix (new provider doesn't have it)
             # This means the NEW provider needs no prefix, but existing does
-            prefix_len = len(existing_path) - len(new_path)
-            # In this case, we don't need a prefix for the new provider
             prefix_candidates[''] = prefix_candidates.get('', 0) + 1
 
             sample_comparisons.append({
@@ -2389,6 +2444,30 @@ def basic_normalize(path):
                 'existing_path': existing_path,
                 'detected_prefix': '(existing has prefix, new does not)'
             })
+        else:
+            # Segment-based longest-common-suffix matching
+            # Handles cases where both providers have residual prefixes
+            # (e.g., "multimedia/music/Artist/Album/song.mp3" vs "music/Artist/Album/song.mp3")
+            new_segments = new_path.lower().split('/')
+            existing_segments = existing_path.lower().split('/')
+
+            common_count = 0
+            for i in range(1, min(len(new_segments), len(existing_segments)) + 1):
+                if new_segments[-i] == existing_segments[-i]:
+                    common_count += 1
+                else:
+                    break
+
+            if common_count >= 2:  # At least 2 matching segments (e.g., album/song)
+                new_prefix = '/'.join(new_path.split('/')[:len(new_segments) - common_count])
+                prefix_candidates[new_prefix] = prefix_candidates.get(new_prefix, 0) + 1
+
+                sample_comparisons.append({
+                    'title': match['title'],
+                    'new_path': new_path,
+                    'existing_path': existing_path,
+                    'detected_prefix': new_prefix
+                })
 
     if not prefix_candidates:
         return {'detected_prefix': '', 'confidence': 'low', 'matches_found': len(matches),
diff --git a/tasks/analysis.py b/tasks/analysis.py
index 75ef9f19..6168a115 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -655,7 +655,7 @@ def analyze_album_task(album_id, album_name, top_n_moods, parent_task_id, provid
     from app_helper import (redis_conn, get_db, save_task_status, get_task_info_from_db,
                      save_track_analysis_and_embedding, save_clap_embedding,
                      get_primary_provider_id, find_existing_analysis_by_file_path,
-                     link_provider_to_existing_track,
+                     link_provider_to_existing_track, link_provider_track,
                      TASK_STATUS_STARTED, TASK_STATUS_PROGRESS, TASK_STATUS_SUCCESS, TASK_STATUS_FAILURE, TASK_STATUS_REVOKED)
     from .clap_analyzer import analyze_audio_file as clap_analyze, is_clap_available
     from .mulan_analyzer import analyze_audio_file as mulan_analyze
@@ -824,43 +824,64 @@ def get_missing_mulan_track_ids(track_ids):
 
                 # Multi-provider: Check if this track was already analyzed under a different provider's item_id
                 # If so, link to the existing analysis via provider_track instead of re-analyzing
+                # Uses 3-tier lookup: path hash → direct file_path → metadata (title+artist+album)
                 item_file_path = item.get('Path') or item.get('FilePath')
-                if needs_musicnn and item_file_path:
-                    existing_analysis = find_existing_analysis_by_file_path(item_file_path, active_provider_id)
+                if needs_musicnn:
+                    existing_analysis = find_existing_analysis_by_file_path(
+                        item_file_path, active_provider_id,
+                        title=item.get('Name'), artist=item.get('AlbumArtist'), album=album_name
+                    )
                     if existing_analysis and existing_analysis.get('has_musicnn'):
                         source_item_id = existing_analysis.get('item_id')
                         if source_item_id and source_item_id != track_id_str:
-                            if link_provider_to_existing_track(
-                                file_path=item_file_path,
-                                provider_id=active_provider_id,
-                                item_id=track_id_str,
-                                title=item.get('Name'),
-                                artist=item.get('AlbumArtist'),
-                                album=item.get('Album')
-                            ):
-                                logger.info(f"Linked '{track_name_full}' to existing analysis (provider item {source_item_id})")
+                            linked = False
+                            if existing_analysis.get('source') == 'metadata_match':
+                                # Metadata-based match: link directly to existing track_id
+                                # (can't use link_provider_to_existing_track because file paths differ)
+                                existing_track_id = existing_analysis.get('track_id')
+                                if existing_track_id:
+                                    link_provider_track(active_provider_id, existing_track_id, track_id_str,
+                                                        item.get('Name'), item.get('AlbumArtist'), album_name)
+                                    linked = True
+                            else:
+                                # Path-based match: existing flow
+                                linked = link_provider_to_existing_track(
+                                    file_path=item_file_path,
+                                    provider_id=active_provider_id,
+                                    item_id=track_id_str,
+                                    title=item.get('Name'),
+                                    artist=item.get('AlbumArtist'),
+                                    album=album_name
+                                )
+                            if linked:
+                                logger.info(f"Linked '{track_name_full}' to existing analysis "
+                                            f"(source: {existing_analysis.get('source', 'path')}, "
+                                            f"provider item {source_item_id})")
                                 needs_musicnn = False
                                 if needs_clap and existing_analysis.get('has_clap'):
                                     needs_clap = False
                                     logger.info(f"  - CLAP embedding available via canonical track")
 
-                # Album name update now handled in main analysis task. If needed, uncomment below:
-                # try:
-                #     with get_db() as conn, conn.cursor() as cur:
-                #         cur.execute("UPDATE score SET album = %s WHERE item_id = %s", (album_name, track_id_str))
-                #         conn.commit()
-                #     logger.info(f"Updated album name for track '{track_name_full}' to '{album_name}'")
-                # except Exception as e:
-                #     logger.warning(f"Failed to update album name for '{track_name_full}': {e}")
-
                 if not needs_musicnn and not needs_clap and not needs_mulan:
+                    # Update metadata for already-analyzed tracks (rating, year, album_artist, file_path)
+                    try:
+                        with get_db() as conn, conn.cursor() as cur:
+                            cur.execute(
+                                "UPDATE score SET album = %s, album_artist = %s, year = %s, rating = %s, file_path = %s WHERE item_id = %s",
+                                (album_name, item.get('OriginalAlbumArtist'), item.get('Year'), item.get('Rating'),
+                                 item.get('Path') or item.get('FilePath'), track_id_str)
+                            )
+                            conn.commit()
+                    except Exception as e:
+                        logger.warning(f"Failed to update metadata for '{track_name_full}': {e}")
+
                     tracks_skipped_count += 1
                     status_parts = ["MusiCNN: ✓"]
                     if is_clap_available():
                         status_parts.append("CLAP: ✓")
                     if MULAN_ENABLED:
                         status_parts.append("MuLan: ✓")
-                    logger.info(f"Skipping '{track_name_full}' - all analyses complete ({', '.join(status_parts)})")
+                    logger.info(f"Skipping '{track_name_full}' - all analyses complete ({', '.join(status_parts)}), metadata updated")
                     continue
                 
                 # MODIFIED: Call to download_track simplified. Assumes it gets server details from config.
@@ -1123,16 +1144,18 @@ def get_missing_mulan_track_ids(track_ids):
 # MODIFIED: Removed jellyfin_url, jellyfin_user_id, jellyfin_token from signature.
 def run_analysis_task(num_recent_albums, top_n_moods):
     from app import app
-    from app_helper import (redis_conn, get_db, rq_queue_default, save_task_status, get_task_info_from_db, TASK_STATUS_STARTED, TASK_STATUS_PROGRESS, TASK_STATUS_SUCCESS, TASK_STATUS_FAILURE, TASK_STATUS_REVOKED)
+    from app_helper import (redis_conn, get_db, rq_queue_default, save_task_status, get_task_info_from_db, get_primary_provider_id, TASK_STATUS_STARTED, TASK_STATUS_PROGRESS, TASK_STATUS_SUCCESS, TASK_STATUS_FAILURE, TASK_STATUS_REVOKED)
     from .clap_analyzer import is_clap_available
     import config  # Import config to access MULAN_ENABLED
 
     MULAN_ENABLED = getattr(config, 'MULAN_ENABLED', False)  # Get MULAN_ENABLED from config
 
     current_job = get_current_job(redis_conn)
-    current_task_id = current_job.id if current_job else str(uuid.uuid4())    
+    current_task_id = current_job.id if current_job else str(uuid.uuid4())
 
     with app.app_context():
+        # Resolve active provider_id for passing to album analysis tasks
+        active_provider_id = get_primary_provider_id()
         if num_recent_albums < 0:
              logger.warning("num_recent_albums is negative, treating as 0 (all albums).")
              num_recent_albums = 0
@@ -1343,7 +1366,7 @@ def monitor_and_clear_jobs():
                         track_id_str = str(item['Id'])
                         try:
                             with get_db() as conn, conn.cursor() as cur:
-                                cur.execute("UPDATE score SET album = %s, album_artist = %s, year = %s, rating = %s, file_path = %s WHERE item_id = %s", (album.get('Name'), item.get('OriginalAlbumArtist'), item.get('Year'), item.get('Rating'), item.get('FilePath'), track_id_str))
+                                cur.execute("UPDATE score SET album = %s, album_artist = %s, year = %s, rating = %s, file_path = %s WHERE item_id = %s", (album.get('Name'), item.get('OriginalAlbumArtist'), item.get('Year'), item.get('Rating'), item.get('Path') or item.get('FilePath'), track_id_str))
                                 conn.commit()
                             logger.info(f"[MainAnalysisTask] Updated album/album_artist/year/rating/file_path for track '{item['Name']}' to '{album.get('Name')}' (main task)")
                         except Exception as e:
@@ -1360,7 +1383,7 @@ def monitor_and_clear_jobs():
                     continue
                 
                 # MODIFIED: Enqueue call for analyze_album_task now passes fewer arguments.
-                job = rq_queue_default.enqueue('tasks.analysis.analyze_album_task', args=(album['Id'], album['Name'], top_n_moods, current_task_id), job_id=str(uuid.uuid4()), job_timeout=-1, retry=Retry(max=3))
+                job = rq_queue_default.enqueue('tasks.analysis.analyze_album_task', args=(album['Id'], album['Name'], top_n_moods, current_task_id), kwargs={'provider_id': active_provider_id}, job_id=str(uuid.uuid4()), job_timeout=-1, retry=Retry(max=3))
                 active_jobs[job.id] = job
                 launched_jobs.append(job)
                 launched_job_ids.add(job.id)  # Track this job ID for reconciliation

From 4c00f261b1faebdc1b8f22f5a5c6ea2cbd732b2b Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Fri, 27 Feb 2026 20:58:56 +0100
Subject: [PATCH 27/33] Multi-provider setup improvements: auto-config, sync
 endpoint, path warnings

- Auto-set multi_provider_enabled and primary_provider_id when providers are
  added/updated/deleted
- Add provider sync endpoint (POST /api/setup/providers/<id>/sync) that links
  provider tracks to existing analysis via file_path_hash and enriches metadata
- Persist detected path_format into provider config JSONB on rescan
- Add Navidrome relative-path warnings in setup wizard, settings page, and
  post-analysis polling
- Add FilePath/OriginalAlbumArtist aliases to localfiles provider for
  analysis.py compatibility
- Improve Navidrome "Report Real Path" guidance to reference correct UI path

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 app_setup.py                    | 233 ++++++++++++++++++++++++++++++++
 static/script.js                |  33 ++++-
 tasks/mediaserver_localfiles.py |   2 +
 templates/settings.html         |  82 ++++++++++-
 templates/setup.html            |  16 ++-
 5 files changed, 357 insertions(+), 9 deletions(-)

diff --git a/app_setup.py b/app_setup.py
index 5111cdc8..1c53750c 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -170,6 +170,22 @@ def is_multi_provider_enabled():
     return result is True or result == 'true' or result == True
 
 
+def _update_multi_provider_settings():
+    """Auto-set multi_provider_enabled and primary_provider_id based on provider count."""
+    providers = get_providers(enabled_only=True)
+    count = len(providers)
+
+    # Auto-set primary to first provider if not set
+    current_primary = get_setting('primary_provider_id')
+    if (current_primary is None or current_primary == 'null') and count > 0:
+        set_setting('primary_provider_id', providers[0]['id'], 'providers',
+                     'ID of the primary provider for playlist creation')
+
+    # Auto-enable multi-provider when >1 providers, disable when <=1
+    set_setting('multi_provider_enabled', count > 1, 'providers',
+                 'Whether multi-provider mode is enabled')
+
+
 # ##############################################################################
 # PROVIDER MANAGEMENT
 # ##############################################################################
@@ -570,9 +586,11 @@ def create_provider():
             # Update existing provider instead of creating duplicate
             update_provider(existing['id'], name=name, config_data=config_data, enabled=enabled, priority=priority)
             logger.info(f"Updated existing provider {existing['id']} ({provider_type}) instead of creating duplicate")
+            _update_multi_provider_settings()
             return jsonify({'id': existing['id'], 'message': 'Provider updated', 'was_update': True}), 200
 
         provider_id = add_provider(provider_type, name, config_data, enabled, priority)
+        _update_multi_provider_settings()
         return jsonify({'id': provider_id, 'message': 'Provider created'}), 201
     except Exception as e:
         logger.error(f"Error creating provider: {e}")
@@ -629,6 +647,7 @@ def update_provider_endpoint(provider_id):
     )
 
     if success:
+        _update_multi_provider_settings()
         return jsonify({'message': 'Provider updated'})
     return jsonify({'error': 'Update failed'}), 500
 
@@ -654,6 +673,7 @@ def delete_provider_endpoint(provider_id):
     """
     success = delete_provider(provider_id)
     if success:
+        _update_multi_provider_settings()
         return jsonify({'message': 'Provider deleted'})
     return jsonify({'error': 'Provider not found'}), 404
 
@@ -824,6 +844,17 @@ def rescan_provider_paths(provider_id):
         path_format = detect_path_format(sample_tracks)
         prefix_result = detect_music_path_prefix(sample_tracks)
 
+        # Persist path_format into provider config JSONB
+        if path_format and path_format != 'unknown':
+            config_data['path_format'] = path_format
+            db = get_db()
+            with db.cursor() as cur:
+                cur.execute(
+                    "UPDATE provider SET config = config || %s::jsonb WHERE id = %s",
+                    (json.dumps({'path_format': path_format}), provider_id)
+                )
+                db.commit()
+
         current_prefix = config_data.get('music_path_prefix', '')
         suggested_prefix = prefix_result.get('detected_prefix', '')
         prefix_changed = current_prefix != suggested_prefix and prefix_result.get('matches_found', 0) > 0
@@ -887,6 +918,208 @@ def get_provider_libraries():
         return jsonify({'error': str(e), 'libraries': []}), 500
 
 
+# ##############################################################################
+# PROVIDER SYNC
+# ##############################################################################
+
+# Config attribute mappings for each provider type, used to temporarily patch
+# config module when calling provider functions with stored DB config.
+_PROVIDER_CONFIG_MAPPING = {
+    'jellyfin': {'url': 'JELLYFIN_URL', 'user_id': 'JELLYFIN_USER_ID', 'token': 'JELLYFIN_TOKEN'},
+    'navidrome': {'url': 'NAVIDROME_URL', 'user': 'NAVIDROME_USER', 'password': 'NAVIDROME_PASSWORD'},
+    'lyrion': {'url': 'LYRION_URL'},
+    'emby': {'url': 'EMBY_URL', 'user_id': 'EMBY_USER_ID', 'token': 'EMBY_TOKEN'},
+    'localfiles': {'music_directory': 'LOCALFILES_MUSIC_DIR'},
+}
+
+
+def _get_all_songs_with_config(provider_type, provider_config):
+    """Get all songs from a provider by temporarily patching config with stored DB values."""
+    from tasks.mediaserver import get_provider_function
+
+    mapping = _PROVIDER_CONFIG_MAPPING.get(provider_type, {})
+    saved = {}
+    for config_key, attr_name in mapping.items():
+        saved[attr_name] = getattr(config, attr_name, '')
+        setattr(config, attr_name, provider_config.get(config_key, ''))
+
+    # Jellyfin/Emby read config.HEADERS (pre-built dict), not individual token attrs
+    saved_headers = getattr(config, 'HEADERS', {})
+    token = provider_config.get('token', '')
+    if provider_type in ('jellyfin', 'emby') and token:
+        config.HEADERS = {"X-Emby-Token": token}
+
+    try:
+        func = get_provider_function(provider_type, 'get_all_songs')
+        return func() if func else []
+    finally:
+        config.HEADERS = saved_headers
+        for attr_name, original_value in saved.items():
+            setattr(config, attr_name, original_value)
+
+
+@setup_bp.route('/api/setup/providers/<int:provider_id>/sync', methods=['POST'])
+def sync_provider(provider_id):
+    """
+    Sync a provider's tracks by matching file paths to existing analyzed tracks.
+    Creates provider_track entries and enriches score metadata from provider data.
+    ---
+    tags:
+      - Setup
+    parameters:
+      - name: provider_id
+        in: path
+        required: true
+        schema:
+          type: integer
+    responses:
+      200:
+        description: Sync results
+      404:
+        description: Provider not found
+    """
+    from app_helper import _compute_file_path_hash, link_provider_track, normalize_provider_path
+
+    provider = get_provider_by_id(provider_id)
+    if not provider:
+        return jsonify({'error': 'Provider not found'}), 404
+
+    provider_type = provider['provider_type']
+    provider_config = provider['config']
+
+    try:
+        # Fetch all songs from the provider using its stored config
+        songs = _get_all_songs_with_config(provider_type, provider_config)
+        if not songs:
+            return jsonify({
+                'message': 'No songs found from provider',
+                'matched': 0,
+                'total': 0,
+                'enriched': 0,
+            })
+
+        db = get_db()
+        matched = 0
+        enriched = 0
+
+        for song in songs:
+            file_path = song.get('Path') or song.get('FilePath')
+            if not file_path:
+                continue
+
+            # Compute hash using the provider's music_path_prefix
+            file_path_hash = _compute_file_path_hash(file_path, provider_id)
+            if not file_path_hash:
+                continue
+
+            # Look up existing track by file_path_hash
+            with db.cursor() as cur:
+                cur.execute("""
+                    SELECT t.id, s.item_id, s.album_artist, s.year, s.rating, s.file_path, s.album
+                    FROM track t
+                    LEFT JOIN score s ON s.track_id = t.id
+                    WHERE t.file_path_hash = %s
+                """, (file_path_hash,))
+                row = cur.fetchone()
+
+            if not row:
+                continue
+
+            track_id, score_item_id = row[0], row[1]
+
+            # Create provider_track link
+            link_provider_track(
+                provider_id, track_id, song.get('Id', ''),
+                title=song.get('Name'),
+                artist=song.get('AlbumArtist') or song.get('Artist'),
+                album=song.get('Album')
+            )
+            matched += 1
+
+            # Metadata enrichment: fill missing score fields from this provider's data
+            if score_item_id:
+                current_album_artist, current_year, current_rating, current_file_path, current_album = row[2], row[3], row[4], row[5], row[6]
+
+                updates = []
+                values = []
+
+                new_album_artist = song.get('OriginalAlbumArtist') or song.get('AlbumArtist')
+                if new_album_artist and not current_album_artist:
+                    updates.append("album_artist = %s")
+                    values.append(new_album_artist)
+
+                new_year = song.get('Year')
+                if new_year and not current_year:
+                    updates.append("year = %s")
+                    values.append(new_year)
+
+                new_rating = song.get('Rating') or song.get('UserRating')
+                if new_rating and (not current_rating or current_rating == 0):
+                    updates.append("rating = %s")
+                    values.append(new_rating)
+
+                new_file_path = normalize_provider_path(file_path, provider_id) or file_path
+                if new_file_path and not current_file_path:
+                    updates.append("file_path = %s")
+                    values.append(new_file_path)
+
+                new_album = song.get('Album')
+                if new_album and not current_album:
+                    updates.append("album = %s")
+                    values.append(new_album)
+
+                if updates:
+                    values.append(score_item_id)
+                    with db.cursor() as cur:
+                        cur.execute(
+                            f"UPDATE score SET {', '.join(updates)} WHERE item_id = %s",
+                            values
+                        )
+                        db.commit()
+                    enriched += 1
+
+        # Detect virtual/non-matching paths and warn the user
+        match_rate = (matched / len(songs)) if songs else 0
+
+        if match_rate < 0.8 and len(songs) > 0:
+            warning = (
+                f"Only {matched}/{len(songs)} tracks matched by file path "
+                f"({match_rate:.0%} match rate). "
+                "This usually means the provider is not reporting real file paths. "
+            )
+            if provider_type == 'navidrome':
+                warning += (
+                    'In Navidrome, enable "Report Real Path" in Settings > Personal > Subsonic, '
+                    f"then call POST /api/setup/providers/{provider_id}/rescan-paths to re-detect paths."
+                )
+            else:
+                warning += (
+                    "Check that the provider's file path settings are configured to report "
+                    f"actual filesystem paths, then call POST /api/setup/providers/{provider_id}/rescan-paths."
+                )
+
+            return jsonify({
+                'warning': warning,
+                'matched': matched,
+                'total': len(songs),
+                'enriched': enriched,
+                'match_rate': round(match_rate, 2),
+                'action_required': 'enable_real_paths',
+                'rescan_url': f'/api/setup/providers/{provider_id}/rescan-paths',
+            })
+
+        return jsonify({
+            'message': f'Synced {matched}/{len(songs)} tracks, enriched {enriched} metadata fields',
+            'matched': matched,
+            'total': len(songs),
+            'enriched': enriched,
+        })
+
+    except Exception as e:
+        logger.error(f"Error syncing provider {provider_id}: {e}")
+        return jsonify({'error': str(e)}), 500
+
+
 @setup_bp.route('/api/setup/settings', methods=['GET'])
 def get_settings():
     """
diff --git a/static/script.js b/static/script.js
index 0698a253..adee1544 100644
--- a/static/script.js
+++ b/static/script.js
@@ -234,11 +234,17 @@ async function checkActiveTasks() {
                 else if (['REVOKED', 'CANCELED'].includes(currentStatusUpper)) alertTitle = 'Task Canceled';
                 
                 showMessageBox(alertTitle, alertMessage);
+
+                // Check Navidrome path warning after analysis completes
+                if (['SUCCESS', 'FINISHED'].includes(currentStatusUpper)
+                    && (mainActiveTask.task_type_from_db || '').toLowerCase().includes('analysis')) {
+                    checkNavidromePathWarning();
+                }
             }
             lastPolledTaskDetails[currentTaskId] = { state: currentStatusUpper, ...mainActiveTask };
             disableTaskButtons(true);
             updateCancelButtonState(false);
-            return true; 
+            return true;
         } else if (currentTaskId) {
             const finishedTaskId = currentTaskId;
             const previousDetails = lastPolledTaskDetails[finishedTaskId];
@@ -262,6 +268,12 @@ async function checkActiveTasks() {
                         else if (['REVOKED', 'CANCELED'].includes(upperFinalStatus)) alertTitle = 'Task Canceled';
                         
                         showMessageBox(alertTitle, alertMessage);
+
+                        // Check Navidrome path warning after analysis completes
+                        if (['SUCCESS', 'FINISHED'].includes(upperFinalStatus)
+                            && (finalStatusData.task_type_from_db || '').toLowerCase().includes('analysis')) {
+                            checkNavidromePathWarning();
+                        }
                     }
                     displayTaskStatus(finalStatusData);
                 } else {
@@ -290,6 +302,25 @@ async function checkActiveTasks() {
     return false;
 }
 
+async function checkNavidromePathWarning() {
+    try {
+        const response = await fetch('/api/setup/providers');
+        const providerList = await response.json();
+        const navidromeRelative = providerList.find(
+            p => p.provider_type === 'navidrome' && p.enabled && p.config && p.config.path_format === 'relative'
+        );
+        if (navidromeRelative) {
+            showMessageBox('Navidrome Path Warning',
+                'Navidrome is reporting relative file paths. Cross-provider track matching will not work.\n\n' +
+                'To fix: In Navidrome, go to Settings > Personal > Subsonic > enable "Report Real Path", ' +
+                'then go to AudioMuse Settings and click "Rescan Paths" on the Navidrome provider.'
+            );
+        }
+    } catch (e) {
+        console.warn('Could not check Navidrome path format:', e);
+    }
+}
+
 function disableTaskButtons(isDisabled) {
     const buttons = [startAnalysisBtn, startClusteringBtn, fetchPlaylistsBtn];
     buttons.forEach(button => {
diff --git a/tasks/mediaserver_localfiles.py b/tasks/mediaserver_localfiles.py
index a8306a1a..99885dc5 100644
--- a/tasks/mediaserver_localfiles.py
+++ b/tasks/mediaserver_localfiles.py
@@ -388,12 +388,14 @@ def _format_song(file_path: str, base_path: str) -> Dict:
         'AlbumArtist': metadata['album_artist'] or metadata['artist'],
         'Album': metadata['album'],
         'Path': file_path,
+        'FilePath': file_path,  # Alias for analysis.py compatibility
         'RelativePath': normalized_path,
         'TrackNumber': metadata['track_number'],
         'Year': metadata['year'],
         'Genre': metadata['genre'],
         'Duration': metadata['duration'],
         'Rating': metadata.get('rating'),
+        'OriginalAlbumArtist': metadata['album_artist'],  # For analysis.py album_artist update
         'FileSize': file_size,
         'last-modified': file_modified.isoformat() if file_modified else None,
         # For compatibility with other providers
diff --git a/templates/settings.html b/templates/settings.html
index 70a9bf06..686faff7 100644
--- a/templates/settings.html
+++ b/templates/settings.html
@@ -824,6 +824,7 @@ <h3 id="modal-title">Add Provider</h3>
     let serverInfo = {};
     let isDirty = false;
     let editingProviderId = null;
+    let lastDetectedPathFormat = null;
 
     // Initialize
     document.addEventListener('DOMContentLoaded', async function() {
@@ -916,6 +917,12 @@ <h3 id="modal-title">Add Provider</h3>
                     <button class="btn-danger" onclick="deleteProvider(${p.id})">Delete</button>
                 </div>
                 <div id="rescan-result-${p.id}" class="rescan-result"></div>
+                ${p.provider_type === 'navidrome' && p.config && p.config.path_format === 'relative'
+                    ? `<div class="test-result warning" style="margin-top: 0.5rem; font-size: 0.85rem;">
+                        <strong>Warning:</strong> Relative file paths detected — cross-provider track matching won't work.
+                        <br><small>Enable <strong>"Report Real Path"</strong> in Navidrome Players &gt; AudioMuse player, then click <strong>Rescan Paths</strong>.</small>
+                    </div>`
+                    : ''}
             `;
             list.appendChild(item);
 
@@ -1225,7 +1232,63 @@ <h3 id="modal-title">Add Provider</h3>
             });
             const data = await response.json();
             resultDiv.className = `test-result ${data.success ? 'success' : 'error'}`;
-            resultDiv.textContent = data.message;
+            let resultHTML = escapeHtml(data.message);
+
+            if (data.success) {
+                // Cache path_format for inclusion when saving
+                if (data.path_format) {
+                    lastDetectedPathFormat = data.path_format;
+                }
+
+                // Show prefix detection info
+                const pd = data.prefix_detection;
+                if (pd) {
+                    if (pd.confidence && pd.confidence !== 'none') {
+                        resultHTML += `<br><small>Path prefix detection: ${escapeHtml(pd.confidence)} confidence`;
+                        if (pd.matches_found) {
+                            resultHTML += ` (${pd.matches_found} matching tracks found)`;
+                        }
+                        resultHTML += `</small>`;
+                    } else if (pd.message) {
+                        resultHTML += `<br><small>${escapeHtml(pd.message)}</small>`;
+                    }
+                }
+
+                // Warn about low-confidence path detection for Navidrome
+                if (type === 'navidrome' && pd && pd.confidence === 'low' && pd.had_existing_tracks) {
+                    resultHTML += `<div class="test-result warning" style="margin-top: 0.5rem;">
+                        <strong>Warning:</strong> Path matching between Navidrome and existing providers has low confidence.
+                        Cross-provider track matching may not work correctly.
+                        <br><small>Check that Navidrome's <strong>"Report Real Path"</strong> is enabled
+                        (Players &gt; AudioMuse player) and verify the Music Path Prefix is correct.</small>
+                    </div>`;
+                }
+
+                // Warn about relative paths for Navidrome
+                if (type === 'navidrome' && data.path_format === 'relative') {
+                    resultHTML += `<div class="test-result warning" style="margin-top: 0.5rem;">
+                        <strong>Warning:</strong> Navidrome is returning relative file paths.
+                        This will prevent cross-provider track matching.
+                        <br><small>To fix: In Navidrome, go to Players &gt; AudioMuse player &gt; enable
+                        <strong>"Report Real Path"</strong>, then re-test.</small>
+                    </div>`;
+                }
+
+                // Warn if testing a non-Navidrome provider while an existing Navidrome has relative paths
+                if (type !== 'navidrome') {
+                    const naviRelative = providers.find(
+                        p => p.provider_type === 'navidrome' && p.config && p.config.path_format === 'relative'
+                    );
+                    if (naviRelative) {
+                        resultHTML += `<div class="test-result warning" style="margin-top: 0.5rem;">
+                            <strong>Warning:</strong> Existing Navidrome provider "${escapeHtml(naviRelative.name)}" has relative file paths.
+                            Cross-provider track matching won't work until you enable "Report Real Path" in Navidrome.
+                        </div>`;
+                    }
+                }
+            }
+
+            resultDiv.innerHTML = resultHTML;
 
             // After successful connection test, fetch available libraries
             if (data.success && type !== 'localfiles') {
@@ -1292,6 +1355,11 @@ <h3 id="modal-title">Add Provider</h3>
         const typeInfo = providerTypes.find(t => t.type === type);
         const config = collectProviderConfig();
 
+        // Include cached path_format for Navidrome providers
+        if (lastDetectedPathFormat && type === 'navidrome') {
+            config.path_format = lastDetectedPathFormat;
+        }
+
         try {
             let response;
             if (editingProviderId) {
@@ -1377,12 +1445,12 @@ <h3 id="modal-title">Add Provider</h3>
                 return;
             }
 
-            let html = `<div class="test-result ${data.path_format === 'relative' && providers.length > 1 ? 'warning' : 'success'}">`;
+            let html = `<div class="test-result ${data.path_format === 'relative' ? 'warning' : 'success'}">`;
             html += `<strong>Path format:</strong> ${data.path_format}`;
 
-            if (data.path_format === 'relative' && providers.length > 1) {
-                html += `<br>Relative paths may prevent cross-provider track matching.`;
-                html += `<br><small>Enable <strong>"Report Real Path"</strong> in Navidrome's Subsonic settings, then rescan again.</small>`;
+            if (data.path_format === 'relative') {
+                html += `<br>Relative paths will prevent cross-provider track matching.`;
+                html += `<br><small>Enable <strong>"Report Real Path"</strong> in Navidrome Players &gt; AudioMuse player, then rescan again.</small>`;
             }
 
             if (data.matches_found > 0) {
@@ -1403,6 +1471,10 @@ <h3 id="modal-title">Add Provider</h3>
             }
 
             resultDiv.innerHTML = html;
+
+            // Reload providers so the persistent warning badge updates
+            await loadProviders();
+            renderProviders();
         } catch (err) {
             resultDiv.innerHTML = `<div class="test-result error">Rescan failed: ${err.message}</div>`;
         }
diff --git a/templates/setup.html b/templates/setup.html
index 0d93646c..ac63a814 100644
--- a/templates/setup.html
+++ b/templates/setup.html
@@ -1682,14 +1682,24 @@ <h4>Features</h4>
                     } else if (pd.message) {
                         resultHTML += `<br><small>${pd.message}</small>`;
                     }
+
+                    // Warn about low-confidence path detection for Navidrome
+                    if (type === 'navidrome' && pd.confidence === 'low' && pd.had_existing_tracks) {
+                        resultHTML += `<div class="test-result warning" style="margin-top: 0.5rem;">
+                            <strong>Warning:</strong> Path matching between Navidrome and existing providers has low confidence.
+                            Cross-provider track matching may not work correctly.
+                            <br><small>Check that Navidrome's <strong>"Report Real Path"</strong> is enabled
+                            (Players &gt; AudioMuse player) and verify the Music Path Prefix is correct.</small>
+                        </div>`;
+                    }
                 }
 
                 // Warn about relative paths for Navidrome in multi-provider setups
-                if (type === 'navidrome' && data.path_format === 'relative' && selectedProviders.length > 1) {
+                if (type === 'navidrome' && data.path_format === 'relative') {
                     resultHTML += `<div class="test-result warning" style="margin-top: 0.5rem;">
                         <strong>Warning:</strong> Navidrome is returning relative file paths.
-                        In a multi-provider setup, this will prevent cross-provider track matching.
-                        <br><small>To fix: In Navidrome, go to Settings &gt; Subsonic &gt; enable <strong>"Report Real Path"</strong>, then re-test the connection.</small>
+                        This will prevent cross-provider track matching.
+                        <br><small>To fix: In Navidrome, go to Players &gt; AudioMuse player &gt; enable <strong>"Report Real Path"</strong>, then re-test the connection.</small>
                     </div>`;
                 }
             }

From 5019b50f0548004fbcb426a520f37d8aa5352a27 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Sat, 28 Feb 2026 21:35:13 +0100
Subject: [PATCH 28/33] Add AI API key fields to Settings UI with Fernet
 encryption

- Add encrypted storage for OpenAI, Gemini, and Mistral API keys via
  existing Fernet system (encrypt_setting_value/decrypt_setting_value)
- Add password input fields with show/hide toggles to Settings page
- Mask sensitive values as '********' in API responses, skip on save
- Apply decrypted keys to runtime config so GUI-set keys take effect
- Fix stale import bindings in app_chat, app_clustering, app_cron:
  use config.OPENAI_API_KEY etc. instead of frozen from-imports

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 app_chat.py             | 31 +++++++-----------
 app_clustering.py       | 16 +++++-----
 app_cron.py             | 13 ++++----
 app_helper.py           | 24 ++++++++++++++
 app_setup.py            | 22 +++++++++++--
 templates/settings.html | 70 +++++++++++++++++++++++++++++++++++++++++
 6 files changed, 141 insertions(+), 35 deletions(-)

diff --git a/app_chat.py b/app_chat.py
index 0f7bad18..9ea5d1ef 100644
--- a/app_chat.py
+++ b/app_chat.py
@@ -6,15 +6,8 @@
 
 
 logger = logging.getLogger(__name__)
-# Import AI configuration from the main config.py
-# This assumes config.py is in the same directory as app_chat.py or accessible via Python path.
-from config import (
-    OLLAMA_SERVER_URL, OLLAMA_MODEL_NAME,
-    OPENAI_SERVER_URL, OPENAI_MODEL_NAME, OPENAI_API_KEY, # Import OpenAI config
-    GEMINI_MODEL_NAME, GEMINI_API_KEY, # Import GEMINI_API_KEY from config
-    MISTRAL_MODEL_NAME, MISTRAL_API_KEY,
-    AI_MODEL_PROVIDER, # Default AI provider
-)
+# Import config module - read attributes at call time so runtime updates take effect
+import config
 
 # Create a Blueprint for chat-related routes
 chat_bp = Blueprint('chat_bp', __name__,
@@ -253,7 +246,7 @@ def chat_playlist_api():
         return jsonify({"error": "Missing userInput in request"}), 400
 
     original_user_input = data.get('userInput')
-    ai_provider = data.get('ai_provider', AI_MODEL_PROVIDER).upper()
+    ai_provider = data.get('ai_provider', config.AI_MODEL_PROVIDER).upper()
     ai_model_from_request = data.get('ai_model')
     
     log_messages = []
@@ -277,15 +270,15 @@ def chat_playlist_api():
     # Build AI configuration object
     ai_config = {
         'provider': ai_provider,
-        'ollama_url': data.get('ollama_server_url', OLLAMA_SERVER_URL),
-        'ollama_model': ai_model_from_request or OLLAMA_MODEL_NAME,
-        'openai_url': data.get('openai_server_url', OPENAI_SERVER_URL),
-        'openai_model': ai_model_from_request or OPENAI_MODEL_NAME,
-        'openai_key': data.get('openai_api_key') or OPENAI_API_KEY,
-        'gemini_key': data.get('gemini_api_key') or GEMINI_API_KEY,
-        'gemini_model': ai_model_from_request or GEMINI_MODEL_NAME,
-        'mistral_key': data.get('mistral_api_key') or MISTRAL_API_KEY,
-        'mistral_model': ai_model_from_request or MISTRAL_MODEL_NAME
+        'ollama_url': data.get('ollama_server_url', config.OLLAMA_SERVER_URL),
+        'ollama_model': ai_model_from_request or config.OLLAMA_MODEL_NAME,
+        'openai_url': data.get('openai_server_url', config.OPENAI_SERVER_URL),
+        'openai_model': ai_model_from_request or config.OPENAI_MODEL_NAME,
+        'openai_key': data.get('openai_api_key') or config.OPENAI_API_KEY,
+        'gemini_key': data.get('gemini_api_key') or config.GEMINI_API_KEY,
+        'gemini_model': ai_model_from_request or config.GEMINI_MODEL_NAME,
+        'mistral_key': data.get('mistral_api_key') or config.MISTRAL_API_KEY,
+        'mistral_model': ai_model_from_request or config.MISTRAL_MODEL_NAME
     }
     
     # Validate API keys for cloud providers
diff --git a/app_clustering.py b/app_clustering.py
index a3f134a3..99fcac1c 100644
--- a/app_clustering.py
+++ b/app_clustering.py
@@ -4,7 +4,8 @@
 import logging
 import traceback
 
-# Import all necessary configuration variables
+# Import config module - read attributes at call time so runtime updates (e.g. API keys) take effect
+import config
 from config import JELLYFIN_URL, JELLYFIN_USER_ID, JELLYFIN_TOKEN, HEADERS, TEMP_DIR, \
     REDIS_URL, DATABASE_URL, MAX_DISTANCE, MAX_SONGS_PER_CLUSTER, MAX_SONGS_PER_ARTIST, NUM_RECENT_ALBUMS, \
     SCORE_WEIGHT_DIVERSITY, SCORE_WEIGHT_SILHOUETTE, SCORE_WEIGHT_DAVIES_BOULDIN, SCORE_WEIGHT_CALINSKI_HARABASZ, \
@@ -15,9 +16,9 @@
     SPECTRAL_N_CLUSTERS_MIN, SPECTRAL_N_CLUSTERS_MAX, ENABLE_CLUSTERING_EMBEDDINGS, \
     PCA_COMPONENTS_MIN, PCA_COMPONENTS_MAX, CLUSTERING_RUNS, MOOD_LABELS, TOP_N_MOODS, \
     AI_MODEL_PROVIDER, OLLAMA_SERVER_URL, OLLAMA_MODEL_NAME, \
-    OPENAI_SERVER_URL, OPENAI_MODEL_NAME, OPENAI_API_KEY, \
-    GEMINI_API_KEY, GEMINI_MODEL_NAME, \
-    TOP_N_PLAYLISTS, MISTRAL_API_KEY, MISTRAL_MODEL_NAME
+    OPENAI_SERVER_URL, OPENAI_MODEL_NAME, \
+    GEMINI_MODEL_NAME, \
+    TOP_N_PLAYLISTS, MISTRAL_MODEL_NAME
 
 # RQ import
 from rq import Retry
@@ -326,11 +327,10 @@ def start_clustering_endpoint():
             "ollama_model_name_param": data.get('ollama_model_name', OLLAMA_MODEL_NAME),
             "openai_server_url_param": data.get('openai_server_url', OPENAI_SERVER_URL),
             "openai_model_name_param": data.get('openai_model_name', OPENAI_MODEL_NAME),
-            "openai_api_key_param": data.get('openai_api_key') or OPENAI_API_KEY,  # Use env var if empty string
-            # This line already falls back to the config value if the request doesn't contain it.
-            "gemini_api_key_param": data.get('gemini_api_key', GEMINI_API_KEY),
+            "openai_api_key_param": data.get('openai_api_key') or config.OPENAI_API_KEY,
+            "gemini_api_key_param": data.get('gemini_api_key') or config.GEMINI_API_KEY,
             "gemini_model_name_param": data.get('gemini_model_name', GEMINI_MODEL_NAME),
-            "mistral_api_key_param": data.get('mistral_api_key', MISTRAL_API_KEY),
+            "mistral_api_key_param": data.get('mistral_api_key') or config.MISTRAL_API_KEY,
             "mistral_model_name_param": data.get('mistral_model_name', MISTRAL_MODEL_NAME),
             "top_n_moods_for_clustering_param": int(data.get('top_n_moods', TOP_N_MOODS)),
             "enable_clustering_embeddings_param": data.get('enable_clustering_embeddings', ENABLE_CLUSTERING_EMBEDDINGS),
diff --git a/app_cron.py b/app_cron.py
index 180358bb..af4d377c 100644
--- a/app_cron.py
+++ b/app_cron.py
@@ -2,6 +2,7 @@
 from psycopg2.extras import DictCursor
 from app_helper import get_db, rq_queue_high, save_task_status, TASK_STATUS_PENDING
 import uuid, time, logging
+import config
 from config import (
     TOP_N_MOODS,
     CLUSTER_ALGORITHM, NUM_CLUSTERS_MIN, NUM_CLUSTERS_MAX,
@@ -13,9 +14,9 @@
     SCORE_WEIGHT_DIVERSITY, SCORE_WEIGHT_SILHOUETTE, SCORE_WEIGHT_DAVIES_BOULDIN, SCORE_WEIGHT_CALINSKI_HARABASZ,
     SCORE_WEIGHT_PURITY, SCORE_WEIGHT_OTHER_FEATURE_DIVERSITY, SCORE_WEIGHT_OTHER_FEATURE_PURITY,
     AI_MODEL_PROVIDER, OLLAMA_SERVER_URL, OLLAMA_MODEL_NAME,
-    OPENAI_SERVER_URL, OPENAI_MODEL_NAME, OPENAI_API_KEY,
-    GEMINI_API_KEY, GEMINI_MODEL_NAME,
-    MISTRAL_API_KEY, MISTRAL_MODEL_NAME, ENABLE_CLUSTERING_EMBEDDINGS
+    OPENAI_SERVER_URL, OPENAI_MODEL_NAME,
+    GEMINI_MODEL_NAME,
+    MISTRAL_MODEL_NAME, ENABLE_CLUSTERING_EMBEDDINGS
 )
 
 cron_bp = Blueprint('cron_bp', __name__)
@@ -161,10 +162,10 @@ def run_due_cron_jobs():
                         "ollama_model_name_param": OLLAMA_MODEL_NAME,
                         "openai_server_url_param": OPENAI_SERVER_URL,
                         "openai_model_name_param": OPENAI_MODEL_NAME,
-                        "openai_api_key_param": OPENAI_API_KEY,
-                        "gemini_api_key_param": GEMINI_API_KEY,
+                        "openai_api_key_param": config.OPENAI_API_KEY,
+                        "gemini_api_key_param": config.GEMINI_API_KEY,
                         "gemini_model_name_param": GEMINI_MODEL_NAME,
-                        "mistral_api_key_param": MISTRAL_API_KEY,
+                        "mistral_api_key_param": config.MISTRAL_API_KEY,
                         "mistral_model_name_param": MISTRAL_MODEL_NAME,
                         "top_n_moods_for_clustering_param": int(TOP_N_MOODS),
                         "enable_clustering_embeddings_param": bool(ENABLE_CLUSTERING_EMBEDDINGS),
diff --git a/app_helper.py b/app_helper.py
index 1502d485..f2c66f25 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -1694,6 +1694,30 @@ def decrypt_provider_config(config_dict):
     return decrypted
 
 
+def encrypt_setting_value(value):
+    """Encrypt a single setting value for storage in app_settings."""
+    if not value or str(value).startswith('gAAAAA'):
+        return value
+    try:
+        f = _get_fernet()
+        return f.encrypt(str(value).encode()).decode()
+    except Exception as e:
+        logger.error(f"Failed to encrypt setting value: {e}")
+        return value
+
+
+def decrypt_setting_value(value):
+    """Decrypt a single setting value retrieved from app_settings."""
+    if not value or not str(value).startswith('gAAAAA'):
+        return value
+    try:
+        f = _get_fernet()
+        return f.decrypt(str(value).encode()).decode()
+    except Exception as e:
+        logger.error(f"Failed to decrypt setting value: {e}")
+        return value
+
+
 # ##############################################################################
 # TRACK LINKING FUNCTIONS - For multi-provider track identity
 # ##############################################################################
diff --git a/app_setup.py b/app_setup.py
index 1c53750c..6eb32b47 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -16,7 +16,7 @@
 from flask import Blueprint, jsonify, request, render_template, redirect, url_for, g
 from functools import wraps
 
-from app_helper import get_db, detect_music_path_prefix, detect_path_format, encrypt_provider_config, decrypt_provider_config
+from app_helper import get_db, detect_music_path_prefix, detect_path_format, encrypt_provider_config, decrypt_provider_config, encrypt_setting_value, decrypt_setting_value
 from tasks.mediaserver import (
     get_available_provider_types,
     get_provider_info,
@@ -31,6 +31,9 @@
 
 setup_bp = Blueprint('setup', __name__)
 
+# Keys that must be encrypted at rest and masked in API responses
+SENSITIVE_SETTING_KEYS = {'openai_api_key', 'gemini_api_key', 'mistral_api_key'}
+
 
 # ##############################################################################
 # HELPER FUNCTIONS
@@ -49,6 +52,9 @@ def get_setting(key, default=None):
 
 def set_setting(key, value, category=None, description=None):
     """Set a setting value in the database."""
+    store_value = value
+    if key in SENSITIVE_SETTING_KEYS and value:
+        store_value = encrypt_setting_value(str(value))
     db = get_db()
     with db.cursor() as cur:
         cur.execute("""
@@ -59,7 +65,7 @@ def set_setting(key, value, category=None, description=None):
                 category = COALESCE(EXCLUDED.category, app_settings.category),
                 description = COALESCE(EXCLUDED.description, app_settings.description),
                 updated_at = NOW()
-        """, (key, json.dumps(value), category, description))
+        """, (key, json.dumps(store_value), category, description))
         db.commit()
 
 
@@ -72,6 +78,9 @@ def get_all_settings():
         settings = {}
         for row in rows:
             key, value, category, description = row
+            # Mask sensitive values in API responses
+            if key in SENSITIVE_SETTING_KEYS and value:
+                value = '********'
             # Handle None category - use 'general' as default
             category = category or 'general'
             if category not in settings:
@@ -97,7 +106,10 @@ def apply_settings_to_config():
         'ollama_model_name': 'OLLAMA_MODEL_NAME',
         'openai_server_url': 'OPENAI_SERVER_URL',
         'openai_model_name': 'OPENAI_MODEL_NAME',
+        'openai_api_key': 'OPENAI_API_KEY',
+        'gemini_api_key': 'GEMINI_API_KEY',
         'gemini_model_name': 'GEMINI_MODEL_NAME',
+        'mistral_api_key': 'MISTRAL_API_KEY',
         'mistral_model_name': 'MISTRAL_MODEL_NAME',
         'max_songs_per_artist_playlist': 'MAX_SONGS_PER_ARTIST_PLAYLIST',
         'playlist_energy_arc': 'PLAYLIST_ENERGY_ARC',
@@ -106,6 +118,9 @@ def apply_settings_to_config():
     for db_key, config_attr in mapping.items():
         val = get_setting(db_key)
         if val is not None and val != '':
+            # Decrypt sensitive settings before applying
+            if db_key in SENSITIVE_SETTING_KEYS:
+                val = decrypt_setting_value(str(val))
             existing = getattr(config, config_attr, None)
             if isinstance(existing, bool):
                 val = val in (True, 'true', 'True')
@@ -1158,6 +1173,9 @@ def update_settings():
         return jsonify({'error': 'No data provided'}), 400
 
     for key, value in data.items():
+        # Skip masked sensitive values (user didn't change the key)
+        if key in SENSITIVE_SETTING_KEYS and value == '********':
+            continue
         set_setting(key, value)
 
     # Apply relevant settings to runtime config immediately
diff --git a/templates/settings.html b/templates/settings.html
index 686faff7..ebe16805 100644
--- a/templates/settings.html
+++ b/templates/settings.html
@@ -117,6 +117,35 @@
         border-color: var(--color-primary);
     }
 
+    .password-wrapper {
+        position: relative;
+        display: inline-block;
+        width: 100%;
+        max-width: 400px;
+    }
+
+    .password-wrapper input {
+        padding-right: 3rem !important;
+    }
+
+    .toggle-password {
+        position: absolute;
+        right: 0.5rem;
+        top: 50%;
+        transform: translateY(-50%);
+        background: none;
+        border: none;
+        cursor: pointer;
+        font-size: 1.1rem;
+        color: var(--text-muted);
+        padding: 0.25rem;
+        line-height: 1;
+    }
+
+    .toggle-password:hover {
+        color: var(--text-main);
+    }
+
     .field-group .checkbox-label {
         display: flex;
         align-items: center;
@@ -732,6 +761,14 @@ <h2><span class="section-icon">&#129302;</span> AI Integration</h2>
                     <input type="text" id="openai-model" placeholder="gpt-4" onchange="markDirty()">
                     <div class="field-help">Model name (e.g., gpt-4, gpt-4o, or OpenRouter model IDs)</div>
                 </div>
+                <div class="field-group">
+                    <label for="openai-api-key">API Key</label>
+                    <div class="password-wrapper">
+                        <input type="password" id="openai-api-key" placeholder="sk-..." onchange="markDirty()">
+                        <button type="button" class="toggle-password" onclick="togglePasswordVisibility(this)" title="Show/hide">&#128065;</button>
+                    </div>
+                    <div class="field-help">OpenAI or OpenRouter API key. Leave blank to use environment variable.</div>
+                </div>
             </div>
 
             <div id="gemini-fields" style="display: none;">
@@ -740,6 +777,14 @@ <h2><span class="section-icon">&#129302;</span> AI Integration</h2>
                     <input type="text" id="gemini-model" placeholder="gemini-2.5-pro" onchange="markDirty()">
                     <div class="field-help">Google Gemini model (e.g., gemini-2.5-pro, gemini-2.5-flash)</div>
                 </div>
+                <div class="field-group">
+                    <label for="gemini-api-key">API Key</label>
+                    <div class="password-wrapper">
+                        <input type="password" id="gemini-api-key" placeholder="AI..." onchange="markDirty()">
+                        <button type="button" class="toggle-password" onclick="togglePasswordVisibility(this)" title="Show/hide">&#128065;</button>
+                    </div>
+                    <div class="field-help">Google Gemini API key. Leave blank to use environment variable.</div>
+                </div>
             </div>
 
             <div id="mistral-fields" style="display: none;">
@@ -748,6 +793,14 @@ <h2><span class="section-icon">&#129302;</span> AI Integration</h2>
                     <input type="text" id="mistral-model" placeholder="ministral-3b-latest" onchange="markDirty()">
                     <div class="field-help">Mistral AI model (e.g., ministral-3b-latest, mistral-large-latest)</div>
                 </div>
+                <div class="field-group">
+                    <label for="mistral-api-key">API Key</label>
+                    <div class="password-wrapper">
+                        <input type="password" id="mistral-api-key" placeholder="..." onchange="markDirty()">
+                        <button type="button" class="toggle-password" onclick="togglePasswordVisibility(this)" title="Show/hide">&#128065;</button>
+                    </div>
+                    <div class="field-help">Mistral AI API key. Leave blank to use environment variable.</div>
+                </div>
             </div>
 
             <!-- Instant Playlist Settings -->
@@ -969,8 +1022,11 @@ <h3 id="modal-title">Add Provider</h3>
         if (settings.ollama_model_name) document.getElementById('ollama-model').value = settings.ollama_model_name;
         if (settings.openai_server_url) document.getElementById('openai-url').value = settings.openai_server_url;
         if (settings.openai_model_name) document.getElementById('openai-model').value = settings.openai_model_name;
+        if (settings.openai_api_key) document.getElementById('openai-api-key').value = settings.openai_api_key;
         if (settings.gemini_model_name) document.getElementById('gemini-model').value = settings.gemini_model_name;
+        if (settings.gemini_api_key) document.getElementById('gemini-api-key').value = settings.gemini_api_key;
         if (settings.mistral_model_name) document.getElementById('mistral-model').value = settings.mistral_model_name;
+        if (settings.mistral_api_key) document.getElementById('mistral-api-key').value = settings.mistral_api_key;
 
         // Instant Playlist
         document.getElementById('max-artist-songs').value = settings.max_songs_per_artist_playlist ?? 5;
@@ -992,6 +1048,17 @@ <h3 id="modal-title">Add Provider</h3>
         document.getElementById('mistral-fields').style.display = provider === 'MISTRAL' ? 'block' : 'none';
     }
 
+    function togglePasswordVisibility(btn) {
+        const input = btn.previousElementSibling;
+        if (input.type === 'password') {
+            input.type = 'text';
+            btn.innerHTML = '&#128064;';
+        } else {
+            input.type = 'password';
+            btn.innerHTML = '&#128065;';
+        }
+    }
+
     function updateWorkerInfo() {
         const workerInfo = document.getElementById('worker-info');
         const deploymentCards = document.querySelectorAll('.option-card[data-value="unified"], .option-card[data-value="split"]');
@@ -1538,8 +1605,11 @@ <h3 id="modal-title">Add Provider</h3>
             ollama_model_name: document.getElementById('ollama-model').value || '',
             openai_server_url: document.getElementById('openai-url').value || '',
             openai_model_name: document.getElementById('openai-model').value || '',
+            openai_api_key: document.getElementById('openai-api-key').value || '',
             gemini_model_name: document.getElementById('gemini-model').value || '',
+            gemini_api_key: document.getElementById('gemini-api-key').value || '',
             mistral_model_name: document.getElementById('mistral-model').value || '',
+            mistral_api_key: document.getElementById('mistral-api-key').value || '',
             // Instant Playlist
             max_songs_per_artist_playlist: parseInt(document.getElementById('max-artist-songs').value) || 5,
             playlist_energy_arc: document.getElementById('energy-arc').checked,

From adfd4cdefe3d61b0fb40d3d18a6cfea5888c35b8 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Sat, 28 Feb 2026 21:36:43 +0100
Subject: [PATCH 29/33] Fix song number truncation at 100 in instant playlist

The .song-list padding-left was too small (1.5rem) for 3-digit numbers,
causing the browser to clip "100" and display only "00".

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 static/style.css | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/static/style.css b/static/style.css
index b4cbbec7..7d5611d8 100644
--- a/static/style.css
+++ b/static/style.css
@@ -730,7 +730,7 @@ body.dark-mode #cancel-sync-btn:disabled {
 .song-list {
     margin-top: 0.75rem;
     list-style-type: decimal;
-    padding-left: 1.5rem;
+    padding-left: 3rem;
     color: var(--text-muted);
 }
 

From ae376afd82d7fea35c6dca1fa3501be9b892f761 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Sat, 28 Feb 2026 21:46:04 +0100
Subject: [PATCH 30/33] Add duplicate detection, provider health checks, and
 path validation

- Add provider health endpoint (GET /api/setup/providers/health) that checks
  all enabled providers for relative paths, missing path format, and prefix
  mismatches
- Replace Navidrome-specific dashboard warning with generalized provider
  health check that runs on page load and after analysis completion
- Add pre-analysis path validation warnings in run_analysis_task() for
  relative paths and missing music_path_prefix (non-blocking)
- Add normalized metadata matching (Tier 3b) in find_existing_analysis_by_file_path()
  to handle "Remastered", "The Beatles" vs "Beatles" variants
- Add duplicate audit endpoint (GET /api/library/duplicates) with track_id
  and metadata-based detection strategies
- Add Library Health section in Settings UI with duplicate checker
- Track cross-provider link counts in album analysis and include in final
  analysis summary message

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 app_helper.py           |  47 ++++++++++++++
 app_setup.py            | 134 ++++++++++++++++++++++++++++++++++++++++
 static/script.js        |  26 ++++----
 tasks/analysis.py       |  48 +++++++++++++-
 templates/settings.html |  75 ++++++++++++++++++++++
 5 files changed, 312 insertions(+), 18 deletions(-)

diff --git a/app_helper.py b/app_helper.py
index f2c66f25..0f31f347 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -2058,6 +2058,25 @@ def get_all_provider_item_ids_for_track(track_id):
         ]
 
 
+def _normalize_metadata_for_matching(title, artist):
+    """Normalize title and artist strings for fuzzy duplicate matching.
+
+    Strips common variations like (Remastered), [Explicit], leading "the ", etc.
+    Reuses the same regex patterns as clustering_postprocessing.py.
+    """
+    import re
+    t = (title or '').lower().strip()
+    t = re.sub(r'\s*\([^)]*(?:remaster|explicit|clean|radio|edit|version|mix)[^)]*\)', '', t, flags=re.IGNORECASE)
+    t = re.sub(r'\s*\[[^\]]*(?:remaster|explicit|clean|radio|edit|version|mix)[^\]]*\]', '', t, flags=re.IGNORECASE)
+    t = re.sub(r'\s*-\s*(?:remaster|explicit|clean|radio|edit|version|mix).*?$', '', t, flags=re.IGNORECASE)
+    t = t.strip()
+
+    a = (artist or '').lower().strip()
+    a = re.sub(r'^the\s+', '', a)
+    a = a.strip()
+    return t, a
+
+
 def find_existing_analysis_by_file_path(file_path, provider_id=None, title=None, artist=None, album=None):
     """
     Find existing analysis data for a file path using cross-provider matching.
@@ -2165,6 +2184,34 @@ def find_existing_analysis_by_file_path(file_path, provider_id=None, title=None,
                     'source': 'metadata_match'
                 }
 
+            # Tier 3b: Normalized metadata match (handles "Remastered", "The Beatles" vs "Beatles", etc.)
+            norm_title, norm_artist = _normalize_metadata_for_matching(title, artist)
+            if norm_title and norm_artist:
+                cur.execute("""
+                    SELECT item_id, title, author, track_id,
+                           (tempo IS NOT NULL) as has_musicnn,
+                           EXISTS(SELECT 1 FROM embedding e WHERE e.item_id = score.item_id) as has_embedding,
+                           EXISTS(SELECT 1 FROM clap_embedding ce WHERE ce.item_id = score.item_id) as has_clap
+                    FROM score
+                    WHERE LOWER(album) = LOWER(%s)
+                      AND track_id IS NOT NULL
+                      AND tempo IS NOT NULL
+                    LIMIT 200
+                """, (album,))
+                for cand in cur.fetchall():
+                    cand_title, cand_artist = _normalize_metadata_for_matching(cand[1], cand[2])
+                    if cand_title == norm_title and cand_artist == norm_artist:
+                        return {
+                            'item_id': cand[0],
+                            'title': cand[1],
+                            'author': cand[2],
+                            'track_id': cand[3],
+                            'has_musicnn': cand[4],
+                            'has_embedding': cand[5],
+                            'has_clap': cand[6],
+                            'source': 'normalized_metadata_match'
+                        }
+
         return None
 
 
diff --git a/app_setup.py b/app_setup.py
index 6eb32b47..845ded65 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -892,6 +892,140 @@ def rescan_provider_paths(provider_id):
         return jsonify({'success': False, 'message': f'Rescan failed: {str(e)}'}), 500
 
 
+@setup_bp.route('/api/setup/providers/health', methods=['GET'])
+def check_provider_health():
+    """Check health of all enabled providers and return warnings."""
+    try:
+        providers = get_providers(enabled_only=True)
+        warnings = []
+
+        # Collect all prefixes to detect mismatches
+        prefixes = {}
+        for p in providers:
+            cfg = p.get('config') or {}
+            prefixes[p['id']] = cfg.get('music_path_prefix', '')
+
+        non_empty_prefixes = {pid: pfx for pid, pfx in prefixes.items() if pfx}
+
+        for p in providers:
+            cfg = p.get('config') or {}
+            pid = p['id']
+            pname = p.get('name') or p.get('provider_type')
+            ptype = p.get('provider_type')
+
+            path_format = cfg.get('path_format', '')
+
+            if path_format == 'relative':
+                warnings.append({
+                    'provider_id': pid, 'provider_name': pname, 'provider_type': ptype,
+                    'level': 'warning',
+                    'message': f'{pname} is reporting relative file paths. Cross-provider track matching will not work.',
+                    'action': 'Enable "Report Real Path" in Navidrome, then Rescan Paths.' if ptype == 'navidrome' else 'Check provider path configuration.',
+                    'action_url': '/settings'
+                })
+            elif not path_format and ptype not in ('localfiles',):
+                warnings.append({
+                    'provider_id': pid, 'provider_name': pname, 'provider_type': ptype,
+                    'level': 'info',
+                    'message': f'{pname} has no path format detected yet. Run "Rescan Paths" after first analysis.',
+                    'action': 'Rescan Paths on the provider in Settings.',
+                    'action_url': '/settings'
+                })
+
+            # Prefix mismatch: this provider has no prefix but others do
+            if non_empty_prefixes and not prefixes.get(pid) and ptype not in ('localfiles',) and path_format != 'relative':
+                if len(providers) > 1:
+                    warnings.append({
+                        'provider_id': pid, 'provider_name': pname, 'provider_type': ptype,
+                        'level': 'warning',
+                        'message': f'{pname} has no music_path_prefix while other providers do. Cross-provider matching may fail.',
+                        'action': 'Run Rescan Paths to auto-detect the prefix.',
+                        'action_url': '/settings'
+                    })
+
+        return jsonify({
+            'warnings': warnings,
+            'provider_count': len(providers),
+            'checked_at': datetime.utcnow().isoformat()
+        })
+    except Exception as e:
+        logger.error(f"Error checking provider health: {e}")
+        return jsonify({'warnings': [], 'provider_count': 0, 'error': str(e)}), 500
+
+
+@setup_bp.route('/api/library/duplicates', methods=['GET'])
+def check_library_duplicates():
+    """Find duplicate tracks in the score table using track_id and metadata matching."""
+    from app_helper import _normalize_metadata_for_matching
+    try:
+        db = get_db()
+        duplicate_groups = []
+
+        with db.cursor() as cur:
+            # Strategy A: track_id duplicates (confirmed, same canonical file)
+            cur.execute("""
+                SELECT track_id, COUNT(*) as cnt
+                FROM score
+                WHERE track_id IS NOT NULL
+                GROUP BY track_id
+                HAVING COUNT(*) > 1
+            """)
+            for track_id, cnt in cur.fetchall():
+                cur.execute(
+                    "SELECT item_id, title, author, album FROM score WHERE track_id = %s ORDER BY item_id",
+                    (track_id,)
+                )
+                rows = cur.fetchall()
+                duplicate_groups.append({
+                    'type': 'track_id',
+                    'key': str(track_id),
+                    'count': cnt,
+                    'items': [{'item_id': r[0], 'title': r[1], 'artist': r[2], 'album': r[3]} for r in rows]
+                })
+
+            # Strategy B: metadata duplicates (suspected)
+            cur.execute("""
+                SELECT LOWER(title), LOWER(author), LOWER(album), COUNT(*) as cnt, array_agg(item_id)
+                FROM score
+                WHERE title IS NOT NULL AND author IS NOT NULL
+                GROUP BY LOWER(title), LOWER(author), LOWER(album)
+                HAVING COUNT(*) > 1
+            """)
+            # Post-filter with normalization to merge variant groups
+            seen_normalized = set()
+            for title_l, author_l, album_l, cnt, item_ids in cur.fetchall():
+                norm_t, norm_a = _normalize_metadata_for_matching(title_l or '', author_l or '')
+                norm_key = (norm_t, norm_a, (album_l or '').strip())
+                if norm_key in seen_normalized:
+                    continue
+                seen_normalized.add(norm_key)
+                # Skip if already covered by track_id duplicates
+                existing_track_id_items = {item for g in duplicate_groups if g['type'] == 'track_id' for item in [i['item_id'] for i in g['items']]}
+                if all(iid in existing_track_id_items for iid in item_ids):
+                    continue
+                duplicate_groups.append({
+                    'type': 'metadata',
+                    'key': f"{title_l} | {author_l} | {album_l}",
+                    'count': cnt,
+                    'items': [{'item_id': iid} for iid in item_ids]
+                })
+
+            # Total score rows for context
+            cur.execute("SELECT COUNT(*) FROM score")
+            total_score_rows = cur.fetchone()[0]
+
+        total_duplicate_rows = sum(g['count'] for g in duplicate_groups)
+        return jsonify({
+            'duplicate_groups': duplicate_groups,
+            'total_groups': len(duplicate_groups),
+            'total_duplicate_rows': total_duplicate_rows,
+            'total_score_rows': total_score_rows
+        })
+    except Exception as e:
+        logger.error(f"Error checking library duplicates: {e}")
+        return jsonify({'error': str(e), 'duplicate_groups': [], 'total_groups': 0}), 500
+
+
 @setup_bp.route('/api/setup/providers/libraries', methods=['POST'])
 def get_provider_libraries():
     """
diff --git a/static/script.js b/static/script.js
index adee1544..74e8445b 100644
--- a/static/script.js
+++ b/static/script.js
@@ -238,7 +238,7 @@ async function checkActiveTasks() {
                 // Check Navidrome path warning after analysis completes
                 if (['SUCCESS', 'FINISHED'].includes(currentStatusUpper)
                     && (mainActiveTask.task_type_from_db || '').toLowerCase().includes('analysis')) {
-                    checkNavidromePathWarning();
+                    checkProviderHealth();
                 }
             }
             lastPolledTaskDetails[currentTaskId] = { state: currentStatusUpper, ...mainActiveTask };
@@ -272,7 +272,7 @@ async function checkActiveTasks() {
                         // Check Navidrome path warning after analysis completes
                         if (['SUCCESS', 'FINISHED'].includes(upperFinalStatus)
                             && (finalStatusData.task_type_from_db || '').toLowerCase().includes('analysis')) {
-                            checkNavidromePathWarning();
+                            checkProviderHealth();
                         }
                     }
                     displayTaskStatus(finalStatusData);
@@ -302,22 +302,17 @@ async function checkActiveTasks() {
     return false;
 }
 
-async function checkNavidromePathWarning() {
+async function checkProviderHealth() {
     try {
-        const response = await fetch('/api/setup/providers');
-        const providerList = await response.json();
-        const navidromeRelative = providerList.find(
-            p => p.provider_type === 'navidrome' && p.enabled && p.config && p.config.path_format === 'relative'
-        );
-        if (navidromeRelative) {
-            showMessageBox('Navidrome Path Warning',
-                'Navidrome is reporting relative file paths. Cross-provider track matching will not work.\n\n' +
-                'To fix: In Navidrome, go to Settings > Personal > Subsonic > enable "Report Real Path", ' +
-                'then go to AudioMuse Settings and click "Rescan Paths" on the Navidrome provider.'
-            );
+        const response = await fetch('/api/setup/providers/health');
+        const data = await response.json();
+        const warnings = data.warnings || [];
+        if (warnings.length > 0) {
+            const bullets = warnings.map(w => `• ${w.message}`).join('<br>');
+            showMessageBox('Provider Warnings', bullets);
         }
     } catch (e) {
-        console.warn('Could not check Navidrome path format:', e);
+        console.warn('Could not check provider health:', e);
     }
 }
 
@@ -562,6 +557,7 @@ document.addEventListener('DOMContentLoaded', async () => {
         await fetchAndDisplayOverallLastTask();
         updateCancelButtonState(true);
     }
+    checkProviderHealth();
     setInterval(checkActiveTasks, 3000);
 });
 
diff --git a/tasks/analysis.py b/tasks/analysis.py
index 6168a115..cf152e3d 100644
--- a/tasks/analysis.py
+++ b/tasks/analysis.py
@@ -670,7 +670,7 @@ def analyze_album_task(album_id, album_name, top_n_moods, parent_task_id, provid
         active_provider_id = provider_id if provider_id is not None else get_primary_provider_id()
         initial_details = {"album_name": album_name, "log": [f"[{time.strftime('%Y-%m-%d %H:%M:%S')}] Album analysis task started."]}
         save_task_status(current_task_id, "album_analysis", TASK_STATUS_STARTED, parent_task_id=parent_task_id, sub_type_identifier=album_id, progress=0, details=initial_details)
-        tracks_analyzed_count, tracks_skipped_count, current_progress_val = 0, 0, 0
+        tracks_analyzed_count, tracks_skipped_count, tracks_linked_count, current_progress_val = 0, 0, 0, 0
         current_task_logs = initial_details["log"]
         
         model_paths = {
@@ -854,6 +854,7 @@ def get_missing_mulan_track_ids(track_ids):
                                     album=album_name
                                 )
                             if linked:
+                                tracks_linked_count += 1
                                 logger.info(f"Linked '{track_name_full}' to existing analysis "
                                             f"(source: {existing_analysis.get('source', 'path')}, "
                                             f"provider item {source_item_id})")
@@ -1092,7 +1093,7 @@ def get_missing_mulan_track_ids(track_ids):
             logger.info("Performing final comprehensive cleanup after album analysis")
             comprehensive_memory_cleanup(force_cuda=True, reset_onnx_pool=True)
 
-            summary = {"tracks_analyzed": tracks_analyzed_count, "tracks_skipped": tracks_skipped_count, "total_tracks_in_album": total_tracks_in_album}
+            summary = {"tracks_analyzed": tracks_analyzed_count, "tracks_skipped": tracks_skipped_count, "tracks_linked": tracks_linked_count, "total_tracks_in_album": total_tracks_in_album}
             log_and_update_album_task(f"Album '{album_name}' analysis complete.", 100, task_state=TASK_STATUS_SUCCESS, final_summary_details=summary)
             return {"status": "SUCCESS", **summary}
 
@@ -1193,6 +1194,29 @@ def log_and_update_main(message, progress, **kwargs):
 
         try:
             log_and_update_main("🚀 Starting main analysis process...", 0)
+
+            # Pre-analysis provider path validation
+            try:
+                from app_setup import get_provider_by_id
+                provider_config = get_provider_by_id(active_provider_id)
+                if provider_config:
+                    pcfg = provider_config.get('config') or {}
+                    pname = provider_config.get('name') or provider_config.get('provider_type')
+                    if pcfg.get('path_format') == 'relative':
+                        log_and_update_main(
+                            f"⚠️ Warning: Provider '{pname}' uses relative file paths. "
+                            f"Cross-provider track matching will not work.", 0)
+                    if not pcfg.get('music_path_prefix') and provider_config.get('provider_type') not in ('localfiles',):
+                        with get_db() as conn, conn.cursor() as cur:
+                            cur.execute("SELECT COUNT(*) FROM provider_track WHERE provider_id != %s LIMIT 1", (active_provider_id,))
+                            other_count = cur.fetchone()[0]
+                        if other_count > 0:
+                            log_and_update_main(
+                                f"⚠️ Warning: Provider '{pname}' has no music_path_prefix but other providers have tracks. "
+                                f"Run 'Rescan Paths' in Settings for better cross-provider matching.", 0)
+            except Exception as e:
+                logger.warning(f"Pre-analysis path validation failed (non-blocking): {e}")
+
             clean_temp(TEMP_DIR)
             # MODIFIED: Call to get_recent_albums no longer needs server parameters.
             all_albums = get_recent_albums(num_recent_albums)
@@ -1488,7 +1512,25 @@ def monitor_and_clear_jobs():
             # Top query computation disabled - using default queries from database only
             logger.info('Analysis complete. CLAP text search uses default queries (no auto-regeneration).')
 
-            final_message = f"Main analysis complete. Launched {albums_launched}, Skipped {albums_skipped}."
+            # Sum cross-provider link stats from child tasks
+            total_linked = 0
+            try:
+                from app_helper import get_child_tasks_from_db
+                for ct in get_child_tasks_from_db(current_task_id):
+                    details = ct.get('details') or {}
+                    if isinstance(details, str):
+                        try:
+                            details = json.loads(details)
+                        except (json.JSONDecodeError, TypeError):
+                            details = {}
+                    total_linked += (details.get('final_summary_details') or {}).get('tracks_linked', 0)
+            except Exception as e:
+                logger.warning(f"Could not sum link stats from child tasks: {e}")
+
+            final_message = (
+                f"Main analysis complete. Launched {albums_launched}, Skipped {albums_skipped}."
+                + (f" Cross-provider links: {total_linked}." if total_linked > 0 else "")
+            )
             log_and_update_main(final_message, 100, task_state=TASK_STATUS_SUCCESS)
             clean_temp(TEMP_DIR)
             return {"status": "SUCCESS", "message": final_message}
diff --git a/templates/settings.html b/templates/settings.html
index ebe16805..b3be2ddd 100644
--- a/templates/settings.html
+++ b/templates/settings.html
@@ -713,6 +713,27 @@ <h2><span class="section-icon">&#128202;</span> Analysis</h2>
         </div>
     </div>
 
+    <!-- Library Health Section -->
+    <div class="settings-section">
+        <div class="section-header" onclick="toggleSection(this)">
+            <h2><span class="section-icon">&#128269;</span> Library Health</h2>
+            <span class="toggle-icon">&#9660;</span>
+        </div>
+        <div class="section-content collapsed">
+            <p class="section-description">
+                Check your library for duplicate tracks and provider configuration issues.
+            </p>
+
+            <div class="field-group">
+                <button id="check-duplicates-btn" onclick="checkDuplicates()" style="margin-bottom: 1rem;">Check for Duplicates</button>
+                <div id="duplicate-results" style="display: none;">
+                    <div id="duplicate-summary" style="margin-bottom: 1rem; font-weight: 600;"></div>
+                    <div id="duplicate-table-container"></div>
+                </div>
+            </div>
+        </div>
+    </div>
+
     <!-- AI Section -->
     <div class="settings-section">
         <div class="section-header" onclick="toggleSection(this)">
@@ -1647,6 +1668,60 @@ <h3 id="modal-title">Add Provider</h3>
         }
     }
 
+    // Library Health
+    async function checkDuplicates() {
+        const btn = document.getElementById('check-duplicates-btn');
+        const resultsDiv = document.getElementById('duplicate-results');
+        const summaryDiv = document.getElementById('duplicate-summary');
+        const tableDiv = document.getElementById('duplicate-table-container');
+
+        btn.disabled = true;
+        btn.textContent = 'Checking...';
+        resultsDiv.style.display = 'none';
+
+        try {
+            const response = await fetch('/api/library/duplicates');
+            const data = await response.json();
+
+            if (data.error) {
+                showToast('Error checking duplicates: ' + data.error, 'error');
+                return;
+            }
+
+            const groups = data.duplicate_groups || [];
+            summaryDiv.textContent = groups.length === 0
+                ? `No duplicates found in ${data.total_score_rows} tracks.`
+                : `Found ${data.total_groups} duplicate group(s) (${data.total_duplicate_rows} rows) out of ${data.total_score_rows} total tracks.`;
+
+            tableDiv.innerHTML = '';
+            if (groups.length > 0) {
+                let html = '<table style="width:100%; border-collapse: collapse; font-size: 0.85rem;">';
+                html += '<tr style="border-bottom: 1px solid var(--border-color);"><th style="text-align:left; padding:0.4rem;">Type</th><th style="text-align:left; padding:0.4rem;">Key</th><th style="text-align:left; padding:0.4rem;">Count</th><th style="text-align:left; padding:0.4rem;">Item IDs</th></tr>';
+                groups.slice(0, 50).forEach(g => {
+                    const itemStr = g.items.map(i => i.title ? `${i.item_id} (${i.title})` : i.item_id).join(', ');
+                    html += `<tr style="border-bottom: 1px solid var(--border-color);">`;
+                    html += `<td style="padding:0.4rem;"><span class="badge ${g.type === 'track_id' ? 'badge-primary' : 'badge-enabled'}">${escapeHtml(g.type)}</span></td>`;
+                    html += `<td style="padding:0.4rem;">${escapeHtml(g.key)}</td>`;
+                    html += `<td style="padding:0.4rem;">${g.count}</td>`;
+                    html += `<td style="padding:0.4rem; word-break: break-all;">${escapeHtml(itemStr)}</td>`;
+                    html += `</tr>`;
+                });
+                if (groups.length > 50) {
+                    html += `<tr><td colspan="4" style="padding:0.4rem; color: var(--text-muted);">... and ${groups.length - 50} more groups</td></tr>`;
+                }
+                html += '</table>';
+                tableDiv.innerHTML = html;
+            }
+
+            resultsDiv.style.display = 'block';
+        } catch (err) {
+            showToast('Error checking duplicates: ' + err.message, 'error');
+        } finally {
+            btn.disabled = false;
+            btn.textContent = 'Check for Duplicates';
+        }
+    }
+
     // Toast notifications
     function showToast(message, type = 'info') {
         const toast = document.getElementById('toast');

From 32ca1833b9385a62f0b7dde53321748747e75679 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Sun, 1 Mar 2026 10:42:26 +0100
Subject: [PATCH 31/33] Add album support to AI instant playlist tools and
 search_database
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

- Add album column to all SELECT statements across 8 MCP server functions
- Include album in all result dict constructions (item_id, title, artist, album)
- Add album filter parameter to _database_genre_query_sync() with case-insensitive matching
- Add album parameter to search_database tool definition in AI client
- Pass album through execute_mcp_tool() to backend
- Update system prompt with album guidance in decision tree and valid values
- Add album to pre-execution validation filter keys in app_chat.py
- Add album to tool contribution summary logging
- Update tests for new decision tree step count (6→7 with CLAP, 5→6 without)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 ai_mcp_client.py                 | 18 ++++--
 app_chat.py                      |  4 +-
 tasks/mcp_server.py              | 96 ++++++++++++++++++--------------
 tests/unit/test_ai_mcp_client.py | 18 +++---
 4 files changed, 81 insertions(+), 55 deletions(-)

diff --git a/ai_mcp_client.py b/ai_mcp_client.py
index e65eec08..f7b45a3a 100644
--- a/ai_mcp_client.py
+++ b/ai_mcp_client.py
@@ -65,12 +65,14 @@ def _build_system_prompt(tools: List[Dict], library_context: Optional[Dict] = No
         decision_tree.append("3. 'songs by/from/like [ARTIST]'? -> artist_similarity (returns artist's own + similar)")
         decision_tree.append("4. MULTIPLE artists blended ('A meets B', 'A + B', 'like A and B combined') OR negation ('X but not Y', 'X without Y')? -> song_alchemy (REQUIRES 2+ items)")
         decision_tree.append("5. Songs NOT in library, trending, award winners (Grammy, Billboard), cultural knowledge? -> ai_brainstorm")
-        decision_tree.append("6. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
+        decision_tree.append("6. 'songs from [ALBUM]' or 'songs like [ALBUM]'? -> search_database with album filter, OR song_similarity with tracks from the album")
+        decision_tree.append("7. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
     else:
         decision_tree.append("2. 'songs by/from/like [ARTIST]'? -> artist_similarity (returns artist's own + similar)")
         decision_tree.append("3. MULTIPLE artists blended ('A meets B', 'A + B', 'like A and B combined') OR negation ('X but not Y', 'X without Y')? -> song_alchemy (REQUIRES 2+ items)")
         decision_tree.append("4. Songs NOT in library, trending, award winners (Grammy, Billboard), cultural knowledge? -> ai_brainstorm")
-        decision_tree.append("5. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
+        decision_tree.append("5. 'songs from [ALBUM]' or 'songs like [ALBUM]'? -> search_database with album filter, OR song_similarity with tracks from the album")
+        decision_tree.append("6. Genre/mood/tempo/energy/year/rating filters? -> search_database (last resort)")
 
     decision_text = '\n'.join(decision_tree)
 
@@ -92,6 +94,8 @@ def _build_system_prompt(tools: List[Dict], library_context: Optional[Dict] = No
 8. When a query has BOTH a genre AND a mood from the MOODS list, prefer search_database over text_search:
    - "sad jazz" -> search_database(genres=["jazz"], moods=["sad"])  NOT text_search
    - But "dreamy atmospheric" -> text_search (no specific genre, sound description)
+9. For album requests: use search_database(album="Album Name") to get songs FROM an album,
+   or song_similarity with a known track from the album to find SIMILAR songs
 
 === VALID search_database VALUES ===
 GENRES: {_get_dynamic_genres(library_context)}
@@ -100,7 +104,8 @@ def _build_system_prompt(tools: List[Dict], library_context: Optional[Dict] = No
 ENERGY: 0.0 (calm) to 1.0 (intense) - use 0.0-0.35 for low, 0.35-0.65 for medium, 0.65-1.0 for high
 SCALE: major, minor
 YEAR: year_min/year_max (e.g., 1990-1999 for 90s). For decade requests (80s, 90s), prefer year filters over genres.
-RATING: min_rating 1-5 (user's personal ratings)"""
+RATING: min_rating 1-5 (user's personal ratings)
+ALBUM: album name (e.g. 'Abbey Road', 'Thriller') - filters songs from a specific album"""
 
     return prompt
 
@@ -673,7 +678,8 @@ def normalize_items(items):
                 tool_args.get('scale'),
                 tool_args.get('year_min'),
                 tool_args.get('year_max'),
-                tool_args.get('min_rating')
+                tool_args.get('min_rating'),
+                tool_args.get('album')
             )
         elif tool_name == "ai_brainstorm":
             return _ai_brainstorm_sync(
@@ -909,6 +915,10 @@ def get_mcp_tools() -> List[Dict]:
                         "type": "integer",
                         "description": "Minimum user rating 1-5"
                     },
+                    "album": {
+                        "type": "string",
+                        "description": "Album name to filter by (e.g. 'Abbey Road', 'Thriller')"
+                    },
                     "get_songs": {
                         "type": "integer",
                         "description": "Number of songs",
diff --git a/app_chat.py b/app_chat.py
index 9ea5d1ef..ce17c39d 100644
--- a/app_chat.py
+++ b/app_chat.py
@@ -480,7 +480,7 @@ def chat_playlist_api():
             # search_database: reject if zero filters specified
             if tn == 'search_database':
                 filter_keys = ['genres', 'moods', 'tempo_min', 'tempo_max', 'energy_min', 'energy_max',
-                               'key', 'scale', 'year_min', 'year_max', 'min_rating']
+                               'key', 'scale', 'year_min', 'year_max', 'min_rating', 'album']
                 has_filter = any(ta.get(k) for k in filter_keys)
                 if not has_filter:
                     log_messages.append(f"   ⚠️ Skipping {tn}: no filters specified (would return random noise)")
@@ -569,6 +569,8 @@ def convert_to_dict(obj):
                     args_summary.append(f"genres={tool_args['genres']}")
                 if 'moods' in tool_args and tool_args['moods']:
                     args_summary.append(f"moods={tool_args['moods']}")
+                if 'album' in tool_args and tool_args['album']:
+                    args_summary.append(f"album='{tool_args['album']}'")
                 if 'tempo_min' in tool_args or 'tempo_max' in tool_args:
                     tempo_str = f"{tool_args.get('tempo_min', '')}..{tool_args.get('tempo_max', '')}"
                     args_summary.append(f"tempo={tempo_str}")
diff --git a/tasks/mcp_server.py b/tasks/mcp_server.py
index f74330ca..6965fdc8 100644
--- a/tasks/mcp_server.py
+++ b/tasks/mcp_server.py
@@ -206,9 +206,9 @@ def _artist_similarity_api_sync(artist: str, count: int, get_songs: int) -> List
         with db_conn.cursor(cursor_factory=DictCursor) as cur:
             placeholders = ','.join(['%s'] * len(all_artist_names))
             query = f"""
-                SELECT item_id, title, author
+                SELECT item_id, title, author, album
                 FROM (
-                    SELECT DISTINCT item_id, title, author
+                    SELECT DISTINCT item_id, title, author, album
                     FROM public.score
                     WHERE author IN ({placeholders})
                 ) AS distinct_songs
@@ -217,8 +217,8 @@ def _artist_similarity_api_sync(artist: str, count: int, get_songs: int) -> List
             """
             cur.execute(query, all_artist_names + [get_songs])
             results = cur.fetchall()
-        
-        songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author']} for r in results]
+
+        songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author'], "album": r.get('album', '')} for r in results]
         log_messages.append(f"Retrieved {len(songs)} songs from original + similar artists")
         
         # Build component_matches to show which songs came from which artist
@@ -319,7 +319,7 @@ def _artist_hits_query_sync(artist: str, ai_config: Dict, get_songs: int) -> Lis
 
                 where_clause = ' OR '.join(or_conditions)
                 cur.execute(f"""
-                    SELECT item_id, title, author
+                    SELECT item_id, title, author, album
                     FROM public.score
                     WHERE author = %s AND ({where_clause})
                 """, [artist] + title_params)
@@ -332,7 +332,8 @@ def _artist_hits_query_sync(artist: str, ai_config: Dict, get_songs: int) -> Lis
                             found_songs.append({
                                 "item_id": row['item_id'],
                                 "title": row['title'],
-                                "artist": row['author']
+                                "artist": row['author'],
+                                "album": row.get('album', '')
                             })
                             seen_ids.add(row['item_id'])
                             break
@@ -342,7 +343,7 @@ def _artist_hits_query_sync(artist: str, ai_config: Dict, get_songs: int) -> Lis
                 exclude_ids = list(seen_ids)
                 if exclude_ids:
                     cur.execute("""
-                        SELECT item_id, title, author
+                        SELECT item_id, title, author, album
                         FROM public.score
                         WHERE author = %s AND item_id != ALL(%s)
                         ORDER BY RANDOM()
@@ -350,7 +351,7 @@ def _artist_hits_query_sync(artist: str, ai_config: Dict, get_songs: int) -> Lis
                     """, (artist, exclude_ids, get_songs - len(found_songs)))
                 else:
                     cur.execute("""
-                        SELECT item_id, title, author
+                        SELECT item_id, title, author, album
                         FROM public.score
                         WHERE author = %s
                         ORDER BY RANDOM()
@@ -362,7 +363,8 @@ def _artist_hits_query_sync(artist: str, ai_config: Dict, get_songs: int) -> Lis
                         found_songs.append({
                             "item_id": r['item_id'],
                             "title": r['title'],
-                            "artist": r['author']
+                            "artist": r['author'],
+                            "album": r.get('album', '')
                         })
                         seen_ids.add(r['item_id'])
         
@@ -440,27 +442,29 @@ def _text_search_sync(description: str, tempo_filter: Optional[str], energy_filt
                 where_clause = ' AND '.join(filter_conditions)
                 
                 sql = f"""
-                    SELECT item_id, title, author
+                    SELECT item_id, title, author, album
                     FROM public.score
                     WHERE item_id IN ({placeholders})
                     AND {where_clause}
                 """
-                
+
                 cur.execute(sql, item_ids + query_params)
                 filtered_results = cur.fetchall()
-            
+
+            # Build album lookup from filtered DB results
+            album_lookup = {r['item_id']: r.get('album', '') for r in filtered_results}
             # Preserve CLAP similarity order for filtered results
             filtered_item_ids = {r['item_id'] for r in filtered_results}
             songs = [
-                {"item_id": r['item_id'], "title": r['title'], "artist": r['author']}
+                {"item_id": r['item_id'], "title": r['title'], "artist": r['author'], "album": album_lookup.get(r['item_id'], '')}
                 for r in clap_results
                 if r['item_id'] in filtered_item_ids
             ]
-            
+
             log_messages.append(f"Filtered to {len(songs)} songs matching tempo/energy criteria")
         else:
-            # No filters - return CLAP results as-is
-            songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author']} for r in clap_results]
+            # No filters - return CLAP results as-is (enrich with album from DB)
+            songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author'], "album": r.get('album', '')} for r in clap_results]
             log_messages.append(f"Retrieved {len(songs)} songs from CLAP")
         
         return {"songs": songs[:get_songs], "message": "\n".join(log_messages)}
@@ -592,7 +596,7 @@ def _escape_like(s: str) -> str:
                     values_params.extend([title.lower(), artist.lower()])
                 values_clause = ', '.join(['(%s, %s)'] * len(valid_items))
                 cur.execute(f"""
-                    SELECT item_id, title, author
+                    SELECT item_id, title, author, album
                     FROM public.score
                     WHERE (LOWER(title), LOWER(author)) IN (VALUES {values_clause})
                 """, values_params)
@@ -614,7 +618,8 @@ def _escape_like(s: str) -> str:
                         found_songs.append({
                             "item_id": result['item_id'],
                             "title": result['title'],
-                            "artist": result['author']
+                            "artist": result['author'],
+                            "album": result.get('album', '')
                         })
                         seen_ids.add(result['item_id'])
                     elif not result:
@@ -641,7 +646,7 @@ def _escape_like(s: str) -> str:
                 if or_conditions:
                     where_clause = ' OR '.join(or_conditions)
                     cur.execute(f"""
-                        SELECT item_id, title, author
+                        SELECT item_id, title, author, album
                         FROM public.score
                         WHERE {where_clause}
                         ORDER BY LENGTH(title) + LENGTH(author)
@@ -660,7 +665,8 @@ def _escape_like(s: str) -> str:
                                     found_songs.append({
                                         "item_id": row['item_id'],
                                         "title": row['title'],
-                                        "artist": row['author']
+                                        "artist": row['author'],
+                                        "album": row.get('album', '')
                                     })
                                     seen_ids.add(row['item_id'])
                                     fuzzy_lookup_order.remove((t_norm, a_norm))
@@ -702,7 +708,7 @@ def _song_similarity_api_sync(song_title: str, song_artist: str, get_songs: int)
         with db_conn.cursor(cursor_factory=DictCursor) as cur:
             # STEP 1: Try exact match first
             cur.execute("""
-                SELECT item_id, title, author FROM public.score
+                SELECT item_id, title, author, album FROM public.score
                 WHERE LOWER(title) = LOWER(%s) AND LOWER(author) = LOWER(%s)
                 LIMIT 1
             """, (song_title, song_artist))
@@ -716,9 +722,9 @@ def _song_similarity_api_sync(song_title: str, song_artist: str, get_songs: int)
                 artist_normalized = song_artist.replace(' ', '').replace('-', '').replace('‐', '').replace('/', '').replace("'", '')
                 
                 cur.execute("""
-                    SELECT item_id, title, author
+                    SELECT item_id, title, author, album
                     FROM public.score
-                    WHERE REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(title, ' ', ''), '-', ''), '‐', ''), '/', ''), '''', '') ILIKE %s 
+                    WHERE REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(title, ' ', ''), '-', ''), '‐', ''), '/', ''), '''', '') ILIKE %s
                       AND REPLACE(REPLACE(REPLACE(REPLACE(REPLACE(author, ' ', ''), '-', ''), '‐', ''), '/', ''), '''', '') ILIKE %s
                     ORDER BY LENGTH(title) + LENGTH(author)
                     LIMIT 1
@@ -752,15 +758,15 @@ def _song_similarity_api_sync(song_title: str, song_artist: str, get_songs: int)
             with db_conn.cursor(cursor_factory=DictCursor) as cur:
                 placeholders = ','.join(['%s'] * len(similar_ids))
                 cur.execute(f"""
-                    SELECT item_id, title, author
+                    SELECT item_id, title, author, album
                     FROM public.score
                     WHERE item_id IN ({placeholders})
                 """, similar_ids)
                 results = cur.fetchall()
-            
+
             # Sort results by the original Voyager order
             sorted_results = sorted(results, key=lambda r: id_to_order.get(r['item_id'], 999999))
-            songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author']} for r in sorted_results]
+            songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author'], "album": r.get('album', '')} for r in sorted_results]
         
         log_messages.append(f"Retrieved {len(songs)} similar songs")
         
@@ -831,7 +837,8 @@ def _database_genre_query_sync(
     scale: Optional[str] = None,
     year_min: Optional[int] = None,
     year_max: Optional[int] = None,
-    min_rating: Optional[int] = None
+    min_rating: Optional[int] = None,
+    album: Optional[str] = None
 ) -> List[Dict]:
     """Synchronous implementation of flexible database search with multiple optional filters.
 
@@ -914,6 +921,11 @@ def _database_genre_query_sync(
                 conditions.append("rating >= %s")
                 params.append(int(min_rating))
 
+            # Album filter
+            if album:
+                conditions.append("LOWER(album) = LOWER(%s)")
+                params.append(album)
+
             where_clause = " AND ".join(conditions) if conditions else "1=1"
             params.append(get_songs)
 
@@ -943,9 +955,9 @@ def _database_genre_query_sync(
                 all_params = score_params + params
 
                 query = f"""
-                    SELECT DISTINCT item_id, title, author
+                    SELECT DISTINCT item_id, title, author, album
                     FROM (
-                        SELECT item_id, title, author,
+                        SELECT item_id, title, author, album,
                                ({relevance_expr}) AS relevance_score
                         FROM public.score
                         WHERE {where_clause}
@@ -956,9 +968,9 @@ def _database_genre_query_sync(
                 cur.execute(query, all_params)
             else:
                 query = f"""
-                    SELECT DISTINCT item_id, title, author
+                    SELECT DISTINCT item_id, title, author, album
                     FROM (
-                        SELECT item_id, title, author
+                        SELECT item_id, title, author, album
                         FROM public.score
                         WHERE {where_clause}
                         ORDER BY RANDOM()
@@ -969,7 +981,7 @@ def _database_genre_query_sync(
 
             results = cur.fetchall()
 
-        songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author']} for r in results]
+        songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author'], "album": r.get('album', '')} for r in results]
 
         filters = []
         if genres:
@@ -988,6 +1000,8 @@ def _database_genre_query_sync(
             filters.append(f"year: {year_min or 'any'}-{year_max or 'any'}")
         if min_rating:
             filters.append(f"min_rating: {min_rating}")
+        if album:
+            filters.append(f"album: {album}")
 
         log_messages.append(f"Found {len(songs)} songs matching {', '.join(filters) if filters else 'all criteria'}")
 
@@ -1032,9 +1046,9 @@ def _database_tempo_energy_query_sync(
         
         with db_conn.cursor(cursor_factory=DictCursor) as cur:
             query = f"""
-                SELECT DISTINCT item_id, title, author
+                SELECT DISTINCT item_id, title, author, album
                 FROM (
-                    SELECT item_id, title, author
+                    SELECT item_id, title, author, album
                     FROM public.score
                     WHERE {where_clause}
                     ORDER BY RANDOM()
@@ -1043,10 +1057,10 @@ def _database_tempo_energy_query_sync(
             """
             cur.execute(query, params)
             results = cur.fetchall()
-        
-        songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author']} for r in results]
+
+        songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author'], "album": r.get('album', '')} for r in results]
         log_messages.append(f"Found {len(songs)} songs matching tempo/energy criteria")
-        
+
         return {"songs": songs, "message": "\n".join(log_messages)}
     finally:
         db_conn.close()
@@ -1156,9 +1170,9 @@ def _vibe_match_sync(vibe_description: str, ai_config: Dict, get_songs: int) ->
         
         with db_conn.cursor(cursor_factory=DictCursor) as cur:
             query = f"""
-                SELECT DISTINCT item_id, title, author
+                SELECT DISTINCT item_id, title, author, album
                 FROM (
-                    SELECT item_id, title, author
+                    SELECT item_id, title, author, album
                     FROM public.score
                     WHERE {where_clause}
                     ORDER BY RANDOM()
@@ -1167,8 +1181,8 @@ def _vibe_match_sync(vibe_description: str, ai_config: Dict, get_songs: int) ->
             """
             cur.execute(query, params)
             results = cur.fetchall()
-        
-        songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author']} for r in results]
+
+        songs = [{"item_id": r['item_id'], "title": r['title'], "artist": r['author'], "album": r.get('album', '')} for r in results]
         log_messages.append(f"Found {len(songs)} songs matching vibe criteria")
         
         return {"songs": songs, "criteria": criteria, "message": "\n".join(log_messages)}
diff --git a/tests/unit/test_ai_mcp_client.py b/tests/unit/test_ai_mcp_client.py
index 5bff9cea..426600e7 100644
--- a/tests/unit/test_ai_mcp_client.py
+++ b/tests/unit/test_ai_mcp_client.py
@@ -133,18 +133,18 @@ def test_prompt_includes_tool_names(self, ai_mcp_client_mod):
         for t in tools:
             assert t['name'] in prompt
 
-    def test_clap_decision_tree_has_six_steps(self, ai_mcp_client_mod):
-        """With text_search present, decision tree should have 6 numbered steps."""
+    def test_clap_decision_tree_has_seven_steps(self, ai_mcp_client_mod):
+        """With text_search present, decision tree should have 7 numbered steps (includes album)."""
         tools = _make_tools(include_text_search=True)
         prompt = ai_mcp_client_mod._build_system_prompt(tools, None)
-        # The decision tree section should contain step 6
+        # The decision tree section should contain step 7
         lines = prompt.split('\n')
-        decision_lines = [l for l in lines if l.strip().startswith(('1.', '2.', '3.', '4.', '5.', '6.'))]
-        assert any(l.strip().startswith('6.') for l in decision_lines)
+        decision_lines = [l for l in lines if l.strip().startswith(('1.', '2.', '3.', '4.', '5.', '6.', '7.'))]
+        assert any(l.strip().startswith('7.') for l in decision_lines)
         assert 'text_search' in prompt
 
-    def test_no_clap_decision_tree_has_five_steps(self, ai_mcp_client_mod):
-        """Without text_search, decision tree should have 5 steps, not 6."""
+    def test_no_clap_decision_tree_has_six_steps(self, ai_mcp_client_mod):
+        """Without text_search, decision tree should have 6 steps (includes album)."""
         tools = _make_tools(include_text_search=False)
         prompt = ai_mcp_client_mod._build_system_prompt(tools, None)
         # Extract only the TOOL SELECTION section lines (numbered decision tree)
@@ -153,8 +153,8 @@ def test_no_clap_decision_tree_has_five_steps(self, ai_mcp_client_mod):
                           if l.strip() and l.strip()[0].isdigit()
                           and l.strip()[1] == '.'
                           and '->' in l]
-        # Should have exactly 5 decision tree entries
-        assert len(decision_lines) == 5
+        # Should have exactly 6 decision tree entries
+        assert len(decision_lines) == 6
         # text_search should NOT appear as a decision tree target
         decision_text = '\n'.join(decision_lines)
         assert '-> text_search' not in decision_text

From 5a68f78d966c8573f7c90020fb105193c1bcdc2a Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Sat, 14 Mar 2026 20:34:28 +0100
Subject: [PATCH 32/33] Fix test failures: patch config module and mock context
 managers

- test_app_chat.py: patch config.* instead of app_chat.* since app_chat
  accesses config vars via `import config` module, not module-level attrs
- test_memory_cleanup.py: fix get_db mock to work as context manager
  (with get_db() as conn), add patches for multi-provider functions
  (find_existing_analysis_by_file_path, upsert_artist_mapping)

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 tests/unit/test_app_chat.py       | 20 ++++++++++----------
 tests/unit/test_memory_cleanup.py | 31 +++++++++++++++++++------------
 2 files changed, 29 insertions(+), 22 deletions(-)

diff --git a/tests/unit/test_app_chat.py b/tests/unit/test_app_chat.py
index a492607b..3fb898d3 100644
--- a/tests/unit/test_app_chat.py
+++ b/tests/unit/test_app_chat.py
@@ -26,16 +26,16 @@
 @pytest.fixture
 def app():
     """Create a Flask app with the chat blueprint registered."""
-    with patch('app_chat.OLLAMA_SERVER_URL', 'http://localhost:11434'), \
-         patch('app_chat.OLLAMA_MODEL_NAME', 'test-model'), \
-         patch('app_chat.OPENAI_SERVER_URL', 'http://localhost'), \
-         patch('app_chat.OPENAI_MODEL_NAME', 'gpt-4'), \
-         patch('app_chat.OPENAI_API_KEY', ''), \
-         patch('app_chat.GEMINI_MODEL_NAME', 'gemini-pro'), \
-         patch('app_chat.GEMINI_API_KEY', ''), \
-         patch('app_chat.MISTRAL_MODEL_NAME', 'mistral-7b'), \
-         patch('app_chat.MISTRAL_API_KEY', ''), \
-         patch('app_chat.AI_MODEL_PROVIDER', 'OLLAMA'):
+    with patch('config.OLLAMA_SERVER_URL', 'http://localhost:11434'), \
+         patch('config.OLLAMA_MODEL_NAME', 'test-model'), \
+         patch('config.OPENAI_SERVER_URL', 'http://localhost'), \
+         patch('config.OPENAI_MODEL_NAME', 'gpt-4'), \
+         patch('config.OPENAI_API_KEY', ''), \
+         patch('config.GEMINI_MODEL_NAME', 'gemini-pro'), \
+         patch('config.GEMINI_API_KEY', ''), \
+         patch('config.MISTRAL_MODEL_NAME', 'mistral-7b'), \
+         patch('config.MISTRAL_API_KEY', ''), \
+         patch('config.AI_MODEL_PROVIDER', 'OLLAMA'):
         from app_chat import chat_bp
         flask_app = Flask(__name__)
         flask_app.register_blueprint(chat_bp)
diff --git a/tests/unit/test_memory_cleanup.py b/tests/unit/test_memory_cleanup.py
index 868c09e4..763d2fce 100644
--- a/tests/unit/test_memory_cleanup.py
+++ b/tests/unit/test_memory_cleanup.py
@@ -232,26 +232,31 @@ def test_cleanup_onnx_sessions_on_success(
     ):
         """Test that ONNX sessions are cleaned up after successful album analysis."""
         from tasks.analysis import analyze_album_task
-        
+
         # Setup mocks
         mock_get_job.return_value = None
         mock_get_tracks.return_value = [
             {'Id': '1', 'Name': 'Track 1', 'AlbumArtist': 'Artist 1', 'ArtistId': 'artist1'}
         ]
         mock_download.return_value = "/tmp/track.mp3"
-        
-        # Mock database
+
+        # Mock database - must work as context manager (with get_db() as conn)
         mock_conn = MagicMock()
         mock_cur = MagicMock()
+        mock_conn.__enter__ = Mock(return_value=mock_conn)
+        mock_conn.__exit__ = Mock(return_value=False)
         mock_conn.cursor.return_value = mock_cur
+        mock_cur.__enter__ = Mock(return_value=mock_cur)
+        mock_cur.__exit__ = Mock(return_value=False)
         mock_cur.fetchall.return_value = []  # No existing tracks
+        mock_cur.fetchone.return_value = None
         mock_get_db.return_value = mock_conn
-        
+
         # Mock ONNX sessions
         mock_ort.get_available_providers.return_value = ['CPUExecutionProvider']
         mock_session = MagicMock()
         mock_ort.InferenceSession.return_value = mock_session
-        
+
         # Mock analyze_track to return results
         mock_analyze.return_value = (
             {
@@ -269,15 +274,17 @@ def test_cleanup_onnx_sessions_on_success(
             },
             np.random.randn(200)
         )
-        
-        # Call function
-        with patch('tasks.clap_analyzer.is_clap_available', return_value=False):
-            with patch('config.MULAN_ENABLED', False):
-                result = analyze_album_task("album_123", "Test Album", 5, None)
-        
+
+        # Call function - mock multi-provider functions added in this branch
+        with patch('tasks.clap_analyzer.is_clap_available', return_value=False), \
+             patch('config.MULAN_ENABLED', False), \
+             patch('app_helper.find_existing_analysis_by_file_path', return_value=None), \
+             patch('app_helper_artist.upsert_artist_mapping'):
+            result = analyze_album_task("album_123", "Test Album", 5, None)
+
         # Verify session cleanup was called for all loaded sessions
         # Should be called 2 times (embedding + prediction; secondary models removed in v4.0.0)
         assert mock_session_cleanup.call_count >= 2
-        
+
         # Verify CUDA cleanup was called
         assert mock_cuda_cleanup.called

From 236f3b753e64f74f3b2f3ddd65aa61bd898f53a8 Mon Sep 17 00:00:00 2001
From: Rendy <rendyjansen@gmail.com>
Date: Sat, 14 Mar 2026 21:12:09 +0100
Subject: [PATCH 33/33] Remove unnecessary complexity: encryption layer, dead
 columns, deprecated function

- Remove Fernet encryption for provider configs (key stored in same DB = no
  security benefit). Credentials stored as plaintext JSONB, matching env var
  security model. UI masking for sensitive keys preserved.
- Remove pre-populated app_settings defaults that duplicated config.py env vars
  (max_songs_per_artist_playlist, playlist_energy_arc, ai_request_timeout).
  Env vars are now single source of truth until explicitly changed via Settings UI.
- Remove unused file_size/file_modified columns from track table and simplify
  get_or_create_track() signature.
- Delete deprecated copy_analysis_to_new_item() (replaced by
  link_provider_to_existing_track()).
- Remove cryptography dependency from requirements.

Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---
 TEST_CHECKLIST.md                   |   2 +-
 app_helper.py                       | 258 +++-------------------------
 app_setup.py                        |  19 +-
 config.py                           |   4 -
 deployment/.env.example             |   4 -
 docs/MULTI_PROVIDER_ARCHITECTURE.md |   3 +-
 requirements/common-noavx2.txt      |   1 -
 requirements/common.txt             |   1 -
 tests/unit/test_app_setup.py        |   4 +-
 9 files changed, 30 insertions(+), 266 deletions(-)

diff --git a/TEST_CHECKLIST.md b/TEST_CHECKLIST.md
index ce404256..08fc9d72 100644
--- a/TEST_CHECKLIST.md
+++ b/TEST_CHECKLIST.md
@@ -268,7 +268,7 @@ pip install -r testing_suite/requirements.txt
 | 3.2.5 | New columns nullable | Auto | Check existing rows | New columns are NULL for old data |
 | 3.2.6 | Re-analysis populates new fields | Manual | Run analysis on existing library | New fields populated |
 | 3.2.7 | Cross-provider file_path linking | Auto | Analyze same track via 2 providers | `find_existing_analysis_by_file_path()` finds match |
-| 3.2.8 | Analysis reuse via file_path | Auto | Mock existing analysis, add new provider | `copy_analysis_to_new_item()` copies instead of re-analyzing |
+| 3.2.8 | Analysis reuse via file_path | Auto | Mock existing analysis, add new provider | `link_provider_to_existing_track()` links instead of re-analyzing |
 
 ### 3.3 Provider CRUD API
 
diff --git a/app_helper.py b/app_helper.py
index 5ed0c13a..3988992e 100644
--- a/app_helper.py
+++ b/app_helper.py
@@ -273,8 +273,6 @@ def init_db():
                 file_path_hash VARCHAR(64) NOT NULL UNIQUE,
                 file_path TEXT NOT NULL,
                 normalized_path TEXT,
-                file_size BIGINT,
-                file_modified TIMESTAMP,
                 created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
                 updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
             )
@@ -342,9 +340,6 @@ def init_db():
                 ('setup_version', '"1.0"', 'system', 'Version of the setup wizard last completed'),
                 ('multi_provider_enabled', 'false', 'providers', 'Whether multi-provider mode is enabled'),
                 ('primary_provider_id', 'null', 'providers', 'ID of the primary provider for playlist creation'),
-                ('max_songs_per_artist_playlist', '5', 'ai', 'Max songs per artist in instant playlists'),
-                ('playlist_energy_arc', 'false', 'ai', 'Enable energy arc shaping for playlist ordering'),
-                ('ai_request_timeout', '300', 'ai', 'AI request timeout in seconds'),
             ]
             for key, value, category, description in default_settings:
                 cur.execute("""
@@ -500,33 +495,6 @@ def init_db():
                 db.rollback()
                 logger.warning(f"Score dedup migration failed (will retry next startup): {e}")
 
-        # Migration: Encrypt existing unencrypted provider configs
-        cur.execute("SELECT value FROM app_settings WHERE key = 'migration_encrypt_provider_configs_done'")
-        if not cur.fetchone():
-            try:
-                cur.execute("SELECT id, config FROM provider")
-                for row in cur.fetchall():
-                    provider_id, pconfig = row
-                    if pconfig and isinstance(pconfig, dict):
-                        needs_encrypt = any(
-                            k in pconfig and pconfig[k] and not str(pconfig[k]).startswith('gAAAAA')
-                            for k in SENSITIVE_CONFIG_KEYS
-                        )
-                        if needs_encrypt:
-                            encrypted = encrypt_provider_config(pconfig)
-                            cur.execute("UPDATE provider SET config = %s WHERE id = %s",
-                                        (json.dumps(encrypted), provider_id))
-                cur.execute("""
-                    INSERT INTO app_settings (key, value, updated_at)
-                    VALUES ('migration_encrypt_provider_configs_done', 'true', NOW())
-                    ON CONFLICT (key) DO NOTHING
-                """)
-                db.commit()
-                logger.info("Encrypted existing provider configs")
-            except Exception as e:
-                db.rollback()
-                logger.warning(f"Provider config encryption migration failed: {e}")
-
         db.commit()
 
 # --- Status Constants ---
@@ -1701,98 +1669,6 @@ def set_primary_provider(provider_id):
         db.commit()
 
 
-# ##############################################################################
-# CREDENTIAL ENCRYPTION
-# ##############################################################################
-
-SENSITIVE_CONFIG_KEYS = {'token', 'password', 'api_key'}
-
-def _get_fernet():
-    """Get or create a Fernet cipher using ENCRYPTION_KEY from config/env."""
-    from cryptography.fernet import Fernet
-    import config as _config
-    key = getattr(_config, 'ENCRYPTION_KEY', None) or os.environ.get('ENCRYPTION_KEY')
-    if not key:
-        # Check app_settings for a previously generated key
-        db = get_db()
-        with db.cursor() as cur:
-            cur.execute("SELECT value FROM app_settings WHERE key = 'encryption_key'")
-            row = cur.fetchone()
-            if row and row[0]:
-                key = row[0] if isinstance(row[0], str) else str(row[0])
-                # Strip JSON quotes if present
-                key = key.strip('"')
-        if not key:
-            # Auto-generate and persist
-            key = Fernet.generate_key().decode()
-            db = get_db()
-            with db.cursor() as cur:
-                cur.execute("""
-                    INSERT INTO app_settings (key, value, updated_at)
-                    VALUES ('encryption_key', %s, NOW())
-                    ON CONFLICT (key) DO UPDATE SET value = EXCLUDED.value, updated_at = NOW()
-                """, (json.dumps(key),))
-                db.commit()
-            logger.info("Generated and stored new encryption key")
-    return Fernet(key.encode() if isinstance(key, str) else key)
-
-
-def encrypt_provider_config(config_dict):
-    """Encrypt sensitive fields in a provider config dict before storage."""
-    if not config_dict or not isinstance(config_dict, dict):
-        return config_dict
-    encrypted = dict(config_dict)
-    try:
-        f = _get_fernet()
-        for k in SENSITIVE_CONFIG_KEYS:
-            if k in encrypted and encrypted[k] and not str(encrypted[k]).startswith('gAAAAA'):
-                encrypted[k] = f.encrypt(str(encrypted[k]).encode()).decode()
-    except Exception as e:
-        logger.error(f"Failed to encrypt provider config: {e}")
-    return encrypted
-
-
-def decrypt_provider_config(config_dict):
-    """Decrypt sensitive fields in a provider config dict after retrieval."""
-    if not config_dict or not isinstance(config_dict, dict):
-        return config_dict
-    decrypted = dict(config_dict)
-    try:
-        f = _get_fernet()
-        for k in SENSITIVE_CONFIG_KEYS:
-            if k in decrypted and decrypted[k] and str(decrypted[k]).startswith('gAAAAA'):
-                try:
-                    decrypted[k] = f.decrypt(str(decrypted[k]).encode()).decode()
-                except Exception:
-                    pass  # Not encrypted or wrong key, leave as-is
-    except Exception as e:
-        logger.error(f"Failed to decrypt provider config: {e}")
-    return decrypted
-
-
-def encrypt_setting_value(value):
-    """Encrypt a single setting value for storage in app_settings."""
-    if not value or str(value).startswith('gAAAAA'):
-        return value
-    try:
-        f = _get_fernet()
-        return f.encrypt(str(value).encode()).decode()
-    except Exception as e:
-        logger.error(f"Failed to encrypt setting value: {e}")
-        return value
-
-
-def decrypt_setting_value(value):
-    """Decrypt a single setting value retrieved from app_settings."""
-    if not value or not str(value).startswith('gAAAAA'):
-        return value
-    try:
-        f = _get_fernet()
-        return f.decrypt(str(value).encode()).decode()
-    except Exception as e:
-        logger.error(f"Failed to decrypt setting value: {e}")
-        return value
-
 
 # ##############################################################################
 # TRACK LINKING FUNCTIONS - For multi-provider track identity
@@ -1925,7 +1801,7 @@ def _compute_file_path_hash(file_path, provider_id=None):
     return hashlib.sha256(normalized.encode('utf-8')).hexdigest()
 
 
-def get_or_create_track(file_path, file_size=None, file_modified=None, provider_id=None):
+def get_or_create_track(file_path, provider_id=None):
     """
     Get or create a track record based on file path.
 
@@ -1934,8 +1810,6 @@ def get_or_create_track(file_path, file_size=None, file_modified=None, provider_
 
     Args:
         file_path: Full or relative path to the audio file
-        file_size: Optional file size in bytes
-        file_modified: Optional file modification timestamp
         provider_id: Optional provider ID for path normalization (uses music_path_prefix from config)
 
     Returns:
@@ -1961,29 +1835,18 @@ def get_or_create_track(file_path, file_size=None, file_modified=None, provider_
 
         if row:
             track_id = row[0]
-            # Update file info and normalized_path if provided
-            updates = ["updated_at = NOW()"]
-            values = []
-            if file_size is not None:
-                updates.append("file_size = %s")
-                values.append(file_size)
-            if file_modified is not None:
-                updates.append("file_modified = %s")
-                values.append(file_modified)
-            # Always update normalized_path to latest
-            updates.append("normalized_path = %s")
-            values.append(normalized_path)
-            values.append(track_id)
-            cur.execute(f"UPDATE track SET {', '.join(updates)} WHERE id = %s", values)
+            # Update normalized_path to latest
+            cur.execute("UPDATE track SET normalized_path = %s, updated_at = NOW() WHERE id = %s",
+                        (normalized_path, track_id))
             db.commit()
             return track_id
 
-        # Create new track with normalized_path
+        # Create new track
         cur.execute("""
-            INSERT INTO track (file_path_hash, file_path, normalized_path, file_size, file_modified)
-            VALUES (%s, %s, %s, %s, %s)
+            INSERT INTO track (file_path_hash, file_path, normalized_path)
+            VALUES (%s, %s, %s)
             RETURNING id
-        """, (file_path_hash, file_path, normalized_path, file_size, file_modified))
+        """, (file_path_hash, file_path, normalized_path))
         track_id = cur.fetchone()[0]
         db.commit()
         return track_id
@@ -2069,7 +1932,7 @@ def get_track_by_file_path(file_path):
     db = get_db()
     with db.cursor() as cur:
         cur.execute("""
-            SELECT t.id, t.file_path, t.file_path_hash, t.file_size, t.file_modified,
+            SELECT t.id, t.file_path, t.file_path_hash,
                    s.item_id, s.title, s.author, s.album, s.tempo, s.key, s.scale,
                    s.mood_vector, s.energy, s.other_features
             FROM track t
@@ -2082,18 +1945,16 @@ def get_track_by_file_path(file_path):
                 'track_id': row[0],
                 'file_path': row[1],
                 'file_path_hash': row[2],
-                'file_size': row[3],
-                'file_modified': row[4],
-                'item_id': row[5],
-                'title': row[6],
-                'author': row[7],
-                'album': row[8],
-                'tempo': row[9],
-                'key': row[10],
-                'scale': row[11],
-                'mood_vector': row[12],
-                'energy': row[13],
-                'other_features': row[14],
+                'item_id': row[3],
+                'title': row[4],
+                'author': row[5],
+                'album': row[6],
+                'tempo': row[7],
+                'key': row[8],
+                'scale': row[9],
+                'mood_vector': row[10],
+                'energy': row[11],
+                'other_features': row[12],
             }
         return None
 
@@ -2295,9 +2156,8 @@ def link_provider_to_existing_track(file_path, provider_id, item_id, title=None,
     """
     Link a new provider's item_id to an already-analyzed track via provider_track.
 
-    Unlike copy_analysis_to_new_item(), this does NOT duplicate score/embedding rows.
-    It only creates a provider_track mapping so the provider's item_id resolves
-    to the existing canonical track.
+    Does NOT duplicate score/embedding rows — only creates a provider_track mapping
+    so the provider's item_id resolves to the existing canonical track.
 
     Args:
         file_path: File path of the track (used to find/create the track record)
@@ -2324,82 +2184,6 @@ def link_provider_to_existing_track(file_path, provider_id, item_id, title=None,
         return False
 
 
-def copy_analysis_to_new_item(source_item_id, target_item_id, file_path=None, provider_id=None):
-    """
-    DEPRECATED: Use link_provider_to_existing_track() instead.
-
-    Copy analysis data from one item_id to another.
-    This duplicates score + embedding rows, which wastes storage and causes
-    duplicate Voyager index entries. Kept temporarily for migration.
-
-    Args:
-        source_item_id: The item_id that has existing analysis
-        target_item_id: The new item_id to copy analysis to
-        file_path: Optional file path for track linking
-        provider_id: Optional provider ID for track linking
-
-    Returns:
-        True if analysis was copied successfully, False otherwise
-    """
-    if not source_item_id or not target_item_id:
-        return False
-
-    if source_item_id == target_item_id:
-        return True  # Nothing to copy
-
-    db = get_db()
-    try:
-        with db.cursor() as cur:
-            # Copy score data
-            cur.execute("""
-                INSERT INTO score (item_id, title, author, tempo, key, scale, mood_vector,
-                                   energy, other_features, album, album_artist, year, rating, file_path, track_id)
-                SELECT %s, title, author, tempo, key, scale, mood_vector,
-                       energy, other_features, album, album_artist, year, rating, file_path, track_id
-                FROM score WHERE item_id = %s
-                ON CONFLICT (item_id) DO NOTHING
-            """, (target_item_id, source_item_id))
-
-            # Copy embedding
-            cur.execute("""
-                INSERT INTO embedding (item_id, embedding)
-                SELECT %s, embedding FROM embedding WHERE item_id = %s
-                ON CONFLICT (item_id) DO NOTHING
-            """, (target_item_id, source_item_id))
-
-            # Copy CLAP embedding if exists
-            cur.execute("""
-                INSERT INTO clap_embedding (item_id, embedding)
-                SELECT %s, embedding FROM clap_embedding WHERE item_id = %s
-                ON CONFLICT (item_id) DO NOTHING
-            """, (target_item_id, source_item_id))
-
-            # Copy MuLan embedding if exists
-            cur.execute("""
-                INSERT INTO mulan_embedding (item_id, embedding)
-                SELECT %s, embedding FROM mulan_embedding WHERE item_id = %s
-                ON CONFLICT (item_id) DO NOTHING
-            """, (target_item_id, source_item_id))
-
-            db.commit()
-
-            # Create track linking for the new item
-            if file_path:
-                track_id = get_or_create_track(file_path, provider_id=provider_id)
-                if track_id:
-                    update_score_track_id(target_item_id, track_id)
-                    if provider_id is not None:
-                        link_provider_track(provider_id, track_id, target_item_id)
-
-            logger.info(f"Copied analysis from {source_item_id} to {target_item_id}")
-            return True
-
-    except Exception as e:
-        db.rollback()
-        logger.error(f"Failed to copy analysis from {source_item_id} to {target_item_id}: {e}")
-        return False
-
-
 def detect_music_path_prefix(sample_tracks, existing_normalized_paths=None, extra_sample_tracks=None):
     """
     Auto-detect the music_path_prefix for a new provider by comparing paths.
diff --git a/app_setup.py b/app_setup.py
index 845ded65..3730d284 100644
--- a/app_setup.py
+++ b/app_setup.py
@@ -16,7 +16,7 @@
 from flask import Blueprint, jsonify, request, render_template, redirect, url_for, g
 from functools import wraps
 
-from app_helper import get_db, detect_music_path_prefix, detect_path_format, encrypt_provider_config, decrypt_provider_config, encrypt_setting_value, decrypt_setting_value
+from app_helper import get_db, detect_music_path_prefix, detect_path_format
 from tasks.mediaserver import (
     get_available_provider_types,
     get_provider_info,
@@ -52,9 +52,6 @@ def get_setting(key, default=None):
 
 def set_setting(key, value, category=None, description=None):
     """Set a setting value in the database."""
-    store_value = value
-    if key in SENSITIVE_SETTING_KEYS and value:
-        store_value = encrypt_setting_value(str(value))
     db = get_db()
     with db.cursor() as cur:
         cur.execute("""
@@ -65,7 +62,7 @@ def set_setting(key, value, category=None, description=None):
                 category = COALESCE(EXCLUDED.category, app_settings.category),
                 description = COALESCE(EXCLUDED.description, app_settings.description),
                 updated_at = NOW()
-        """, (key, json.dumps(store_value), category, description))
+        """, (key, json.dumps(value), category, description))
         db.commit()
 
 
@@ -118,9 +115,6 @@ def apply_settings_to_config():
     for db_key, config_attr in mapping.items():
         val = get_setting(db_key)
         if val is not None and val != '':
-            # Decrypt sensitive settings before applying
-            if db_key in SENSITIVE_SETTING_KEYS:
-                val = decrypt_setting_value(str(val))
             existing = getattr(config, config_attr, None)
             if isinstance(existing, bool):
                 val = val in (True, 'true', 'True')
@@ -233,7 +227,7 @@ def get_providers(enabled_only=False):
                 'id': row[0],
                 'provider_type': row[1],
                 'name': row[2],
-                'config': decrypt_provider_config(row[3]),  # JSONB is automatically parsed, decrypt sensitive fields
+                'config': row[3],  # JSONB is automatically parsed by psycopg2
                 'enabled': row[4],
                 'priority': row[5],
                 'created_at': row[6].isoformat() if row[6] else None,
@@ -266,7 +260,7 @@ def get_provider_by_id(provider_id):
                 'id': row[0],
                 'provider_type': row[1],
                 'name': row[2],
-                'config': decrypt_provider_config(row[3]),
+                'config': row[3],
                 'enabled': row[4],
                 'priority': row[5],
             }
@@ -276,13 +270,12 @@ def get_provider_by_id(provider_id):
 def add_provider(provider_type, name, config_data, enabled=True, priority=0):
     """Add a new provider configuration."""
     db = get_db()
-    encrypted_config = encrypt_provider_config(config_data)
     with db.cursor() as cur:
         cur.execute("""
             INSERT INTO provider (provider_type, name, config, enabled, priority)
             VALUES (%s, %s, %s, %s, %s)
             RETURNING id
-        """, (provider_type, name, json.dumps(encrypted_config), enabled, priority))
+        """, (provider_type, name, json.dumps(config_data), enabled, priority))
         provider_id = cur.fetchone()[0]
         db.commit()
         return provider_id
@@ -299,7 +292,7 @@ def update_provider(provider_id, name=None, config_data=None, enabled=None, prio
         values.append(name)
     if config_data is not None:
         updates.append("config = %s")
-        values.append(json.dumps(encrypt_provider_config(config_data)))
+        values.append(json.dumps(config_data))
     if enabled is not None:
         updates.append("enabled = %s")
         values.append(enabled)
diff --git a/config.py b/config.py
index 927e4d34..dff930b4 100644
--- a/config.py
+++ b/config.py
@@ -466,10 +466,6 @@
 # }
 ENABLE_PROXY_FIX = os.environ.get("ENABLE_PROXY_FIX", "False").lower() == "true"
 
-# --- Credential Encryption ---
-ENCRYPTION_KEY = os.getenv('ENCRYPTION_KEY', '')
-
-
 # --- Instant Playlist Optimization ---
 # Max songs from a single artist in the instant playlist (diversity enforcement)
 MAX_SONGS_PER_ARTIST_PLAYLIST = int(os.environ.get("MAX_SONGS_PER_ARTIST_PLAYLIST", "5"))
diff --git a/deployment/.env.example b/deployment/.env.example
index a01608f4..bb6c1933 100644
--- a/deployment/.env.example
+++ b/deployment/.env.example
@@ -163,10 +163,6 @@ OPENAI_API_CALL_DELAY_SECONDS=7
 GEMINI_API_KEY=
 MISTRAL_API_KEY=
 
-# --- Credential Encryption ---
-# Optional: encryption key for provider credentials (auto-generated if not set)
-# ENCRYPTION_KEY=
-
 # --- GPU Acceleration for Clustering ---
 # Enable GPU-accelerated clustering using RAPIDS cuML (requires NVIDIA GPU)
 # Set to true to use GPU for KMeans, DBSCAN, and PCA in clustering tasks
diff --git a/docs/MULTI_PROVIDER_ARCHITECTURE.md b/docs/MULTI_PROVIDER_ARCHITECTURE.md
index 417052ed..6b39b84d 100644
--- a/docs/MULTI_PROVIDER_ARCHITECTURE.md
+++ b/docs/MULTI_PROVIDER_ARCHITECTURE.md
@@ -57,8 +57,7 @@ CREATE TABLE track (
     id SERIAL PRIMARY KEY,
     file_path_hash VARCHAR(64) NOT NULL UNIQUE,  -- SHA-256 of normalized relative path
     file_path TEXT NOT NULL,                      -- Original file path for display
-    file_size BIGINT,                             -- For change detection
-    file_modified TIMESTAMP,                      -- For change detection
+    normalized_path TEXT,                         -- Normalized relative path
     created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
     updated_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP
 );
diff --git a/requirements/common-noavx2.txt b/requirements/common-noavx2.txt
index fc6dc0a9..ce82181e 100644
--- a/requirements/common-noavx2.txt
+++ b/requirements/common-noavx2.txt
@@ -33,6 +33,5 @@ httpx
 voyager==2.1.0
 transformers==4.35.2
 sentencepiece
-cryptography
 gunicorn
 zstandard
diff --git a/requirements/common.txt b/requirements/common.txt
index ba28f4cd..db841081 100644
--- a/requirements/common.txt
+++ b/requirements/common.txt
@@ -34,7 +34,6 @@ httpx
 voyager==2.1.0
 transformers==4.57.3
 sentencepiece==0.2.1
-cryptography
 PyJWT>=2.8.0
 gunicorn
 zstandard
diff --git a/tests/unit/test_app_setup.py b/tests/unit/test_app_setup.py
index ae52aca7..24540a31 100644
--- a/tests/unit/test_app_setup.py
+++ b/tests/unit/test_app_setup.py
@@ -48,9 +48,7 @@
 def app():
     """Create a Flask app with the setup blueprint registered."""
     with patch('app_setup.get_db') as _mock_get_db, \
-         patch('app_setup.detect_music_path_prefix') as _mock_detect, \
-         patch('app_setup.encrypt_provider_config', side_effect=lambda x: x), \
-         patch('app_setup.decrypt_provider_config', side_effect=lambda x: x):
+         patch('app_setup.detect_music_path_prefix') as _mock_detect:
         from app_setup import setup_bp
         flask_app = Flask(__name__)
         flask_app.register_blueprint(setup_bp)