"""
Music Generation Studio - HuggingFace Spaces Deployment
Main application file for Gradio interface

Version: 1.0.2
"""
import os
import sys
import gradio as gr
import logging
from pathlib import Path
from datetime import datetime
import shutil
import subprocess
import json
import time

# Import version info
from version import __version__

# Import spaces for ZeroGPU support
try:
    import spaces
    # Check if we're actually on ZeroGPU (has device-api)
    import requests
    try:
        requests.head("http://device-api.zero/", timeout=0.5)
        HAS_ZEROGPU = True
    except:
        HAS_ZEROGPU = False
except ImportError:
    HAS_ZEROGPU = False

# Create appropriate decorator
if HAS_ZEROGPU:
    # Use ZeroGPU decorator - make it callable with duration parameter
    def GPU_DECORATOR(duration=120):
        return spaces.GPU(duration=duration)
else:
    # No-op decorator for regular GPU/CPU
    def GPU_DECORATOR(duration=120):
        def decorator(func):
            return func
        return decorator

# Run DiffRhythm2 source setup if needed
setup_script = Path(__file__).parent / "setup_diffrhythm2_src.sh"
if setup_script.exists():
    try:
        subprocess.run(["bash", str(setup_script)], check=True)
    except Exception as e:
        print(f"Warning: Failed to run setup script: {e}")

# Configure environment for HuggingFace Spaces (espeak-ng paths, etc.)
import hf_config

# Setup paths for HuggingFace Spaces
SPACE_DIR = Path(__file__).parent
sys.path.insert(0, str(SPACE_DIR / 'backend'))

# Configure logging
logging.basicConfig(
    level=logging.INFO,
    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s'
)
logger = logging.getLogger(__name__)

# Log GPU mode
if HAS_ZEROGPU:
    logger.info("🚀 ZeroGPU detected - using dynamic GPU allocation")
else:
    logger.info("💻 Running on regular GPU/CPU - using static device allocation")

# Import services
try:
    from services.diffrhythm_service import DiffRhythmService
    from services.lyricmind_service import LyricMindService
    from services.timeline_service import TimelineService
    from services.export_service import ExportService
    from services.hf_storage_service import HFStorageService
    from config.settings import Config
    from utils.prompt_analyzer import PromptAnalyzer
except ImportError as e:
    logger.error(f"Import error: {e}")
    raise

# Initialize configuration
config = Config()

# Create necessary directories
os.makedirs("outputs", exist_ok=True)
os.makedirs("outputs/music", exist_ok=True)
os.makedirs("outputs/mixed", exist_ok=True)
os.makedirs("models", exist_ok=True)
os.makedirs("logs", exist_ok=True)

# Initialize services - these persist at module level
timeline_service = TimelineService()
export_service = ExportService()

# Initialize MSD services (lazy loading to avoid startup issues)
msd_db_service = None
genre_profiler = None
msd_importer = None
lakh_midi_service = None
theory_constraint_service = None

def initialize_msd_services():
    """Lazy initialization of MSD services"""
    global msd_db_service, genre_profiler, msd_importer
    
    if msd_db_service is not None:
        return  # Already initialized
    
    try:
        from services.msd_database_service import MSDDatabaseService
        from services.genre_profiler import GenreProfiler
        from services.msd_importer import MSDSubsetImporter
        
        msd_db_service = MSDDatabaseService()
        genre_profiler = GenreProfiler()
        msd_importer = MSDSubsetImporter()
        
        logger.info("✅ MSD services initialized successfully")
    except Exception as e:
        logger.warning(f"⚠️ MSD services not available: {e}")
        msd_db_service = None
        genre_profiler = None
        msd_importer = None

def initialize_theory_services():
    """Lazy initialization of music theory services"""
    global lakh_midi_service, theory_constraint_service
    
    if theory_constraint_service is not None:
        return  # Already initialized
    
    try:
        from services.lakh_midi_service import LakhMIDIService
        from services.theory_constraint_service import TheoryConstraintService
        
        lakh_midi_service = LakhMIDIService()
        theory_constraint_service = TheoryConstraintService()
        
        logger.info("✅ Music theory services initialized successfully")
    except Exception as e:
        logger.warning(f"⚠️ Music theory services not available: {e}")
        lakh_midi_service = None
        theory_constraint_service = None

# Initialize HF storage for LoRA uploads to dataset repo
hf_storage = HFStorageService(username="Gamahea", dataset_repo="lemmdata")
logger.info("🔍 Checking HuggingFace dataset repo for LoRAs...")
sync_result = hf_storage.sync_on_startup(loras_dir=Path("models/loras"), datasets_dir=Path("training_data"))
if sync_result.get('loras'):
    logger.info(f"✅ Found {len(sync_result['loras'])} LoRA(s) in dataset repo")
else:
    logger.info("ℹ️ No LoRAs in dataset repo yet - train your first one!")

# Lazy-load AI services (heavy models)
diffrhythm_service = None
lyricmind_service = None

def get_diffrhythm_service():
    """Lazy load DiffRhythm service"""
    global diffrhythm_service
    if diffrhythm_service is None:
        logger.info("Loading DiffRhythm2 model...")
        diffrhythm_service = DiffRhythmService(model_path=config.DIFFRHYTHM_MODEL_PATH)
        logger.info("DiffRhythm2 model loaded")
    return diffrhythm_service

def get_lyricmind_service():
    """Lazy load LyricMind service"""
    global lyricmind_service
    if lyricmind_service is None:
        logger.info("Loading LyricMind model...")
        lyricmind_service = LyricMindService(model_path=config.LYRICMIND_MODEL_PATH)
        logger.info("LyricMind model loaded")
    return lyricmind_service

@GPU_DECORATOR(duration=60)
def generate_lyrics(prompt: str, progress=gr.Progress()):
    """Generate lyrics from prompt using analysis"""
    try:
        if not prompt or not prompt.strip():
            return "❌ Please enter a prompt"
        
        # Fixed duration for all clips
        duration = 32
        
        progress(0, desc="🔍 Analyzing prompt...")
        logger.info(f"Generating lyrics for: {prompt}")
        
        # Analyze prompt
        analysis = PromptAnalyzer.analyze(prompt)
        genre = analysis.get('genres', ['general'])[0] if analysis.get('genres') else 'general'
        mood = analysis.get('mood', 'unknown')
        
        logger.info(f"Analysis - Genre: {genre}, Mood: {mood}")
        
        progress(0.3, desc=f"✍️ Generating {genre} lyrics...")
        
        service = get_lyricmind_service()
        lyrics = service.generate(
            prompt=prompt,
            duration=duration,
            prompt_analysis=analysis
        )
        
        progress(1.0, desc="✅ Lyrics generated!")
        return lyrics
        
    except Exception as e:
        logger.error(f"Error generating lyrics: {e}", exc_info=True)
        return f"❌ Error: {str(e)}"

# Helper functions for JSON string State management
def parse_timeline_state(state_str: str):
    """Parse JSON string State to dict"""
    try:
        if not state_str or state_str.strip() == '':
            return {'clips': []}
        return json.loads(state_str)
    except Exception as e:
        logger.error(f"Error parsing timeline state: {e}")
        return {'clips': []}

def serialize_timeline_state(state_dict):
    """Convert dict to JSON string State"""
    try:
        return json.dumps(state_dict)
    except Exception as e:
        logger.error(f"Error serializing timeline state: {e}")
        return '{"clips": []}'

def restore_timeline_from_state(state_dict):
    """Restore timeline service from dict"""
    try:
        if state_dict and 'clips' in state_dict:
            timeline_service.clips = []
            for clip_data in state_dict['clips']:
                from models.schemas import TimelineClip
                clip = TimelineClip(**clip_data)
                timeline_service.clips.append(clip)
            logger.info(f"[STATE] Restored {len(timeline_service.clips)} clips from state")
        else:
            logger.warning(f"[STATE] No clips in state to restore")
    except Exception as e:
        logger.error(f"Error restoring timeline from state: {e}", exc_info=True)

def save_timeline_to_state():
    """Save timeline to dict"""
    return {
        'clips': [{
            'clip_id': c.clip_id,
            'file_path': c.file_path,
            'duration': c.duration,
            'timeline_position': c.timeline_position,
            'start_time': c.start_time,
            'music_path': c.music_path
        } for c in timeline_service.clips]
    }

@GPU_DECORATOR(duration=180)
def generate_music(prompt: str, lyrics: str, lyrics_mode: str, position: str, context_length: int, use_lora: bool, selected_lora: str, timeline_state: str, progress=gr.Progress()):
    """Generate music clip and add to timeline"""
    try:
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        
        if not prompt or not prompt.strip():
            return "❌ Please enter a music prompt", get_timeline_display(), None, timeline_state
        
        # Handle LoRA if selected
        lora_path = None
        lora_name = None
        if use_lora and selected_lora:
            try:
                # Parse LoRA source and name
                if selected_lora.startswith('[Local] '):
                    lora_name = selected_lora.replace('[Local] ', '')
                    lora_dir = Path('models/diffrhythm2/loras') / lora_name
                    if lora_dir.exists():
                        lora_path = str(lora_dir)
                        logger.info(f"Using local LoRA: {lora_path}")
                    else:
                        logger.warning(f"Local LoRA not found: {lora_name}")
                        lora_name = None
                        
                elif selected_lora.startswith('[HF] '):
                    lora_name = selected_lora.replace('[HF] ', '')
                    # Download from HuggingFace
                    from backend.services.hf_storage_service import HFStorageService
                    hf_storage = HFStorageService()
                    
                    target_dir = Path('models/diffrhythm2/loras') / lora_name
                    target_dir.mkdir(parents=True, exist_ok=True)
                    
                    if hf_storage.download_lora(f"loras/{lora_name}", target_dir):
                        lora_path = str(target_dir)
                        logger.info(f"Downloaded and using HF LoRA: {lora_path}")
                    else:
                        logger.warning(f"Failed to download HF LoRA: {lora_name}")
                        lora_name = None
                
                if lora_name:
                    progress(0.05, desc=f"✅ LoRA loaded: {lora_name}")
            except Exception as e:
                logger.error(f"Error loading LoRA: {e}")
                # Continue without LoRA
        
        # Fixed duration for all clips
        duration = 32
        
        # Estimate time (CPU on HF Spaces)
        est_time = int(duration * 4)  # Conservative estimate for CPU
        
        progress(0, desc=f"🔍 Analyzing prompt... (Est. {est_time}s)")
        logger.info(f"Generating music: {prompt}, mode={lyrics_mode}, duration={duration}s")
        
        # Analyze prompt
        analysis = PromptAnalyzer.analyze(prompt)
        genre = analysis.get('genres', ['general'])[0] if analysis.get('genres') else 'general'
        bpm = analysis.get('bpm', 120)
        mood = analysis.get('mood', 'neutral')
        
        logger.info(f"Analysis - Genre: {genre}, BPM: {bpm}, Mood: {mood}")
        
        # Apply style consistency from previous clips within context window
        # Auto-disable context if this is the first clip
        clips = timeline_service.get_all_clips()
        effective_context_length = 0 if len(clips) == 0 else context_length
        
        if effective_context_length > 0 and clips:
            # Calculate which clips fall within the context window
            total_duration = timeline_service.get_total_duration()
            context_start = max(0, total_duration - effective_context_length)
            
            context_clips = [c for c in clips if c['start_time'] >= context_start]
            
            if context_clips:
                logger.info(f"Using {len(context_clips)} clips for style consistency (context: {effective_context_length}s)")
                # Enhance prompt with style consistency guidance
                prompt = f"{prompt} (maintaining consistent {genre} style at {bpm} BPM with {mood} mood)"
            else:
                logger.info("No clips in context window")
        else:
            if len(clips) == 0:
                logger.info("First clip - style consistency disabled")
            else:
                logger.info("Style consistency disabled (context length: 0)")
        
        # Determine lyrics based on mode
        lyrics_to_use = None
        
        if lyrics_mode == "Instrumental":
            logger.info("Generating instrumental (no vocals)")
            progress(0.1, desc=f"🎹 Preparing instrumental generation... ({est_time}s)")
            
        elif lyrics_mode == "User Lyrics":
            if not lyrics or not lyrics.strip():
                return "❌ Please enter lyrics or switch mode", get_timeline_display(), None
            lyrics_to_use = lyrics.strip()
            logger.info(f"Using user-provided lyrics (length: {len(lyrics_to_use)} chars)")
            logger.info(f"First 100 chars: {lyrics_to_use[:100]}")
            progress(0.1, desc=f"🎤 Preparing vocal generation... ({est_time}s)")
            
        elif lyrics_mode == "Auto Lyrics":
            if lyrics and lyrics.strip():
                lyrics_to_use = lyrics.strip()
                logger.info("Using existing lyrics from textbox")
                progress(0.1, desc=f"🎤 Using provided lyrics... ({est_time}s)")
            else:
                progress(0.1, desc="✍️ Generating lyrics...")
                logger.info("Auto-generating lyrics...")
                lyric_service = get_lyricmind_service()
                lyrics_to_use = lyric_service.generate(
                    prompt=prompt,
                    duration=duration,
                    prompt_analysis=analysis
                )
                logger.info(f"Generated {len(lyrics_to_use)} characters of lyrics")
                progress(0.25, desc=f"🎵 Lyrics ready, generating music... ({est_time}s)")
        
        # Generate music
        progress(0.3, desc=f"🎼 Generating {genre} at {bpm} BPM... ({est_time}s)")
        service = get_diffrhythm_service()
        
        # Add LoRA info to generation if available
        generation_kwargs = {
            'prompt': prompt,
            'duration': duration,
            'lyrics': lyrics_to_use
        }
        
        if lora_path:
            generation_kwargs['lora_path'] = lora_path
            logger.info(f"Generating with LoRA: {lora_path}")
        
        final_path = service.generate(**generation_kwargs)
        
        # Add to timeline
        progress(0.9, desc="📊 Adding to timeline...")
        clip_id = os.path.basename(final_path).split('.')[0]
        
        logger.info(f"[GENERATE] About to add clip: {clip_id}, position: {position}")
        logger.info(f"[GENERATE] Timeline service ID: {id(timeline_service)}")
        logger.info(f"[GENERATE] Clips before add: {len(timeline_service.clips)}")
        
        from models.schemas import ClipPosition
        clip_info = timeline_service.add_clip(
            clip_id=clip_id,
            file_path=final_path,
            duration=float(duration),
            position=ClipPosition(position)
        )
        
        logger.info(f"Music added to timeline at position {clip_info['timeline_position']}")
        logger.info(f"[GENERATE] Clips after add: {len(timeline_service.clips)}")
        
        # Build status message
        progress(1.0, desc="✅ Complete!")
        status_msg = f"✅ Music generated successfully!\n"
        status_msg += f"🎸 Genre: {genre} | 🥁 BPM: {bpm} | 🎭 Mood: {mood}\n"
        status_msg += f"🎤 Mode: {lyrics_mode} | 📍 Position: {position}\n"
        
        if lyrics_mode == "Auto Lyrics" and lyrics_to_use and not lyrics:
            status_msg += "✍️ (Lyrics auto-generated)"
        
        # Save timeline to state
        new_state = {
            'clips': [{
                'clip_id': c.clip_id,
                'file_path': c.file_path,
                'duration': c.duration,
                'timeline_position': c.timeline_position,
                'start_time': c.start_time,
                'music_path': c.music_path
            } for c in timeline_service.clips]
        }
        logger.info(f"[STATE] Saved {len(new_state['clips'])} clips to state")
        
        return status_msg, get_timeline_display(), final_path, serialize_timeline_state(new_state)
        
    except Exception as e:
        logger.error(f"Error generating music: {e}", exc_info=True)
        
        # Check if it's a ZeroGPU quota error
        error_str = str(e)
        if "ZeroGPU quota" in error_str or "running out of daily" in error_str:
            error_msg = (
                "❌ ZeroGPU Quota Issue\n\n"
                "🔑 This Space requires authentication to access GPU resources.\n\n"
                "💡 Solutions:\n"
                "1. Make sure you're logged into HuggingFace\n"
                "2. If you're logged in but still see this, try duplicating this Space to your account\n"
                "3. Free tier users: Check your daily GPU quota at https://huggingface.co/settings/billing\n\n"
                f"Technical details: {error_str}"
            )
        else:
            error_msg = f"❌ Error: {str(e)}"
        
        return error_msg, get_timeline_display(), None, timeline_state

def get_timeline_display():
    """Get timeline clips as HTML visualization with waveform-style display"""
    clips = timeline_service.get_all_clips()
    
    if not clips:
        return "<div style='text-align:center; padding:40px; color:#888;'>📭 Timeline is empty. Generate clips to get started!</div>"
    
    total_duration = timeline_service.get_total_duration()
    
    # Build HTML timeline
    html = f"""
    <div style="font-family: Arial, sans-serif; background: #1a1a1a; padding: 20px; border-radius: 8px; color: white;">
        <div style="margin-bottom: 15px; font-size: 14px; color: #aaa;">
            <strong>📊 Timeline:</strong> {len(clips)} clips | Total: {format_duration(total_duration)}
        </div>
        <div style="background: #2a2a2a; border-radius: 6px; padding: 15px; position: relative; min-height: 80px;">
            <div style="position: absolute; top: 10px; left: 15px; right: 15px; height: 60px; background: #333; border-radius: 4px; overflow: hidden;">
    """
    
    # Calculate pixel width (scale to fit)
    if total_duration > 0:
        pixels_per_second = 800 / total_duration  # 800px total width
    else:
        pixels_per_second = 10
    
    # Add clip blocks
    colors = ['#8b5cf6', '#ec4899', '#06b6d4', '#10b981', '#f59e0b', '#ef4444']
    for i, clip in enumerate(clips):
        start_px = clip['start_time'] * pixels_per_second
        width_px = clip['duration'] * pixels_per_second
        color = colors[i % len(colors)]
        
        # Create waveform-style bars
        bars = ''.join([
            f'<div style="display:inline-block; width:2px; height:{20 + (i*7 % 30)}px; background:rgba(255,255,255,0.3); margin:0 1px; vertical-align:bottom;"></div>'
            for i in range(min(int(width_px / 4), 50))
        ])
        
        html += f"""
                <div style="position: absolute; left: {start_px}px; width: {width_px}px; height: 60px; 
                     background: linear-gradient(135deg, {color} 0%, {color}dd 100%); 
                     border-radius: 4px; border: 1px solid rgba(255,255,255,0.2);
                     display: flex; align-items: center; justify-content: center;
                     overflow: hidden; box-shadow: 0 2px 4px rgba(0,0,0,0.3);">
                    <div style="position: absolute; bottom: 5px; left: 0; right: 0; height: 40px; display: flex; align-items: flex-end; justify-content: space-evenly; padding: 0 5px;">
                        {bars}
                    </div>
                    <div style="position: relative; z-index: 1; font-size: 11px; font-weight: bold; 
                         text-shadow: 0 1px 2px rgba(0,0,0,0.5); text-align: center; padding: 0 5px;">
                        Clip {i+1}<br>{format_duration(clip['duration'])}
                    </div>
                </div>
        """
    
    html += """
            </div>
            <div style="margin-top: 75px; font-size: 11px; color: #888;">
                <div style="display: flex; justify-content: space-between;">
                    <span>0:00</span>
                    <span>{}</span>
                </div>
            </div>
        </div>
    </div>
    """.format(format_duration(total_duration))
    
    return html

def remove_clip(clip_number: int, timeline_state: str):
    """Remove a clip from timeline"""
    try:
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        
        clips = timeline_service.get_all_clips()
        
        if not clips:
            return "📭 Timeline is empty", get_timeline_display(), timeline_state
        
        if clip_number < 1 or clip_number > len(clips):
            return f"❌ Invalid clip number. Choose 1-{len(clips)}", get_timeline_display(), timeline_state
        
        clip_id = clips[clip_number - 1]['clip_id']
        timeline_service.remove_clip(clip_id)
        
        # Save updated state
        new_state = save_timeline_to_state()
        
        return f"✅ Clip {clip_number} removed", get_timeline_display(), serialize_timeline_state(new_state)
        
    except Exception as e:
        logger.error(f"Error removing clip: {e}", exc_info=True)
        return f"❌ Error: {str(e)}", get_timeline_display(), timeline_state

def clear_timeline(timeline_state: str):
    """Clear all clips from timeline"""
    try:
        timeline_service.clear()
        new_state = {'clips': []}
        return "✅ Timeline cleared", get_timeline_display(), serialize_timeline_state(new_state)
    except Exception as e:
        logger.error(f"Error clearing timeline: {e}", exc_info=True)
        return f"❌ Error: {str(e)}", get_timeline_display(), timeline_state

def export_timeline(filename: str, export_format: str, timeline_state: str, progress=gr.Progress()):
    """Export timeline to audio file"""
    try:
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        logger.info(f"[STATE] Restored {len(timeline_service.clips)} clips for export")
        
        clips = timeline_service.get_all_clips()
        
        if not clips:
            return "❌ No clips to export", None, timeline_state
        
        if not filename or not filename.strip():
            filename = "output"
        
        progress(0, desc="🔄 Merging clips...")
        logger.info(f"Exporting timeline: {filename}.{export_format}")
        
        export_service.timeline_service = timeline_service
        
        progress(0.5, desc="💾 Encoding audio...")
        output_path = export_service.merge_clips(
            filename=filename,
            export_format=export_format
        )
        
        if output_path:
            progress(1.0, desc="✅ Export complete!")
            return f"✅ Exported: {os.path.basename(output_path)}", output_path, timeline_state
        else:
            return "❌ Export failed", None, timeline_state
            
    except Exception as e:
        logger.error(f"Error exporting: {e}", exc_info=True)
        return f"❌ Error: {str(e)}", None, timeline_state

def get_timeline_playback(timeline_state: str):
    """Get merged timeline audio for playback"""
    try:
        logger.info(f"[PLAYBACK] get_timeline_playback called")
        
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        logger.info(f"[PLAYBACK] Restored {len(timeline_service.clips)} clips from state")
        
        clips = timeline_service.get_all_clips()
        logger.info(f"[PLAYBACK] Total clips in timeline: {len(clips)}")
        
        if not clips:
            logger.warning("[PLAYBACK] No clips available for playback")
            return None
        
        # Use export service to merge clips
        export_service.timeline_service = timeline_service
        output_path = export_service.merge_clips(
            filename="timeline_preview",
            export_format="wav"
        )
        
        logger.info(f"[PLAYBACK] Timeline playback ready: {output_path}")
        return output_path
        
    except Exception as e:
        logger.error(f"Error creating playback: {e}", exc_info=True)
        return None

def update_preset_description(preset_select_value: str):
    """
    Update preset description when preset is selected
    
    Args:
        preset_select_value: Full preset string like "Clean Master - Transparent mastering"
        
    Returns:
        Description text for the selected preset
    """
    try:
        # Extract preset key from the dropdown value (format: "Key - Description")
        preset_key = preset_select_value.split(" - ")[0]
        
        # Map display names to actual preset keys
        preset_map = {
            "Clean Master": "clean_master",
            "Subtle Warmth": "subtle_warmth",
            "Modern Pop": "modern_pop",
            "Radio Ready": "radio_ready",
            "Punchy Commercial": "punchy_commercial",
            "Rock Master": "rock_master",
            "Metal Aggressive": "metal_aggressive",
            "Indie Rock": "indie_rock",
            "EDM Club": "edm_club",
            "House Groovy": "house_groovy",
            "Techno Dark": "techno_dark",
            "Dubstep Heavy": "dubstep_heavy",
            "HipHop Modern": "hiphop_modern",
            "Trap 808": "trap_808",
            "RnB Smooth": "rnb_smooth",
            "Acoustic Natural": "acoustic_natural",
            "Folk Warm": "folk_warm",
            "Jazz Vintage": "jazz_vintage",
            "Orchestral Wide": "orchestral_wide",
            "Classical Concert": "classical_concert",
            "Ambient Spacious": "ambient_spacious",
            "Harmonic Enhance": "harmonic_enhance"
        }
        
        if preset_key in preset_map:
            from services.mastering_service import MasteringService
            mastering = MasteringService()
            actual_key = preset_map[preset_key]
            
            if actual_key in mastering.PRESETS:
                preset = mastering.PRESETS[actual_key]
                return preset.description
        
        # Fallback - extract description from dropdown value
        parts = preset_select_value.split(" - ", 1)
        if len(parts) == 2:
            return parts[1]
        
        return "Select a preset to see its description"
        
    except Exception as e:
        logger.error(f"Error updating preset description: {e}")
        return "Error loading preset description"

def preview_mastering_preset(preset_name: str, timeline_state: str):
    """Preview mastering preset on the most recent clip"""
    try:
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        
        clips = timeline_service.get_all_clips()
        if not clips:
            return None, "❌ No clips in timeline to preview"
        
        # Use the most recent clip for preview
        latest_clip = clips[-1]
        clip_path = latest_clip['file_path']
        
        if not os.path.exists(clip_path):
            return None, f"❌ Clip file not found: {clip_path}"
        
        # Extract preset name
        preset_key = preset_name.split(" - ")[0].lower().replace(" ", "_")
        
        # Create temporary preview file
        import tempfile
        preview_path = os.path.join(tempfile.gettempdir(), f"preview_{latest_clip['clip_id']}.wav")
        
        from services.mastering_service import MasteringService
        mastering_service = MasteringService()
        
        # Apply preset to preview file
        mastering_service.apply_preset(
            audio_path=clip_path,
            preset_name=preset_key,
            output_path=preview_path
        )
        
        logger.info(f"Created mastering preview: {preview_path}")
        return preview_path, f"✅ Preview ready: {preset_name.split(' - ')[0]} applied to latest clip"
        
    except Exception as e:
        logger.error(f"Error creating preview: {e}", exc_info=True)
        return None, f"❌ Preview error: {str(e)}"

def apply_mastering_preset(preset_name: str, timeline_state: str):
    """Apply mastering preset to all clips in timeline"""
    try:
        logger.info(f"[STATE DEBUG] apply_mastering_preset called")
        
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        logger.info(f"[STATE] Restored {len(timeline_service.clips)} clips for mastering")
        
        clips = timeline_service.get_all_clips()
        logger.info(f"[MASTERING DEBUG] Retrieved {len(clips)} clips from timeline")
        
        if not clips:
            logger.warning("[MASTERING DEBUG] No clips found in timeline")
            return "❌ No clips in timeline", timeline_state
        
        # Log clip details for debugging
        for i, clip in enumerate(clips):
            logger.info(f"[MASTERING DEBUG] Clip {i+1}: {clip}")
        
        # Extract preset name from dropdown value
        preset_key = preset_name.split(" - ")[0].lower().replace(" ", "_")
        
        logger.info(f"Applying preset '{preset_key}' to {len(clips)} clip(s)")
        
        # Import mastering service
        from services.mastering_service import MasteringService
        mastering_service = MasteringService()
        
        # Apply preset to all clips
        for clip in clips:
            clip_path = clip['file_path']
            
            if not os.path.exists(clip_path):
                logger.warning(f"Audio file not found: {clip_path}")
                continue
            
            # Apply preset
            mastering_service.apply_preset(
                audio_path=clip_path,
                preset_name=preset_key,
                output_path=clip_path  # Overwrite original
            )
            logger.info(f"Applied preset to: {clip['clip_id']}")
        
        return f"✅ Applied '{preset_name.split(' - ')[0]}' to {len(clips)} clip(s)", timeline_state
        
    except Exception as e:
        logger.error(f"Error applying preset: {e}", exc_info=True)
        return f"❌ Error: {str(e)}", timeline_state

def preview_custom_eq(low_shelf, low_mid, mid, high_mid, high_shelf, timeline_state: str):
    """Preview custom EQ on the most recent clip"""
    try:
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        
        clips = timeline_service.get_all_clips()
        if not clips:
            return None, "❌ No clips in timeline to preview"
        
        # Use the most recent clip for preview
        latest_clip = clips[-1]
        clip_path = latest_clip['file_path']
        
        if not os.path.exists(clip_path):
            return None, f"❌ Clip file not found: {clip_path}"
        
        # Create temporary preview file
        import tempfile
        preview_path = os.path.join(tempfile.gettempdir(), f"eq_preview_{latest_clip['clip_id']}.wav")
        
        from services.mastering_service import MasteringService
        mastering_service = MasteringService()
        
        # Format EQ bands
        eq_bands = [
            {'type': 'lowshelf', 'frequency': 100, 'gain': low_shelf, 'q': 0.7},
            {'type': 'peak', 'frequency': 500, 'gain': low_mid, 'q': 1.0},
            {'type': 'peak', 'frequency': 2000, 'gain': mid, 'q': 1.0},
            {'type': 'peak', 'frequency': 5000, 'gain': high_mid, 'q': 1.0},
            {'type': 'highshelf', 'frequency': 10000, 'gain': high_shelf, 'q': 0.7}
        ]
        
        # Apply EQ to preview file
        mastering_service.apply_custom_eq(
            audio_path=clip_path,
            eq_bands=eq_bands,
            output_path=preview_path
        )
        
        logger.info(f"Created EQ preview: {preview_path}")
        return preview_path, f"✅ Preview ready: Custom EQ applied to latest clip"
        
    except Exception as e:
        logger.error(f"Error creating EQ preview: {e}", exc_info=True)
        return None, f"❌ Preview error: {str(e)}"

def apply_custom_eq(low_shelf, low_mid, mid, high_mid, high_shelf, timeline_state: str):
    """Apply custom EQ to all clips in timeline"""
    try:
        logger.info(f"[STATE DEBUG] apply_custom_eq called")
        
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        logger.info(f"[STATE] Restored {len(timeline_service.clips)} clips for EQ")
        
        clips = timeline_service.get_all_clips()
        logger.info(f"[EQ DEBUG] Retrieved {len(clips)} clips from timeline")
        
        if not clips:
            logger.warning("[EQ DEBUG] No clips found in timeline")
            return "❌ No clips in timeline", timeline_state
        
        # Log clip details for debugging
        for i, clip in enumerate(clips):
            logger.info(f"[EQ DEBUG] Clip {i+1}: {clip}")
        
        logger.info(f"Applying custom EQ to {len(clips)} clip(s)")
        
        # Import mastering service
        from services.mastering_service import MasteringService
        mastering_service = MasteringService()
        
        # Apply custom EQ - format eq_bands as expected by the service
        eq_bands = [
            {'type': 'lowshelf', 'frequency': 100, 'gain': low_shelf, 'q': 0.7},
            {'type': 'peak', 'frequency': 500, 'gain': low_mid, 'q': 1.0},
            {'type': 'peak', 'frequency': 2000, 'gain': mid, 'q': 1.0},
            {'type': 'peak', 'frequency': 5000, 'gain': high_mid, 'q': 1.0},
            {'type': 'highshelf', 'frequency': 10000, 'gain': high_shelf, 'q': 0.7}
        ]
        
        # Apply to all clips
        for clip in clips:
            clip_path = clip['file_path']
            
            if not os.path.exists(clip_path):
                logger.warning(f"Audio file not found: {clip_path}")
                continue
            
            mastering_service.apply_custom_eq(
                audio_path=clip_path,
                eq_bands=eq_bands,
                output_path=clip_path  # Overwrite original
            )
            logger.info(f"Applied EQ to: {clip['clip_id']}")
        
        return f"✅ Applied custom EQ to {len(clips)} clip(s)", timeline_state
        
    except Exception as e:
        logger.error(f"Error applying EQ: {e}", exc_info=True)
        return f"❌ Error: {str(e)}", timeline_state

def enhance_timeline_clips(enhancement_level: str, timeline_state: str):
    """Enhance all clips in timeline using stem separation"""
    try:
        logger.info(f"[ENHANCEMENT] Starting enhancement: level={enhancement_level}")
        
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        logger.info(f"[STATE] Restored {len(timeline_service.clips)} clips for enhancement")
        
        clips = timeline_service.get_all_clips()
        
        if not clips:
            return "❌ No clips in timeline", timeline_state
        
        # Import stem enhancement service
        from services.stem_enhancement_service import StemEnhancementService
        enhancer = StemEnhancementService()
        
        # Convert enhancement level to service format
        level_map = {
            "Fast": "fast",
            "Balanced": "balanced",
            "Maximum": "maximum"
        }
        service_level = level_map.get(enhancement_level, "balanced")
        
        # Enhance each clip
        enhanced_count = 0
        for clip in clips:
            clip_path = clip['file_path']
            
            if not os.path.exists(clip_path):
                logger.warning(f"Clip file not found: {clip_path}")
                continue
            
            logger.info(f"Enhancing clip: {clip['clip_id']} ({service_level})")
            
            # Enhance in-place (overwrites original)
            enhancer.enhance_clip(
                audio_path=clip_path,
                output_path=clip_path,
                enhancement_level=service_level
            )
            
            enhanced_count += 1
            logger.info(f"Enhanced {enhanced_count}/{len(clips)} clips")
        
        return f"✅ Enhanced {enhanced_count} clip(s) ({enhancement_level} quality)", timeline_state
        
    except Exception as e:
        logger.error(f"Enhancement failed: {e}", exc_info=True)
        return f"❌ Error: {str(e)}", timeline_state

def upscale_timeline_clips(upscale_mode: str, timeline_state: str):
    """Upscale all clips in timeline to 48kHz"""
    try:
        logger.info(f"[UPSCALE] Starting upscale: mode={upscale_mode}")
        
        # Parse and restore state
        state_dict = parse_timeline_state(timeline_state)
        restore_timeline_from_state(state_dict)
        logger.info(f"[STATE] Restored {len(timeline_service.clips)} clips for upscale")
        
        clips = timeline_service.get_all_clips()
        
        if not clips:
            return "❌ No clips in timeline", timeline_state
        
        # Import upscale service
        from services.audio_upscale_service import AudioUpscaleService
        upscaler = AudioUpscaleService()
        
        # Upscale each clip
        upscaled_count = 0
        for clip in clips:
            clip_path = clip['file_path']
            
            if not os.path.exists(clip_path):
                logger.warning(f"Clip file not found: {clip_path}")
                continue
            
            logger.info(f"Upscaling clip: {clip['clip_id']} ({upscale_mode})")
            
            # Choose upscale method
            if upscale_mode == "Quick (Resample)":
                upscaler.quick_upscale(
                    audio_path=clip_path,
                    output_path=clip_path
                )
            else:  # Neural (AudioSR)
                upscaler.upscale_audio(
                    audio_path=clip_path,
                    output_path=clip_path,
                    target_sr=48000
                )
            
            upscaled_count += 1
            logger.info(f"Upscaled {upscaled_count}/{len(clips)} clips")
        
        return f"✅ Upscaled {upscaled_count} clip(s) to 48kHz ({upscale_mode})", timeline_state
        
    except Exception as e:
        logger.error(f"Upscale failed: {e}", exc_info=True)
        return f"❌ Error: {str(e)}", timeline_state

def format_duration(seconds: float) -> str:
    """Format duration as MM:SS"""
    mins = int(seconds // 60)
    secs = int(seconds % 60)
    return f"{mins}:{secs:02d}"

# LoRA Training Functions
def analyze_user_audio(audio_files, split_clips, separate_stems):
    """Analyze uploaded audio files and generate metadata"""
    try:
        if not audio_files:
            return "❌ No audio files uploaded", None
        
        from backend.services.audio_analysis_service import AudioAnalysisService
        analyzer = AudioAnalysisService()
        
        results = []
        for audio_file in audio_files:
            # Analyze audio (will use embedded metadata when available)
            metadata = analyzer.analyze_audio(audio_file.name)
            
            # Use description from embedded metadata if available
            description = metadata.get('description', '')
            if not description and 'title' in metadata and 'artist' in metadata:
                description = f"{metadata['title']} by {metadata['artist']}"
            elif not description and 'title' in metadata:
                description = metadata['title']
            
            # Add to results
            results.append([
                Path(audio_file.name).name,
                metadata.get('genre', 'unknown'),
                metadata.get('bpm', 120),
                metadata.get('key', 'C major'),
                metadata.get('energy', 'medium'),
                '',  # Instruments (user fills in)
                description  # Use embedded description if available
            ])
        
        status = f"✅ Analyzed {len(results)} file(s)"
        return status, results
        
    except Exception as e:
        logger.error(f"Audio analysis failed: {e}")
        return f"❌ Error: {str(e)}", None

def ai_generate_all_metadata(metadata_table):
    """AI generate metadata for all files in table"""
    try:
        if metadata_table is None or len(metadata_table) == 0:
            return "❌ No files in metadata table"
        
        import pandas as pd
        
        # This is a placeholder - would use actual AI model
        # For now, return sample metadata
        updated_table = []
        for idx in range(len(metadata_table)):
            row = metadata_table.iloc[idx]
            if row['File']:  # If filename exists
                updated_table.append([
                    row['File'],  # Filename
                    row['Genre'] if row['Genre'] else "pop",  # Genre
                    row['BPM'] if row['BPM'] else 120,     # BPM
                    row['Key'] if row['Key'] else "C major",  # Key
                    row['Mood'] if row['Mood'] else "energetic",  # Mood
                    "synth, drums, bass",  # Instruments
                    f"AI-generated music in {row['Genre'] if row['Genre'] else 'unknown'} style"  # Description
                ])
        
        return f"✅ Generated metadata for {len(updated_table)} file(s)"
        
    except Exception as e:
        logger.error(f"Metadata generation failed: {e}", exc_info=True)
        return f"❌ Error: {str(e)}"

def check_downloaded_datasets():
    """Check and display status of already downloaded datasets"""
    try:
        from backend.services.dataset_service import DatasetService
        
        dataset_service = DatasetService()
        downloaded = dataset_service.get_downloaded_datasets()
        
        if not downloaded:
            return "📁 No datasets downloaded yet.\n\nSelect datasets above and click 'Download Datasets' to get started."
        
        status_messages = []
        status_messages.append(f"📊 Downloaded Datasets Status\n")
        status_messages.append(f"{'='*60}\n")
        
        for dataset_key, info in downloaded.items():
            status_messages.append(f"✅ {info.get('name', dataset_key)}")
            status_messages.append(f"   Type: {info.get('type', 'unknown')}")
            status_messages.append(f"   Size: ~{info.get('size_gb', 0):.1f} GB")
            
            if info.get('prepared'):
                status_messages.append(f"   Status: ✅ Prepared for training")
                status_messages.append(f"   Train samples: {info.get('num_train_samples', 0)}")
                status_messages.append(f"   Val samples: {info.get('num_val_samples', 0)}")
            else:
                status_messages.append(f"   Status: ⏳ Downloaded, needs preparation")
                
            status_messages.append("")
        
        status_messages.append(f"{'='*60}")
        status_messages.append(f"Total downloaded: {len(downloaded)} dataset(s)")
        
        return "\n".join(status_messages)
        
    except Exception as e:
        logger.error(f"Error checking datasets: {e}", exc_info=True)
        return f"❌ Error checking datasets: {str(e)}"

def get_dataset_choices_with_status():
    """Get dataset choices with download/preparation status indicators"""
    try:
        from backend.services.dataset_service import DatasetService
        
        dataset_service = DatasetService()
        downloaded = dataset_service.get_downloaded_datasets()
        user_datasets = dataset_service.get_user_datasets()
        
        # Dataset display mappings
        dataset_display_map = {
            "gtzan": "GTZAN Music Genre (1000 tracks, 10 genres)",
            "fsd50k": "FSD50K Sound Events (51K clips, 200 classes)",
            "librispeech": "LibriSpeech ASR (speech recognition)",
            "libritts": "LibriTTS (audiobooks for TTS)",
            "audioset_strong": "AudioSet Strong (labeled audio events)",
            "esc50": "ESC-50 Environmental Sounds",
            "urbansound8k": "UrbanSound8K (urban sounds)"
        }
        
        music_choices = []
        vocal_choices = []
        prepare_choices = []
        
        music_keys = ["gtzan"]
        vocal_keys = ["librispeech", "libritts", "audioset_strong", "esc50", "urbansound8k", "fsd50k"]
        
        # Add HuggingFace datasets
        for key in music_keys:
            display_name = dataset_display_map.get(key, key)
            if key in downloaded:
                info = downloaded[key]
                if info.get('prepared'):
                    music_choices.append(f"✅ {display_name} [Downloaded & Prepared]")
                    prepare_choices.append(f"✅ {key} [Already Prepared]")
                else:
                    music_choices.append(f"📥 {display_name} [Downloaded]")
                    prepare_choices.append(key)
            else:
                music_choices.append(display_name)
        
        for key in vocal_keys:
            display_name = dataset_display_map.get(key, key)
            if key in downloaded:
                info = downloaded[key]
                if info.get('prepared'):
                    vocal_choices.append(f"✅ {display_name} [Downloaded & Prepared]")
                else:
                    vocal_choices.append(f"📥 {display_name} [Downloaded]")
            else:
                vocal_choices.append(display_name)
        
        # Add user-uploaded datasets
        for key, info in user_datasets.items():
            dataset_name = info.get('dataset_name', key)
            num_samples = info.get('num_train_samples', 0) + info.get('num_val_samples', 0)
            display_name = f"👤 {dataset_name} ({num_samples} samples)"
            
            if info.get('prepared'):
                vocal_choices.append(f"✅ {display_name} [User Dataset - Prepared]")
            else:
                vocal_choices.append(f"📥 {display_name} [User Dataset]")
        
        return music_choices, vocal_choices, prepare_choices
        
    except Exception as e:
        logger.error(f"Error getting dataset status: {e}", exc_info=True)
        # Return default choices on error
        return [], [], []

def download_prepare_datasets(vocal_datasets, symbolic_datasets):
    """Download and prepare curated datasets for training"""
    try:
        from backend.services.dataset_service import DatasetService
        
        selected_datasets = []
        if vocal_datasets:
            selected_datasets.extend(vocal_datasets)
        if symbolic_datasets:
            selected_datasets.extend(symbolic_datasets)
        
        if not selected_datasets:
            return "❌ No datasets selected. Please check at least one dataset."
        
        dataset_service = DatasetService()
        
        # Map display names to dataset keys (handle status indicators)
        dataset_map = {
            # Music datasets
            "GTZAN Music Genre (1000 tracks, 10 genres)": "gtzan",
            # Vocal & Sound datasets
            "FSD50K Sound Events (51K clips, 200 classes)": "fsd50k",
            "Common Voice English (crowdsourced speech)": "common_voice",
            # Vocal & Sound datasets
            "FLEURS English Speech (multi-speaker)": "fleurs",
            "LibriSpeech ASR (speech recognition)": "librispeech",
            "LibriTTS (audiobooks for TTS)": "libritts",
            "AudioSet Strong (labeled audio events)": "audioset_strong",
            "ESC-50 Environmental Sounds": "esc50",
            "UrbanSound8K (urban sounds)": "urbansound8k"
        }
        
        # Extract dataset keys from selected items (strip status indicators)
        dataset_keys = []
        for item in selected_datasets:
            # Remove status prefixes and suffixes
            clean_item = item.replace("✅ ", "").replace("📥 ", "")
            clean_item = clean_item.split(" [")[0]  # Remove [Downloaded] or [Prepared] suffix
            
            if clean_item in dataset_map:
                dataset_keys.append(dataset_map[clean_item])
            else:
                # Direct key match
                if clean_item in ["gtzan", "fsd50k",
                                   "librispeech", "libritts", "audioset_strong", "esc50", "urbansound8k"]:
                    dataset_keys.append(clean_item)
        
        if not dataset_keys:
            return "❌ No valid datasets selected."
        
        status_messages = []
        status_messages.append(f"📥 Starting download for {len(dataset_keys)} dataset(s)...\n")
        
        success_count = 0
        already_downloaded_count = 0
        manual_count = 0
        error_count = 0
        
        for dataset_key in dataset_keys:
            # Get display name for this key
            dataset_config = dataset_service.DATASETS.get(dataset_key, {})
            dataset_display_name = dataset_config.get('name', dataset_key)
            
            status_messages.append(f"\n{'='*60}")
            status_messages.append(f"📦 Processing: {dataset_display_name}")
            status_messages.append(f"{'='*60}\n")
            
            # Progress callback
            progress_msgs = []
            def progress_callback(msg):
                progress_msgs.append(msg)
            
            # Download dataset
            result = dataset_service.download_dataset(dataset_key, progress_callback)
            
            # Add progress messages
            for msg in progress_msgs:
                status_messages.append(f"   {msg}")
            
            if result.get('success'):
                if result.get('already_downloaded'):
                    already_downloaded_count += 1
                else:
                    success_count += 1
                    info = result.get('info', {})
                    status_messages.append(f"\n   ✅ Successfully downloaded!")
                    status_messages.append(f"   📊 Examples: {info.get('num_examples', 'N/A')}")
                    status_messages.append(f"   💾 Path: {info.get('path', 'N/A')}\n")
            elif result.get('manual_download_required'):
                manual_count += 1
                status_messages.append(f"\n   ℹ️ Manual download required")
                status_messages.append(f"   🔗 URL: {result.get('url', 'N/A')}\n")
            else:
                error_count += 1
                status_messages.append(f"\n   ❌ Error: {result.get('error', 'Unknown error')}\n")
        
        # Summary
        status_messages.append(f"\n{'='*60}")
        status_messages.append("📊 DOWNLOAD SUMMARY")
        status_messages.append(f"{'='*60}")
        status_messages.append(f"✅ Newly downloaded: {success_count}")
        status_messages.append(f"♻️  Already downloaded: {already_downloaded_count}")
        status_messages.append(f"ℹ️  Manual required: {manual_count}")
        status_messages.append(f"❌ Errors: {error_count}")
        status_messages.append(f"📁 Total processed: {len(selected_datasets)}")
        
        if success_count > 0 or already_downloaded_count > 0:
            status_messages.append(f"\n✅ Datasets are ready!")
            status_messages.append(f"💡 Use the 'Training Configuration' tab to start training")
        
        return "\n".join(status_messages)
        
    except Exception as e:
        logger.error(f"Dataset download failed: {e}", exc_info=True)
        return f"❌ Error: {str(e)}\n\nStacktrace logged to console."

def prepare_datasets_for_training(selected_datasets, max_samples_per_dataset):
    """Prepare downloaded datasets for LoRA training by extracting audio files"""
    try:
        from backend.services.dataset_service import DatasetService
        
        if not selected_datasets:
            return "❌ No datasets selected. Please check at least one downloaded dataset."
        
        dataset_service = DatasetService()
        
        # Extract dataset keys (remove status indicators)
        dataset_keys = []
        for item in selected_datasets:
            # Remove status prefix if present
            clean_item = item.replace("✅ ", "").replace("📥 ", "").split(" [")[0]
            dataset_keys.append(clean_item)
        
        status_messages = []
        status_messages.append(f"🔧 Preparing {len(dataset_keys)} dataset(s) for training...\n")
        
        success_count = 0
        already_prepared_count = 0
        error_count = 0
        
        max_samples = int(max_samples_per_dataset) if max_samples_per_dataset > 0 else None
        
        for dataset_key in dataset_keys:
            status_messages.append(f"\n{'='*60}")
            status_messages.append(f"🔧 Preparing: {dataset_key}")
            status_messages.append(f"{'='*60}\n")
            
            # Progress callback
            progress_msgs = []
            def progress_callback(msg):
                progress_msgs.append(msg)
            
            # Prepare dataset
            result = dataset_service.prepare_dataset_for_training(
                dataset_key,
                train_val_split=0.8,
                max_samples=max_samples,
                progress_callback=progress_callback
            )
            
            # Add progress messages
            for msg in progress_msgs:
                status_messages.append(f"   {msg}")
            
            if result.get('success'):
                if result.get('already_prepared'):
                    already_prepared_count += 1
                    status_messages.append(f"\n   ℹ️ Dataset was already prepared")
                else:
                    success_count += 1
                    status_messages.append(f"\n   ✅ Preparation complete!")
                    status_messages.append(f"   📊 Training samples: {result.get('num_train', 0)}")
                    status_messages.append(f"   📊 Validation samples: {result.get('num_val', 0)}")
            else:
                error_count += 1
                status_messages.append(f"\n   ❌ Error: {result.get('error', 'Unknown error')}\n")
        
        # Summary
        status_messages.append(f"\n{'='*60}")
        status_messages.append(f"Summary:")
        status_messages.append(f"  ✅ Successfully prepared: {success_count}")
        status_messages.append(f"  ℹ️ Already prepared: {already_prepared_count}")
        status_messages.append(f"  ❌ Errors: {error_count}")
        status_messages.append(f"{'='*60}")
        
        if success_count > 0:
            status_messages.append(f"\n✅ Datasets are now ready for LoRA training!")
            status_messages.append(f"💡 Go to 'Training Configuration' tab to start training")
        
        return "\n".join(status_messages)
        
    except Exception as e:
        logger.error(f"Dataset preparation failed: {e}", exc_info=True)
        return f"❌ Error: {str(e)}"

def refresh_dataset_status():
    """Refresh dataset status and return updated choices"""
    music_choices, vocal_choices, prepare_choices = get_dataset_choices_with_status()
    return (
        gr.update(choices=music_choices if music_choices else [
            "GTZAN Music Genre (1000 tracks, 10 genres)"
        ]),
        gr.update(choices=vocal_choices if vocal_choices else [
            "FSD50K Sound Events (51K clips, 200 classes)",
            "LibriSpeech ASR (speech recognition)",
            "LibriTTS (audiobooks for TTS)",
            "AudioSet Strong (labeled audio events)",
            "ESC-50 Environmental Sounds",
            "UrbanSound8K (urban sounds)"
        ]),
        gr.update(choices=prepare_choices if prepare_choices else [
            "gtzan", "fsd50k",
            "librispeech", "libritts", "audioset_strong", "esc50", "urbansound8k"
        ])
    )

def prepare_user_training_dataset(audio_files, metadata_table, split_clips, separate_stems, append_to_existing=False, existing_dataset=None, continue_training=False, base_lora_name=None):
    """Prepare user audio dataset for training or append to existing dataset"""
    try:
        logger.info(f"prepare_user_training_dataset called with: audio_files type={type(audio_files)}, value={audio_files if not isinstance(audio_files, list) else f'list of {len(audio_files)} items'}, metadata_table type={type(metadata_table)}")
        
        if not audio_files:
            return "❌ No audio files uploaded"
        
        from backend.services.audio_analysis_service import AudioAnalysisService
        from backend.services.dataset_service import DatasetService
        from pathlib import Path
        import shutil
        import json
        
        analyzer = AudioAnalysisService()
        dataset_service = DatasetService()
        
        # Validate append mode
        if append_to_existing:
            if not existing_dataset or existing_dataset.startswith("⚠️") or existing_dataset.startswith("❌"):
                return "❌ Cannot append: No valid dataset selected\n\n💡 To append files:\n1. First create a dataset by preparing audio without 'Add to existing dataset' checked\n2. Then upload new files and select that dataset to append to"
        
        # Determine dataset name and directory
        if append_to_existing and existing_dataset:
            # Append to existing dataset
            dataset_name = existing_dataset.split(" (")[0].strip()
            dataset_dir = Path("training_data") / dataset_name
            if not dataset_dir.exists():
                return f"❌ Dataset not found: {dataset_name}\n💡 The dataset may have been deleted or moved."
            is_appending = True
        else:
            # Create new dataset directory
            timestamp = int(time.time())
            if continue_training and base_lora_name:
                # Name dataset to indicate continuation
                clean_lora_name = base_lora_name.replace("[Local] ", "").replace("[HF] ", "")
                dataset_name = f"{clean_lora_name}_continue_{timestamp}"
            else:
                dataset_name = f"user_dataset_{timestamp}"
            dataset_dir = Path("training_data") / dataset_name
            is_appending = False
        
        audio_dir = dataset_dir / "audio"
        audio_dir.mkdir(parents=True, exist_ok=True)
        
        logger.info(f"Processing {len(audio_files)} audio files with metadata_table={metadata_table}")
        
        # Process audio files
        processed_files = []
        processed_metadata = []
        
        for i, audio_file in enumerate(audio_files):
            logger.info(f"Processing file {i+1}/{len(audio_files)}: {audio_file.name if hasattr(audio_file, 'name') else audio_file}")
            
            # Get metadata from table
            has_metadata = metadata_table is not None and len(metadata_table) > 0 and i < len(metadata_table)
            
            # Additional check: verify row has actual data (not just empty cells)
            row_data = None
            if has_metadata:
                row_data = metadata_table.iloc[i]
                # Check if the row has a filename (first non-empty indicator)
                has_metadata = bool(row_data['File'])
            
            logger.info(f"has_metadata={has_metadata}, metadata_table length={len(metadata_table) if metadata_table is not None else 'None'}")
            
            if has_metadata and row_data is not None:
                # Access DataFrame using the row we already retrieved
                file_metadata = {
                    'genre': row_data['Genre'] if row_data['Genre'] else 'unknown',
                    'bpm': int(row_data['BPM']) if row_data['BPM'] and row_data['BPM'] != '' else 120,
                    'key': row_data['Key'] if row_data['Key'] else 'C major',
                    'mood': row_data['Mood'] if row_data['Mood'] else 'medium',
                    'instrumentation': row_data['Instruments'] if row_data['Instruments'] else '',
                    'description': row_data['Description'] if row_data['Description'] else ''
                }
            else:
                # Analyze if no metadata
                file_metadata = analyzer.analyze_audio(audio_file.name)
            
            # Copy file to persistent storage
            dest_filename = f"sample_{i:06d}.wav"
            dest_path = audio_dir / dest_filename
            shutil.copy2(audio_file.name, dest_path)
            
            processed_files.append(str(dest_path))
            processed_metadata.append(file_metadata)
        
        # Load existing dataset info if appending
        metadata_path = dataset_dir / 'dataset_info.json'
        existing_dataset_info = None
        if is_appending and metadata_path.exists():
            with open(metadata_path, 'r') as f:
                existing_dataset_info = json.load(f)
            # Append to existing files
            existing_files = existing_dataset_info.get('train_files', []) + existing_dataset_info.get('val_files', [])
            existing_metadata = existing_dataset_info.get('train_metadata', []) + existing_dataset_info.get('val_metadata', [])
            all_files = existing_files + processed_files
            all_metadata = existing_metadata + processed_metadata
        else:
            all_files = processed_files
            all_metadata = processed_metadata
        
        # Split into train/val
        num_train = int(len(all_files) * 0.9)
        train_files = all_files[:num_train]
        val_files = all_files[num_train:]
        train_metadata = all_metadata[:num_train]
        val_metadata = all_metadata[num_train:]
        
        # Save dataset metadata
        dataset_info = {
            'dataset_name': dataset_name,
            'dataset_key': dataset_name,
            'is_user_dataset': True,
            'continue_training': continue_training,
            'base_lora': base_lora_name if continue_training else None,
            'created_date': existing_dataset_info.get('created_date', datetime.now().isoformat()) if existing_dataset_info else datetime.now().isoformat(),
            'last_updated': datetime.now().isoformat(),
            'prepared': True,
            'num_train_samples': len(train_files),
            'num_val_samples': len(val_files),
            'train_files': train_files,
            'val_files': val_files,
            'train_metadata': train_metadata,
            'val_metadata': val_metadata,
            'train_val_split': 0.9
        }
        
        with open(metadata_path, 'w') as f:
            json.dump(dataset_info, f, indent=2)
        
        if is_appending:
            result_msg = f"✅ Added {len(processed_files)} samples to dataset '{dataset_name}'\n📊 Total: {len(all_files)} samples ({len(train_files)} train, {len(val_files)} val)\n📁 Location: {dataset_dir}"
        else:
            result_msg = f"✅ Prepared user dataset '{dataset_name}' with {len(processed_files)} samples ({len(train_files)} train, {len(val_files)} val)\n📁 Saved to: {dataset_dir}"
        
        if continue_training and base_lora_name:
            result_msg += f"\n\n🔄 This dataset is set to continue training from: {base_lora_name}\n💡 Use the 'Training Configuration' tab and select this dataset to start training."
        
        return result_msg
        
    except Exception as e:
        logger.error(f"Dataset preparation failed: {e}", exc_info=True)
        return f"❌ Error: {str(e)}\n\n🔍 Check the logs for detailed error information"

def refresh_dataset_list():
    """Refresh list of available datasets for training"""
    try:
        from backend.services.dataset_service import DatasetService
        
        dataset_service = DatasetService()
        all_datasets = dataset_service.get_all_available_datasets()
        
        # Filter to only prepared datasets
        prepared_datasets = []
        for key, info in all_datasets.items():
            if info.get('prepared'):
                # Format: dataset_key (num_train + num_val samples)
                num_samples = info.get('num_train_samples', 0) + info.get('num_val_samples', 0)
                display_name = f"{key} ({num_samples} samples)"
                prepared_datasets.append(display_name)
        
        if not prepared_datasets:
            prepared_datasets = ["No prepared datasets available"]
        
        # Return two dropdowns with same choices
        # First for training, second for appending
        default_value = prepared_datasets[0] if prepared_datasets and prepared_datasets[0] != "No prepared datasets available" else None
        return gr.Dropdown(choices=prepared_datasets, value=default_value), gr.Dropdown(choices=prepared_datasets, value=None, visible=False)
        
    except Exception as e:
        logger.error(f"Failed to refresh datasets: {e}")
        return gr.Dropdown(choices=["Error loading datasets"])

def auto_populate_lora_name(dataset):
    """Auto-populate LoRA name based on selected dataset, and auto-configure continue training if applicable"""
    try:
        if not dataset or dataset == "No prepared datasets available" or dataset == "Error loading datasets":
            return "", gr.update(), gr.update()
        
        # Extract dataset key from display name
        dataset_key = dataset.split(" (")[0].strip()
        
        # Check if this dataset is set for continue training
        from pathlib import Path
        import json
        
        dataset_dir = Path("training_data") / dataset_key
        metadata_path = dataset_dir / 'dataset_info.json'
        
        use_base_lora = False
        base_lora_value = None
        
        if metadata_path.exists():
            with open(metadata_path, 'r') as f:
                dataset_info = json.load(f)
            
            # Check if this dataset is for continue training
            if dataset_info.get('continue_training') and dataset_info.get('base_lora'):
                use_base_lora = True
                base_lora_value = dataset_info['base_lora']
        
        # Generate versioned name
        import time
        timestamp = int(time.time()) % 10000  # Last 4 digits of timestamp
        lora_name = f"{dataset_key}_v1_{timestamp}"
        
        # Return: lora_name, use_existing_lora checkbox, base_lora_adapter dropdown
        return lora_name, gr.update(value=use_base_lora), gr.update(value=base_lora_value)
        
    except Exception as e:
        logger.error(f"Failed to auto-populate LoRA name: {e}")
        return "", gr.update(), gr.update()

def load_lora_for_training(lora_name):
    """Load a LoRA adapter's configuration for continued training"""
    try:
        if not lora_name:
            return "", "❌ No LoRA selected"
        
        from backend.services.lora_training_service import LoRATrainingService
        lora_service = LoRATrainingService()
        
        # Check if LoRA exists
        lora_path = Path("models/loras") / lora_name
        if not lora_path.exists():
            return "", f"❌ LoRA not found: {lora_name}"
        
        # Load metadata to get original dataset
        import json
        metadata_path = lora_path / "metadata.json"
        dataset_name = ""
        
        if metadata_path.exists():
            with open(metadata_path, 'r') as f:
                metadata = json.load(f)
                dataset_name = metadata.get('dataset', '')
        
        # Generate new LoRA name for continued training
        import time
        timestamp = int(time.time()) % 10000
        new_lora_name = f"{lora_name}_continued_{timestamp}"
        
        status = f"✅ Loaded LoRA: {lora_name}\n"
        status += f"💡 Suggested name for continued training: {new_lora_name}\n"
        if dataset_name:
            status += f"📊 Original dataset: {dataset_name}\n"
        status += "\n⚠️ Remember to select a dataset before starting training!"
        
        return new_lora_name, status
        
    except Exception as e:
        logger.error(f"Failed to load LoRA for training: {e}")
        return "", f"❌ Error: {str(e)}"

def download_lora_from_hf(lora_path_or_id):
    """Download a LoRA from HuggingFace dataset repo"""
    try:
        if not lora_path_or_id or not lora_path_or_id.strip():
            return "❌ Please enter a LoRA path or ID"
        
        # Clean input
        lora_input = lora_path_or_id.strip()
        
        # Extract LoRA name from various input formats
        # Format 1: "loras/jazz-v1" (path in dataset repo)
        # Format 2: "jazz-v1" (just the name)
        # Format 3: Full URL
        
        if lora_input.startswith("http"):
            # Extract from URL
            if "/loras/" in lora_input:
                lora_name = lora_input.split("/loras/")[-1].split(".")[0]
            else:
                return "❌ Invalid URL format. Expected format: .../loras/name.zip"
        elif lora_input.startswith("loras/"):
            # Remove loras/ prefix
            lora_name = lora_input[6:]
        else:
            # Assume it's just the name
            lora_name = lora_input
        
        # Download from dataset repo
        target_dir = Path("models/loras") / lora_name
        lora_path = f"loras/{lora_name}"
        
        logger.info(f"Downloading LoRA: {lora_name} from dataset repo...")
        
        success = hf_storage.download_lora(lora_path, target_dir)
        
        if success:
            return f"✅ Downloaded LoRA: {lora_name}\n💾 Saved to: models/loras/{lora_name}\n\n🎵 LoRA is now available for generation and training!"
        else:
            return f"❌ Failed to download LoRA: {lora_name}\n💡 Check that the LoRA exists in the dataset repo"
        
    except Exception as e:
        logger.error(f"Failed to download LoRA from HF: {e}", exc_info=True)
        return f"❌ Error: {str(e)}"

def start_lora_training(lora_name, dataset, batch_size, learning_rate, num_epochs, lora_rank, lora_alpha, use_base_lora, base_lora):
    """Start LoRA training"""
    try:
        if not lora_name:
            return "❌ Please enter LoRA adapter name", ""
        
        if not dataset or dataset == "No prepared datasets available" or dataset == "Error loading datasets":
            return "❌ Please select a valid dataset", ""
        
        from backend.services.lora_training_service import LoRATrainingService
        lora_service = LoRATrainingService()
        
        # Extract dataset key from display name (format: "dataset_key (N samples)")
        dataset_key = dataset.split(" (")[0].strip()
        
        # Handle base LoRA if continuing training
        base_lora_path = None
        if use_base_lora and base_lora:
            # Extract LoRA name from dropdown selection (format: "[Local] name" or "[HF] name")
            if base_lora.startswith('[Local] '):
                base_lora_name = base_lora.replace('[Local] ', '')
                base_lora_path = str(Path('models/loras') / base_lora_name)
                logger.info(f"Continuing training from local LoRA: {base_lora_path}")
            elif base_lora.startswith('[HF] '):
                base_lora_name = base_lora.replace('[HF] ', '')
                # Download from HuggingFace if needed
                target_dir = Path('models/loras') / base_lora_name
                if not target_dir.exists():
                    logger.info(f"Downloading base LoRA from HF: {base_lora_name}")
                    if hf_storage.download_lora(f"loras/{base_lora_name}", target_dir):
                        base_lora_path = str(target_dir)
                    else:
                        return f"❌ Failed to download base LoRA: {base_lora_name}", ""
                else:
                    base_lora_path = str(target_dir)
                    logger.info(f"Using downloaded HF LoRA: {base_lora_path}")
        
        # Training config
        config = {
            'batch_size': int(batch_size),
            'learning_rate': float(learning_rate),
            'num_epochs': int(num_epochs),
            'lora_rank': int(lora_rank),
            'lora_alpha': int(lora_alpha),
            'base_lora_path': base_lora_path  # Add base LoRA path to config
        }
        
        # Progress callback
        progress_log = []
        def progress_callback(status):
            progress_log.append(
                f"Epoch {status['epoch']} | Step {status['step']} | Loss: {status['loss']:.4f} | Progress: {status['progress']:.1f}%"
            )
            return "\n".join(progress_log[-20:])  # Last 20 lines
        
        # Start training
        progress = f"🚀 Starting training: {lora_name}\nDataset: {dataset_key}\n"
        if base_lora_path:
            progress += f"📂 Base LoRA: {base_lora}\n"
        progress += f"Config: {config}\n\n"
        log = "Training started...\n"
        if base_lora_path:
            log += f"Continuing from base LoRA: {base_lora_path}\n"
        
        # Note: In production, this should run in a background thread
        # For now, this is a simplified synchronous version
        results = lora_service.train_lora(
            dataset_key,
            lora_name,
            training_type="vocal",
            config=config,
            progress_callback=progress_callback
        )
        
        progress += f"\n✅ Training complete!\nFinal validation loss: {results['final_val_loss']:.4f}"
        log += f"\n\nTraining Results:\n{json.dumps(results, indent=2)}"
        
        # Upload trained LoRA to HF dataset repo
        progress += "\n\n📤 Uploading LoRA to HuggingFace dataset repo..."
        lora_dir = Path("models/loras") / lora_name
        if lora_dir.exists():
            try:
                # Upload with training config for proper metadata
                upload_result = hf_storage.upload_lora(lora_dir, training_config=config)
                if upload_result and 'repo_id' in upload_result:
                    progress += f"\n✅ LoRA uploaded successfully!"
                    progress += f"\n🔗 Path: {upload_result['repo_id']}"
                    progress += f"\n👁️ View: {upload_result['url']}"
                    progress += f"\n📚 Dataset Repo: {upload_result['dataset_repo']}"
                elif upload_result is None:
                    # Check if it failed due to auth
                    if not hf_storage.token:
                        progress += "\n⚠️ Upload skipped - not logged in to HuggingFace"
                        progress += "\n💡 To enable uploads: Duplicate this Space and log in"
                    else:
                        progress += "\n⚠️ LoRA trained but upload failed (saved locally)"
                    progress += f"\n💾 LoRA saved locally: models/loras/{lora_name}"
                else:
                    progress += "\n⚠️ LoRA trained but upload failed (saved locally)"
                    progress += f"\n💾 LoRA saved locally: models/loras/{lora_name}"
            except Exception as upload_err:
                logger.error(f"LoRA upload error: {upload_err}", exc_info=True)
                progress += f"\n⚠️ Upload error: {str(upload_err)}"
                progress += f"\n💾 LoRA saved locally: models/loras/{lora_name}"
        else:
            progress += "\n⚠️ LoRA directory not found after training"
        
        return progress, log
        
    except Exception as e:
        logger.error(f"Training failed: {e}", exc_info=True)
        return f"❌ Error: {str(e)}", str(e)

def stop_lora_training():
    """Stop current training"""
    try:
        from backend.services.lora_training_service import LoRATrainingService
        lora_service = LoRATrainingService()
        
        lora_service.stop_training()
        return "⏹️ Training stopped"
        
    except Exception as e:
        logger.error(f"Failed to stop training: {e}")
        return f"❌ Error: {str(e)}"

def refresh_lora_list():
    """Refresh list of LoRA adapters"""
    try:
        from backend.services.lora_training_service import LoRATrainingService
        lora_service = LoRATrainingService()
        
        adapters = lora_service.list_lora_adapters()
        
        # Format as table
        table_data = []
        lora_names = []
        
        for adapter in adapters:
            table_data.append([
                adapter.get('name', ''),
                adapter.get('saved_at', ''),
                adapter.get('training_steps', 0),
                adapter.get('training_type', 'unknown')
            ])
            lora_names.append(adapter.get('name', ''))
        
        # Return table data and update dropdowns (action dropdown, base_lora dropdown, and user_base_lora dropdown)
        return table_data, gr.Dropdown(choices=lora_names), gr.Dropdown(choices=lora_names), gr.Dropdown(choices=lora_names)
        
    except Exception as e:
        logger.error(f"Failed to refresh LoRA list: {e}")
        return [], gr.Dropdown(choices=[]), gr.Dropdown(choices=[]), gr.Dropdown(choices=[])

def get_available_loras():
    """Get list of available LoRA adapter names"""
    try:
        from backend.services.lora_training_service import LoRATrainingService
        lora_service = LoRATrainingService()
        
        adapters = lora_service.list_lora_adapters()
        lora_names = [adapter.get('name', '') for adapter in adapters if adapter.get('name')]
        
        return lora_names
    except Exception as e:
        logger.error(f"Failed to get available LoRAs: {e}")
        return []

def delete_lora(lora_name):
    """Delete selected LoRA adapter"""
    try:
        if not lora_name:
            return "❌ No LoRA selected"
        
        from backend.services.lora_training_service import LoRATrainingService
        lora_service = LoRATrainingService()
        
        success = lora_service.delete_lora_adapter(lora_name)
        
        if success:
            return f"✅ Deleted LoRA adapter: {lora_name}"
        else:
            return f"❌ Failed to delete: {lora_name}"
        
    except Exception as e:
        logger.error(f"Failed to delete LoRA: {e}")
        return f"❌ Error: {str(e)}"

def download_lora(lora_name):
    """Export LoRA adapter as zip file for download"""
    try:
        if not lora_name:
            return None, "❌ No LoRA selected"
        
        from backend.services.lora_training_service import LoRATrainingService
        lora_service = LoRATrainingService()
        
        zip_path = lora_service.export_lora_adapter(lora_name)
        
        if zip_path:
            # Return the file path for Gradio to handle the download
            return zip_path, f"✅ Ready to download: {lora_name}.zip (click the file above to download)"
        else:
            return None, f"❌ Failed to export: {lora_name}"
        
    except Exception as e:
        logger.error(f"Failed to export LoRA: {e}")
        return None, f"❌ Error: {str(e)}"

def upload_lora(zip_file):
    """Import LoRA adapter from zip file"""
    try:
        if not zip_file:
            return "❌ No file selected"
        
        from backend.services.lora_training_service import LoRATrainingService
        lora_service = LoRATrainingService()
        
        lora_name = lora_service.import_lora_adapter(zip_file)
        
        if lora_name:
            return f"✅ Imported LoRA adapter: {lora_name}"
        else:
            return "❌ Failed to import LoRA"
        
    except Exception as e:
        logger.error(f"Failed to import LoRA: {e}")
        return f"❌ Error: {str(e)}"

def toggle_base_lora(use_existing):
    """Toggle visibility of base LoRA dropdown and populate choices"""
    if not use_existing:
        return gr.update(visible=False)
    
    # Get available LoRAs when showing dropdown
    try:
        lora_choices = get_available_loras()
        
        if not lora_choices:
            return gr.update(
                visible=True,
                choices=["⚠️ No LoRAs available"],
                value="⚠️ No LoRAs available",
                interactive=False
            )
        
        return gr.update(
            visible=True,
            choices=lora_choices,
            value=lora_choices[0] if lora_choices else None,
            interactive=True
        )
    except Exception as e:
        logger.error(f"Failed to load LoRAs: {e}")
        return gr.update(
            visible=True,
            choices=["❌ Error loading LoRAs"],
            value="❌ Error loading LoRAs",
            interactive=False
        )

def toggle_append_dataset(should_append):
    """Toggle visibility of existing dataset dropdown with validation"""
    if not should_append:
        return gr.update(visible=False)
    
    # Get available datasets when showing dropdown
    try:
        from backend.services.dataset_service import DatasetService
        dataset_service = DatasetService()
        all_datasets = dataset_service.get_all_available_datasets()
        
        prepared_datasets = []
        for key, info in all_datasets.items():
            if info.get('prepared'):
                num_samples = info.get('num_train_samples', 0) + info.get('num_val_samples', 0)
                display_name = f"{key} ({num_samples} samples)"
                prepared_datasets.append(display_name)
        
        if not prepared_datasets:
            # No datasets available
            return gr.update(
                visible=True, 
                choices=["⚠️ No datasets available - create one first"],
                value="⚠️ No datasets available - create one first",
                interactive=False
            )
        
        return gr.update(
            visible=True, 
            choices=prepared_datasets,
            value=None,
            interactive=True
        )
    except Exception as e:
        return gr.update(
            visible=True,
            choices=[f"❌ Error loading datasets: {str(e)}"],
            value=None,
            interactive=False
        )

def export_dataset(dataset_key):
    """Export prepared dataset as zip file"""
    try:
        if not dataset_key:
            return None, "❌ No dataset selected"
        
        from backend.services.dataset_service import DatasetService
        dataset_service = DatasetService()
        
        zip_path = dataset_service.export_prepared_dataset(dataset_key)
        
        if zip_path:
            return zip_path, f"✅ Dataset exported: {dataset_key}.zip"
        else:
            return None, f"❌ Failed to export: {dataset_key}"
        
    except Exception as e:
        logger.error(f"Failed to export dataset: {e}")
        return None, f"❌ Error: {str(e)}"

def import_dataset(zip_file):
    """Import prepared dataset from zip file"""
    try:
        if not zip_file:
            return "❌ No file selected"
        
        from backend.services.dataset_service import DatasetService
        dataset_service = DatasetService()
        
        dataset_key = dataset_service.import_prepared_dataset(zip_file)
        
        if dataset_key:
            return f"✅ Imported dataset: {dataset_key}"
        else:
            return "❌ Failed to import dataset"
        
    except Exception as e:
        logger.error(f"Failed to import dataset: {e}")
        return f"❌ Error: {str(e)}"

def refresh_export_dataset_list():
    """Refresh list of datasets available for export"""
    try:
        from backend.services.dataset_service import DatasetService
        dataset_service = DatasetService()
        
        # Get all available datasets (both HF and user)
        all_datasets = dataset_service.get_all_available_datasets()
        
        # Filter to only prepared datasets
        prepared = []
        for key, info in all_datasets.items():
            if info.get('prepared', False):
                prepared.append(key)
        
        return gr.Dropdown(choices=prepared)
        
    except Exception as e:
        logger.error(f"Failed to refresh export list: {e}")
        return gr.Dropdown(choices=[])

# MSD Genre Suggestion Functions
def get_available_genres():
    """Get list of available genres from MSD database"""
    # Default genres (available even before importing sample data)
    default_genres = [
        "rock", "pop", "electronic", "jazz", "classical",
        "metal", "hip-hop", "country", "blues", "folk"
    ]
    
    try:
        initialize_msd_services()
        
        if not genre_profiler:
            return default_genres
        
        genres = genre_profiler.get_all_genre_names()
        # Return database genres if available, otherwise use defaults
        return genres if genres else default_genres
    except Exception as e:
        logger.error(f"Failed to get genres: {e}")
        return default_genres

def suggest_parameters_for_genre(genre: str):
    """Get parameter suggestions based on genre profile"""
    initialize_msd_services()
    
    if not genre_profiler or not genre:
        return "Select a genre to see parameter suggestions", "", ""
    
    try:
        suggestions = genre_profiler.suggest_parameters_for_genre(genre)
        
        if not suggestions:
            return f"No profile data available for genre: {genre}", "", ""
        
        # Format suggestions
        info_text = f"""
### 🎵 Genre Profile: {genre.title()}

**Tempo (BPM):** {suggestions.get('tempo_bpm', 'N/A')} BPM
**Recommended Range:** {suggestions['tempo_range']['min']:.0f} - {suggestions['tempo_range']['max']:.0f} BPM

**Common Keys:** {', '.join(suggestions.get('recommended_keys', ['N/A']))}
**Preferred Mode:** {suggestions.get('recommended_mode', 'N/A')}

**Energy Level:** {suggestions.get('energy_level', 'N/A')}
**Danceability:** {suggestions.get('danceability', 'N/A')}

💡 *These suggestions are based on analysis of existing {genre} tracks*
"""
        
        # Generate prompt suggestion
        tempo = suggestions.get('tempo_bpm', 120)
        mode = 'major' if 'major' in str(suggestions.get('recommended_mode', '')).lower() else 'minor'
        
        prompt_suggestion = f"{genre} song at {tempo:.0f} BPM, {mode} key"
        
        # BPM value for slider
        bpm_value = int(tempo)
        
        return info_text, prompt_suggestion, bpm_value
        
    except Exception as e:
        logger.error(f"Error getting genre suggestions: {e}")
        return f"Error: {str(e)}", "", ""

def import_msd_sample_data(count: int = 1000):
    """Import sample MSD data for testing"""
    initialize_msd_services()
    
    if not msd_importer:
        return "❌ MSD services not available"
    
    try:
        logger.info(f"Importing {count} sample songs...")
        result = msd_importer.import_sample_data(count)
        
        status = f"""
✅ Import Complete!

**Songs Imported:** {result['imported']} / {result['total']}
**Failed:** {result['failed']}
**Genres Analyzed:** {result['genres_analyzed']}
**Key-Tempo Patterns:** {result['patterns_saved']}

Database is ready for genre-based parameter suggestions!
"""
        
        return status
        
    except Exception as e:
        logger.error(f"Error importing sample data: {e}")
        return f"❌ Error: {str(e)}"

def get_msd_database_stats():
    """Get current MSD database statistics"""
    initialize_msd_services()
    
    if not msd_db_service:
        return "MSD services not available"
    
    try:
        stats = msd_db_service.get_database_stats()
        
        if stats.get('total_songs', 0) == 0:
            return "Database is empty. Click 'Import Sample Data' to get started."
        
        top_genres = stats.get('top_genres', {})
        genre_list = '\n'.join([f"- {genre}: {count} songs" for genre, count in list(top_genres.items())[:5]])
        
        stats_text = f"""
### 📊 Database Statistics

**Total Songs:** {stats.get('total_songs', 0):,}
**Unique Genres:** {stats.get('genres_count', 0)}

**Top Genres:**
{genre_list}

**Tempo Range:** {stats.get('tempo_min', 0):.0f} - {stats.get('tempo_max', 0):.0f} BPM
**Average Tempo:** {stats.get('tempo_avg', 0):.0f} BPM
"""
        
        return stats_text
        
    except Exception as e:
        logger.error(f"Error getting database stats: {e}")
        return f"Error: {str(e)}"

# Music Theory Functions
def get_theory_suggestions(genre: str, tempo: float, key_index: int, mode_index: int):
    """Get comprehensive music theory suggestions"""
    initialize_theory_services()
    
    if not theory_constraint_service:
        return "Music theory services not available"
    
    try:
        # Convert indices to values
        key_names = ['C', 'C#', 'D', 'D#', 'E', 'F', 'F#', 'G', 'G#', 'A', 'A#', 'B']
        mode_names = ['minor', 'major']
        
        key = key_index
        mode = mode_index
        
        suggestions = theory_constraint_service.suggest_generation_constraints(
            genre, tempo, key, mode
        )
        
        # Format output
        prog_str = '\n'.join([
            f"- {i+1}. {' → '.join(p['progression'])}: {p['description']}"
            for i, p in enumerate(suggestions.get('recommended_progressions', []))
        ])
        
        compat_keys = '\n'.join([
            f"- {k['key_name']} {k['mode_name']}: {k['relationship']} ({k['strength']})"
            for k in suggestions.get('compatible_keys', [])
        ])
        
        output = f"""
### 🎼 Music Theory Suggestions

**Key:** {suggestions['key']} {suggestions['mode']}  
**Scale Notes:** {', '.join(suggestions.get('scale_notes', []))}  
**Tempo:** {tempo} BPM  
**Genre:** {genre}

---

### 🎵 Recommended Chord Progressions
{prog_str}

---

### 🔄 Compatible Keys for Transitions
{compat_keys}

---

### ⚙️ Generation Constraints
- **Allowed Notes:** {', '.join([suggestions['scale_notes'][i] for i in range(min(7, len(suggestions['scale_notes'])))])}
- **Tempo Range:** {suggestions['constraints']['tempo_range'][0]:.0f} - {suggestions['constraints']['tempo_range'][1]:.0f} BPM
- **Time Signature:** {suggestions['constraints'].get('time_signature', '4/4')}

💡 *These suggestions are based on music theory principles and common practices*
"""
        
        return output
        
    except Exception as e:
        logger.error(f"Error getting theory suggestions: {e}")
        return f"Error: {str(e)}"

def import_midi_sample_data(count: int = 100):
    """Import sample MIDI data for testing"""
    initialize_theory_services()
    
    if not lakh_midi_service:
        return "❌ MIDI services not available"
    
    try:
        logger.info(f"Importing {count} sample MIDI files...")
        result = lakh_midi_service.import_sample_data(count)
        
        status = f"""
✅ MIDI Import Complete!

**MIDI Files Imported:** {result['imported']} / {result['total']}
**Failed:** {result['failed']}

MIDI database is ready for chord progression analysis!
"""
        
        return status
        
    except Exception as e:
        logger.error(f"Error importing MIDI data: {e}")
        return f"❌ Error: {str(e)}"

def get_midi_stats():
    """Get MIDI database statistics"""
    initialize_theory_services()
    
    if not lakh_midi_service:
        return "MIDI services not available"
    
    try:
        stats = lakh_midi_service.get_midi_stats()
        
        if stats.get('total_midi_files', 0) == 0:
            return "MIDI database is empty. Click 'Import MIDI Data' to get started."
        
        stats_text = f"""
### 📊 MIDI Database Statistics

**Total MIDI Files:** {stats.get('total_midi_files', 0):,}
**Chord Progressions:** {stats.get('total_progressions', 0):,}
**Average Tempo:** {stats.get('avg_tempo', 0):.0f} BPM

Database contains analyzed chord progressions and melodic patterns for music theory-aware generation!
"""
        
        return stats_text
        
    except Exception as e:
        logger.error(f"Error getting MIDI stats: {e}")
        return f"Error: {str(e)}"

# Create Gradio interface
with gr.Blocks(
    title="LEMM - Let Everyone Make Music v1.0.0 (beta)",
    theme=gr.themes.Soft(primary_hue="purple", secondary_hue="pink")
) as app:
    
    gr.Markdown(
        """
        # 🎵 LEMM - Let Everyone Make Music
        **Version 1.0.0 (beta)**
        
        Advanced AI music generator with built-in training, EQ, Mastering, and Super Resolution. Training data is stored safely on a separate repo for download / reuse.
        """
    )
    
    # Timeline state - stored as JSON string to avoid Gradio schema validation errors
    # Functions will parse/stringify as needed
    timeline_state = gr.State(value='{"clips": []}')
    
    # Generation Section
    gr.Markdown("### 🎼 Music Generation")
    
    prompt_input = gr.Textbox(
        label="🎯 Music Prompt",
        placeholder="energetic rock song with electric guitar at 140 BPM",
        lines=3,
        info="Describe the music style, instruments, tempo, and mood"
    )
    
    # Genre-based Parameter Suggestions (MSD Integration)
    with gr.Accordion("🎸 Genre-Based Parameter Suggestions (Beta)", open=False):
        gr.Markdown("""
            Get AI-powered parameter suggestions based on analysis of real music!
            Select a genre to see recommended BPM, keys, and musical characteristics.
        """)
        
        with gr.Row():
            genre_selector = gr.Dropdown(
                label="Select Genre",
                choices=get_available_genres(),
                value=None,
                interactive=True
            )
            refresh_genres_btn = gr.Button("🔄 Refresh Genres", size="sm")
        
        genre_suggestions_output = gr.Markdown(
            value="Select a genre to see parameter suggestions"
        )
        
        with gr.Row():
            apply_prompt_btn = gr.Button("Apply to Prompt", size="sm")
            apply_bpm_btn = gr.Button("Apply BPM", size="sm", visible=False)
        
        # Hidden state for BPM value
        suggested_bpm = gr.Number(value=120, visible=False)
        
        with gr.Accordion("📊 Database Management", open=False):
            with gr.Row():
                import_sample_btn = gr.Button("Import Sample Data (1000 songs)", size="sm")
                show_stats_btn = gr.Button("Show Database Stats", size="sm")
            
            import_count_slider = gr.Slider(
                minimum=100,
                maximum=5000,
                value=1000,
                step=100,
                label="Number of sample songs to import",
                visible=False
            )
            
            msd_status_output = gr.Markdown(value="")
    
    # Music Theory Suggestions (Phase 2)
    with gr.Accordion("🎼 Music Theory & Chord Progressions (Beta)", open=False):
        gr.Markdown("""
            Get AI-powered music theory suggestions including chord progressions,
            compatible keys, and theory-based constraints for your generation!
        """)
        
        with gr.Row():
            theory_genre = gr.Dropdown(
                label="Genre",
                choices=["pop", "rock", "jazz", "blues", "electronic", "metal", "hip-hop", "classical"],
                value="pop"
            )
            theory_tempo = gr.Slider(
                minimum=60,
                maximum=200,
                value=120,
                step=5,
                label="Tempo (BPM)"
            )
        
        with gr.Row():
            theory_key = gr.Dropdown(
                label="Key",
                choices=["C", "C#", "D", "D#", "E", "F", "F#", "G", "G#", "A", "A#", "B"],
                value="C"
            )
            theory_mode = gr.Dropdown(
                label="Mode",
                choices=["minor", "major"],
                value="major"
            )
        
        get_theory_btn = gr.Button("🔍 Get Theory Suggestions", variant="primary")
        
        theory_output = gr.Markdown(value="Click 'Get Theory Suggestions' to see recommendations")
        
        with gr.Accordion("📊 MIDI Database Management", open=False):
            with gr.Row():
                import_midi_btn = gr.Button("Import MIDI Data (100 files)", size="sm")
                show_midi_stats_btn = gr.Button("Show MIDI Stats", size="sm")
            
            midi_status_output = gr.Markdown(value="")
    
    lyrics_mode = gr.Radio(
        choices=["Instrumental", "User Lyrics", "Auto Lyrics"],
        value="Instrumental",
        label="🎤 Vocal Mode",
        info="Instrumental: no vocals | User: provide lyrics | Auto: AI-generated"
    )
    
    with gr.Row():
        auto_gen_btn = gr.Button("✍️ Generate Lyrics", size="sm")
    
    lyrics_input = gr.Textbox(
        label="📝 Lyrics",
        placeholder="Enter lyrics or click 'Generate Lyrics'...",
        lines=6
    )
    
    with gr.Row():
        context_length_input = gr.Slider(
            minimum=0,
            maximum=240,
            value=0,
            step=10,
            label="🎨 Style Context (seconds)",
            info="How far back to analyze for style consistency (0 = disabled, auto-disabled for first clip)",
            interactive=True
        )
        position_input = gr.Radio(
            choices=["intro", "previous", "next", "outro"],
            value="next",
            label="📍 Position",
            info="Where to add clip on timeline"
        )
    
    with gr.Row():
        use_lora_for_gen = gr.Checkbox(
            label="🎛️ Use LoRA Adapter",
            value=False,
            info="Apply a custom LoRA adapter to generation"
        )
        selected_lora_for_gen = gr.Dropdown(
            label="Select LoRA",
            choices=[],
            visible=False,
            interactive=True
        )
    
    gr.Markdown("*All clips are generated at 32 seconds*")
    
    with gr.Row():
        generate_btn = gr.Button(
            "✨ Generate Music Clip",
            variant="primary",
            size="lg"
        )
    
    gen_status = gr.Textbox(label="📊 Status", lines=2, interactive=False)
    audio_output = gr.Audio(
        label="🎧 Preview", 
        type="filepath",
        waveform_options=gr.WaveformOptions(
            waveform_color="#9333ea",
            waveform_progress_color="#c084fc"
        )
    )
    
    # Timeline Section
    gr.Markdown("---")
    gr.Markdown("### 📊 Timeline")
    
    timeline_display = gr.HTML(
        value=get_timeline_display()
    )
    
    # Playback controls
    timeline_playback = gr.Audio(
        label="🎵 Timeline Playback",
        type="filepath",
        interactive=False,
        autoplay=False,
        waveform_options=gr.WaveformOptions(
            waveform_color="#06b6d4",
            waveform_progress_color="#22d3ee",
            show_controls=True
        )
    )
    
    with gr.Row():
        play_timeline_btn = gr.Button("▶️ Load Timeline for Playback", variant="secondary", scale=2)
        clip_number_input = gr.Number(
            label="Clip #",
            precision=0,
            minimum=1,
            scale=1
        )
        remove_btn = gr.Button("🗑️ Remove Clip", size="sm", scale=1)
        clear_btn = gr.Button("🗑️ Clear All", variant="stop", scale=1)
    
    timeline_status = gr.Textbox(label="Timeline Status", lines=1, interactive=False)
    
    # Advanced Controls
    with gr.Accordion("⚙️ Advanced Audio Mastering", open=False):
        gr.Markdown("### Professional Mastering & EQ")
        
        with gr.Row():
            with gr.Column(scale=1):
                gr.Markdown("**Mastering Presets**")
                preset_select = gr.Dropdown(
                    choices=[
                        "Clean Master - Transparent mastering",
                        "Subtle Warmth - Gentle low-end enhancement",
                        "Modern Pop - Radio-ready pop sound",
                        "Radio Ready - Maximum loudness",
                        "Punchy Commercial - Aggressive punch",
                        "Rock Master - Guitar-focused mastering",
                        "Metal Aggressive - Heavy metal mastering",
                        "Indie Rock - Lo-fi indie character",
                        "EDM Club - Electronic dance music",
                        "House Groovy - House music vibe",
                        "Techno Dark - Dark techno atmosphere",
                        "Dubstep Heavy - Heavy bass dubstep",
                        "HipHop Modern - Modern hip-hop mix",
                        "Trap 808 - Trap with 808 bass",
                        "RnB Smooth - Smooth R&B sound",
                        "Acoustic Natural - Natural acoustic tone",
                        "Folk Warm - Warm folk sound",
                        "Jazz Vintage - Vintage jazz character",
                        "Orchestral Wide - Wide orchestral space",
                        "Classical Concert - Concert hall sound",
                        "Ambient Spacious - Spacious atmospheric",
                        "Harmonic Enhance - Adds brightness and warmth"
                    ],
                    value="Clean Master - Transparent mastering",
                    label="Select Preset"
                )
                
                preset_description = gr.Textbox(
                    label="Description",
                    value="Transparent mastering with gentle compression",
                    lines=2,
                    interactive=False
                )
                
                with gr.Row():
                    preview_preset_btn = gr.Button("🔊 Preview Preset", variant="secondary")
                    apply_preset_btn = gr.Button("✨ Apply to Timeline", variant="primary")
                
                preset_preview_audio = gr.Audio(
                    label="🎵 Preset Preview (Latest Clip)",
                    type="filepath",
                    interactive=False,
                    waveform_options=gr.WaveformOptions(
                        waveform_color="#9333ea",
                        waveform_progress_color="#c084fc"
                    )
                )
                preset_status = gr.Textbox(label="Status", lines=1, interactive=False)
            
            with gr.Column(scale=1):
                gr.Markdown("**Custom EQ**")
                gr.Markdown("*5-band parametric EQ. Adjust gain for each frequency band (-12 to +12 dB).*")
                
                # DAW-style vertical sliders in columns
                with gr.Row():
                    with gr.Column(scale=1):
                        gr.Markdown("<center>**Low**<br>100 Hz</center>")
                        low_shelf_gain = gr.Slider(
                            -12, 12, 0, step=0.5,
                            label="Low (100 Hz)"
                        )
                    
                    with gr.Column(scale=1):
                        gr.Markdown("<center>**Low-Mid**<br>500 Hz</center>")
                        low_mid_gain = gr.Slider(
                            -12, 12, 0, step=0.5,
                            label="Low-Mid (500 Hz)"
                        )
                    
                    with gr.Column(scale=1):
                        gr.Markdown("<center>**Mid**<br>2000 Hz</center>")
                        mid_gain = gr.Slider(
                            -12, 12, 0, step=0.5,
                            label="Mid (2000 Hz)"
                        )
                    
                    with gr.Column(scale=1):
                        gr.Markdown("<center>**High-Mid**<br>5000 Hz</center>")
                        high_mid_gain = gr.Slider(
                            -12, 12, 0, step=0.5,
                            label="High-Mid (5000 Hz)"
                        )
                    
                    with gr.Column(scale=1):
                        gr.Markdown("<center>**High**<br>10k Hz</center>")
                        high_shelf_gain = gr.Slider(
                            -12, 12, 0, step=0.5,
                            label="High (10k Hz)"
                        )
                
                with gr.Row():
                    preview_eq_btn = gr.Button("🔊 Preview EQ", variant="secondary")
                    apply_custom_eq_btn = gr.Button("🎹 Apply to Timeline", variant="primary")
                
                eq_preview_audio = gr.Audio(
                    label="🎵 EQ Preview (Latest Clip)",
                    type="filepath",
                    interactive=False,
                    waveform_options=gr.WaveformOptions(
                        waveform_color="#ec4899",
                        waveform_progress_color="#f9a8d4"
                    )
                )
                eq_status = gr.Textbox(label="Status", lines=1, interactive=False)
        
        # Audio Enhancement Section
        gr.Markdown("---")
        with gr.Row():
            with gr.Column(scale=1):
                gr.Markdown("**🎛️ Stem Enhancement**")
                gr.Markdown("*Separate and enhance vocals, drums, bass independently (improves AI audio quality)*")
                
                enhancement_level = gr.Radio(
                    choices=["Fast", "Balanced", "Maximum"],
                    value="Balanced",
                    label="Enhancement Level",
                    info="Fast: Quick denoise | Balanced: Best quality/speed | Maximum: Full processing"
                )
                
                enhance_timeline_btn = gr.Button("✨ Enhance All Clips", variant="primary")
                enhancement_status = gr.Textbox(label="Status", lines=2, interactive=False)
            
            with gr.Column(scale=1):
                gr.Markdown("**🔊 Audio Upscaling**")
                gr.Markdown("*Neural upsampling to 48kHz for enhanced high-frequency detail*")
                
                upscale_mode = gr.Radio(
                    choices=["Quick (Resample)", "Neural (AudioSR)"],
                    value="Quick (Resample)",
                    label="Upscale Method",
                    info="Quick: Fast resampling | Neural: AI-powered super resolution"
                )
                
                upscale_timeline_btn = gr.Button("⬆️ Upscale All Clips", variant="primary")
                upscale_status = gr.Textbox(label="Status", lines=2, interactive=False)
    
    # Export Section
    gr.Markdown("---")
    gr.Markdown("### 💾 Export")
    
    with gr.Row():
        export_filename = gr.Textbox(
            label="Filename",
            value="my_song",
            scale=2
        )
        export_format = gr.Dropdown(
            choices=["wav", "mp3"],
            value="wav",
            label="Format",
            scale=1
        )
        export_btn = gr.Button("💾 Export", variant="primary", scale=1)
    
    export_status = gr.Textbox(label="Status", lines=1, interactive=False)
    export_audio = gr.Audio(
        label="📥 Download", 
        type="filepath",
        waveform_options=gr.WaveformOptions(
            waveform_color="#10b981",
            waveform_progress_color="#34d399"
        )
    )
    
    # Event handlers
    # Genre Suggestions Event Handlers
    refresh_genres_btn.click(
        fn=lambda: gr.Dropdown(choices=get_available_genres()),
        inputs=[],
        outputs=[genre_selector]
    )
    
    genre_selector.change(
        fn=suggest_parameters_for_genre,
        inputs=[genre_selector],
        outputs=[genre_suggestions_output, prompt_input, suggested_bpm]
    )
    
    apply_prompt_btn.click(
        fn=lambda genre_info, current_prompt: current_prompt if not genre_info else genre_info,
        inputs=[prompt_input, prompt_input],
        outputs=[prompt_input]
    )
    
    import_sample_btn.click(
        fn=lambda count: import_msd_sample_data(count),
        inputs=[import_count_slider],
        outputs=[msd_status_output]
    ).then(
        fn=lambda: gr.Dropdown(choices=get_available_genres()),
        inputs=[],
        outputs=[genre_selector]
    )
    
    show_stats_btn.click(
        fn=get_msd_database_stats,
        inputs=[],
        outputs=[msd_status_output]
    )
    
    # Music Theory Event Handlers
    get_theory_btn.click(
        fn=lambda g, t, k, m: get_theory_suggestions(
            g, t, 
            ["C", "C#", "D", "D#", "E", "F", "F#", "G", "G#", "A", "A#", "B"].index(k),
            ["minor", "major"].index(m)
        ),
        inputs=[theory_genre, theory_tempo, theory_key, theory_mode],
        outputs=[theory_output]
    )
    
    import_midi_btn.click(
        fn=lambda: import_midi_sample_data(100),
        inputs=[],
        outputs=[midi_status_output]
    )
    
    show_midi_stats_btn.click(
        fn=get_midi_stats,
        inputs=[],
        outputs=[midi_status_output]
    )
    
    auto_gen_btn.click(
        fn=generate_lyrics,
        inputs=[prompt_input],
        outputs=lyrics_input
    )
    
    # LoRA selector for generation - reuse toggle_base_lora logic
    use_lora_for_gen.change(
        fn=toggle_base_lora,
        inputs=[use_lora_for_gen],
        outputs=[selected_lora_for_gen]
    )
    
    generate_btn.click(
        fn=generate_music,
        inputs=[prompt_input, lyrics_input, lyrics_mode, position_input, context_length_input, use_lora_for_gen, selected_lora_for_gen, timeline_state],
        outputs=[gen_status, timeline_display, audio_output, timeline_state]
    ).then(
        fn=get_timeline_playback,
        inputs=[timeline_state],
        outputs=[timeline_playback]
    )
    
    remove_btn.click(
        fn=remove_clip,
        inputs=[clip_number_input, timeline_state],
        outputs=[timeline_status, timeline_display, timeline_state]
    )
    
    clear_btn.click(
        fn=clear_timeline,
        inputs=[timeline_state],
        outputs=[timeline_status, timeline_display, timeline_state]
    )
    
    play_timeline_btn.click(
        fn=get_timeline_playback,
        inputs=[timeline_state],
        outputs=[timeline_playback]
    )
    
    export_btn.click(
        fn=export_timeline,
        inputs=[export_filename, export_format, timeline_state],
        outputs=[export_status, export_audio, timeline_state]
    )
    
    # Mastering event handlers
    preset_select.change(
        fn=update_preset_description,
        inputs=[preset_select],
        outputs=[preset_description]
    )
    
    preview_preset_btn.click(
        fn=preview_mastering_preset,
        inputs=[preset_select, timeline_state],
        outputs=[preset_preview_audio, preset_status]
    )
    
    apply_preset_btn.click(
        fn=apply_mastering_preset,
        inputs=[preset_select, timeline_state],
        outputs=[preset_status, timeline_state]
    ).then(
        fn=get_timeline_playback,
        inputs=[timeline_state],
        outputs=[timeline_playback]
    )
    
    preview_eq_btn.click(
        fn=preview_custom_eq,
        inputs=[low_shelf_gain, low_mid_gain, mid_gain, high_mid_gain, high_shelf_gain, timeline_state],
        outputs=[eq_preview_audio, eq_status]
    )
    
    apply_custom_eq_btn.click(
        fn=apply_custom_eq,
        inputs=[low_shelf_gain, low_mid_gain, mid_gain, high_mid_gain, high_shelf_gain, timeline_state],
        outputs=[eq_status, timeline_state]
    ).then(
        fn=get_timeline_playback,
        inputs=[timeline_state],
        outputs=[timeline_playback]
    )
    
    # Enhancement event handlers
    enhance_timeline_btn.click(
        fn=enhance_timeline_clips,
        inputs=[enhancement_level, timeline_state],
        outputs=[enhancement_status, timeline_state]
    ).then(
        fn=get_timeline_playback,
        inputs=[timeline_state],
        outputs=[timeline_playback]
    )
    
    upscale_timeline_btn.click(
        fn=upscale_timeline_clips,
        inputs=[upscale_mode, timeline_state],
        outputs=[upscale_status, timeline_state]
    ).then(
        fn=get_timeline_playback,
        inputs=[timeline_state],
        outputs=[timeline_playback]
    )
    
    # LoRA Training Section
    gr.Markdown("---")
    with gr.Accordion("🎓 LoRA Training (Advanced)", open=False):
        gr.Markdown(
            """
            # 🧠 Train Custom LoRA Adapters
            
            Fine-tune DiffRhythm2 with your own audio or curated datasets to create specialized music generation models.
            
            **Training is permanent** - LoRA adapters are saved to disk and persist across sessions.
            """
        )
        
        with gr.Tabs():
            # Tab 1: Dataset Training
            with gr.Tab("📚 Dataset Training"):
                gr.Markdown("### Pre-curated Dataset Training")
                gr.Markdown("Select datasets from the categories below. All datasets can be used for music generation training.")
                gr.Markdown("**Datasets persist across sessions** - once downloaded/prepared, they remain available.")
                
                refresh_datasets_status_btn = gr.Button("🔄 Refresh Dataset Status", size="sm", variant="secondary")
                
                with gr.Row():
                    with gr.Column():
                        gr.Markdown("**Music Datasets**")
                        vocal_datasets = gr.CheckboxGroup(
                            choices=[
                                "GTZAN Music Genre (1000 tracks, 10 genres)"
                            ],
                            label="Select Music Datasets",
                            info="Verified working music datasets (11TB storage available)"
                        )
                    
                    with gr.Column():
                        gr.Markdown("**Vocal & Sound Datasets**")
                        symbolic_datasets = gr.CheckboxGroup(
                            choices=[
                                "FSD50K Sound Events (51K clips, 200 classes)",
                                "LibriSpeech ASR (speech recognition)",
                                "LibriTTS (audiobooks for TTS)",
                                "AudioSet Strong (labeled audio events)",
                                "ESC-50 Environmental Sounds",
                                "UrbanSound8K (urban sounds)"
                            ],
                            label="Select Vocal/Sound Datasets",
                            info="Verified working vocal and sound datasets"
                        )
                
                with gr.Row():
                    dataset_download_btn = gr.Button("📥 Download Datasets", variant="secondary")
                    check_status_btn = gr.Button("📊 Check Downloaded Datasets", variant="secondary")
                
                dataset_status = gr.Textbox(
                    label="Download Status", 
                    lines=15, 
                    max_lines=25,
                    interactive=False,
                    show_copy_button=True
                )
                
                gr.Markdown("---")
                gr.Markdown("### 🔧 Prepare Downloaded Datasets for Training")
                gr.Markdown("After downloading, prepare datasets by extracting audio files and creating train/val splits.")
                
                prepare_datasets_selector = gr.CheckboxGroup(
                    choices=["gtzan", "fsd50k",
                             "librispeech", "libritts", "audioset_strong", "esc50", "urbansound8k"],
                    label="Select Downloaded Datasets to Prepare",
                    info="Only select datasets you've already downloaded above"
                )
                
                max_samples_slider = gr.Slider(
                    minimum=0,
                    maximum=10000,
                    value=1000,
                    step=100,
                    label="Max Samples per Dataset (0 = all)",
                    info="Limit samples to speed up preparation. 0 means process all samples."
                )
                
                prepare_btn = gr.Button("🔧 Prepare Datasets for Training", variant="primary")
                hf_prepare_status = gr.Textbox(
                    label="Preparation Status",
                    lines=15,
                    max_lines=25,
                    interactive=False,
                    show_copy_button=True
                )
            
            # Tab 2: User Audio Training
            with gr.Tab("🎵 User Audio Training"):
                gr.Markdown("### Train on Your Own Audio")
                
                user_audio_upload = gr.File(
                    label="Upload Audio Files (.wav)",
                    file_count="multiple",
                    file_types=[".wav"]
                )
                
                gr.Markdown("#### Audio Processing Options")
                
                with gr.Row():
                    split_to_clips = gr.Checkbox(
                        label="Auto-split into clips",
                        value=True,
                        info="Split long audio into 10-30s training clips"
                    )
                    separate_stems = gr.Checkbox(
                        label="Separate vocal stems",
                        value=False,
                        info="Extract vocals for vocal-only training (slower)"
                    )
                
                analyze_audio_btn = gr.Button("🔍 Analyze & Generate Metadata", variant="secondary")
                analysis_status = gr.Textbox(label="Analysis Status", lines=2, interactive=False)
                
                gr.Markdown("---")
                gr.Markdown("#### Metadata Editor")
                
                metadata_table = gr.Dataframe(
                    headers=["File", "Genre", "BPM", "Key", "Mood", "Instruments", "Description"],
                    datatype=["str", "str", "number", "str", "str", "str", "str"],
                    row_count=5,
                    col_count=(7, "fixed"),
                    label="Audio Metadata",
                    interactive=True
                )
                
                with gr.Row():
                    ai_generate_metadata_btn = gr.Button("✨ AI Generate All Metadata", size="sm")
                    save_metadata_btn = gr.Button("💾 Save Metadata", variant="primary", size="sm")
                
                metadata_status = gr.Textbox(label="Metadata Status", lines=1, interactive=False)
                
                gr.Markdown("---")
                gr.Markdown("#### Continue Training Options")
                
                with gr.Row():
                    append_to_dataset = gr.Checkbox(
                        label="Add to existing dataset",
                        value=False,
                        info="Append these files to an existing dataset"
                    )
                    existing_dataset_selector = gr.Dropdown(
                        choices=[],
                        label="Select Dataset to Append To",
                        info="Choose which dataset to add files to",
                        visible=False
                    )
                
                with gr.Row():
                    user_continue_lora = gr.Checkbox(
                        label="Continue training from existing LoRA",
                        value=False,
                        info="Start from a pre-trained LoRA adapter"
                    )
                    user_base_lora = gr.Dropdown(
                        choices=[],
                        label="Select LoRA to Continue",
                        info="Choose which LoRA to start from",
                        visible=False
                    )
                
                prepare_user_dataset_btn = gr.Button("📦 Prepare Training Dataset", variant="primary")
                user_prepare_status = gr.Textbox(label="Preparation Status", lines=2, interactive=False)
                
                gr.Markdown("---")
                gr.Markdown("### 📤 Dataset Import/Export")
                
                with gr.Row():
                    dataset_to_export = gr.Dropdown(
                        choices=[],
                        label="Select Dataset to Export",
                        info="Download prepared datasets"
                    )
                    export_dataset_btn = gr.Button("⬇️ Export Dataset", variant="primary", size="sm")
                
                with gr.Row():
                    import_dataset_file = gr.File(
                        label="Import Dataset (.zip)",
                        file_types=[".zip"],
                        type="filepath"
                    )
                
                dataset_download_file = gr.File(label="Downloaded Dataset", visible=True, interactive=False)
                dataset_export_status = gr.Textbox(label="Export/Import Status", lines=2, interactive=False)
            
            # Tab 3: Training Configuration
            with gr.Tab("⚙️ Training Configuration"):
                gr.Markdown("### LoRA Training Settings")
                
                lora_name_input = gr.Textbox(
                    label="LoRA Adapter Name",
                    placeholder="my_custom_lora_v1",
                    info="Unique name for this LoRA adapter"
                )
                
                selected_dataset = gr.Dropdown(
                    choices=[],
                    label="Training Dataset",
                    info="Select prepared dataset to train on"
                )
                
                refresh_datasets_btn = gr.Button("🔄 Refresh Datasets", size="sm")
                
                gr.Markdown("#### Fine-tune Existing LoRA (Optional)")
                
                use_existing_lora = gr.Checkbox(
                    label="Continue training from existing LoRA",
                    value=False,
                    info="Start from a pre-trained LoRA adapter instead of from scratch"
                )
                
                base_lora_adapter = gr.Dropdown(
                    choices=[],
                    label="Base LoRA Adapter",
                    info="Select LoRA to continue training from",
                    visible=False
                )
                
                gr.Markdown("#### Hyperparameters")
                
                with gr.Row():
                    with gr.Column():
                        batch_size = gr.Slider(
                            minimum=1,
                            maximum=16,
                            value=4,
                            step=1,
                            label="Batch Size",
                            info="Larger = faster but more GPU memory"
                        )
                        
                        learning_rate = gr.Slider(
                            minimum=1e-5,
                            maximum=1e-3,
                            value=3e-4,
                            step=1e-5,
                            label="Learning Rate",
                            info="Lower = more stable, higher = faster convergence"
                        )
                        
                        num_epochs = gr.Slider(
                            minimum=1,
                            maximum=50,
                            value=10,
                            step=1,
                            label="Number of Epochs",
                            info="How many times to iterate over dataset"
                        )
                    
                    with gr.Column():
                        lora_rank = gr.Slider(
                            minimum=4,
                            maximum=64,
                            value=16,
                            step=4,
                            label="LoRA Rank",
                            info="Higher = more capacity but slower"
                        )
                        
                        lora_alpha = gr.Slider(
                            minimum=8,
                            maximum=128,
                            value=32,
                            step=8,
                            label="LoRA Alpha",
                            info="Scaling factor for LoRA weights"
                        )
                
                gr.Markdown("---")
                
                start_training_btn = gr.Button("🚀 Start Training", variant="primary", size="lg")
                stop_training_btn = gr.Button("⏹️ Stop Training", variant="stop", size="sm")
                
                training_progress = gr.Textbox(
                    label="Training Progress",
                    lines=5,
                    interactive=False
                )
                
                training_log = gr.Textbox(
                    label="Training Log",
                    lines=10,
                    interactive=False
                )
            
            # Tab 4: Manage LoRA Adapters
            with gr.Tab("📂 Manage LoRA Adapters"):
                gr.Markdown("### Download from HuggingFace")
                gr.Markdown("Download LoRAs from the centralized dataset repository")
                
                with gr.Row():
                    lora_path_input = gr.Textbox(
                        label="LoRA Name or Path",
                        placeholder="jazz-v1 or loras/jazz-v1",
                        info="Enter LoRA name from dataset repo",
                        scale=3
                    )
                    download_from_hf_btn = gr.Button("⬇️ Download from HF", variant="primary", size="sm")
                
                download_from_hf_status = gr.Textbox(label="Download Status", lines=3, interactive=False)
                
                gr.Markdown("---")
                gr.Markdown("### Upload New LoRA Adapter")
                
                with gr.Row():
                    upload_lora_file = gr.File(
                        label="📤 Upload LoRA (.zip)",
                        file_types=[".zip"],
                        type="filepath",
                        scale=3
                    )
                    upload_lora_btn = gr.Button("Upload", variant="primary", size="sm")
                
                upload_lora_status = gr.Textbox(label="Upload Status", lines=1, interactive=False)
                
                gr.Markdown("---")
                gr.Markdown("### Installed LoRA Adapters")
                
                lora_list = gr.Dataframe(
                    headers=["Name", "Created", "Training Steps", "Type"],
                    datatype=["str", "str", "number", "str"],
                    row_count=10,
                    label="Available LoRA Adapters",
                    interactive=False
                )
                
                with gr.Row():
                    refresh_lora_btn = gr.Button("🔄 Refresh List", size="sm")
                
                gr.Markdown("### Actions on Selected LoRA")
                
                selected_lora_for_action = gr.Dropdown(
                    choices=[],
                    label="Select LoRA Adapter",
                    info="Choose a LoRA to download or delete"
                )
                
                with gr.Row():
                    download_lora_btn = gr.Button("⬇️ Download LoRA", variant="primary", size="lg", scale=1)
                    delete_lora_btn = gr.Button("🗑️ Delete LoRA", variant="stop", size="lg", scale=1)
                
                lora_download_file = gr.File(label="Downloaded LoRA", interactive=False)
                lora_action_status = gr.Textbox(label="Action Status", lines=1, interactive=False)
                
                gr.Markdown("---")
                gr.Markdown(
                    """
                    ### 💡 Training Tips
                    
                    **Dataset Size:**
                    - Vocal: 20-50 hours minimum for good results
                    - Symbolic: 1000+ MIDI files recommended
                    - User audio: 30+ minutes minimum (more is better)
                    
                    **Training Time Estimates:**
                    - Small dataset (< 1 hour): 2-4 hours training
                    - Medium dataset (1-10 hours): 4-12 hours training
                    - Large dataset (> 10 hours): 12-48 hours training
                    
                    **GPU Requirements:**
                    - Minimum: 16GB VRAM (LoRA training)
                    - Recommended: 24GB+ VRAM
                    - CPU training: 10-50x slower (not recommended)
                    
                    **Best Practices:**
                    1. Start with small learning rate (3e-4)
                    2. Use batch size 4-8 for best results
                    3. Monitor validation loss to prevent overfitting
                    4. Save checkpoints every 500 steps
                    5. Test generated samples during training
                    
                    **Audio Preprocessing:**
                    - Split long files into 10-30s clips for diversity
                    - Separate vocal stems for vocal-specific training
                    - Use AI metadata generation for consistent labels
                    - Ensure audio quality (44.1kHz, no compression artifacts)
                    """
                )
    
    # LoRA Training Event Handlers
    refresh_datasets_status_btn.click(
        fn=refresh_dataset_status,
        inputs=[],
        outputs=[vocal_datasets, symbolic_datasets, prepare_datasets_selector]
    )
    
    dataset_download_btn.click(
        fn=download_prepare_datasets,
        inputs=[vocal_datasets, symbolic_datasets],
        outputs=[dataset_status]
    ).then(
        fn=refresh_dataset_status,
        inputs=[],
        outputs=[vocal_datasets, symbolic_datasets, prepare_datasets_selector]
    )
    
    check_status_btn.click(
        fn=check_downloaded_datasets,
        inputs=[],
        outputs=[dataset_status]
    )
    
    prepare_btn.click(
        fn=prepare_datasets_for_training,
        inputs=[prepare_datasets_selector, max_samples_slider],
        outputs=[hf_prepare_status]
    ).then(
        fn=refresh_dataset_status,
        inputs=[],
        outputs=[vocal_datasets, symbolic_datasets, prepare_datasets_selector]
    )
    
    analyze_audio_btn.click(
        fn=analyze_user_audio,
        inputs=[user_audio_upload, split_to_clips, separate_stems],
        outputs=[analysis_status, metadata_table]
    )
    
    ai_generate_metadata_btn.click(
        fn=ai_generate_all_metadata,
        inputs=[metadata_table],
        outputs=[metadata_status]
    )
    
    append_to_dataset.change(
        fn=toggle_append_dataset,
        inputs=[append_to_dataset],
        outputs=[existing_dataset_selector]
    )
    
    user_continue_lora.change(
        fn=toggle_base_lora,
        inputs=[user_continue_lora],
        outputs=[user_base_lora]
    )
    
    prepare_user_dataset_btn.click(
        fn=prepare_user_training_dataset,
        inputs=[user_audio_upload, metadata_table, split_to_clips, separate_stems, append_to_dataset, existing_dataset_selector, user_continue_lora, user_base_lora],
        outputs=[user_prepare_status]
    ).then(
        fn=refresh_dataset_status,
        inputs=[],
        outputs=[vocal_datasets, symbolic_datasets, prepare_datasets_selector]
    ).then(
        fn=refresh_dataset_list,
        inputs=[],
        outputs=[selected_dataset, existing_dataset_selector]
    ).success(
        fn=lambda: gr.update(value=False),
        inputs=[],
        outputs=[append_to_dataset]
    )
    
    refresh_datasets_btn.click(
        fn=refresh_dataset_list,
        inputs=[],
        outputs=[selected_dataset, existing_dataset_selector]
    )
    
    start_training_btn.click(
        fn=start_lora_training,
        inputs=[lora_name_input, selected_dataset, batch_size, learning_rate, num_epochs, lora_rank, lora_alpha, use_existing_lora, base_lora_adapter],
        outputs=[training_progress, training_log]
    )
    
    stop_training_btn.click(
        fn=stop_lora_training,
        inputs=[],
        outputs=[training_progress]
    )
    
    refresh_lora_btn.click(
        fn=refresh_lora_list,
        inputs=[],
        outputs=[lora_list, selected_lora_for_action, base_lora_adapter, user_base_lora]
    )
    
    delete_lora_btn.click(
        fn=delete_lora,
        inputs=[selected_lora_for_action],
        outputs=[lora_action_status]
    ).then(
        fn=refresh_lora_list,
        inputs=[],
        outputs=[lora_list, selected_lora_for_action, base_lora_adapter, user_base_lora]
    )
    
    download_lora_btn.click(
        fn=download_lora,
        inputs=[selected_lora_for_action],
        outputs=[lora_download_file, lora_action_status]
    )
    
    upload_lora_btn.click(
        fn=upload_lora,
        inputs=[upload_lora_file],
        outputs=[upload_lora_status]
    ).then(
        fn=refresh_lora_list,
        inputs=[],
        outputs=[lora_list, selected_lora_for_action, base_lora_adapter, user_base_lora]
    )
    
    use_existing_lora.change(
        fn=toggle_base_lora,
        inputs=[use_existing_lora],
        outputs=[base_lora_adapter]
    )
    
    # Auto-populate LoRA name when dataset is selected
    selected_dataset.change(
        fn=auto_populate_lora_name,
        inputs=[selected_dataset],
        outputs=[lora_name_input, use_existing_lora, base_lora_adapter]
    )
    
    # Load LoRA config when existing LoRA is selected for continued training
    base_lora_adapter.change(
        fn=load_lora_for_training,
        inputs=[base_lora_adapter],
        outputs=[lora_name_input, training_log]
    )
    
    # Download LoRA from HuggingFace
    download_from_hf_btn.click(
        fn=download_lora_from_hf,
        inputs=[lora_path_input],
        outputs=[download_from_hf_status]
    ).then(
        fn=refresh_lora_list,
        inputs=[],
        outputs=[lora_list, selected_lora_for_action, base_lora_adapter]
    )
    
    export_dataset_btn.click(
        fn=export_dataset,
        inputs=[dataset_to_export],
        outputs=[dataset_download_file, dataset_export_status]
    )
    
    import_dataset_file.change(
        fn=import_dataset,
        inputs=[import_dataset_file],
        outputs=[dataset_export_status]
    ).then(
        fn=refresh_dataset_status,
        inputs=[],
        outputs=[vocal_datasets, symbolic_datasets, prepare_datasets_selector]
    ).then(
        fn=refresh_dataset_list,
        inputs=[],
        outputs=[selected_dataset]
    ).then(
        fn=refresh_export_dataset_list,
        inputs=[],
        outputs=[dataset_to_export]
    )
    
    # Help section
    with gr.Accordion("ℹ️ Help & Tips", open=False):
        gr.Markdown(
            """
            ## 🚀 Quick Start
            
            1. **Enter a prompt**: "upbeat pop song with synth at 128 BPM"
            2. **Choose mode**: Instrumental (fastest) or with vocals
            3. **Set duration**: Start with 10-20s for quick results
            4. **Generate**: Click the button and wait ~2-4 minutes
            5. **Export**: Download your complete song
            
            ## ⚡ Performance Tips
            
            - **Shorter clips = faster**: 10-20s clips generate in ~1-2 minutes
            - **Instrumental mode**: ~30% faster than with vocals
            - **HF Spaces uses CPU**: Expect 2-4 minutes per 30s clip
            - **Build incrementally**: Generate short clips, then combine
            
            ## 🎯 Prompt Tips
            
            - **Be specific**: "energetic rock with distorted guitar" > "rock song"
            - **Include BPM**: "at 140 BPM" helps set tempo
            - **Mention instruments**: "with piano and drums"
            - **Describe mood**: "melancholic", "upbeat", "aggressive"
            
            ## 🎤 Vocal Modes
            
            - **Instrumental**: Pure music, no vocals (fastest)
            - **User Lyrics**: Provide your own lyrics
            - **Auto Lyrics**: AI generates lyrics based on prompt
            
            ## 📊 Timeline
            
            - Clips are arranged sequentially
            - Remove or clear clips as needed
            - Export combines all clips into one file
            
            ## 🎛️ Audio Enhancement (Advanced)
            
            - **Stem Enhancement**: Separates vocals, drums, bass for individual processing
              - *Fast*: Quick denoise (~2-3s per clip)
              - *Balanced*: Best quality/speed (~5-7s per clip)
              - *Maximum*: Full processing (~10-15s per clip)
            - **Audio Upscaling**: Increase sample rate to 48kHz
              - *Quick*: Fast resampling (~1s per clip)
              - *Neural*: AI super-resolution (~10-20s per clip, better quality)
            
            **Note**: Apply enhancements AFTER all clips are generated and BEFORE export
            
            ---
            
            ⏱️ **Average Generation Time**: 2-4 minutes per 30-second clip on CPU
            
            🎵 **Models**: DiffRhythm2 + MuQ-MuLan + LyricMind AI
            """
        )

# Configure and launch
if __name__ == "__main__":
    logger.info("🎵 Starting Music Generation Studio on HuggingFace Spaces...")
    
    app.queue(
        default_concurrency_limit=1,
        max_size=5
    )
    
    app.launch()