diff --git "a/acestep/gradio_ui/event.py" "b/acestep/gradio_ui/event.py"
deleted file mode 100644--- "a/acestep/gradio_ui/event.py"
+++ /dev/null
@@ -1,3003 +0,0 @@
-"""
-Gradio UI Event Handlers Module
-Contains all event handler definitions and connections
-"""
-import os
-import json
-import random
-import glob
-import time as time_module
-import tempfile
-import gradio as gr
-import math
-from loguru import logger
-from typing import Optional
-from acestep.constants import (
-    TASK_TYPES_TURBO,
-    TASK_TYPES_BASE,
-)
-from acestep.gradio_ui.i18n import t
-
-
-def setup_event_handlers(demo, dit_handler, llm_handler, dataset_handler, dataset_section, generation_section, results_section):
-    """Setup event handlers connecting UI components and business logic"""
-    
-    # Helper functions for batch queue management
-    def store_batch_in_queue(
-        batch_queue,
-        batch_index,
-        audio_paths,
-        generation_info,
-        seeds,
-        codes=None,
-        scores=None,
-        allow_lm_batch=False,
-        batch_size=2,
-        generation_params=None,
-        lm_generated_metadata=None,
-        status="completed"
-    ):
-        """Store batch results in queue with ALL generation parameters
-        
-        Args:
-            codes: Audio codes used for generation (list for batch mode, string for single mode)
-            scores: List of score displays for each audio (optional)
-            allow_lm_batch: Whether batch LM mode was used for this batch
-            batch_size: Batch size used for this batch
-            generation_params: Complete dictionary of ALL generation parameters used
-            lm_generated_metadata: LM-generated metadata for scoring (optional)
-        """
-        import datetime
-        batch_queue[batch_index] = {
-            "status": status,
-            "audio_paths": audio_paths,
-            "generation_info": generation_info,
-            "seeds": seeds,
-            "codes": codes,  # Store codes used for this batch
-            "scores": scores if scores else [""] * 8,  # Store scores, default to empty
-            "allow_lm_batch": allow_lm_batch,  # Store batch mode setting
-            "batch_size": batch_size,  # Store batch size
-            "generation_params": generation_params if generation_params else {},  # Store ALL parameters
-            "lm_generated_metadata": lm_generated_metadata,  # Store LM metadata for scoring
-            "timestamp": datetime.datetime.now().isoformat()
-        }
-        return batch_queue
-    
-    def update_batch_indicator(current_batch, total_batches):
-        """Update batch indicator text"""
-        return t("results.batch_indicator", current=current_batch + 1, total=total_batches)
-    
-    def update_navigation_buttons(current_batch, total_batches):
-        """Determine navigation button states"""
-        can_go_previous = current_batch > 0
-        can_go_next = current_batch < total_batches - 1
-        return can_go_previous, can_go_next
-    
-    def save_audio_and_metadata(
-        audio_path, task_type, captions, lyrics, vocal_language, bpm, key_scale, time_signature, audio_duration,
-        batch_size_input, inference_steps, guidance_scale, seed, random_seed_checkbox,
-        use_adg, cfg_interval_start, cfg_interval_end, audio_format,
-        lm_temperature, lm_cfg_scale, lm_top_k, lm_top_p, lm_negative_prompt,
-        use_cot_caption, use_cot_language, audio_cover_strength,
-        think_checkbox, text2music_audio_code_string, repainting_start, repainting_end,
-        track_name, complete_track_classes, lm_metadata
-    ):
-        """Save audio file and its metadata as a zip package"""
-        import datetime
-        import shutil
-        import zipfile
-        
-        if audio_path is None:
-            gr.Warning(t("messages.no_audio_to_save"))
-            return None
-        
-        try:
-            # Create metadata dictionary
-            metadata = {
-                "saved_at": datetime.datetime.now().isoformat(),
-                "task_type": task_type,
-                "caption": captions or "",
-                "lyrics": lyrics or "",
-                "vocal_language": vocal_language,
-                "bpm": bpm if bpm is not None else None,
-                "keyscale": key_scale or "",
-                "timesignature": time_signature or "",
-                "duration": audio_duration if audio_duration is not None else -1,
-                "batch_size": batch_size_input,
-                "inference_steps": inference_steps,
-                "guidance_scale": guidance_scale,
-                "seed": seed,
-                "random_seed": False,  # Disable random seed for reproducibility
-                "use_adg": use_adg,
-                "cfg_interval_start": cfg_interval_start,
-                "cfg_interval_end": cfg_interval_end,
-                "audio_format": audio_format,
-                "lm_temperature": lm_temperature,
-                "lm_cfg_scale": lm_cfg_scale,
-                "lm_top_k": lm_top_k,
-                "lm_top_p": lm_top_p,
-                "lm_negative_prompt": lm_negative_prompt,
-                "use_cot_caption": use_cot_caption,
-                "use_cot_language": use_cot_language,
-                "audio_cover_strength": audio_cover_strength,
-                "think": think_checkbox,
-                "audio_codes": text2music_audio_code_string or "",
-                "repainting_start": repainting_start,
-                "repainting_end": repainting_end,
-                "track_name": track_name,
-                "complete_track_classes": complete_track_classes or [],
-            }
-            
-            # Add LM-generated metadata if available
-            if lm_metadata:
-                metadata["lm_generated_metadata"] = lm_metadata
-            
-            # Generate timestamp and base name
-            timestamp = datetime.datetime.now().strftime("%Y%m%d_%H%M%S")
-            
-            # Extract audio filename extension
-            audio_ext = os.path.splitext(audio_path)[1]
-            
-            # Create temporary directory for packaging
-            temp_dir = tempfile.mkdtemp()
-            
-            # Save JSON metadata
-            json_path = os.path.join(temp_dir, f"metadata_{timestamp}.json")
-            with open(json_path, 'w', encoding='utf-8') as f:
-                json.dump(metadata, f, indent=2, ensure_ascii=False)
-            
-            # Copy audio file
-            audio_copy_path = os.path.join(temp_dir, f"audio_{timestamp}{audio_ext}")
-            shutil.copy2(audio_path, audio_copy_path)
-            
-            # Create zip file
-            zip_path = os.path.join(tempfile.gettempdir(), f"music_package_{timestamp}.zip")
-            with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zipf:
-                zipf.write(audio_copy_path, os.path.basename(audio_copy_path))
-                zipf.write(json_path, os.path.basename(json_path))
-            
-            # Clean up temp directory
-            shutil.rmtree(temp_dir)
-            
-            gr.Info(t("messages.save_success", filename=os.path.basename(zip_path)))
-            return zip_path
-            
-        except Exception as e:
-            gr.Warning(t("messages.save_failed", error=str(e)))
-            import traceback
-            traceback.print_exc()
-            return None
-    
-    def load_metadata(file_obj):
-        """Load generation parameters from a JSON file"""
-        if file_obj is None:
-            gr.Warning(t("messages.no_file_selected"))
-            return [None] * 31 + [False]  # Return None for all fields, False for is_format_caption
-        
-        try:
-            # Read the uploaded file
-            if hasattr(file_obj, 'name'):
-                filepath = file_obj.name
-            else:
-                filepath = file_obj
-            
-            with open(filepath, 'r', encoding='utf-8') as f:
-                metadata = json.load(f)
-            
-            # Extract all fields
-            task_type = metadata.get('task_type', 'text2music')
-            captions = metadata.get('caption', '')
-            lyrics = metadata.get('lyrics', '')
-            vocal_language = metadata.get('vocal_language', 'unknown')
-            
-            # Convert bpm
-            bpm_value = metadata.get('bpm')
-            if bpm_value is not None and bpm_value != "N/A":
-                try:
-                    bpm = int(bpm_value) if bpm_value else None
-                except:
-                    bpm = None
-            else:
-                bpm = None
-            
-            key_scale = metadata.get('keyscale', '')
-            time_signature = metadata.get('timesignature', '')
-            
-            # Convert duration
-            duration_value = metadata.get('duration', -1)
-            if duration_value is not None and duration_value != "N/A":
-                try:
-                    audio_duration = float(duration_value)
-                except:
-                    audio_duration = -1
-            else:
-                audio_duration = -1
-            
-            batch_size = metadata.get('batch_size', 2)
-            inference_steps = metadata.get('inference_steps', 8)
-            guidance_scale = metadata.get('guidance_scale', 7.0)
-            seed = metadata.get('seed', '-1')
-            random_seed = metadata.get('random_seed', True)
-            use_adg = metadata.get('use_adg', False)
-            cfg_interval_start = metadata.get('cfg_interval_start', 0.0)
-            cfg_interval_end = metadata.get('cfg_interval_end', 1.0)
-            audio_format = metadata.get('audio_format', 'mp3')
-            lm_temperature = metadata.get('lm_temperature', 0.85)
-            lm_cfg_scale = metadata.get('lm_cfg_scale', 2.0)
-            lm_top_k = metadata.get('lm_top_k', 0)
-            lm_top_p = metadata.get('lm_top_p', 0.9)
-            lm_negative_prompt = metadata.get('lm_negative_prompt', 'NO USER INPUT')
-            use_cot_caption = metadata.get('use_cot_caption', True)
-            use_cot_language = metadata.get('use_cot_language', True)
-            audio_cover_strength = metadata.get('audio_cover_strength', 1.0)
-            think = metadata.get('think', True)
-            audio_codes = metadata.get('audio_codes', '')
-            repainting_start = metadata.get('repainting_start', 0.0)
-            repainting_end = metadata.get('repainting_end', -1)
-            track_name = metadata.get('track_name')
-            complete_track_classes = metadata.get('complete_track_classes', [])
-            
-            gr.Info(t("messages.params_loaded", filename=os.path.basename(filepath)))
-            
-            return (
-                task_type, captions, lyrics, vocal_language, bpm, key_scale, time_signature,
-                audio_duration, batch_size, inference_steps, guidance_scale, seed, random_seed,
-                use_adg, cfg_interval_start, cfg_interval_end, audio_format,
-                lm_temperature, lm_cfg_scale, lm_top_k, lm_top_p, lm_negative_prompt,
-                use_cot_caption, use_cot_language, audio_cover_strength,
-                think, audio_codes, repainting_start, repainting_end,
-                track_name, complete_track_classes,
-                True  # Set is_format_caption to True when loading from file
-            )
-            
-        except json.JSONDecodeError as e:
-            gr.Warning(t("messages.invalid_json", error=str(e)))
-            return [None] * 31 + [False]
-        except Exception as e:
-            gr.Warning(t("messages.load_error", error=str(e)))
-            return [None] * 31 + [False]
-    
-    def load_random_example(task_type: str):
-        """Load a random example from the task-specific examples directory
-        
-        Args:
-            task_type: The task type (e.g., "text2music")
-            
-        Returns:
-            Tuple of (caption, lyrics, think, bpm, duration, keyscale, language, timesignature) for updating UI components
-        """
-        try:
-            # Get the project root directory
-            current_file = os.path.abspath(__file__)
-            # event.py is in acestep/gradio_ui/, need 3 levels up to reach project root
-            project_root = os.path.dirname(os.path.dirname(os.path.dirname(current_file)))
-            
-            # Construct the examples directory path
-            examples_dir = os.path.join(project_root, "examples", task_type)
-            
-            # Check if directory exists
-            if not os.path.exists(examples_dir):
-                gr.Warning(f"Examples directory not found: examples/{task_type}/")
-                return "", "", True, None, None, "", "", ""
-            
-            # Find all JSON files in the directory
-            json_files = glob.glob(os.path.join(examples_dir, "*.json"))
-            
-            if not json_files:
-                gr.Warning(f"No JSON files found in examples/{task_type}/")
-                return "", "", True, None, None, "", "", ""
-            
-            # Randomly select one file
-            selected_file = random.choice(json_files)
-            
-            # Read and parse JSON
-            try:
-                with open(selected_file, 'r', encoding='utf-8') as f:
-                    data = json.load(f)
-                
-                # Extract caption (prefer 'caption', fallback to 'prompt')
-                caption_value = data.get('caption', data.get('prompt', ''))
-                if not isinstance(caption_value, str):
-                    caption_value = str(caption_value) if caption_value else ''
-                
-                # Extract lyrics
-                lyrics_value = data.get('lyrics', '')
-                if not isinstance(lyrics_value, str):
-                    lyrics_value = str(lyrics_value) if lyrics_value else ''
-                
-                # Extract think (default to True if not present)
-                think_value = data.get('think', True)
-                if not isinstance(think_value, bool):
-                    think_value = True
-                
-                # Extract optional metadata fields
-                bpm_value = None
-                if 'bpm' in data and data['bpm'] not in [None, "N/A", ""]:
-                    try:
-                        bpm_value = int(data['bpm'])
-                    except (ValueError, TypeError):
-                        pass
-                
-                duration_value = None
-                if 'duration' in data and data['duration'] not in [None, "N/A", ""]:
-                    try:
-                        duration_value = float(data['duration'])
-                    except (ValueError, TypeError):
-                        pass
-                
-                keyscale_value = data.get('keyscale', '')
-                if keyscale_value in [None, "N/A"]:
-                    keyscale_value = ''
-                
-                language_value = data.get('language', '')
-                if language_value in [None, "N/A"]:
-                    language_value = ''
-                
-                timesignature_value = data.get('timesignature', '')
-                if timesignature_value in [None, "N/A"]:
-                    timesignature_value = ''
-                
-                gr.Info(t("messages.example_loaded", filename=os.path.basename(selected_file)))
-                return caption_value, lyrics_value, think_value, bpm_value, duration_value, keyscale_value, language_value, timesignature_value
-                
-            except json.JSONDecodeError as e:
-                gr.Warning(t("messages.example_failed", filename=os.path.basename(selected_file), error=str(e)))
-                return "", "", True, None, None, "", "", ""
-            except Exception as e:
-                gr.Warning(t("messages.example_error", error=str(e)))
-                return "", "", True, None, None, "", "", ""
-                
-        except Exception as e:
-            gr.Warning(t("messages.example_error", error=str(e)))
-            return "", "", True, None, None, "", "", ""
-    
-    def sample_example_smart(task_type: str, constrained_decoding_debug: bool = False):
-        """Smart sample function that uses LM if initialized, otherwise falls back to examples
-        
-        Args:
-            task_type: The task type (e.g., "text2music")
-            constrained_decoding_debug: Whether to enable debug logging for constrained decoding
-            
-        Returns:
-            Tuple of (caption, lyrics, think, bpm, duration, keyscale, language, timesignature) for updating UI components
-        """
-        # Check if LM is initialized
-        if llm_handler.llm_initialized:
-            # Use LM to generate example
-            try:
-                # Generate example using LM with empty input (NO USER INPUT)
-                metadata, status = llm_handler.understand_audio_from_codes(
-                    audio_codes="NO USER INPUT",
-                    use_constrained_decoding=True,
-                    temperature=0.85,
-                    constrained_decoding_debug=constrained_decoding_debug,
-                )
-                
-                if metadata:
-                    caption_value = metadata.get('caption', '')
-                    lyrics_value = metadata.get('lyrics', '')
-                    think_value = True  # Always enable think when using LM-generated examples
-                    
-                    # Extract optional metadata fields
-                    bpm_value = None
-                    if 'bpm' in metadata and metadata['bpm'] not in [None, "N/A", ""]:
-                        try:
-                            bpm_value = int(metadata['bpm'])
-                        except (ValueError, TypeError):
-                            pass
-                    
-                    duration_value = None
-                    if 'duration' in metadata and metadata['duration'] not in [None, "N/A", ""]:
-                        try:
-                            duration_value = float(metadata['duration'])
-                        except (ValueError, TypeError):
-                            pass
-                    
-                    keyscale_value = metadata.get('keyscale', '')
-                    if keyscale_value in [None, "N/A"]:
-                        keyscale_value = ''
-                    
-                    language_value = metadata.get('language', '')
-                    if language_value in [None, "N/A"]:
-                        language_value = ''
-                    
-                    timesignature_value = metadata.get('timesignature', '')
-                    if timesignature_value in [None, "N/A"]:
-                        timesignature_value = ''
-                    
-                    gr.Info(t("messages.lm_generated"))
-                    return caption_value, lyrics_value, think_value, bpm_value, duration_value, keyscale_value, language_value, timesignature_value
-                else:
-                    gr.Warning(t("messages.lm_fallback"))
-                    return load_random_example(task_type)
-                    
-            except Exception as e:
-                gr.Warning(t("messages.lm_fallback"))
-                return load_random_example(task_type)
-        else:
-            # LM not initialized, use examples directory
-            return load_random_example(task_type)
-    
-    def update_init_status(status_msg, enable_btn):
-        """Update initialization status and enable/disable generate button"""
-        return status_msg, gr.update(interactive=enable_btn)
-    
-    # Dataset handlers
-    dataset_section["import_dataset_btn"].click(
-        fn=dataset_handler.import_dataset,
-        inputs=[dataset_section["dataset_type"]],
-        outputs=[dataset_section["data_status"]]
-    )
-    
-    # Service initialization - refresh checkpoints
-    def refresh_checkpoints():
-        choices = dit_handler.get_available_checkpoints()
-        return gr.update(choices=choices)
-    
-    generation_section["refresh_btn"].click(
-        fn=refresh_checkpoints,
-        outputs=[generation_section["checkpoint_dropdown"]]
-    )
-    
-    # Update UI based on model type (turbo vs base)
-    def update_model_type_settings(config_path):
-        """Update UI settings based on model type"""
-        if config_path is None:
-            config_path = ""
-        config_path_lower = config_path.lower()
-        
-        if "turbo" in config_path_lower:
-            # Turbo model: max 8 steps, hide CFG/ADG, only show text2music/repaint/cover
-            return (
-                gr.update(value=8, maximum=8, minimum=1),  # inference_steps
-                gr.update(visible=False),  # guidance_scale
-                gr.update(visible=False),  # use_adg
-                gr.update(visible=False),  # cfg_interval_start
-                gr.update(visible=False),  # cfg_interval_end
-                gr.update(choices=TASK_TYPES_TURBO),  # task_type
-            )
-        elif "base" in config_path_lower:
-            # Base model: max 100 steps, show CFG/ADG, show all task types
-            return (
-                gr.update(value=32, maximum=100, minimum=1),  # inference_steps
-                gr.update(visible=True),  # guidance_scale
-                gr.update(visible=True),  # use_adg
-                gr.update(visible=True),  # cfg_interval_start
-                gr.update(visible=True),  # cfg_interval_end
-                gr.update(choices=TASK_TYPES_BASE),  # task_type
-            )
-        else:
-            # Default to turbo settings
-            return (
-                gr.update(value=8, maximum=8, minimum=1),
-                gr.update(visible=False),
-                gr.update(visible=False),
-                gr.update(visible=False),
-                gr.update(visible=False),
-                gr.update(choices=TASK_TYPES_TURBO),  # task_type
-            )
-    
-    generation_section["config_path"].change(
-        fn=update_model_type_settings,
-        inputs=[generation_section["config_path"]],
-        outputs=[
-            generation_section["inference_steps"],
-            generation_section["guidance_scale"],
-            generation_section["use_adg"],
-            generation_section["cfg_interval_start"],
-            generation_section["cfg_interval_end"],
-            generation_section["task_type"],
-        ]
-    )
-    
-    # Service initialization
-    def init_service_wrapper(checkpoint, config_path, device, init_llm, lm_model_path, backend, use_flash_attention, offload_to_cpu, offload_dit_to_cpu):
-        """Wrapper for service initialization, returns status, button state, and accordion state"""
-        # Initialize DiT handler
-        status, enable = dit_handler.initialize_service(
-            checkpoint, config_path, device,
-            use_flash_attention=use_flash_attention, compile_model=False, 
-            offload_to_cpu=offload_to_cpu, offload_dit_to_cpu=offload_dit_to_cpu
-        )
-        
-        # Initialize LM handler if requested
-        if init_llm:
-            # Get checkpoint directory
-            current_file = os.path.abspath(__file__)
-            # event.py is in acestep/gradio_ui/, need 3 levels up to reach project root
-            project_root = os.path.dirname(os.path.dirname(os.path.dirname(current_file)))
-            checkpoint_dir = os.path.join(project_root, "checkpoints")
-            
-            lm_status, lm_success = llm_handler.initialize(
-                checkpoint_dir=checkpoint_dir,
-                lm_model_path=lm_model_path,
-                backend=backend,
-                device=device,
-                offload_to_cpu=offload_to_cpu,
-                dtype=dit_handler.dtype
-            )
-            
-            if lm_success:
-                status += f"\n{lm_status}"
-            else:
-                status += f"\n{lm_status}"
-                # Don't fail the entire initialization if LM fails, but log it
-                # Keep enable as is (DiT initialization result) even if LM fails
-        
-        # Check if model is initialized - if so, collapse the accordion
-        is_model_initialized = dit_handler.model is not None
-        accordion_state = gr.update(open=not is_model_initialized)
-        
-        return status, gr.update(interactive=enable), accordion_state
-    
-    # Update negative prompt visibility based on "Initialize 5Hz LM" checkbox
-    def update_negative_prompt_visibility(init_llm_checked):
-        """Update negative prompt visibility: show if Initialize 5Hz LM checkbox is checked"""
-        return gr.update(visible=init_llm_checked)
-    
-    # Update audio_cover_strength visibility and label based on task type and LM initialization
-    def update_audio_cover_strength_visibility(task_type_value, init_llm_checked):
-        """Update audio_cover_strength visibility and label"""
-        # Show if task is cover OR if LM is initialized
-        is_visible = (task_type_value == "cover") or init_llm_checked
-        # Change label based on context
-        if init_llm_checked and task_type_value != "cover":
-            label = "LM codes strength"
-            info = "Control how many denoising steps use LM-generated codes"
-        else:
-            label = "Audio Cover Strength"
-            info = "Control how many denoising steps use cover mode"
-        
-        return gr.update(visible=is_visible, label=label, info=info)
-    
-    # Update visibility when init_llm_checkbox changes
-    generation_section["init_llm_checkbox"].change(
-        fn=update_negative_prompt_visibility,
-        inputs=[generation_section["init_llm_checkbox"]],
-        outputs=[generation_section["lm_negative_prompt"]]
-    )
-    
-    # Update audio_cover_strength visibility and label when init_llm_checkbox changes
-    generation_section["init_llm_checkbox"].change(
-        fn=update_audio_cover_strength_visibility,
-        inputs=[generation_section["task_type"], generation_section["init_llm_checkbox"]],
-        outputs=[generation_section["audio_cover_strength"]]
-    )
-    
-    # Also update audio_cover_strength when task_type changes (to handle label changes)
-    generation_section["task_type"].change(
-        fn=update_audio_cover_strength_visibility,
-        inputs=[generation_section["task_type"], generation_section["init_llm_checkbox"]],
-        outputs=[generation_section["audio_cover_strength"]]
-    )
-    
-    generation_section["init_btn"].click(
-        fn=init_service_wrapper,
-        inputs=[
-            generation_section["checkpoint_dropdown"],
-            generation_section["config_path"],
-            generation_section["device"],
-            generation_section["init_llm_checkbox"],
-            generation_section["lm_model_path"],
-            generation_section["backend_dropdown"],
-            generation_section["use_flash_attention_checkbox"],
-            generation_section["offload_to_cpu_checkbox"],
-            generation_section["offload_dit_to_cpu_checkbox"],
-        ],
-        outputs=[generation_section["init_status"], generation_section["generate_btn"], generation_section["service_config_accordion"]]
-    )
-    
-    # Generation with progress bar
-    def generate_with_progress(
-        captions, lyrics, bpm, key_scale, time_signature, vocal_language,
-        inference_steps, guidance_scale, random_seed_checkbox, seed,
-        reference_audio, audio_duration, batch_size_input, src_audio,
-        text2music_audio_code_string, repainting_start, repainting_end,
-        instruction_display_gen, audio_cover_strength, task_type,
-        use_adg, cfg_interval_start, cfg_interval_end, audio_format, lm_temperature,
-        think_checkbox, lm_cfg_scale, lm_top_k, lm_top_p, lm_negative_prompt,
-        use_cot_metas, use_cot_caption, use_cot_language, is_format_caption,
-        constrained_decoding_debug,
-        allow_lm_batch,
-        auto_score,
-        score_scale,
-        lm_batch_chunk_size,
-        progress=gr.Progress(track_tqdm=True)
-    ):
-        # If think is enabled (llm_dit mode) and use_cot_metas is True, generate audio codes using LM first
-        audio_code_string_to_use = text2music_audio_code_string
-        lm_generated_metadata = None  # Store LM-generated metadata for display
-        lm_generated_audio_codes = None  # Store LM-generated audio codes for display
-        lm_generated_audio_codes_list = []  # Store list of audio codes for batch processing
-        
-        # Determine if we should use batch LM generation
-        should_use_lm_batch = (
-            think_checkbox and
-            llm_handler.llm_initialized and
-            use_cot_metas and
-            allow_lm_batch and
-            batch_size_input >= 2
-        )
-        
-        if think_checkbox and llm_handler.llm_initialized and use_cot_metas:
-            # Convert top_k: 0 means None (disabled)
-            top_k_value = None if lm_top_k == 0 else int(lm_top_k)
-            # Convert top_p: 1.0 means None (disabled)
-            top_p_value = None if lm_top_p >= 1.0 else lm_top_p
-            
-            # Build user_metadata from user-provided values (only include non-empty values)
-            user_metadata = {}
-            # Handle bpm: gr.Number can be None, int, float, or string
-            if bpm is not None:
-                try:
-                    bpm_value = float(bpm)
-                    if bpm_value > 0:
-                        user_metadata['bpm'] = str(int(bpm_value))
-                except (ValueError, TypeError):
-                    # If bpm is not a valid number, skip it
-                    pass
-            if key_scale and key_scale.strip():
-                key_scale_clean = key_scale.strip()
-                if key_scale_clean.lower() not in ["n/a", ""]:
-                    user_metadata['keyscale'] = key_scale_clean
-            if time_signature and time_signature.strip():
-                time_sig_clean = time_signature.strip()
-                if time_sig_clean.lower() not in ["n/a", ""]:
-                    user_metadata['timesignature'] = time_sig_clean
-            if audio_duration is not None:
-                try:
-                    duration_value = float(audio_duration)
-                    if duration_value > 0:
-                        user_metadata['duration'] = str(int(duration_value))
-                except (ValueError, TypeError):
-                    # If audio_duration is not a valid number, skip it
-                    pass
-            
-            # Only pass user_metadata if user provided any values, otherwise let LM generate
-            user_metadata_to_pass = user_metadata if user_metadata else None
-            
-            if should_use_lm_batch:
-                # BATCH LM GENERATION                
-                logger.info(f"Using LM batch generation for {batch_size_input} items...")
-                
-                # Prepare seeds for batch items
-                actual_seed_list, _ = dit_handler.prepare_seeds(batch_size_input, seed, random_seed_checkbox)
-                
-                # Split batch into chunks (GPU memory constraint)
-                max_inference_batch_size = int(lm_batch_chunk_size)
-                num_chunks = math.ceil(batch_size_input / max_inference_batch_size)
-                
-                all_metadata_list = []
-                all_audio_codes_list = []
-                
-                for chunk_idx in range(num_chunks):
-                    chunk_start = chunk_idx * max_inference_batch_size
-                    chunk_end = min(chunk_start + max_inference_batch_size, batch_size_input)
-                    chunk_size = chunk_end - chunk_start
-                    chunk_seeds = actual_seed_list[chunk_start:chunk_end]
-                    
-                    logger.info(f"Generating LM batch chunk {chunk_idx+1}/{num_chunks} (size: {chunk_size}, seeds: {chunk_seeds})...")
-                    
-                    # Generate batch
-                    metadata_list, audio_codes_list, status = llm_handler.generate_with_stop_condition_batch(
-                        caption=captions or "",
-                        lyrics=lyrics or "",
-                        batch_size=chunk_size,
-                        infer_type="llm_dit",
-                        temperature=lm_temperature,
-                        cfg_scale=lm_cfg_scale,
-                        negative_prompt=lm_negative_prompt,
-                        top_k=top_k_value,
-                        top_p=top_p_value,
-                        user_metadata=user_metadata_to_pass,
-                        use_cot_caption=use_cot_caption,
-                        use_cot_language=use_cot_language,
-                        is_format_caption=is_format_caption,
-                        constrained_decoding_debug=constrained_decoding_debug,
-                        seeds=chunk_seeds,
-                    )
-                    
-                    all_metadata_list.extend(metadata_list)
-                    all_audio_codes_list.extend(audio_codes_list)
-                
-                # Use first metadata as representative (all are same)
-                lm_generated_metadata = all_metadata_list[0] if all_metadata_list else None
-                
-                # Store audio codes list for later use
-                lm_generated_audio_codes_list = all_audio_codes_list
-                
-                # Prepare audio codes for DiT (list of codes, one per batch item)
-                audio_code_string_to_use = all_audio_codes_list
-                
-                # Update metadata fields from LM if not provided by user
-                if lm_generated_metadata:
-                    if bpm is None and lm_generated_metadata.get('bpm'):
-                        bpm_value = lm_generated_metadata.get('bpm')
-                        if bpm_value != "N/A" and bpm_value != "":
-                            try:
-                                bpm = int(bpm_value)
-                            except:
-                                pass
-                    if not key_scale and lm_generated_metadata.get('keyscale'):
-                        key_scale_value = lm_generated_metadata.get('keyscale', lm_generated_metadata.get('key_scale', ""))
-                        if key_scale_value != "N/A":
-                            key_scale = key_scale_value
-                    if not time_signature and lm_generated_metadata.get('timesignature'):
-                        time_signature_value = lm_generated_metadata.get('timesignature', lm_generated_metadata.get('time_signature', ""))
-                        if time_signature_value != "N/A":
-                            time_signature = time_signature_value
-                    if audio_duration is None or audio_duration <= 0:
-                        audio_duration_value = lm_generated_metadata.get('duration', -1)
-                        if audio_duration_value != "N/A" and audio_duration_value != "":
-                            try:
-                                audio_duration = float(audio_duration_value)
-                            except:
-                                pass
-            else:
-                # SEQUENTIAL LM GENERATION (current behavior, when allow_lm_batch is False)
-                # Phase 1: Generate CoT metadata
-                phase1_start = time_module.time()
-                metadata, _, status = llm_handler.generate_with_stop_condition(
-                    caption=captions or "",
-                    lyrics=lyrics or "",
-                    infer_type="dit",  # Only generate metadata in Phase 1
-                    temperature=lm_temperature,
-                    cfg_scale=lm_cfg_scale,
-                    negative_prompt=lm_negative_prompt,
-                    top_k=top_k_value,
-                    top_p=top_p_value,
-                    user_metadata=user_metadata_to_pass,
-                    use_cot_caption=use_cot_caption,
-                    use_cot_language=use_cot_language,
-                    is_format_caption=is_format_caption,
-                    constrained_decoding_debug=constrained_decoding_debug,
-                )
-                lm_phase1_time = time_module.time() - phase1_start
-                logger.info(f"LM Phase 1 (CoT) completed in {lm_phase1_time:.2f}s")
-                
-                # Phase 2: Generate audio codes
-                phase2_start = time_module.time()
-                metadata, audio_codes, status = llm_handler.generate_with_stop_condition(
-                    caption=captions or "",
-                    lyrics=lyrics or "",
-                    infer_type="llm_dit",  # Generate both metadata and codes
-                    temperature=lm_temperature,
-                    cfg_scale=lm_cfg_scale,
-                    negative_prompt=lm_negative_prompt,
-                    top_k=top_k_value,
-                    top_p=top_p_value,
-                    user_metadata=user_metadata_to_pass,
-                    use_cot_caption=use_cot_caption,
-                    use_cot_language=use_cot_language,
-                    is_format_caption=is_format_caption,
-                    constrained_decoding_debug=constrained_decoding_debug,
-                )
-                lm_phase2_time = time_module.time() - phase2_start
-                logger.info(f"LM Phase 2 (Codes) completed in {lm_phase2_time:.2f}s")
-                
-                # Store LM-generated metadata and audio codes for display
-                lm_generated_metadata = metadata
-                if audio_codes:
-                    audio_code_string_to_use = audio_codes
-                    lm_generated_audio_codes = audio_codes
-                    # Update metadata fields only if they are empty/None (user didn't provide them)
-                    if bpm is None and metadata.get('bpm'):
-                        bpm_value = metadata.get('bpm')
-                        if bpm_value != "N/A" and bpm_value != "":
-                            try:
-                                bpm = int(bpm_value)
-                            except:
-                                pass
-                    if not key_scale and metadata.get('keyscale'):
-                        key_scale_value = metadata.get('keyscale', metadata.get('key_scale', ""))
-                        if key_scale_value != "N/A":
-                            key_scale = key_scale_value
-                    if not time_signature and metadata.get('timesignature'):
-                        time_signature_value = metadata.get('timesignature', metadata.get('time_signature', ""))
-                        if time_signature_value != "N/A":
-                            time_signature = time_signature_value
-                    if audio_duration is None or audio_duration <= 0:
-                        audio_duration_value = metadata.get('duration', -1)
-                        if audio_duration_value != "N/A" and audio_duration_value != "":
-                            try:
-                                audio_duration = float(audio_duration_value)
-                            except:
-                                pass
-        
-        # Pass LM timing to dit_handler.generate_music via generation_info
-        # We'll add it to the result after getting it back
-        
-        # Call generate_music and get results
-        result = dit_handler.generate_music(
-            captions=captions, lyrics=lyrics, bpm=bpm, key_scale=key_scale,
-            time_signature=time_signature, vocal_language=vocal_language,
-            inference_steps=inference_steps, guidance_scale=guidance_scale,
-            use_random_seed=random_seed_checkbox, seed=seed,
-            reference_audio=reference_audio, audio_duration=audio_duration,
-            batch_size=batch_size_input, src_audio=src_audio,
-            audio_code_string=audio_code_string_to_use,
-            repainting_start=repainting_start, repainting_end=repainting_end,
-            instruction=instruction_display_gen, audio_cover_strength=audio_cover_strength,
-            task_type=task_type, use_adg=use_adg,
-            cfg_interval_start=cfg_interval_start, cfg_interval_end=cfg_interval_end,
-            audio_format=audio_format, lm_temperature=lm_temperature,
-            progress=progress
-        )
-        
-        # Extract results
-        first_audio, second_audio, all_audio_paths, generation_info, status_message, seed_value_for_ui, \
-            align_score_1, align_text_1, align_plot_1, align_score_2, align_text_2, align_plot_2 = result
-        
-        # Extract LM timing from status if available and prepend to generation_info
-        if status:
-            import re
-            # Try to extract timing info from status using regex
-            # Expected format: "Phase1: X.XXs" and "Phase2: X.XXs"
-            phase1_match = re.search(r'Phase1:\s*([\d.]+)s', status)
-            phase2_match = re.search(r'Phase2:\s*([\d.]+)s', status)
-            
-            if phase1_match or phase2_match:
-                lm_timing_section = "\n\n**🤖 LM Timing:**\n"
-                lm_total = 0.0
-                if phase1_match:
-                    phase1_time = float(phase1_match.group(1))
-                    lm_timing_section += f"  - Phase 1 (CoT Metadata): {phase1_time:.2f}s\n"
-                    lm_total += phase1_time
-                if phase2_match:
-                    phase2_time = float(phase2_match.group(1))
-                    lm_timing_section += f"  - Phase 2 (Audio Codes): {phase2_time:.2f}s\n"
-                    lm_total += phase2_time
-                if lm_total > 0:
-                    lm_timing_section += f"  - Total LM Time: {lm_total:.2f}s\n"
-                generation_info = lm_timing_section + "\n" + generation_info
-        
-        # Append LM-generated metadata to generation_info if available
-        if lm_generated_metadata:
-            metadata_lines = []
-            if lm_generated_metadata.get('bpm'):
-                metadata_lines.append(f"- **BPM:** {lm_generated_metadata['bpm']}")
-            if lm_generated_metadata.get('caption'):
-                metadata_lines.append(f"- **User Query Rewritten Caption:** {lm_generated_metadata['caption']}")
-            if lm_generated_metadata.get('duration'):
-                metadata_lines.append(f"- **Duration:** {lm_generated_metadata['duration']} seconds")
-            if lm_generated_metadata.get('keyscale'):
-                metadata_lines.append(f"- **KeyScale:** {lm_generated_metadata['keyscale']}")
-            if lm_generated_metadata.get('language'):
-                metadata_lines.append(f"- **Language:** {lm_generated_metadata['language']}")
-            if lm_generated_metadata.get('timesignature'):
-                metadata_lines.append(f"- **Time Signature:** {lm_generated_metadata['timesignature']}")
-            
-            if metadata_lines:
-                metadata_section = "\n\n**🤖 LM-Generated Metadata:**\n" + "\n\n".join(metadata_lines)
-                generation_info = metadata_section + "\n\n" + generation_info
-        
-        # Update audio codes in UI if LM generated them
-        codes_outputs = [""] * 8  # Codes for 8 components
-        if should_use_lm_batch and lm_generated_audio_codes_list:
-            # Batch mode: update individual codes inputs
-            for idx in range(min(len(lm_generated_audio_codes_list), 8)):
-                codes_outputs[idx] = lm_generated_audio_codes_list[idx]
-            # For single codes input, show first one
-            updated_audio_codes = lm_generated_audio_codes_list[0] if lm_generated_audio_codes_list else text2music_audio_code_string
-        else:
-            # Single mode: update main codes input
-            updated_audio_codes = lm_generated_audio_codes if lm_generated_audio_codes else text2music_audio_code_string
-        
-        # AUTO-SCORING
-        score_displays = [""] * 8  # Scores for 8 components
-        if auto_score and all_audio_paths:
-            from loguru import logger
-            logger.info(f"Auto-scoring enabled, calculating quality scores for {batch_size_input} generated audios...")
-            
-            # Determine which audio codes to use for scoring
-            if should_use_lm_batch and lm_generated_audio_codes_list:
-                codes_list = lm_generated_audio_codes_list
-            elif audio_code_string_to_use and isinstance(audio_code_string_to_use, list):
-                codes_list = audio_code_string_to_use
-            else:
-                # Single code string, replicate for all audios
-                codes_list = [audio_code_string_to_use] * len(all_audio_paths)
-            
-            # Calculate scores only for actually generated audios (up to batch_size_input)
-            # Don't score beyond the actual batch size to avoid duplicates
-            actual_audios_to_score = min(len(all_audio_paths), int(batch_size_input))
-            for idx in range(actual_audios_to_score):
-                if idx < len(codes_list) and codes_list[idx]:
-                    try:
-                        score_display = calculate_score_handler(
-                            codes_list[idx],
-                            captions,
-                            lyrics,
-                            lm_generated_metadata,
-                            bpm, key_scale, time_signature, audio_duration, vocal_language,
-                            score_scale
-                        )
-                        score_displays[idx] = score_display
-                        logger.info(f"Auto-scored audio {idx+1}")
-                    except Exception as e:
-                        logger.error(f"Auto-scoring failed for audio {idx+1}: {e}")
-                        score_displays[idx] = f"❌ Auto-scoring failed: {str(e)}"
-        
-        # Prepare audio outputs (up to 8)
-        audio_outputs = [None] * 8
-        for idx in range(min(len(all_audio_paths), 8)):
-            audio_outputs[idx] = all_audio_paths[idx]
-        
-        return (
-            audio_outputs[0],  # generated_audio_1
-            audio_outputs[1],  # generated_audio_2
-            audio_outputs[2],  # generated_audio_3
-            audio_outputs[3],  # generated_audio_4
-            audio_outputs[4],  # generated_audio_5
-            audio_outputs[5],  # generated_audio_6
-            audio_outputs[6],  # generated_audio_7
-            audio_outputs[7],  # generated_audio_8
-            all_audio_paths,   # generated_audio_batch
-            generation_info,
-            status_message,
-            seed_value_for_ui,
-            align_score_1,
-            align_text_1,
-            align_plot_1,
-            align_score_2,
-            align_text_2,
-            align_plot_2,
-            score_displays[0],  # score_display_1
-            score_displays[1],  # score_display_2
-            score_displays[2],  # score_display_3
-            score_displays[3],  # score_display_4
-            score_displays[4],  # score_display_5
-            score_displays[5],  # score_display_6
-            score_displays[6],  # score_display_7
-            score_displays[7],  # score_display_8
-            updated_audio_codes,  # Update main audio codes in UI
-            codes_outputs[0],  # text2music_audio_code_string_1
-            codes_outputs[1],  # text2music_audio_code_string_2
-            codes_outputs[2],  # text2music_audio_code_string_3
-            codes_outputs[3],  # text2music_audio_code_string_4
-            codes_outputs[4],  # text2music_audio_code_string_5
-            codes_outputs[5],  # text2music_audio_code_string_6
-            codes_outputs[6],  # text2music_audio_code_string_7
-            codes_outputs[7],  # text2music_audio_code_string_8
-            lm_generated_metadata,  # Store metadata for "Send to src audio" buttons
-            is_format_caption,  # Keep is_format_caption unchanged
-        )
-    
-    # Helper function to capture current UI parameters - NOT NEEDED ANYMORE
-    # Parameters are already captured during generate_with_batch_management
-    def capture_current_params(
-        captions, lyrics, bpm, key_scale, time_signature, vocal_language,
-        inference_steps, guidance_scale, random_seed_checkbox, seed,
-        reference_audio, audio_duration, batch_size_input, src_audio,
-        text2music_audio_code_string, repainting_start, repainting_end,
-        instruction_display_gen, audio_cover_strength, task_type,
-        use_adg, cfg_interval_start, cfg_interval_end, audio_format, lm_temperature,
-        think_checkbox, lm_cfg_scale, lm_top_k, lm_top_p, lm_negative_prompt,
-        use_cot_metas, use_cot_caption, use_cot_language,
-        constrained_decoding_debug, allow_lm_batch, auto_score, score_scale, lm_batch_chunk_size,
-        track_name, complete_track_classes  # ADDED: missing parameters
-    ):
-        """Capture current UI parameters for next batch generation
-        
-        IMPORTANT: For AutoGen batches, we clear audio codes to ensure:
-        - Thinking mode: LM generates NEW codes for each batch
-        - Non-thinking mode: DiT generates with different random seeds
-        """
-        return {
-            "captions": captions,
-            "lyrics": lyrics,
-            "bpm": bpm,
-            "key_scale": key_scale,
-            "time_signature": time_signature,
-            "vocal_language": vocal_language,
-            "inference_steps": inference_steps,
-            "guidance_scale": guidance_scale,
-            "random_seed_checkbox": True,  # Always use random for AutoGen batches
-            "seed": seed,
-            "reference_audio": reference_audio,
-            "audio_duration": audio_duration,
-            "batch_size_input": batch_size_input,
-            "src_audio": src_audio,
-            "text2music_audio_code_string": "",  # CLEAR codes for next batch! Let LM regenerate or DiT use new seeds
-            "repainting_start": repainting_start,
-            "repainting_end": repainting_end,
-            "instruction_display_gen": instruction_display_gen,
-            "audio_cover_strength": audio_cover_strength,
-            "task_type": task_type,
-            "use_adg": use_adg,
-            "cfg_interval_start": cfg_interval_start,
-            "cfg_interval_end": cfg_interval_end,
-            "audio_format": audio_format,
-            "lm_temperature": lm_temperature,
-            "think_checkbox": think_checkbox,
-            "lm_cfg_scale": lm_cfg_scale,
-            "lm_top_k": lm_top_k,
-            "lm_top_p": lm_top_p,
-            "lm_negative_prompt": lm_negative_prompt,
-            "use_cot_metas": use_cot_metas,
-            "use_cot_caption": use_cot_caption,
-            "use_cot_language": use_cot_language,
-            "constrained_decoding_debug": constrained_decoding_debug,
-            "allow_lm_batch": allow_lm_batch,
-            "auto_score": auto_score,
-            "score_scale": score_scale,
-            "lm_batch_chunk_size": lm_batch_chunk_size,
-            "track_name": track_name,  # ADDED
-            "complete_track_classes": complete_track_classes,  # ADDED
-        }
-    
-    # Wrapper function with batch queue management
-    def generate_with_batch_management(
-        captions, lyrics, bpm, key_scale, time_signature, vocal_language,
-        inference_steps, guidance_scale, random_seed_checkbox, seed,
-        reference_audio, audio_duration, batch_size_input, src_audio,
-        text2music_audio_code_string, repainting_start, repainting_end,
-        instruction_display_gen, audio_cover_strength, task_type,
-        use_adg, cfg_interval_start, cfg_interval_end, audio_format, lm_temperature,
-        think_checkbox, lm_cfg_scale, lm_top_k, lm_top_p, lm_negative_prompt,
-        use_cot_metas, use_cot_caption, use_cot_language, is_format_caption,
-        constrained_decoding_debug,
-        allow_lm_batch,
-        auto_score,
-        score_scale,
-        lm_batch_chunk_size,
-        track_name,  # ADDED: track name for lego/extract tasks
-        complete_track_classes,  # ADDED: complete track classes
-        autogen_checkbox,  # NEW: AutoGen checkbox state
-        current_batch_index,  # NEW: Current batch index
-        total_batches,  # NEW: Total batches
-        batch_queue,  # NEW: Batch queue
-        generation_params_state,  # NEW: Generation parameters state
-        progress=gr.Progress(track_tqdm=True)
-    ):
-        """
-        Wrapper for generate_with_progress that adds batch queue management
-        """
-        # Call the original generation function
-        result = generate_with_progress(
-            captions, lyrics, bpm, key_scale, time_signature, vocal_language,
-            inference_steps, guidance_scale, random_seed_checkbox, seed,
-            reference_audio, audio_duration, batch_size_input, src_audio,
-            text2music_audio_code_string, repainting_start, repainting_end,
-            instruction_display_gen, audio_cover_strength, task_type,
-            use_adg, cfg_interval_start, cfg_interval_end, audio_format, lm_temperature,
-            think_checkbox, lm_cfg_scale, lm_top_k, lm_top_p, lm_negative_prompt,
-            use_cot_metas, use_cot_caption, use_cot_language, is_format_caption,
-            constrained_decoding_debug,
-            allow_lm_batch,
-            auto_score,
-            score_scale,
-            lm_batch_chunk_size,
-            progress
-        )
-        
-        # Extract results from generation
-        all_audio_paths = result[8]  # generated_audio_batch
-        generation_info = result[9]
-        seed_value_for_ui = result[11]
-        lm_generated_metadata = result[34]  # Index 34 is lm_metadata_state
-        
-        # --- FIXED: Corrected index offsets for codes extraction ---
-        # Index 25 is score_display_8
-        # Index 26 is updated_audio_codes (Single)
-        # Index 27-34 are codes_outputs[0] through codes_outputs[7] (Batch 1-8)
-        generated_codes_single = result[26]
-        generated_codes_batch = [result[27], result[28], result[29], result[30], result[31], result[32], result[33], result[34]]
-        
-        # Determine which codes to store based on mode
-        if allow_lm_batch and batch_size_input >= 2:
-            # Batch mode: store list of codes
-            codes_to_store = generated_codes_batch[:int(batch_size_input)]
-        else:
-            # Single mode: store single code string
-            codes_to_store = generated_codes_single
-        
-        # --- OPTIMIZATION: Separate "saved params" (for history) and "next params" (for AutoGen) ---
-        
-        # 1. Real historical parameters (for storage in Queue, for accurate restoration)
-        # These record the actual parameter state used for this generation
-        saved_params = {
-            "captions": captions,
-            "lyrics": lyrics,
-            "bpm": bpm,
-            "key_scale": key_scale,
-            "time_signature": time_signature,
-            "vocal_language": vocal_language,
-            "inference_steps": inference_steps,
-            "guidance_scale": guidance_scale,
-            "random_seed_checkbox": random_seed_checkbox,  # Save real checkbox state
-            "seed": seed,
-            "reference_audio": reference_audio,
-            "audio_duration": audio_duration,
-            "batch_size_input": batch_size_input,
-            "src_audio": src_audio,
-            "text2music_audio_code_string": text2music_audio_code_string,  # Save real input
-            "repainting_start": repainting_start,
-            "repainting_end": repainting_end,
-            "instruction_display_gen": instruction_display_gen,
-            "audio_cover_strength": audio_cover_strength,
-            "task_type": task_type,
-            "use_adg": use_adg,
-            "cfg_interval_start": cfg_interval_start,
-            "cfg_interval_end": cfg_interval_end,
-            "audio_format": audio_format,
-            "lm_temperature": lm_temperature,
-            "think_checkbox": think_checkbox,
-            "lm_cfg_scale": lm_cfg_scale,
-            "lm_top_k": lm_top_k,
-            "lm_top_p": lm_top_p,
-            "lm_negative_prompt": lm_negative_prompt,
-            "use_cot_metas": use_cot_metas,
-            "use_cot_caption": use_cot_caption,
-            "use_cot_language": use_cot_language,
-            "constrained_decoding_debug": constrained_decoding_debug,
-            "allow_lm_batch": allow_lm_batch,
-            "auto_score": auto_score,
-            "score_scale": score_scale,
-            "lm_batch_chunk_size": lm_batch_chunk_size,
-            "track_name": track_name,
-            "complete_track_classes": complete_track_classes,
-        }
-        
-        # 2. Next batch parameters (for background AutoGen)
-        # Based on current params, but clear codes and force random seeds to generate new content
-        next_params = saved_params.copy()
-        next_params["text2music_audio_code_string"] = ""  # CLEAR! Let LM regenerate or DiT use new seeds
-        next_params["random_seed_checkbox"] = True        # Always use random for next batch
-        
-        # Store current batch in queue using saved_params (real historical snapshot)
-        batch_queue = store_batch_in_queue(
-            batch_queue,
-            current_batch_index,
-            all_audio_paths,
-            generation_info,
-            seed_value_for_ui,
-            codes=codes_to_store,  # Store the codes used for this batch
-            allow_lm_batch=allow_lm_batch,  # Store batch mode setting
-            batch_size=int(batch_size_input),  # Store batch size
-            generation_params=saved_params,  # <-- Use saved_params for accurate history
-            lm_generated_metadata=lm_generated_metadata,  # Store LM metadata for scoring
-            status="completed"
-        )
-        
-        # Update batch counters (start with 1 batch)
-        # Don't increment total_batches yet - will do that when next batch starts generating
-        total_batches = max(total_batches, current_batch_index + 1)
-        
-        # Update batch indicator
-        batch_indicator_text = update_batch_indicator(current_batch_index, total_batches)
-        
-        # Update navigation button states
-        can_go_previous, can_go_next = update_navigation_buttons(current_batch_index, total_batches)
-        
-        # Prepare next batch status message
-        next_batch_status_text = ""
-        if autogen_checkbox:
-            next_batch_status_text = t("messages.autogen_enabled")
-        
-        # Return original results plus batch management state updates
-        return result + (
-            current_batch_index,  # Keep current batch index unchanged (still on batch 0)
-            total_batches,  # Updated total batches
-            batch_queue,  # Updated batch queue
-            next_params,  # Pass next_params for background generation (with cleared codes & random seed)
-            batch_indicator_text,  # Update batch indicator
-            gr.update(interactive=can_go_previous),  # prev_batch_btn
-            gr.update(interactive=can_go_next),  # next_batch_btn
-            next_batch_status_text,  # next_batch_status
-            gr.update(interactive=True),  # restore_params_btn - Enable after generation
-        )
-    
-    # Background generation function
-    def generate_next_batch_background(
-        autogen_enabled,
-        generation_params,
-        current_batch_index,
-        total_batches,
-        batch_queue,
-        is_format_caption,
-        progress=gr.Progress(track_tqdm=True)
-    ):
-        """
-        Generate next batch in background if AutoGen is enabled
-        """
-        from loguru import logger
-        
-        # Early return if AutoGen not enabled
-        if not autogen_enabled:
-            return (
-                batch_queue,
-                total_batches,
-                "",  # next_batch_status
-                gr.update(interactive=False),  # keep next_batch_btn disabled
-            )
-        
-        # Calculate next batch index
-        next_batch_idx = current_batch_index + 1
-        
-        # Check if next batch already exists
-        if next_batch_idx in batch_queue and batch_queue[next_batch_idx].get("status") == "completed":
-            # Next batch already generated, enable button
-            return (
-                batch_queue,
-                total_batches,
-                t("messages.batch_ready", n=next_batch_idx + 1),
-                gr.update(interactive=True),
-            )
-        
-        # Update total batches count
-        total_batches = next_batch_idx + 1
-        
-        # Update status to show generation starting
-        gr.Info(t("messages.batch_generating", n=next_batch_idx + 1))
-        
-        # Generate next batch using stored parameters
-        params = generation_params.copy()
-        
-        # DEBUG LOGGING: Log all parameters used for background generation
-        logger.info(f"========== BACKGROUND GENERATION BATCH {next_batch_idx + 1} ==========")
-        logger.info(f"Parameters used for background generation:")
-        logger.info(f"  - captions: {params.get('captions', 'N/A')}")
-        logger.info(f"  - lyrics: {params.get('lyrics', 'N/A')[:50]}..." if params.get('lyrics') else "  - lyrics: N/A")
-        logger.info(f"  - bpm: {params.get('bpm')}")
-        logger.info(f"  - batch_size_input: {params.get('batch_size_input')}")
-        logger.info(f"  - allow_lm_batch: {params.get('allow_lm_batch')}")
-        logger.info(f"  - think_checkbox: {params.get('think_checkbox')}")
-        logger.info(f"  - lm_temperature: {params.get('lm_temperature')}")
-        logger.info(f"  - track_name: {params.get('track_name')}")
-        logger.info(f"  - complete_track_classes: {params.get('complete_track_classes')}")
-        logger.info(f"  - text2music_audio_code_string: {'<CLEARED>' if params.get('text2music_audio_code_string') == '' else 'HAS_VALUE'}")
-        logger.info(f"=========================================================")
-        
-        # Add error handling for background generation
-        try:
-            # Ensure all parameters have default values to prevent None errors
-            params.setdefault("captions", "")
-            params.setdefault("lyrics", "")
-            params.setdefault("bpm", None)
-            params.setdefault("key_scale", "")
-            params.setdefault("time_signature", "")
-            params.setdefault("vocal_language", "unknown")
-            params.setdefault("inference_steps", 8)
-            params.setdefault("guidance_scale", 7.0)
-            params.setdefault("random_seed_checkbox", True)
-            params.setdefault("seed", "-1")
-            params.setdefault("reference_audio", None)
-            params.setdefault("audio_duration", -1)
-            params.setdefault("batch_size_input", 2)
-            params.setdefault("src_audio", None)
-            params.setdefault("text2music_audio_code_string", "")
-            params.setdefault("repainting_start", 0.0)
-            params.setdefault("repainting_end", -1)
-            params.setdefault("instruction_display_gen", "")
-            params.setdefault("audio_cover_strength", 1.0)
-            params.setdefault("task_type", "text2music")
-            params.setdefault("use_adg", False)
-            params.setdefault("cfg_interval_start", 0.0)
-            params.setdefault("cfg_interval_end", 1.0)
-            params.setdefault("audio_format", "mp3")
-            params.setdefault("lm_temperature", 0.85)
-            params.setdefault("think_checkbox", True)
-            params.setdefault("lm_cfg_scale", 2.0)
-            params.setdefault("lm_top_k", 0)
-            params.setdefault("lm_top_p", 0.9)
-            params.setdefault("lm_negative_prompt", "NO USER INPUT")
-            params.setdefault("use_cot_metas", True)
-            params.setdefault("use_cot_caption", True)
-            params.setdefault("use_cot_language", True)
-            params.setdefault("constrained_decoding_debug", False)
-            params.setdefault("allow_lm_batch", True)
-            params.setdefault("auto_score", False)
-            params.setdefault("score_scale", 0.5)
-            params.setdefault("lm_batch_chunk_size", 8)
-            params.setdefault("track_name", None)
-            params.setdefault("complete_track_classes", [])
-            
-            # Call generate_with_progress with the saved parameters
-            result = generate_with_progress(
-                captions=params.get("captions"),
-                lyrics=params.get("lyrics"),
-                bpm=params.get("bpm"),
-                key_scale=params.get("key_scale"),
-                time_signature=params.get("time_signature"),
-                vocal_language=params.get("vocal_language"),
-                inference_steps=params.get("inference_steps"),
-                guidance_scale=params.get("guidance_scale"),
-                random_seed_checkbox=params.get("random_seed_checkbox"),
-                seed=params.get("seed"),
-                reference_audio=params.get("reference_audio"),
-                audio_duration=params.get("audio_duration"),
-                batch_size_input=params.get("batch_size_input"),
-                src_audio=params.get("src_audio"),
-                text2music_audio_code_string=params.get("text2music_audio_code_string"),
-                repainting_start=params.get("repainting_start"),
-                repainting_end=params.get("repainting_end"),
-                instruction_display_gen=params.get("instruction_display_gen"),
-                audio_cover_strength=params.get("audio_cover_strength"),
-                task_type=params.get("task_type"),
-                use_adg=params.get("use_adg"),
-                cfg_interval_start=params.get("cfg_interval_start"),
-                cfg_interval_end=params.get("cfg_interval_end"),
-                audio_format=params.get("audio_format"),
-                lm_temperature=params.get("lm_temperature"),
-                think_checkbox=params.get("think_checkbox"),
-                lm_cfg_scale=params.get("lm_cfg_scale"),
-                lm_top_k=params.get("lm_top_k"),
-                lm_top_p=params.get("lm_top_p"),
-                lm_negative_prompt=params.get("lm_negative_prompt"),
-                use_cot_metas=params.get("use_cot_metas"),
-                use_cot_caption=params.get("use_cot_caption"),
-                use_cot_language=params.get("use_cot_language"),
-                is_format_caption=is_format_caption,
-                constrained_decoding_debug=params.get("constrained_decoding_debug"),
-                allow_lm_batch=params.get("allow_lm_batch"),
-                auto_score=params.get("auto_score"),
-                score_scale=params.get("score_scale"),
-                lm_batch_chunk_size=params.get("lm_batch_chunk_size"),
-                progress=progress
-            )
-            
-            # Extract results
-            all_audio_paths = result[8]  # generated_audio_batch
-            generation_info = result[9]
-            seed_value_for_ui = result[11]
-            lm_generated_metadata = result[34]  # Index 34 is lm_metadata_state
-            
-            # --- FIXED: Corrected index offsets for codes extraction ---
-            # Index 25 is score_display_8
-            # Index 26 is updated_audio_codes (Single)
-            # Index 27-34 are codes_outputs[0] through codes_outputs[7] (Batch 1-8)
-            generated_codes_single = result[26]
-            generated_codes_batch = [result[27], result[28], result[29], result[30], result[31], result[32], result[33], result[34]]
-            
-            # Determine which codes to store
-            batch_size = params.get("batch_size_input", 2)
-            allow_lm_batch = params.get("allow_lm_batch", False)
-            if allow_lm_batch and batch_size >= 2:
-                codes_to_store = generated_codes_batch[:int(batch_size)]
-            else:
-                codes_to_store = generated_codes_single
-            
-            # DEBUG LOGGING: Log codes extraction and storage
-            logger.info(f"Codes extraction for Batch {next_batch_idx + 1}:")
-            logger.info(f"  - allow_lm_batch: {allow_lm_batch}")
-            logger.info(f"  - batch_size: {batch_size}")
-            logger.info(f"  - generated_codes_single exists: {bool(generated_codes_single)}")
-            if isinstance(codes_to_store, list):
-                logger.info(f"  - codes_to_store: LIST with {len(codes_to_store)} items")
-                for idx, code in enumerate(codes_to_store):
-                    logger.info(f"    * Sample {idx + 1}: {len(code) if code else 0} chars")
-            else:
-                logger.info(f"  - codes_to_store: STRING with {len(codes_to_store) if codes_to_store else 0} chars")
-            
-            # Store next batch in queue with codes, batch settings, and ALL generation params
-            batch_queue = store_batch_in_queue(
-                batch_queue,
-                next_batch_idx,
-                all_audio_paths,
-                generation_info,
-                seed_value_for_ui,
-                codes=codes_to_store,  # Store codes
-                allow_lm_batch=allow_lm_batch,  # Store batch mode setting
-                batch_size=int(batch_size),  # Store batch size
-                generation_params=params,  # Store ALL generation parameters used
-                lm_generated_metadata=lm_generated_metadata,  # Store LM metadata for scoring
-                status="completed"
-            )
-            
-            logger.info(f"Batch {next_batch_idx + 1} stored in queue successfully")
-            
-            # Success message
-            next_batch_status = t("messages.batch_ready", n=next_batch_idx + 1)
-            
-            # Enable next button now that batch is ready
-            return (
-                batch_queue,
-                total_batches,
-                next_batch_status,
-                gr.update(interactive=True),  # Enable next_batch_btn
-            )
-        except Exception as e:
-            # Handle generation errors
-            import traceback
-            error_msg = t("messages.batch_failed", error=str(e))
-            gr.Warning(error_msg)
-            
-            # Mark batch as failed in queue
-            batch_queue[next_batch_idx] = {
-                "status": "error",
-                "error": str(e),
-                "traceback": traceback.format_exc()
-            }
-            
-            return (
-                batch_queue,
-                total_batches,
-                error_msg,
-                gr.update(interactive=False),  # Keep next_batch_btn disabled on error
-            )
-    
-    # Wire up generation button with background generation chaining
-    generation_section["generate_btn"].click(
-        fn=generate_with_batch_management,
-        inputs=[
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["bpm"],
-            generation_section["key_scale"],
-            generation_section["time_signature"],
-            generation_section["vocal_language"],
-            generation_section["inference_steps"],
-            generation_section["guidance_scale"],
-            generation_section["random_seed_checkbox"],
-            generation_section["seed"],
-            generation_section["reference_audio"],
-            generation_section["audio_duration"],
-            generation_section["batch_size_input"],
-            generation_section["src_audio"],
-            generation_section["text2music_audio_code_string"],
-            generation_section["repainting_start"],
-            generation_section["repainting_end"],
-            generation_section["instruction_display_gen"],
-            generation_section["audio_cover_strength"],
-            generation_section["task_type"],
-            generation_section["use_adg"],
-            generation_section["cfg_interval_start"],
-            generation_section["cfg_interval_end"],
-            generation_section["audio_format"],
-            generation_section["lm_temperature"],
-            generation_section["think_checkbox"],
-            generation_section["lm_cfg_scale"],
-            generation_section["lm_top_k"],
-            generation_section["lm_top_p"],
-            generation_section["lm_negative_prompt"],
-            generation_section["use_cot_metas"],
-            generation_section["use_cot_caption"],
-            generation_section["use_cot_language"],
-            results_section["is_format_caption_state"],
-            generation_section["constrained_decoding_debug"],
-            generation_section["allow_lm_batch"],
-            generation_section["auto_score"],
-            generation_section["score_scale"],
-            generation_section["lm_batch_chunk_size"],
-            generation_section["track_name"],  # ADDED: For lego/extract tasks
-            generation_section["complete_track_classes"],  # ADDED: For complete task
-            generation_section["autogen_checkbox"],  # NEW: AutoGen checkbox
-            results_section["current_batch_index"],  #NEW: Current batch index
-            results_section["total_batches"],  # NEW: Total batches
-            results_section["batch_queue"],  # NEW: Batch queue
-            results_section["generation_params_state"],  # NEW: Generation parameters
-        ],
-        outputs=[
-            results_section["generated_audio_1"],
-            results_section["generated_audio_2"],
-            results_section["generated_audio_3"],
-            results_section["generated_audio_4"],
-            results_section["generated_audio_5"],
-            results_section["generated_audio_6"],
-            results_section["generated_audio_7"],
-            results_section["generated_audio_8"],
-            results_section["generated_audio_batch"],
-            results_section["generation_info"],
-            results_section["status_output"],
-            generation_section["seed"],
-            results_section["align_score_1"],
-            results_section["align_text_1"],
-            results_section["align_plot_1"],
-            results_section["align_score_2"],
-            results_section["align_text_2"],
-            results_section["align_plot_2"],
-            results_section["score_display_1"],
-            results_section["score_display_2"],
-            results_section["score_display_3"],
-            results_section["score_display_4"],
-            results_section["score_display_5"],
-            results_section["score_display_6"],
-            results_section["score_display_7"],
-            results_section["score_display_8"],
-            generation_section["text2music_audio_code_string"],  # Update main audio codes display
-            generation_section["text2music_audio_code_string_1"],  # Update codes for sample 1
-            generation_section["text2music_audio_code_string_2"],  # Update codes for sample 2
-            generation_section["text2music_audio_code_string_3"],  # Update codes for sample 3
-            generation_section["text2music_audio_code_string_4"],  # Update codes for sample 4
-            generation_section["text2music_audio_code_string_5"],  # Update codes for sample 5
-            generation_section["text2music_audio_code_string_6"],  # Update codes for sample 6
-            generation_section["text2music_audio_code_string_7"],  # Update codes for sample 7
-            generation_section["text2music_audio_code_string_8"],  # Update codes for sample 8
-            results_section["lm_metadata_state"],  # Store metadata
-            results_section["is_format_caption_state"],  # Update is_format_caption state
-            results_section["current_batch_index"],  # NEW: Update current batch index
-            results_section["total_batches"],  # NEW: Update total batches
-            results_section["batch_queue"],  # NEW: Update batch queue
-            results_section["generation_params_state"],  # NEW: Update generation params
-            results_section["batch_indicator"],  # NEW: Update batch indicator
-            results_section["prev_batch_btn"],  # NEW: Update prev button state
-            results_section["next_batch_btn"],  # NEW: Update next button state
-            results_section["next_batch_status"],  # NEW: Update next batch status
-            results_section["restore_params_btn"],  # NEW: Enable restore button after generation
-        ]
-    ).then(
-        # Chain background generation with parameters already stored by generate_with_batch_management
-        # NOTE: No need to capture_current_params again - already stored at generation time
-        fn=generate_next_batch_background,
-        inputs=[
-            generation_section["autogen_checkbox"],
-            results_section["generation_params_state"],  # Use params from generate_with_batch_management
-            results_section["current_batch_index"],
-            results_section["total_batches"],
-            results_section["batch_queue"],
-            results_section["is_format_caption_state"],
-        ],
-        outputs=[
-            results_section["batch_queue"],
-            results_section["total_batches"],
-            results_section["next_batch_status"],
-            results_section["next_batch_btn"],
-        ]
-    )
-    
-    # Update audio components visibility based on batch size
-    def update_audio_components_visibility(batch_size):
-        """Show/hide individual audio components based on batch size (1-8)
-        
-        Row 1: Components 1-4 (batch_size 1-4)
-        Row 2: Components 5-8 (batch_size 5-8)
-        """
-        # Clamp batch size to 1-8 range for UI
-        batch_size = min(max(int(batch_size), 1), 8)
-        
-        # Row 1 columns (1-4)
-        updates_row1 = (
-            gr.update(visible=True),  # audio_col_1: always visible
-            gr.update(visible=batch_size >= 2),  # audio_col_2
-            gr.update(visible=batch_size >= 3),  # audio_col_3
-            gr.update(visible=batch_size >= 4),  # audio_col_4
-        )
-        
-        # Row 2 container and columns (5-8)
-        show_row_5_8 = batch_size >= 5
-        updates_row2 = (
-            gr.update(visible=show_row_5_8),  # audio_row_5_8 (container)
-            gr.update(visible=batch_size >= 5),  # audio_col_5
-            gr.update(visible=batch_size >= 6),  # audio_col_6
-            gr.update(visible=batch_size >= 7),  # audio_col_7
-            gr.update(visible=batch_size >= 8),  # audio_col_8
-        )
-        
-        return updates_row1 + updates_row2
-    
-    generation_section["batch_size_input"].change(
-        fn=update_audio_components_visibility,
-        inputs=[generation_section["batch_size_input"]],
-        outputs=[
-            # Row 1 (1-4)
-            results_section["audio_col_1"],
-            results_section["audio_col_2"],
-            results_section["audio_col_3"],
-            results_section["audio_col_4"],
-            # Row 2 container and columns (5-8)
-            results_section["audio_row_5_8"],
-            results_section["audio_col_5"],
-            results_section["audio_col_6"],
-            results_section["audio_col_7"],
-            results_section["audio_col_8"],
-        ]
-    )
-    
-    # Update LM codes hints display based on src_audio, allow_lm_batch and batch_size
-    def update_codes_hints_visibility(src_audio, allow_lm_batch, batch_size):
-        """Switch between single/batch codes input based on src_audio presence
-        
-        When src_audio is present:
-            - Show single mode with transcribe button
-            - Clear codes (will be filled by transcription)
-        
-        When src_audio is absent:
-            - Hide transcribe button
-            - Show batch mode if allow_lm_batch=True and batch_size>=2
-            - Show single mode otherwise
-        
-        Row 1: Codes 1-4
-        Row 2: Codes 5-8 (batch_size >= 5)
-        """
-        batch_size = min(max(int(batch_size), 1), 8)
-        has_src_audio = src_audio is not None
-        
-        if has_src_audio:
-            # Has src_audio: show single mode with transcribe button
-            return (
-                gr.update(visible=True),   # codes_single_row
-                gr.update(visible=False),  # codes_batch_row
-                gr.update(visible=False),  # codes_batch_row_2
-                *[gr.update(visible=False)] * 8,  # Hide all batch columns
-                gr.update(visible=True),   # transcribe_btn: show when src_audio present
-            )
-        else:
-            # No src_audio: decide between single/batch mode based on settings
-            if allow_lm_batch and batch_size >= 2:
-                # Batch mode: hide single, show batch codes with dynamic columns
-                show_row_2 = batch_size >= 5
-                return (
-                    gr.update(visible=False),  # codes_single_row
-                    gr.update(visible=True),   # codes_batch_row (row 1)
-                    gr.update(visible=show_row_2),  # codes_batch_row_2 (row 2)
-                    # Row 1 columns (1-4)
-                    gr.update(visible=True),   # codes_col_1: always visible in batch mode
-                    gr.update(visible=batch_size >= 2),  # codes_col_2
-                    gr.update(visible=batch_size >= 3),  # codes_col_3
-                    gr.update(visible=batch_size >= 4),  # codes_col_4
-                    # Row 2 columns (5-8)
-                    gr.update(visible=batch_size >= 5),  # codes_col_5
-                    gr.update(visible=batch_size >= 6),  # codes_col_6
-                    gr.update(visible=batch_size >= 7),  # codes_col_7
-                    gr.update(visible=batch_size >= 8),  # codes_col_8
-                    gr.update(visible=False),  # transcribe_btn: hide when no src_audio
-                )
-            else:
-                # Single mode: show single, hide batch
-                return (
-                    gr.update(visible=True),   # codes_single_row
-                    gr.update(visible=False),  # codes_batch_row
-                    gr.update(visible=False),  # codes_batch_row_2
-                    *[gr.update(visible=False)] * 8,  # Hide all batch columns
-                    gr.update(visible=False),  # transcribe_btn: hide when no src_audio
-                )
-    
-    # Update codes hints when src_audio, allow_lm_batch, or batch_size changes
-    generation_section["src_audio"].change(
-        fn=update_codes_hints_visibility,
-        inputs=[
-            generation_section["src_audio"],
-            generation_section["allow_lm_batch"],
-            generation_section["batch_size_input"]
-        ],
-        outputs=[
-            generation_section["codes_single_row"],
-            generation_section["codes_batch_row"],
-            generation_section["codes_batch_row_2"],
-            # Row 1
-            generation_section["codes_col_1"],
-            generation_section["codes_col_2"],
-            generation_section["codes_col_3"],
-            generation_section["codes_col_4"],
-            # Row 2
-            generation_section["codes_col_5"],
-            generation_section["codes_col_6"],
-            generation_section["codes_col_7"],
-            generation_section["codes_col_8"],
-            generation_section["transcribe_btn"],
-        ]
-    )
-    
-    generation_section["allow_lm_batch"].change(
-        fn=update_codes_hints_visibility,
-        inputs=[
-            generation_section["src_audio"],
-            generation_section["allow_lm_batch"],
-            generation_section["batch_size_input"]
-        ],
-        outputs=[
-            generation_section["codes_single_row"],
-            generation_section["codes_batch_row"],
-            generation_section["codes_batch_row_2"],
-            # Row 1
-            generation_section["codes_col_1"],
-            generation_section["codes_col_2"],
-            generation_section["codes_col_3"],
-            generation_section["codes_col_4"],
-            # Row 2
-            generation_section["codes_col_5"],
-            generation_section["codes_col_6"],
-            generation_section["codes_col_7"],
-            generation_section["codes_col_8"],
-            generation_section["transcribe_btn"],
-        ]
-    )
-    
-    # Also update codes hints when batch_size changes
-    generation_section["batch_size_input"].change(
-        fn=update_codes_hints_visibility,
-        inputs=[
-            generation_section["src_audio"],
-            generation_section["allow_lm_batch"],
-            generation_section["batch_size_input"]
-        ],
-        outputs=[
-            generation_section["codes_single_row"],
-            generation_section["codes_batch_row"],
-            generation_section["codes_batch_row_2"],
-            # Row 1
-            generation_section["codes_col_1"],
-            generation_section["codes_col_2"],
-            generation_section["codes_col_3"],
-            generation_section["codes_col_4"],
-            # Row 2
-            generation_section["codes_col_5"],
-            generation_section["codes_col_6"],
-            generation_section["codes_col_7"],
-            generation_section["codes_col_8"],
-            generation_section["transcribe_btn"],
-        ]
-    )
-    
-    # Convert src audio to codes
-    def convert_src_audio_to_codes_wrapper(src_audio):
-        """Wrapper for converting src audio to codes"""
-        codes_string = dit_handler.convert_src_audio_to_codes(src_audio)
-        return codes_string
-    
-    generation_section["convert_src_to_codes_btn"].click(
-        fn=convert_src_audio_to_codes_wrapper,
-        inputs=[generation_section["src_audio"]],
-        outputs=[generation_section["text2music_audio_code_string"]]
-    )
-    
-    # Update instruction and UI visibility based on task type
-    def update_instruction_ui(
-        task_type_value: str, 
-        track_name_value: Optional[str], 
-        complete_track_classes_value: list, 
-        audio_codes_content: str = "",
-        init_llm_checked: bool = False
-    ) -> tuple:
-        """Update instruction and UI visibility based on task type."""
-        instruction = dit_handler.generate_instruction(
-            task_type=task_type_value,
-            track_name=track_name_value,
-            complete_track_classes=complete_track_classes_value
-        )
-        
-        # Show track_name for lego and extract
-        track_name_visible = task_type_value in ["lego", "extract"]
-        # Show complete_track_classes for complete
-        complete_visible = task_type_value == "complete"
-        # Show audio_cover_strength for cover OR when LM is initialized
-        audio_cover_strength_visible = (task_type_value == "cover") or init_llm_checked
-        # Determine label and info based on context
-        if init_llm_checked and task_type_value != "cover":
-            audio_cover_strength_label = "LM codes strength"
-            audio_cover_strength_info = "Control how many denoising steps use LM-generated codes"
-        else:
-            audio_cover_strength_label = "Audio Cover Strength"
-            audio_cover_strength_info = "Control how many denoising steps use cover mode"
-        # Show repainting controls for repaint and lego
-        repainting_visible = task_type_value in ["repaint", "lego"]
-        # Show text2music_audio_codes if task is text2music OR if it has content
-        # This allows it to stay visible even if user switches task type but has codes
-        has_audio_codes = audio_codes_content and str(audio_codes_content).strip()
-        text2music_audio_codes_visible = task_type_value == "text2music" or has_audio_codes
-        
-        return (
-            instruction,  # instruction_display_gen
-            gr.update(visible=track_name_visible),  # track_name
-            gr.update(visible=complete_visible),  # complete_track_classes
-            gr.update(visible=audio_cover_strength_visible, label=audio_cover_strength_label, info=audio_cover_strength_info),  # audio_cover_strength
-            gr.update(visible=repainting_visible),  # repainting_group
-            gr.update(visible=text2music_audio_codes_visible),  # text2music_audio_codes_group
-        )
-    
-    # Bind update_instruction_ui to task_type, track_name, and complete_track_classes changes
-    generation_section["task_type"].change(
-        fn=update_instruction_ui,
-        inputs=[
-            generation_section["task_type"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            generation_section["text2music_audio_code_string"],
-            generation_section["init_llm_checkbox"]
-        ],
-        outputs=[
-            generation_section["instruction_display_gen"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            generation_section["audio_cover_strength"],
-            generation_section["repainting_group"],
-            generation_section["text2music_audio_codes_group"],
-        ]
-    )
-    
-    # Also update instruction when track_name changes (for lego/extract tasks)
-    generation_section["track_name"].change(
-        fn=update_instruction_ui,
-        inputs=[
-            generation_section["task_type"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            generation_section["text2music_audio_code_string"],
-            generation_section["init_llm_checkbox"]
-        ],
-        outputs=[
-            generation_section["instruction_display_gen"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            generation_section["audio_cover_strength"],
-            generation_section["repainting_group"],
-            generation_section["text2music_audio_codes_group"],
-        ]
-    )
-    
-    # Also update instruction when complete_track_classes changes (for complete task)
-    generation_section["complete_track_classes"].change(
-        fn=update_instruction_ui,
-        inputs=[
-            generation_section["task_type"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            generation_section["text2music_audio_code_string"],
-            generation_section["init_llm_checkbox"]
-        ],
-        outputs=[
-            generation_section["instruction_display_gen"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            generation_section["audio_cover_strength"],
-            generation_section["repainting_group"],
-            generation_section["text2music_audio_codes_group"],
-        ]
-    )
-    
-    # Send generated audio to src_audio and populate metadata
-    def send_audio_to_src_with_metadata(audio_file, lm_metadata):
-        """Send generated audio file to src_audio input and populate metadata fields
-        
-        Args:
-            audio_file: Audio file path
-            lm_metadata: Dictionary containing LM-generated metadata
-            
-        Returns:
-            Tuple of (audio_file, bpm, caption, lyrics, duration, key_scale, language, time_signature, is_format_caption)
-        """
-        if audio_file is None:
-            return None, None, None, None, None, None, None, None, True  # Keep is_format_caption as True
-        
-        # Extract metadata fields if available
-        bpm_value = None
-        caption_value = None
-        lyrics_value = None
-        duration_value = None
-        key_scale_value = None
-        language_value = None
-        time_signature_value = None
-        
-        if lm_metadata:
-            # BPM
-            if lm_metadata.get('bpm'):
-                bpm_str = lm_metadata.get('bpm')
-                if bpm_str and bpm_str != "N/A":
-                    try:
-                        bpm_value = int(bpm_str)
-                    except (ValueError, TypeError):
-                        pass
-            
-            # Caption (Rewritten Caption)
-            if lm_metadata.get('caption'):
-                caption_value = lm_metadata.get('caption')
-            
-            # Lyrics
-            if lm_metadata.get('lyrics'):
-                lyrics_value = lm_metadata.get('lyrics')
-            
-            # Duration
-            if lm_metadata.get('duration'):
-                duration_str = lm_metadata.get('duration')
-                if duration_str and duration_str != "N/A":
-                    try:
-                        duration_value = float(duration_str)
-                    except (ValueError, TypeError):
-                        pass
-            
-            # KeyScale
-            if lm_metadata.get('keyscale'):
-                key_scale_str = lm_metadata.get('keyscale')
-                if key_scale_str and key_scale_str != "N/A":
-                    key_scale_value = key_scale_str
-            
-            # Language
-            if lm_metadata.get('language'):
-                language_str = lm_metadata.get('language')
-                if language_str and language_str != "N/A":
-                    language_value = language_str
-            
-            # Time Signature
-            if lm_metadata.get('timesignature'):
-                time_sig_str = lm_metadata.get('timesignature')
-                if time_sig_str and time_sig_str != "N/A":
-                    time_signature_value = time_sig_str
-        
-        return (
-            audio_file,
-            bpm_value,
-            caption_value,
-            lyrics_value,
-            duration_value,
-            key_scale_value,
-            language_value,
-            time_signature_value,
-            True  # Set is_format_caption to True (from LM-generated metadata)
-        )
-    
-    results_section["send_to_src_btn_1"].click(
-        fn=send_audio_to_src_with_metadata,
-        inputs=[
-            results_section["generated_audio_1"],
-            results_section["lm_metadata_state"]
-        ],
-        outputs=[
-            generation_section["src_audio"],
-            generation_section["bpm"],
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["audio_duration"],
-            generation_section["key_scale"],
-            generation_section["vocal_language"],
-            generation_section["time_signature"],
-            results_section["is_format_caption_state"]
-        ]
-    )
-    
-    results_section["send_to_src_btn_2"].click(
-        fn=send_audio_to_src_with_metadata,
-        inputs=[
-            results_section["generated_audio_2"],
-            results_section["lm_metadata_state"]
-        ],
-        outputs=[
-            generation_section["src_audio"],
-            generation_section["bpm"],
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["audio_duration"],
-            generation_section["key_scale"],
-            generation_section["vocal_language"],
-            generation_section["time_signature"],
-            results_section["is_format_caption_state"]
-        ]
-    )
-    
-    # Sample button - smart sample (uses LM if initialized, otherwise examples)
-    # Need to add is_format_caption return value to sample_example_smart
-    def sample_example_smart_with_flag(task_type: str, constrained_decoding_debug: bool):
-        """Wrapper for sample_example_smart that adds is_format_caption flag"""
-        result = sample_example_smart(task_type, constrained_decoding_debug)
-        # Add True at the end to set is_format_caption
-        return result + (True,)
-    
-    generation_section["sample_btn"].click(
-        fn=sample_example_smart_with_flag,
-        inputs=[
-            generation_section["task_type"],
-            generation_section["constrained_decoding_debug"]
-        ],
-        outputs=[
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["think_checkbox"],
-            generation_section["bpm"],
-            generation_section["audio_duration"],
-            generation_section["key_scale"],
-            generation_section["vocal_language"],
-            generation_section["time_signature"],
-            results_section["is_format_caption_state"]  # Set is_format_caption to True (from Sample/LM)
-        ]
-    )
-    
-    # Transcribe audio codes to metadata (or generate example if empty)
-    def transcribe_audio_codes(audio_code_string, constrained_decoding_debug):
-        """
-        Transcribe audio codes to metadata using LLM understanding.
-        If audio_code_string is empty, generate a sample example instead.
-        
-        Args:
-            audio_code_string: String containing audio codes (or empty for example generation)
-            constrained_decoding_debug: Whether to enable debug logging for constrained decoding
-            
-        Returns:
-            Tuple of (status_message, caption, lyrics, bpm, duration, keyscale, language, timesignature)
-        """
-        if not llm_handler.llm_initialized:
-            return t("messages.lm_not_initialized"), "", "", None, None, "", "", ""
-        
-        # If codes are empty, this becomes a "generate example" task
-        # Use "NO USER INPUT" as the input to generate a sample
-        if not audio_code_string or not audio_code_string.strip():
-            audio_code_string = "NO USER INPUT"
-        
-        # Call LLM understanding
-        metadata, status = llm_handler.understand_audio_from_codes(
-            audio_codes=audio_code_string,
-            use_constrained_decoding=True,
-            constrained_decoding_debug=constrained_decoding_debug,
-        )
-        
-        # Extract fields for UI update
-        caption = metadata.get('caption', '')
-        lyrics = metadata.get('lyrics', '')
-        bpm = metadata.get('bpm')
-        duration = metadata.get('duration')
-        keyscale = metadata.get('keyscale', '')
-        language = metadata.get('language', '')
-        timesignature = metadata.get('timesignature', '')
-        
-        # Convert to appropriate types
-        try:
-            bpm = int(bpm) if bpm and bpm != 'N/A' else None
-        except:
-            bpm = None
-        
-        try:
-            duration = float(duration) if duration and duration != 'N/A' else None
-        except:
-            duration = None
-        
-        return (
-            status,
-            caption,
-            lyrics,
-            bpm,
-            duration,
-            keyscale,
-            language,
-            timesignature,
-            True  # Set is_format_caption to True (from Transcribe/LM understanding)
-        )
-    
-    # Update transcribe button text based on whether codes are present
-    def update_transcribe_button_text(audio_code_string):
-        """
-        Update the transcribe button text based on input content.
-        If empty: "Generate Example"
-        If has content: "Transcribe"
-        """
-        if not audio_code_string or not audio_code_string.strip():
-            return gr.update(value="Generate Example")
-        else:
-            return gr.update(value="Transcribe")
-    
-    # Update button text when codes change
-    generation_section["text2music_audio_code_string"].change(
-        fn=update_transcribe_button_text,
-        inputs=[generation_section["text2music_audio_code_string"]],
-        outputs=[generation_section["transcribe_btn"]]
-    )
-    
-    generation_section["transcribe_btn"].click(
-        fn=transcribe_audio_codes,
-        inputs=[
-            generation_section["text2music_audio_code_string"],
-            generation_section["constrained_decoding_debug"]
-        ],
-        outputs=[
-            results_section["status_output"],       # Show status
-            generation_section["captions"],         # Update caption field
-            generation_section["lyrics"],           # Update lyrics field
-            generation_section["bpm"],              # Update BPM field
-            generation_section["audio_duration"],   # Update duration field
-            generation_section["key_scale"],        # Update keyscale field
-            generation_section["vocal_language"],   # Update language field
-            generation_section["time_signature"],   # Update time signature field
-            results_section["is_format_caption_state"]  # Set is_format_caption to True
-        ]
-    )
-    
-    # Reset is_format_caption to False when user manually edits fields
-    def reset_format_caption_flag():
-        """Reset is_format_caption to False when user manually edits caption/metadata"""
-        return False
-    
-    # Connect reset function to all user-editable metadata fields
-    generation_section["captions"].change(
-        fn=reset_format_caption_flag,
-        inputs=[],
-        outputs=[results_section["is_format_caption_state"]]
-    )
-    
-    generation_section["lyrics"].change(
-        fn=reset_format_caption_flag,
-        inputs=[],
-        outputs=[results_section["is_format_caption_state"]]
-    )
-    
-    generation_section["bpm"].change(
-        fn=reset_format_caption_flag,
-        inputs=[],
-        outputs=[results_section["is_format_caption_state"]]
-    )
-    
-    generation_section["key_scale"].change(
-        fn=reset_format_caption_flag,
-        inputs=[],
-        outputs=[results_section["is_format_caption_state"]]
-    )
-    
-    generation_section["time_signature"].change(
-        fn=reset_format_caption_flag,
-        inputs=[],
-        outputs=[results_section["is_format_caption_state"]]
-    )
-    
-    generation_section["vocal_language"].change(
-        fn=reset_format_caption_flag,
-        inputs=[],
-        outputs=[results_section["is_format_caption_state"]]
-    )
-    
-    generation_section["audio_duration"].change(
-        fn=reset_format_caption_flag,
-        inputs=[],
-        outputs=[results_section["is_format_caption_state"]]
-    )
-    
-    # Auto-expand Audio Uploads accordion when audio is uploaded
-    def update_audio_uploads_accordion(reference_audio, src_audio):
-        """Update Audio Uploads accordion open state based on whether audio files are present"""
-        has_audio = (reference_audio is not None) or (src_audio is not None)
-        return gr.update(open=has_audio)
-    
-    # Bind to both audio components' change events
-    generation_section["reference_audio"].change(
-        fn=update_audio_uploads_accordion,
-        inputs=[generation_section["reference_audio"], generation_section["src_audio"]],
-        outputs=[generation_section["audio_uploads_accordion"]]
-    )
-    
-    generation_section["src_audio"].change(
-        fn=update_audio_uploads_accordion,
-        inputs=[generation_section["reference_audio"], generation_section["src_audio"]],
-        outputs=[generation_section["audio_uploads_accordion"]]
-    )
-    
-    # Save audio and metadata handlers - downloads as zip package
-    results_section["save_btn_1"].click(
-        fn=save_audio_and_metadata,
-        inputs=[
-            results_section["generated_audio_1"],
-            generation_section["task_type"],
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["vocal_language"],
-            generation_section["bpm"],
-            generation_section["key_scale"],
-            generation_section["time_signature"],
-            generation_section["audio_duration"],
-            generation_section["batch_size_input"],
-            generation_section["inference_steps"],
-            generation_section["guidance_scale"],
-            generation_section["seed"],
-            generation_section["random_seed_checkbox"],
-            generation_section["use_adg"],
-            generation_section["cfg_interval_start"],
-            generation_section["cfg_interval_end"],
-            generation_section["audio_format"],
-            generation_section["lm_temperature"],
-            generation_section["lm_cfg_scale"],
-            generation_section["lm_top_k"],
-            generation_section["lm_top_p"],
-            generation_section["lm_negative_prompt"],
-            generation_section["use_cot_caption"],
-            generation_section["use_cot_language"],
-            generation_section["audio_cover_strength"],
-            generation_section["think_checkbox"],
-            generation_section["text2music_audio_code_string"],
-            generation_section["repainting_start"],
-            generation_section["repainting_end"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            results_section["lm_metadata_state"],
-        ],
-        outputs=[gr.File(label="Download Package", visible=False)]
-    )
-    
-    results_section["save_btn_2"].click(
-        fn=save_audio_and_metadata,
-        inputs=[
-            results_section["generated_audio_2"],
-            generation_section["task_type"],
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["vocal_language"],
-            generation_section["bpm"],
-            generation_section["key_scale"],
-            generation_section["time_signature"],
-            generation_section["audio_duration"],
-            generation_section["batch_size_input"],
-            generation_section["inference_steps"],
-            generation_section["guidance_scale"],
-            generation_section["seed"],
-            generation_section["random_seed_checkbox"],
-            generation_section["use_adg"],
-            generation_section["cfg_interval_start"],
-            generation_section["cfg_interval_end"],
-            generation_section["audio_format"],
-            generation_section["lm_temperature"],
-            generation_section["lm_cfg_scale"],
-            generation_section["lm_top_k"],
-            generation_section["lm_top_p"],
-            generation_section["lm_negative_prompt"],
-            generation_section["use_cot_caption"],
-            generation_section["use_cot_language"],
-            generation_section["audio_cover_strength"],
-            generation_section["think_checkbox"],
-            generation_section["text2music_audio_code_string"],
-            generation_section["repainting_start"],
-            generation_section["repainting_end"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            results_section["lm_metadata_state"],
-        ],
-        outputs=[gr.File(label="Download Package", visible=False)]
-    )
-    
-    # Load metadata handler - triggered when file is uploaded via UploadButton
-    generation_section["load_file"].upload(
-        fn=load_metadata,
-        inputs=[generation_section["load_file"]],
-        outputs=[
-            generation_section["task_type"],
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["vocal_language"],
-            generation_section["bpm"],
-            generation_section["key_scale"],
-            generation_section["time_signature"],
-            generation_section["audio_duration"],
-            generation_section["batch_size_input"],
-            generation_section["inference_steps"],
-            generation_section["guidance_scale"],
-            generation_section["seed"],
-            generation_section["random_seed_checkbox"],
-            generation_section["use_adg"],
-            generation_section["cfg_interval_start"],
-            generation_section["cfg_interval_end"],
-            generation_section["audio_format"],
-            generation_section["lm_temperature"],
-            generation_section["lm_cfg_scale"],
-            generation_section["lm_top_k"],
-            generation_section["lm_top_p"],
-            generation_section["lm_negative_prompt"],
-            generation_section["use_cot_caption"],
-            generation_section["use_cot_language"],
-            generation_section["audio_cover_strength"],
-            generation_section["think_checkbox"],
-            generation_section["text2music_audio_code_string"],
-            generation_section["repainting_start"],
-            generation_section["repainting_end"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-            results_section["is_format_caption_state"]
-        ]
-    )
-    
-    # Instrumental checkbox handler - auto-fill [Instrumental] when checked
-    def handle_instrumental_checkbox(instrumental_checked, current_lyrics):
-        """
-        Handle instrumental checkbox changes.
-        When checked: if no lyrics, fill with [Instrumental]
-        When unchecked: if lyrics is [Instrumental], clear it
-        """
-        if instrumental_checked:
-            # If checked and no lyrics, fill with [Instrumental]
-            if not current_lyrics or not current_lyrics.strip():
-                return "[Instrumental]"
-            else:
-                # Has lyrics, don't change
-                return current_lyrics
-        else:
-            # If unchecked and lyrics is exactly [Instrumental], clear it
-            if current_lyrics and current_lyrics.strip() == "[Instrumental]":
-                return ""
-            else:
-                # Has other lyrics, don't change
-                return current_lyrics
-    
-    generation_section["instrumental_checkbox"].change(
-        fn=handle_instrumental_checkbox,
-        inputs=[generation_section["instrumental_checkbox"], generation_section["lyrics"]],
-        outputs=[generation_section["lyrics"]]
-    )
-    
-    # Score calculation handlers
-    def update_batch_score(current_batch_index, batch_queue, sample_idx, score_display):
-        """Update score for a specific sample in the current batch"""
-        if current_batch_index in batch_queue:
-            if "scores" not in batch_queue[current_batch_index]:
-                batch_queue[current_batch_index]["scores"] = [""] * 8
-            batch_queue[current_batch_index]["scores"][sample_idx - 1] = score_display
-        return batch_queue
-    
-    def calculate_score_handler_with_selection(
-        sample_idx,
-        score_scale,
-        current_batch_index,
-        batch_queue
-    ):
-        """
-        Calculate PMI-based quality score - REFACTORED to read from batch_queue only.
-        This ensures scoring uses the actual generation parameters, not current UI values.
-        
-        Args:
-            sample_idx: Which sample to score (1-8)
-            score_scale: Sensitivity scale parameter (tool setting, can be from UI)
-            current_batch_index: Current batch index
-            batch_queue: Batch queue containing historical generation data
-        """
-        if current_batch_index not in batch_queue:
-            return t("messages.scoring_failed"), batch_queue
-        
-        batch_data = batch_queue[current_batch_index]
-        params = batch_data.get("generation_params", {})
-        
-        # Read ALL parameters from historical batch data
-        caption = params.get("captions", "")
-        lyrics = params.get("lyrics", "")
-        bpm = params.get("bpm")
-        key_scale = params.get("key_scale", "")
-        time_signature = params.get("time_signature", "")
-        audio_duration = params.get("audio_duration", -1)
-        vocal_language = params.get("vocal_language", "")
-        
-        # Get LM metadata from batch_data (if it was saved during generation)
-        lm_metadata = batch_data.get("lm_generated_metadata", None)
-        
-        # Get codes from batch_data
-        stored_codes = batch_data.get("codes", "")
-        stored_allow_lm_batch = batch_data.get("allow_lm_batch", False)
-        
-        # Select correct codes for this sample
-        audio_codes_str = ""
-        if stored_allow_lm_batch and isinstance(stored_codes, list):
-            # Batch mode: use specific sample's codes
-            if 0 <= sample_idx - 1 < len(stored_codes):
-                audio_codes_str = stored_codes[sample_idx - 1]
-        else:
-            # Single mode: all samples use same codes
-            audio_codes_str = stored_codes if isinstance(stored_codes, str) else ""
-        
-        # Calculate score using historical parameters
-        score_display = calculate_score_handler(
-            audio_codes_str, caption, lyrics, lm_metadata,
-            bpm, key_scale, time_signature, audio_duration, vocal_language,
-            score_scale
-        )
-        
-        # Update batch_queue with the calculated score
-        batch_queue = update_batch_score(current_batch_index, batch_queue, sample_idx, score_display)
-        
-        return score_display, batch_queue
-    
-    def calculate_score_handler(audio_codes_str, caption, lyrics, lm_metadata, bpm, key_scale, time_signature, audio_duration, vocal_language, score_scale):
-        """
-        Calculate PMI-based quality score for generated audio.
-        
-        PMI (Pointwise Mutual Information) removes condition bias:
-        score = log P(condition|codes) - log P(condition)
-        
-        Args:
-            audio_codes_str: Generated audio codes string
-            caption: Caption text used for generation
-            lyrics: Lyrics text used for generation
-            lm_metadata: LM-generated metadata dictionary (from CoT generation)
-            bpm: BPM value
-            key_scale: Key scale value
-            time_signature: Time signature value
-            audio_duration: Audio duration value
-            vocal_language: Vocal language value
-            score_scale: Sensitivity scale parameter
-            
-        Returns:
-            Score display string
-        """
-        from acestep.test_time_scaling import calculate_pmi_score_per_condition
-        
-        if not llm_handler.llm_initialized:
-            return t("messages.lm_not_initialized")
-        
-        if not audio_codes_str or not audio_codes_str.strip():
-            return t("messages.no_codes")
-        
-        try:
-            # Build metadata dictionary from both LM metadata and user inputs
-            metadata = {}
-            
-            # Priority 1: Use LM-generated metadata if available
-            if lm_metadata and isinstance(lm_metadata, dict):
-                metadata.update(lm_metadata)
-            
-            # Priority 2: Add user-provided metadata (if not already in LM metadata)
-            if bpm is not None and 'bpm' not in metadata:
-                try:
-                    metadata['bpm'] = int(bpm)
-                except:
-                    pass
-            
-            if caption and 'caption' not in metadata:
-                metadata['caption'] = caption
-            
-            if audio_duration is not None and audio_duration > 0 and 'duration' not in metadata:
-                try:
-                    metadata['duration'] = int(audio_duration)
-                except:
-                    pass
-            
-            if key_scale and key_scale.strip() and 'keyscale' not in metadata:
-                metadata['keyscale'] = key_scale.strip()
-            
-            if vocal_language and vocal_language.strip() and 'language' not in metadata:
-                metadata['language'] = vocal_language.strip()
-            
-            if time_signature and time_signature.strip() and 'timesignature' not in metadata:
-                metadata['timesignature'] = time_signature.strip()
-            
-            # Calculate per-condition scores with appropriate metrics
-            # - Metadata fields (bpm, duration, etc.): Top-k recall
-            # - Caption and lyrics: PMI (normalized)
-            scores_per_condition, global_score, status = calculate_pmi_score_per_condition(
-                llm_handler=llm_handler,
-                audio_codes=audio_codes_str,
-                caption=caption or "",
-                lyrics=lyrics or "",
-                metadata=metadata if metadata else None,
-                temperature=1.0,
-                topk=10,
-                score_scale=score_scale
-            )
-            
-            # Format display string with per-condition breakdown
-            if global_score == 0.0 and not scores_per_condition:
-                return t("messages.score_failed", error=status)
-            else:
-                # Build per-condition scores display
-                condition_lines = []
-                for condition_name, score_value in sorted(scores_per_condition.items()):
-                    condition_lines.append(
-                        f"  • {condition_name}: {score_value:.4f}"
-                    )
-                
-                conditions_display = "\n".join(condition_lines) if condition_lines else "  (no conditions)"
-                
-                return (
-                    f"✅ Global Quality Score: {global_score:.4f} (0-1, higher=better)\n\n"
-                    f"📊 Per-Condition Scores (0-1):\n{conditions_display}\n\n"
-                    f"Note: Metadata uses Top-k Recall, Caption/Lyrics use PMI\n"
-                )
-                
-        except Exception as e:
-            import traceback
-            error_msg = t("messages.score_error", error=str(e)) + f"\n{traceback.format_exc()}"
-            return error_msg
-    
-    # Connect score buttons - REFACTORED: Read from batch_queue only, not UI
-    def get_score_btn_inputs(sample_idx):
-        """Simplified score inputs - only batch data, no UI components"""
-        return [
-            gr.State(value=sample_idx),
-            generation_section["score_scale"],  # Only UI param is the tool setting
-            results_section["current_batch_index"],
-            results_section["batch_queue"],
-        ]
-    
-    results_section["score_btn_1"].click(
-        fn=calculate_score_handler_with_selection,
-        inputs=get_score_btn_inputs(1),
-        outputs=[results_section["score_display_1"], results_section["batch_queue"]]
-    )
-    
-    results_section["score_btn_2"].click(
-        fn=calculate_score_handler_with_selection,
-        inputs=get_score_btn_inputs(2),
-        outputs=[results_section["score_display_2"], results_section["batch_queue"]]
-    )
-    
-    results_section["score_btn_3"].click(
-        fn=calculate_score_handler_with_selection,
-        inputs=get_score_btn_inputs(3),
-        outputs=[results_section["score_display_3"], results_section["batch_queue"]]
-    )
-    
-    results_section["score_btn_4"].click(
-        fn=calculate_score_handler_with_selection,
-        inputs=get_score_btn_inputs(4),
-        outputs=[results_section["score_display_4"], results_section["batch_queue"]]
-    )
-    
-    results_section["score_btn_5"].click(
-        fn=calculate_score_handler_with_selection,
-        inputs=get_score_btn_inputs(5),
-        outputs=[results_section["score_display_5"], results_section["batch_queue"]]
-    )
-    
-    results_section["score_btn_6"].click(
-        fn=calculate_score_handler_with_selection,
-        inputs=get_score_btn_inputs(6),
-        outputs=[results_section["score_display_6"], results_section["batch_queue"]]
-    )
-    
-    results_section["score_btn_7"].click(
-        fn=calculate_score_handler_with_selection,
-        inputs=get_score_btn_inputs(7),
-        outputs=[results_section["score_display_7"], results_section["batch_queue"]]
-    )
-    
-    results_section["score_btn_8"].click(
-        fn=calculate_score_handler_with_selection,
-        inputs=get_score_btn_inputs(8),
-        outputs=[results_section["score_display_8"], results_section["batch_queue"]]
-    )
-    
-    # Send to src handlers for audio 3 and 4
-    results_section["send_to_src_btn_3"].click(
-        fn=send_audio_to_src_with_metadata,
-        inputs=[
-            results_section["generated_audio_3"],
-            results_section["lm_metadata_state"]
-        ],
-        outputs=[
-            generation_section["src_audio"],
-            generation_section["bpm"],
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["audio_duration"],
-            generation_section["key_scale"],
-            generation_section["vocal_language"],
-            generation_section["time_signature"],
-            results_section["is_format_caption_state"]
-        ]
-    )
-    
-    results_section["send_to_src_btn_4"].click(
-        fn=send_audio_to_src_with_metadata,
-        inputs=[
-            results_section["generated_audio_4"],
-            results_section["lm_metadata_state"]
-        ],
-        outputs=[
-            generation_section["src_audio"],
-            generation_section["bpm"],
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["audio_duration"],
-            generation_section["key_scale"],
-            generation_section["vocal_language"],
-            generation_section["time_signature"],
-            results_section["is_format_caption_state"]
-        ]
-    )
-    
-    # Send to src handlers for audio 5-8
-    results_section["send_to_src_btn_5"].click(
-        fn=send_audio_to_src_with_metadata,
-        inputs=[results_section["generated_audio_5"], results_section["lm_metadata_state"]],
-        outputs=[
-            generation_section["src_audio"], generation_section["bpm"], generation_section["captions"],
-            generation_section["lyrics"], generation_section["audio_duration"], generation_section["key_scale"],
-            generation_section["vocal_language"], generation_section["time_signature"], results_section["is_format_caption_state"]
-        ]
-    )
-    
-    results_section["send_to_src_btn_6"].click(
-        fn=send_audio_to_src_with_metadata,
-        inputs=[results_section["generated_audio_6"], results_section["lm_metadata_state"]],
-        outputs=[
-            generation_section["src_audio"], generation_section["bpm"], generation_section["captions"],
-            generation_section["lyrics"], generation_section["audio_duration"], generation_section["key_scale"],
-            generation_section["vocal_language"], generation_section["time_signature"], results_section["is_format_caption_state"]
-        ]
-    )
-    
-    results_section["send_to_src_btn_7"].click(
-        fn=send_audio_to_src_with_metadata,
-        inputs=[results_section["generated_audio_7"], results_section["lm_metadata_state"]],
-        outputs=[
-            generation_section["src_audio"], generation_section["bpm"], generation_section["captions"],
-            generation_section["lyrics"], generation_section["audio_duration"], generation_section["key_scale"],
-            generation_section["vocal_language"], generation_section["time_signature"], results_section["is_format_caption_state"]
-        ]
-    )
-    
-    results_section["send_to_src_btn_8"].click(
-        fn=send_audio_to_src_with_metadata,
-        inputs=[results_section["generated_audio_8"], results_section["lm_metadata_state"]],
-        outputs=[
-            generation_section["src_audio"], generation_section["bpm"], generation_section["captions"],
-            generation_section["lyrics"], generation_section["audio_duration"], generation_section["key_scale"],
-            generation_section["vocal_language"], generation_section["time_signature"], results_section["is_format_caption_state"]
-        ]
-    )
-    
-    # Navigation button handlers - REFACTORED: Only update results, never touch input UI
-    def navigate_to_previous_batch(
-        current_batch_index,
-        batch_queue,
-    ):
-        """Navigate to previous batch (Result View Only - Never touches Input UI)"""
-        if current_batch_index <= 0:
-            gr.Warning(t("messages.at_first_batch"))
-            return [gr.update()] * 24
-        
-        # Move to previous batch
-        new_batch_index = current_batch_index - 1
-        
-        # Load batch data from queue
-        if new_batch_index not in batch_queue:
-            gr.Warning(t("messages.batch_not_found", n=new_batch_index + 1))
-            return [gr.update()] * 24
-        
-        batch_data = batch_queue[new_batch_index]
-        audio_paths = batch_data.get("audio_paths", [])
-        generation_info_text = batch_data.get("generation_info", "")
-        
-        # Prepare audio outputs (up to 8)
-        audio_outputs = [None] * 8
-        for idx in range(min(len(audio_paths), 8)):
-            audio_outputs[idx] = audio_paths[idx]
-        
-        # Update batch indicator
-        total_batches = len(batch_queue)
-        batch_indicator_text = update_batch_indicator(new_batch_index, total_batches)
-        
-        # Update button states
-        can_go_previous, can_go_next = update_navigation_buttons(new_batch_index, total_batches)
-        
-        # Restore score displays from batch queue
-        stored_scores = batch_data.get("scores", [""] * 8)
-        score_displays = stored_scores if stored_scores else [""] * 8
-        
-        return (
-            audio_outputs[0],  # generated_audio_1
-            audio_outputs[1],  # generated_audio_2
-            audio_outputs[2],  # generated_audio_3
-            audio_outputs[3],  # generated_audio_4
-            audio_outputs[4],  # generated_audio_5
-            audio_outputs[5],  # generated_audio_6
-            audio_outputs[6],  # generated_audio_7
-            audio_outputs[7],  # generated_audio_8
-            audio_paths,  # generated_audio_batch
-            generation_info_text,  # generation_info
-            new_batch_index,  # current_batch_index
-            batch_indicator_text,  # batch_indicator
-            gr.update(interactive=can_go_previous),  # prev_batch_btn
-            gr.update(interactive=can_go_next),  # next_batch_btn
-            t("messages.viewing_batch", n=new_batch_index + 1),  # status_output
-            score_displays[0],  # score_display_1
-            score_displays[1],  # score_display_2
-            score_displays[2],  # score_display_3
-            score_displays[3],  # score_display_4
-            score_displays[4],  # score_display_5
-            score_displays[5],  # score_display_6
-            score_displays[6],  # score_display_7
-            score_displays[7],  # score_display_8
-            gr.update(interactive=True),  # restore_params_btn - Enable when viewing batch
-            # NO generation_section outputs - Input UI remains untouched!
-        )
-    
-    def navigate_to_next_batch(
-        autogen_enabled,
-        current_batch_index,
-        total_batches,
-        batch_queue,
-    ):
-        """Navigate to next batch (Result View Only - Never touches Input UI)"""
-        if current_batch_index >= total_batches - 1:
-            gr.Warning(t("messages.at_last_batch"))
-            return [gr.update()] * 25
-        
-        # Move to next batch
-        new_batch_index = current_batch_index + 1
-        
-        # Load batch data from queue
-        if new_batch_index not in batch_queue:
-            gr.Warning(t("messages.batch_not_found", n=new_batch_index + 1))
-            return [gr.update()] * 25
-        
-        batch_data = batch_queue[new_batch_index]
-        audio_paths = batch_data.get("audio_paths", [])
-        generation_info_text = batch_data.get("generation_info", "")
-        
-        # Prepare audio outputs (up to 8)
-        audio_outputs = [None] * 8
-        for idx in range(min(len(audio_paths), 8)):
-            audio_outputs[idx] = audio_paths[idx]
-        
-        # Update batch indicator
-        batch_indicator_text = update_batch_indicator(new_batch_index, total_batches)
-        
-        # Update button states
-        can_go_previous, can_go_next = update_navigation_buttons(new_batch_index, total_batches)
-        
-        # Prepare next batch status message
-        next_batch_status_text = ""
-        is_latest_view = (new_batch_index == total_batches - 1)
-        if autogen_enabled and is_latest_view:
-            next_batch_status_text = "🔄 AutoGen will generate next batch in background..."
-        
-        # Restore score displays from batch queue
-        stored_scores = batch_data.get("scores", [""] * 8)
-        score_displays = stored_scores if stored_scores else [""] * 8
-        
-        return (
-            audio_outputs[0],  # generated_audio_1
-            audio_outputs[1],  # generated_audio_2
-            audio_outputs[2],  # generated_audio_3
-            audio_outputs[3],  # generated_audio_4
-            audio_outputs[4],  # generated_audio_5
-            audio_outputs[5],  # generated_audio_6
-            audio_outputs[6],  # generated_audio_7
-            audio_outputs[7],  # generated_audio_8
-            audio_paths,  # generated_audio_batch
-            generation_info_text,  # generation_info
-            new_batch_index,  # current_batch_index
-            batch_indicator_text,  # batch_indicator
-            gr.update(interactive=can_go_previous),  # prev_batch_btn
-            gr.update(interactive=can_go_next),  # next_batch_btn
-            t("messages.viewing_batch", n=new_batch_index + 1),  # status_output
-            next_batch_status_text,  # next_batch_status
-            score_displays[0],  # score_display_1
-            score_displays[1],  # score_display_2
-            score_displays[2],  # score_display_3
-            score_displays[3],  # score_display_4
-            score_displays[4],  # score_display_5
-            score_displays[5],  # score_display_6
-            score_displays[6],  # score_display_7
-            score_displays[7],  # score_display_8
-            gr.update(interactive=True),  # restore_params_btn - Enable when viewing batch
-            # NO generation_section outputs - Input UI remains untouched!
-        )
-    
-    def restore_batch_parameters(current_batch_index, batch_queue):
-        """
-        Restore parameters from currently viewed batch to Input UI.
-        This is the bridge allowing users to "reuse" historical settings.
-        """
-        if current_batch_index not in batch_queue:
-            gr.Warning(t("messages.no_batch_data"))
-            return [gr.update()] * 29  # Match number of outputs
-        
-        batch_data = batch_queue[current_batch_index]
-        params = batch_data.get("generation_params", {})
-        
-        # Extract all parameters with defaults
-        captions = params.get("captions", "")
-        lyrics = params.get("lyrics", "")
-        bpm = params.get("bpm", None)
-        key_scale = params.get("key_scale", "")
-        time_signature = params.get("time_signature", "")
-        vocal_language = params.get("vocal_language", "unknown")
-        audio_duration = params.get("audio_duration", -1)
-        batch_size_input = params.get("batch_size_input", 2)
-        inference_steps = params.get("inference_steps", 8)
-        lm_temperature = params.get("lm_temperature", 0.85)
-        lm_cfg_scale = params.get("lm_cfg_scale", 2.0)
-        lm_top_k = params.get("lm_top_k", 0)
-        lm_top_p = params.get("lm_top_p", 0.9)
-        think_checkbox = params.get("think_checkbox", True)
-        use_cot_caption = params.get("use_cot_caption", True)
-        use_cot_language = params.get("use_cot_language", True)
-        allow_lm_batch = params.get("allow_lm_batch", True)
-        track_name = params.get("track_name", None)
-        complete_track_classes = params.get("complete_track_classes", [])
-        
-        # Extract and process codes (prefer actual codes from batch_data over params)
-        stored_codes = batch_data.get("codes", "")
-        stored_allow_lm_batch = params.get("allow_lm_batch", False)
-        
-        codes_outputs = [""] * 9  # [Main, 1-8]
-        if stored_codes:
-            if stored_allow_lm_batch and isinstance(stored_codes, list):
-                # Batch mode: populate codes 1-8, main shows first
-                codes_outputs[0] = stored_codes[0] if stored_codes else ""
-                for idx in range(min(len(stored_codes), 8)):
-                    codes_outputs[idx + 1] = stored_codes[idx]
-            else:
-                # Single mode: populate main, clear 1-8
-                codes_outputs[0] = stored_codes if isinstance(stored_codes, str) else (stored_codes[0] if stored_codes else "")
-        
-        gr.Info(t("messages.params_restored", n=current_batch_index + 1))
-        
-        return (
-            codes_outputs[0],  # text2music_audio_code_string
-            codes_outputs[1],  # text2music_audio_code_string_1
-            codes_outputs[2],  # text2music_audio_code_string_2
-            codes_outputs[3],  # text2music_audio_code_string_3
-            codes_outputs[4],  # text2music_audio_code_string_4
-            codes_outputs[5],  # text2music_audio_code_string_5
-            codes_outputs[6],  # text2music_audio_code_string_6
-            codes_outputs[7],  # text2music_audio_code_string_7
-            codes_outputs[8],  # text2music_audio_code_string_8
-            captions,
-            lyrics,
-            bpm,
-            key_scale,
-            time_signature,
-            vocal_language,
-            audio_duration,
-            batch_size_input,
-            inference_steps,
-            lm_temperature,
-            lm_cfg_scale,
-            lm_top_k,
-            lm_top_p,
-            think_checkbox,
-            use_cot_caption,
-            use_cot_language,
-            allow_lm_batch,
-            track_name,
-            complete_track_classes
-        )
-    
-    # Wire up navigation buttons - REFACTORED: Results-only outputs
-    results_section["prev_batch_btn"].click(
-        fn=navigate_to_previous_batch,
-        inputs=[
-            results_section["current_batch_index"],
-            results_section["batch_queue"],
-        ],
-        outputs=[
-            results_section["generated_audio_1"],
-            results_section["generated_audio_2"],
-            results_section["generated_audio_3"],
-            results_section["generated_audio_4"],
-            results_section["generated_audio_5"],
-            results_section["generated_audio_6"],
-            results_section["generated_audio_7"],
-            results_section["generated_audio_8"],
-            results_section["generated_audio_batch"],
-            results_section["generation_info"],
-            results_section["current_batch_index"],
-            results_section["batch_indicator"],
-            results_section["prev_batch_btn"],
-            results_section["next_batch_btn"],
-            results_section["status_output"],
-            results_section["score_display_1"],
-            results_section["score_display_2"],
-            results_section["score_display_3"],
-            results_section["score_display_4"],
-            results_section["score_display_5"],
-            results_section["score_display_6"],
-            results_section["score_display_7"],
-            results_section["score_display_8"],
-            results_section["restore_params_btn"],  # Enable restore button
-            # NO generation_section outputs - Input UI preserved across navigation!
-        ]
-    )
-    
-    # REFACTORED: Capture->Navigate->Generate chain with Input/Result decoupling
-    results_section["next_batch_btn"].click(
-        # Step 1: Capture current UI parameters (user's modifications like BS=8)
-        fn=capture_current_params,
-        inputs=[
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["bpm"],
-            generation_section["key_scale"],
-            generation_section["time_signature"],
-            generation_section["vocal_language"],
-            generation_section["inference_steps"],
-            generation_section["guidance_scale"],
-            generation_section["random_seed_checkbox"],
-            generation_section["seed"],
-            generation_section["reference_audio"],
-            generation_section["audio_duration"],
-            generation_section["batch_size_input"],
-            generation_section["src_audio"],
-            generation_section["text2music_audio_code_string"],
-            generation_section["repainting_start"],
-            generation_section["repainting_end"],
-            generation_section["instruction_display_gen"],
-            generation_section["audio_cover_strength"],
-            generation_section["task_type"],
-            generation_section["use_adg"],
-            generation_section["cfg_interval_start"],
-            generation_section["cfg_interval_end"],
-            generation_section["audio_format"],
-            generation_section["lm_temperature"],
-            generation_section["think_checkbox"],
-            generation_section["lm_cfg_scale"],
-            generation_section["lm_top_k"],
-            generation_section["lm_top_p"],
-            generation_section["lm_negative_prompt"],
-            generation_section["use_cot_metas"],
-            generation_section["use_cot_caption"],
-            generation_section["use_cot_language"],
-            generation_section["constrained_decoding_debug"],
-            generation_section["allow_lm_batch"],
-            generation_section["auto_score"],
-            generation_section["score_scale"],
-            generation_section["lm_batch_chunk_size"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-        ],
-        outputs=[results_section["generation_params_state"]]
-    ).then(
-        # Step 2: Navigate to next batch (updates results only, preserves input UI)
-        fn=navigate_to_next_batch,
-        inputs=[
-            generation_section["autogen_checkbox"],
-            results_section["current_batch_index"],
-            results_section["total_batches"],
-            results_section["batch_queue"],
-        ],
-        outputs=[
-            results_section["generated_audio_1"],
-            results_section["generated_audio_2"],
-            results_section["generated_audio_3"],
-            results_section["generated_audio_4"],
-            results_section["generated_audio_5"],
-            results_section["generated_audio_6"],
-            results_section["generated_audio_7"],
-            results_section["generated_audio_8"],
-            results_section["generated_audio_batch"],
-            results_section["generation_info"],
-            results_section["current_batch_index"],
-            results_section["batch_indicator"],
-            results_section["prev_batch_btn"],
-            results_section["next_batch_btn"],
-            results_section["status_output"],
-            results_section["next_batch_status"],
-            results_section["score_display_1"],
-            results_section["score_display_2"],
-            results_section["score_display_3"],
-            results_section["score_display_4"],
-            results_section["score_display_5"],
-            results_section["score_display_6"],
-            results_section["score_display_7"],
-            results_section["score_display_8"],
-            results_section["restore_params_btn"],  # Enable restore button
-            # NO generation_section outputs - Input UI preserved across navigation!
-        ]
-    ).then(
-        # Step 3: Generate next batch in background (uses captured params from Step 1)
-        fn=generate_next_batch_background,
-        inputs=[
-            generation_section["autogen_checkbox"],
-            results_section["generation_params_state"],  # Uses Step 1 captured params
-            results_section["current_batch_index"],
-            results_section["total_batches"],
-            results_section["batch_queue"],
-            results_section["is_format_caption_state"],
-        ],
-        outputs=[
-            results_section["batch_queue"],
-            results_section["total_batches"],
-            results_section["next_batch_status"],
-            results_section["next_batch_btn"],
-        ]
-    )
-    
-    # Bind restore parameters button - Bridge between Result View and Input View
-    results_section["restore_params_btn"].click(
-        fn=restore_batch_parameters,
-        inputs=[
-            results_section["current_batch_index"],
-            results_section["batch_queue"]
-        ],
-        outputs=[
-            generation_section["text2music_audio_code_string"],
-            generation_section["text2music_audio_code_string_1"],
-            generation_section["text2music_audio_code_string_2"],
-            generation_section["text2music_audio_code_string_3"],
-            generation_section["text2music_audio_code_string_4"],
-            generation_section["text2music_audio_code_string_5"],
-            generation_section["text2music_audio_code_string_6"],
-            generation_section["text2music_audio_code_string_7"],
-            generation_section["text2music_audio_code_string_8"],
-            generation_section["captions"],
-            generation_section["lyrics"],
-            generation_section["bpm"],
-            generation_section["key_scale"],
-            generation_section["time_signature"],
-            generation_section["vocal_language"],
-            generation_section["audio_duration"],
-            generation_section["batch_size_input"],
-            generation_section["inference_steps"],
-            generation_section["lm_temperature"],
-            generation_section["lm_cfg_scale"],
-            generation_section["lm_top_k"],
-            generation_section["lm_top_p"],
-            generation_section["think_checkbox"],
-            generation_section["use_cot_caption"],
-            generation_section["use_cot_language"],
-            generation_section["allow_lm_batch"],
-            generation_section["track_name"],
-            generation_section["complete_track_classes"],
-        ]
-    )
-