ai_qc/backend/api_server.py

#!/usr/bin/env python3
"""
API server for Visual AI QC application.
Provides API endpoints for visual quality control checks without web UI.
"""
import os
import sys
import json
import base64
import collections
import html
import importlib
import traceback
import re
import threading
import time
from concurrent.futures import ThreadPoolExecutor, as_completed
from datetime import datetime, timedelta
from pathlib import Path
from flask import Flask, request, jsonify, Response, make_response, g, redirect
from dotenv import load_dotenv

# Determine environment and load appropriate config
def load_environment_config():
    """Load environment-specific configuration"""
    # Check for environment variable first
    environment = os.environ.get('ENVIRONMENT', 'development')

    # Determine config file path based on environment
    base_dir = os.path.dirname(os.path.abspath(__file__))

    # Try new config structure first
    config_path = os.path.join(base_dir, 'config', f'{environment}.env')

    # Fall back to old config.env if new structure doesn't exist
    if not os.path.exists(config_path):
        old_config_path = os.path.join(base_dir, 'config.env')
        if os.path.exists(old_config_path):
            config_path = old_config_path
            environment = 'production'  # Assume production for backward compatibility
            print(f"Using legacy config file: {config_path}")
        else:
            print(f"No configuration file found. Checked: {config_path} and {old_config_path}")
            return environment

    # Load the configuration
    load_dotenv(config_path)
    print(f"Environment: {environment}")
    print(f"Loaded configuration from: {config_path}")
    print(f"OPENAI_API_KEY set: {'OPENAI_API_KEY' in os.environ}")
    print(f"GOOGLE_API_KEY set: {'GOOGLE_API_KEY' in os.environ}")
    print(f"Port: {os.environ.get('PORT', 'not set')}")

    return environment

# Load environment configuration
current_environment = load_environment_config()

# Add the parent directory to the Python path to ensure imports work correctly
sys.path.append(os.path.dirname(os.path.abspath(__file__)))

# Import QC utilities and model configuration
from visual_qc_apps.utils import get_image_from_asset
from llm_config import run_visual_qc, get_model_info
from profile_config import QC_CHECKS, PROFILES, get_profile, get_check_llm_map
from brand_guidelines_db import BrandGuidelinesDB
from auth_middleware import AuthMiddleware
from technical_check import inspect as technical_inspect, format_for_llm_prompt as technical_to_prompt
import box_jwt_client
from PIL import Image
import io

# Create Flask app
app = Flask(__name__)

# Configure app based on environment
upload_folder = os.environ.get('UPLOAD_FOLDER', 'uploads')
output_folder = os.environ.get('OUTPUT_FOLDER', 'output')
debug_mode = os.environ.get('DEBUG_MODE', 'false').lower() == 'true'

app.config['UPLOAD_FOLDER'] = upload_folder
app.config['OUTPUT_FOLDER'] = output_folder
app.config['MAX_CONTENT_LENGTH'] = 100 * 1024 * 1024  # 100MB max file size
app.config['SECRET_KEY'] = os.environ.get('SECRET_KEY', 'default-secret-change-this')
app.debug = debug_mode

print(f"Upload folder: {upload_folder}")
print(f"Output folder: {output_folder}")
print(f"Debug mode: {debug_mode}")

# Ensure directories exist
os.makedirs(app.config['UPLOAD_FOLDER'], exist_ok=True)
os.makedirs(app.config['OUTPUT_FOLDER'], exist_ok=True)

# Initialize authentication middleware
auth = AuthMiddleware(app)

# Initialize brand guidelines database
brand_db = BrandGuidelinesDB()

# Initialize media plans storage
MEDIA_PLANS_DIR = os.path.join(os.path.dirname(os.path.abspath(__file__)), 'media_plans')
os.makedirs(MEDIA_PLANS_DIR, exist_ok=True)
MEDIA_PLANS_DB_FILE = os.path.join(MEDIA_PLANS_DIR, 'plans_db.json')

def _load_media_plans_db():
    if os.path.exists(MEDIA_PLANS_DB_FILE):
        try:
            with open(MEDIA_PLANS_DB_FILE, 'r') as f:
                return json.load(f)
        except (json.JSONDecodeError, FileNotFoundError):
            pass
    return {}

def _save_media_plans_db(db):
    with open(MEDIA_PLANS_DB_FILE, 'w') as f:
        json.dump(db, f, indent=2)

def _get_active_media_plan(client_id):
    """Get the parsed media plan data for a client, or None."""
    db = _load_media_plans_db()
    plan_info = db.get(client_id)
    if not plan_info:
        return None
    json_path = plan_info.get('json_path')
    if json_path and os.path.exists(json_path):
        try:
            with open(json_path, 'r') as f:
                return json.load(f)
        except (json.JSONDecodeError, FileNotFoundError):
            pass
    return None

# Global progress tracking
progress_tracker = {}

# Dictionary to store QC app instances and prompts
qc_apps = {}

# Define QC checks that require reference assets
REFERENCE_ASSET_REQUIRED_CHECKS = {'brand_assets_visibility', 'visual_hierarchy', 'logo_visibility'}

def extract_json_from_response(response_text):
    """Extract JSON objects from the LLM's response"""
    # First, try to find JSON blocks (```json ... ```)
    json_pattern = r'```json\s*(.*?)\s*```'
    json_matches = re.finditer(json_pattern, response_text, re.DOTALL)

    # Get all JSON blocks as a list
    json_objects = []
    for match in json_matches:
        try:
            json_data = json.loads(match.group(1).strip())
            json_objects.append(json_data)
        except Exception as e:
            print(f"Could not parse JSON block: {e}")

    # If we found multiple JSON blocks, merge them (later blocks override earlier blocks)
    if json_objects:
        merged_json = {}
        for json_obj in json_objects:
            if json_obj:  # If not empty
                merged_json.update(json_obj)
        if merged_json:
            return merged_json

    # If we couldn't extract JSON blocks or they were empty, look for JSON directly
    try:
        # Try to find pure JSON in response (without code blocks)
        # Remove markdown code formatting first
        clean_response = re.sub(r'```.*?```', '', response_text, flags=re.DOTALL)

        # Look for text that looks like JSON (between { and })
        json_pattern = r'\{.*\}'
        json_match = re.search(json_pattern, clean_response, re.DOTALL)
        if json_match:
            try:
                json_data = json.loads(json_match.group(0))
                return json_data
            except json.JSONDecodeError:
                pass
    except Exception as e:
        print(f"Failed to extract direct JSON: {e}")

    # If we couldn't find valid JSON, return an empty dict
    return {}

def detect_and_crop_main_element(image_path, file_type_hint=None):
    """Detect main element in POS files and return cropped region coordinates"""
    try:
        if not file_type_hint or 'pos' not in file_type_hint.lower():
            return None

        # Create a prompt to detect the main marketing element
        crop_detection_prompt = """
        This appears to be a POS (Point of Sale) material. Please identify the main marketing element that should be used for QC analysis.

        Look for the primary branded content area (usually the center panel or main marketing message) and ignore peripheral elements like:
        - Side panels with fine print
        - Edge decorations
        - Background patterns
        - Border elements

        Respond with JSON format:
        {
            "main_element_detected": true/false,
            "crop_coordinates": {
                "x": left_position_percentage,
                "y": top_position_percentage,
                "width": width_percentage,
                "height": height_percentage
            },
            "description": "description of the main element found"
        }

        Coordinates should be percentages (0-100) of the total image dimensions.
        """

        # Run AI analysis to detect main element
        result = run_visual_qc(
            prompt=crop_detection_prompt,
            asset_path=image_path,
            model_name="Gemini"
        )

        # Extract crop coordinates
        crop_data = extract_json_from_response(result['response'])

        if crop_data.get('main_element_detected') and 'crop_coordinates' in crop_data:
            return crop_data['crop_coordinates']

        return None

    except Exception as e:
        print(f"Error detecting main element: {e}")
        return None

def apply_crop_to_analysis(image_path, crop_coordinates):
    """Apply cropping to image for analysis (if coordinates provided)"""
    if not crop_coordinates:
        return image_path

    try:
        from PIL import Image
        import os

        # Load original image
        with Image.open(image_path) as img:
            width, height = img.size

            # Convert percentage coordinates to pixels
            x = int((crop_coordinates['x'] / 100) * width)
            y = int((crop_coordinates['y'] / 100) * height)
            crop_width = int((crop_coordinates['width'] / 100) * width)
            crop_height = int((crop_coordinates['height'] / 100) * height)

            # Ensure coordinates are within image bounds
            x = max(0, min(x, width))
            y = max(0, min(y, height))
            crop_width = min(crop_width, width - x)
            crop_height = min(crop_height, height - y)

            # Crop the image
            cropped_img = img.crop((x, y, x + crop_width, y + crop_height))

            # Save cropped version
            filename, ext = os.path.splitext(image_path)
            cropped_path = f"{filename}_cropped{ext}"
            cropped_img.save(cropped_path)

            return cropped_path

    except Exception as e:
        print(f"Error applying crop: {e}")
        return image_path

    return image_path

def extract_score_from_result(result, profile_config=None, check_name=None):
    """Extract score from LLM result response with Unilever-specific logic"""
    score = None
    try:
        # Use our extraction function to get score from JSON blocks
        json_data = extract_json_from_response(result['response'])

        # Unilever Key Visual profile specific logic
        if (profile_config and
            ((hasattr(profile_config, 'name') and profile_config.name == 'Unilever Key Visual') or
             (hasattr(profile_config, 'get') and profile_config.get('name') == 'Unilever Key Visual')) and
            check_name in ['face_visibility', 'new_visibility', 'face_gaze_direction']):

            # Check for zero score conditions based on missing elements
            if check_name == 'face_visibility' and json_data.get('face_present') == False:
                print(f"Unilever profile: No face detected for {check_name}, setting score to 0")
                return 0

            elif check_name == 'new_visibility' and json_data.get('new_present') == False:
                print(f"Unilever profile: No 'new' element detected for {check_name}, setting score to 0")
                return 0

            elif check_name == 'face_gaze_direction' and json_data.get('face_present') == False:
                print(f"Unilever profile: No face detected for {check_name}, setting score to 0")
                return 0

        # Standard scoring logic
        if 'score' in json_data:
            score = json_data.get('score')
            print(f"Extracted score from JSON block: {score}")

        # If we still don't have a score, look for any score in text
        if score is None:
            # Try to find a score pattern in the text
            score_pattern = r'["\']score["\']\s*:\s*(\d+)'
            score_match = re.search(score_pattern, result['response'])
            if score_match:
                score = int(score_match.group(1))
                print(f"Extracted score from regex: {score}")
            else:
                # Look for descriptive scores in text
                descriptive_score_pattern = r'score(?:\s+is|\s*:\s*|\s+of\s+)(?:\s*)(\d+)(?:\s*out\s*of\s*10)?'
                descriptive_match = re.search(descriptive_score_pattern, result['response'].lower())
                if descriptive_match:
                    score = int(descriptive_match.group(1))
                    print(f"Extracted score from descriptive text: {score}")
                else:
                    # Try to determine score from pass/fail status (legacy mode)
                    result_text = result.get('response', '').upper()
                    if "PASS" in result_text:
                        score = 10  # Pass = 10/10
                        print("Detected PASS keyword, setting score to 10")
                    elif "FAIL" in result_text:
                        score = 3   # Fail = 3/10
                        print("Detected FAIL keyword, setting score to 3")
                    else:
                        score = 5  # Default middle score
                        print(f"Could not extract score, using default of 5")
    except Exception as parse_error:
        print(f"Error parsing score from response: {parse_error}")
        score = 5  # Default to middle score

    return score if score is not None else 5

def determine_grade(overall_score):
    """Determine Pass/Fail based on overall score"""
    # Convert overall score to individual check average (1-10 scale)
    avg_individual_score = overall_score / 10
    if avg_individual_score >= 6:
        return 'Pass'
    else:
        return 'Fail'

def _run_dj_file_naming_check(check_name, file_path, profile_weights):
    """
    Deterministic file-naming check for the Dow Jones / OLIVER convention.
    Bypasses the LLM dispatch entirely; returns a result dict shaped like an LLM check
    so it slots into the existing scoring + report pipeline.
    """
    from file_naming_validator import validate_filename
    filename = os.path.basename(file_path) if file_path else ''
    validation = validate_filename(filename)
    weight = profile_weights.get(check_name, 0.1)
    score = validation['score']
    weighted_score = score * weight
    return {
        'check_name': check_name,
        'status': 'success',
        'response': validation['explanation'],
        'json_data': validation,
        'score': score,
        'weight': weight,
        'weighted_score': weighted_score,
        'model_used': {'model': 'deterministic', 'provider': 'internal'},
        'token_usage': {'input_tokens': 0, 'output_tokens': 0},
        'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
        'display_name': 'DJ File Naming',
        'brand_guidelines_status': None,
        'requires_brand_guidelines': False,
    }


def process_single_check(check_name, qc_apps, profile_config, profile_weights, file_path,
                        analysis_reference_asset, brand_db, progress_tracker, session_id,
                        check_index, total_checks, model_version=None, media_plan_context=None,
                        ocr_context=None):
    """Process a single QC check - designed to run in parallel"""
    try:
        # Deterministic file-naming check — short-circuit before any LLM dispatch.
        if check_name == 'dj_file_naming':
            return _run_dj_file_naming_check(check_name, file_path, profile_weights)

        # Check if this check requires a reference asset but none is provided
        if check_name in REFERENCE_ASSET_REQUIRED_CHECKS and not analysis_reference_asset:
            # Return automatic fail with score 0
            fail_response = f"Reference asset is required for the '{check_name}' QC check but was not provided."
            return {
                'check_name': check_name,
                'status': 'success',
                'score': 0,
                'result': 'Fail',
                'response': fail_response,
                'json_data': {},
                'requires_brand_guidelines': False,
                'brand_guidelines_status': None
            }
        check_prompt = qc_apps[check_name]['prompt']
        llm_model = profile_config.get_check_llm(check_name)

        # Handle brand guidelines if needed
        requires_brand_guidelines = any(keyword in check_prompt.lower() for keyword in [
            'brand guideline', 'brand standard', 'brand requirement', 'brand specification',
            'brand compliance', 'brand rule', 'brand policy'
        ])

        brand_guidelines_status = None
        detected_brand = None
        # Since we skip triage, we won't have detected_brand automatically
        # Could be enhanced with direct brand detection if needed

        if requires_brand_guidelines and detected_brand:
            brand_guidelines = brand_db.get_brand_guidelines(detected_brand)
            if brand_guidelines:
                brand_guidelines_status = f"Brand guidelines found for {detected_brand} ({len(brand_guidelines)} files)."
                # Add guidelines to prompt (simplified version)
                check_prompt += f"\n\nBrand Analysis Context: Using brand guidelines for {detected_brand}."
            else:
                brand_guidelines_status = f"INFO: Brand detected as '{detected_brand}' but no brand guidelines found."

        # Add pre-analysis instructions if available
        final_prompt = check_prompt
        if profile_config.pre_analysis_instructions:
            final_prompt = profile_config.pre_analysis_instructions + "\n\n" + check_prompt

        # Add reference asset content if selected
        reference_image_path = None
        if analysis_reference_asset:
            reference_content = get_reference_asset_content(analysis_reference_asset)
            if reference_content:
                final_prompt = reference_content + "\n\n" + final_prompt
                print(f"Added reference asset {analysis_reference_asset} to {check_name} prompt")

            # Also get the actual reference image path for LLM
            reference_image_path = get_reference_asset_image_path(analysis_reference_asset)

        # Add media plan context if available
        if media_plan_context:
            final_prompt = final_prompt + "\n" + media_plan_context

        # Add OCR measurement context for checks that evaluate spatial layout
        try:
            from ocr_measurement import OCR_RELEVANT_CHECKS as _ocr_checks
            ocr_enabled = check_name in _ocr_checks
        except ImportError:
            ocr_enabled = False
        if ocr_context and ocr_enabled:
            final_prompt = final_prompt + "\n" + ocr_context

        tech_report = progress_tracker.get(session_id, {}).get('technical_report')
        if tech_report:
            try:
                final_prompt = technical_to_prompt(tech_report) + "\n\n" + final_prompt
            except Exception:
                pass  # Pre-flight context is best-effort; never block the check on it.

        print(f"Running check {check_index + 1}/{total_checks}: {check_name}")

        result = run_visual_qc(
            prompt=final_prompt,
            asset_path=file_path,
            reference_path=reference_image_path,
            model_name=llm_model,
            model_version=model_version
        )

        # Extract score and data
        json_data = extract_json_from_response(result['response'])
        score = extract_score_from_result(result, profile_config, check_name)
        weight = profile_weights.get(check_name, 0.1)
        weighted_score = score * weight if score is not None else 0

        return {
            'check_name': check_name,
            'status': 'success',
            'result': result,
            'response': result['response'],
            'brand_guidelines_status': brand_guidelines_status,
            'requires_brand_guidelines': requires_brand_guidelines,
            'json_data': json_data,
            'score': score,
            'weight': weight,
            'weighted_score': weighted_score,
            'model_used': result.get('model_info', {}),
            'token_usage': result.get('token_usage', {}),
            'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
            'display_name': check_name.replace('_', ' ').title()
        }

    except Exception as e:
        print(f"Error in check {check_name}: {str(e)}")
        weight = profile_weights.get(check_name, 0.1)
        return {
            'check_name': check_name,
            'status': 'error',
            'error': str(e),
            'weight': weight,
            'score': 0,
            'weighted_score': 0
        }

def process_checks_in_batches(enabled_checks, qc_apps, profile_config, profile_weights,
                             file_path, analysis_reference_asset, brand_db, progress_tracker,
                             session_id, batch_size=15, media_plan_context=None, ocr_context=None):
    """Process QC checks in parallel batches"""
    check_results = {}
    total_checks = len(enabled_checks)
    completed_checks = 0

    print(f"Processing {total_checks} checks in batches of {batch_size}")

    # Split checks into batches
    for batch_start in range(0, total_checks, batch_size):
        batch_end = min(batch_start + batch_size, total_checks)
        batch_checks = enabled_checks[batch_start:batch_end]
        batch_number = (batch_start // batch_size) + 1
        total_batches = (total_checks + batch_size - 1) // batch_size

        print(f"Processing batch {batch_number}/{total_batches} ({len(batch_checks)} checks)")

        # Update progress for batch start
        progress_tracker[session_id].update({
            'current_batch': batch_number,
            'total_batches': total_batches,
            'current_check': f"Batch {batch_number}",
            'current_check_display': f"Processing batch {batch_number}/{total_batches}",
            'percentage': 10 + ((completed_checks / total_checks) * 80)
        })

        # Process batch in parallel
        with ThreadPoolExecutor(max_workers=batch_size) as executor:
            # Submit all checks in the batch
            future_to_check = {}
            for i, check_name in enumerate(batch_checks):
                future = executor.submit(
                    process_single_check,
                    check_name, qc_apps, profile_config, profile_weights, file_path,
                    analysis_reference_asset, brand_db, progress_tracker, session_id,
                    batch_start + i, total_checks, None, media_plan_context, ocr_context
                )
                future_to_check[future] = check_name

            # Collect results as they complete
            batch_results = {}
            for future in as_completed(future_to_check):
                check_name = future_to_check[future]
                try:
                    result = future.result()
                    batch_results[result['check_name']] = result
                    completed_checks += 1

                    # Update progress for each completed check
                    progress_tracker[session_id].update({
                        'completed_checks': completed_checks,
                        'percentage': 10 + ((completed_checks / total_checks) * 80)
                    })

                    print(f"Completed check: {check_name} ({completed_checks}/{total_checks})")

                except Exception as e:
                    print(f"Error getting result for check {check_name}: {str(e)}")
                    weight = profile_weights.get(check_name, 0.1)
                    batch_results[check_name] = {
                        'check_name': check_name,
                        'status': 'error',
                        'error': str(e),
                        'weight': weight,
                        'score': 0,
                        'weighted_score': 0
                    }
                    completed_checks += 1

            # Add batch results to main results
            check_results.update(batch_results)

        print(f"Completed batch {batch_number}/{total_batches}")

        # Small delay between batches to avoid overwhelming the APIs
        if batch_number < total_batches:
            time.sleep(0.5)

    print(f"Completed all {total_checks} checks in {total_batches} batches")
    return check_results

def process_single_check_with_triage(check_name, qc_apps, profile_config, profile_weights, file_path,
                                    reference_asset, brand_db, progress_tracker, session_id,
                                    check_index, total_checks, model_version=None):
    """Process a single QC check with triage logic - designed to run in parallel"""
    try:
        # Deterministic file-naming check — short-circuit before any LLM dispatch.
        if check_name == 'dj_file_naming':
            return _run_dj_file_naming_check(check_name, file_path, profile_weights)

        # Check if this check requires a reference asset but none is provided
        if check_name in REFERENCE_ASSET_REQUIRED_CHECKS and not reference_asset:
            # Return automatic fail with score 0
            fail_response = f"Reference asset is required for the '{check_name}' QC check but was not provided."
            return {
                'check_name': check_name,
                'status': 'success',
                'score': 0,
                'result': 'Fail',
                'response': fail_response,
                'json_data': {},
                'requires_brand_guidelines': False,
                'brand_guidelines_status': None
            }
        check_prompt = qc_apps[check_name]['prompt']
        llm_model = profile_config.get_check_llm(check_name)

        # Check if this check requires brand guidelines
        requires_brand_guidelines = any(keyword in check_prompt.lower() for keyword in [
            'brand guideline', 'brand standard', 'brand requirement', 'brand specification',
            'brand compliance', 'brand rule', 'brand policy'
        ])

        brand_guidelines_status = None
        # Try to extract brand from triage results or detection
        detected_brand = None
        # Since we skip triage, we won't have detected_brand automatically
        # Could be enhanced with direct brand detection if needed

        if requires_brand_guidelines:
            if detected_brand:
                brand_guidelines = brand_db.get_brand_guidelines(detected_brand)
                if not brand_guidelines:
                    brand_guidelines_status = f"INFO: Brand detected as '{detected_brand}' but no brand guidelines found. Performing generic brand analysis."
                    check_prompt += f"\n\nBrand Analysis Context: The detected brand is '{detected_brand}'. While specific brand guidelines are not available, please analyze the visual content for general brand consistency, professional appearance, and adherence to common branding best practices for this brand if you're familiar with it."
                else:
                    brand_guidelines_status = f"Brand guidelines found for {detected_brand} ({len(brand_guidelines)} files)."

                    # Add brand guidelines content to the prompt
                    guidelines_content = "\n\n=== BRAND GUIDELINES REFERENCE ===\n"
                    guidelines_content += f"The following brand guidelines have been provided for {detected_brand}:\n\n"

                    for guideline in brand_guidelines:
                        guidelines_content += f"**Guideline File: {guideline.get('original_filename', 'Unknown')}**\n"
                        if guideline.get('description'):
                            guidelines_content += f"Description: {guideline['description']}\n"
                        if guideline.get('tags'):
                            guidelines_content += f"Tags: {', '.join(guideline['tags'])}\n"

                        # Try to read file content if it's a text-based file
                        guideline_file_path = guideline.get('file_path')
                        if guideline_file_path and os.path.exists(guideline_file_path):
                            try:
                                file_ext = os.path.splitext(guideline_file_path)[1].lower()
                                if file_ext in ['.txt', '.md', '.json']:
                                    with open(guideline_file_path, 'r', encoding='utf-8') as f:
                                        content = f.read()
                                        if len(content) > 2000:  # Limit content length
                                            content = content[:2000] + "... [content truncated]"
                                        guidelines_content += f"Content:\n{content}\n\n"
                                else:
                                    guidelines_content += f"[File type {file_ext} - content not directly readable, but file is available as reference]\n\n"
                            except Exception as e:
                                guidelines_content += f"[Error reading file content: {str(e)}]\n\n"
                        else:
                            guidelines_content += "[File path not found]\n\n"

                    guidelines_content += "Please use these brand guidelines as reference when performing your analysis. Pay special attention to brand colors, fonts, logo usage, tone of voice, and any specific requirements mentioned in the guidelines.\n"
                    guidelines_content += "=== END BRAND GUIDELINES REFERENCE ===\n"

                    check_prompt += guidelines_content
            else:
                brand_guidelines_status = "INFO: Brand could not be determined. Performing generic analysis."
                check_prompt += "\n\nGeneric Analysis: Since the brand could not be determined from the image, please analyze the visual content for general quality, professional appearance, and adherence to common design best practices."

        # Add pre-analysis instructions if available
        final_prompt = check_prompt
        if profile_config.pre_analysis_instructions:
            final_prompt = profile_config.pre_analysis_instructions + "\n\n" + check_prompt

        # Add reference asset content if selected
        reference_image_path = None
        if reference_asset:
            reference_content = get_reference_asset_content(reference_asset)
            if reference_content:
                final_prompt = reference_content + "\n\n" + final_prompt
                print(f"Added reference asset {reference_asset} to {check_name} prompt")

            # Also get the actual reference image path for LLM
            reference_image_path = get_reference_asset_image_path(reference_asset)

        print(f"Running check {check_index + 1}/{total_checks}: {check_name}")

        result = run_visual_qc(
            prompt=final_prompt,
            asset_path=file_path,
            reference_path=reference_image_path,
            model_name=llm_model,
            model_version=model_version
        )

        # Extract score and data
        json_data = extract_json_from_response(result['response'])
        score = extract_score_from_result(result, profile_config, check_name)
        weight = profile_weights.get(check_name, 0.1)
        weighted_score = score * weight if score is not None else 0

        return {
            'check_name': check_name,
            'status': 'completed',
            'response': result['response'],
            'brand_guidelines_status': brand_guidelines_status,
            'requires_brand_guidelines': requires_brand_guidelines,
            'json_data': json_data,
            'score': score,
            'weight': weight,
            'weighted_score': weighted_score,
            'model_used': result.get('model_info', {}),
            'token_usage': result.get('token_usage', {}),
            'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S')
        }

    except Exception as e:
        print(f"Error in check {check_name}: {str(e)}")
        weight = profile_weights.get(check_name, 0.1)
        return {
            'check_name': check_name,
            'status': 'error',
            'error': str(e),
            'weight': weight,
            'score': 0,
            'weighted_score': 0
        }

def process_checks_in_batches_with_triage(enabled_checks, qc_apps, profile_config, profile_weights,
                                         file_path, reference_asset, brand_db, progress_tracker,
                                         session_id, batch_size=15, base_percentage=10, percentage_range=80):
    """Process QC checks in parallel batches with triage logic"""
    check_results = {}
    total_checks = len(enabled_checks)
    completed_checks = 0

    print(f"Processing {total_checks} checks in batches of {batch_size}")

    # Split checks into batches
    for batch_start in range(0, total_checks, batch_size):
        batch_end = min(batch_start + batch_size, total_checks)
        batch_checks = enabled_checks[batch_start:batch_end]
        batch_number = (batch_start // batch_size) + 1
        total_batches = (total_checks + batch_size - 1) // batch_size

        print(f"Processing batch {batch_number}/{total_batches} ({len(batch_checks)} checks)")

        # Update progress for batch start
        progress_tracker[session_id].update({
            'current_batch': batch_number,
            'total_batches': total_batches,
            'current_check': f"Batch {batch_number}",
            'current_check_display': f"Processing batch {batch_number}/{total_batches}",
            'percentage': base_percentage + ((completed_checks / total_checks) * percentage_range)
        })

        # Process batch in parallel
        with ThreadPoolExecutor(max_workers=batch_size) as executor:
            # Submit all checks in the batch
            future_to_check = {}
            for i, check_name in enumerate(batch_checks):
                future = executor.submit(
                    process_single_check_with_triage,
                    check_name, qc_apps, profile_config, profile_weights, file_path,
                    reference_asset, brand_db, progress_tracker, session_id,
                    batch_start + i, total_checks
                )
                future_to_check[future] = check_name

            # Collect results as they complete
            batch_results = {}
            for future in as_completed(future_to_check):
                check_name = future_to_check[future]
                try:
                    result = future.result()
                    batch_results[result['check_name']] = result
                    completed_checks += 1

                    # Update progress for each completed check
                    progress_tracker[session_id].update({
                        'completed_checks': completed_checks,
                        'percentage': base_percentage + ((completed_checks / total_checks) * percentage_range)
                    })

                    print(f"Completed check: {check_name} ({completed_checks}/{total_checks})")

                except Exception as e:
                    print(f"Error getting result for check {check_name}: {str(e)}")
                    weight = profile_weights.get(check_name, 0.1)
                    batch_results[check_name] = {
                        'check_name': check_name,
                        'status': 'error',
                        'error': str(e),
                        'weight': weight,
                        'score': 0,
                        'weighted_score': 0
                    }
                    completed_checks += 1

            # Add batch results to main results
            check_results.update(batch_results)

        print(f"Completed batch {batch_number}/{total_batches}")

        # Small delay between batches to avoid overwhelming the APIs
        if batch_number < total_batches:
            time.sleep(0.5)

    print(f"Completed all {total_checks} checks in {total_batches} batches")
    return check_results

def create_thumbnail_base64(file_path, max_size=(300, 300)):
    """Create a base64 encoded thumbnail of the input file"""
    try:
        # Get the image using the existing utility
        pil_image = get_image_from_asset(file_path)
        if not pil_image:
            return None

        # Create thumbnail
        thumbnail = pil_image.copy()
        thumbnail.thumbnail(max_size, Image.Resampling.LANCZOS)

        # Convert to base64
        buffer = io.BytesIO()
        # Convert to RGB if necessary (for PNG with transparency)
        if thumbnail.mode in ('RGBA', 'LA'):
            background = Image.new('RGB', thumbnail.size, (255, 255, 255))
            background.paste(thumbnail, mask=thumbnail.split()[-1] if thumbnail.mode == 'RGBA' else None)
            thumbnail = background

        thumbnail.save(buffer, format='JPEG', quality=85)
        img_str = base64.b64encode(buffer.getvalue()).decode()
        return f"data:image/jpeg;base64,{img_str}"

    except Exception as e:
        print(f"Error creating thumbnail: {e}")
        return None

def get_client_from_profile(profile_id):
    """Determine client from profile ID"""
    if not profile_id:
        return 'general'

    profile_lower = profile_id.lower()
    if profile_lower.startswith('loreal'):
        return 'loreal'
    elif profile_lower.startswith('diageo'):
        return 'diageo'
    elif profile_lower.startswith('unilever'):
        return 'unilever'
    elif profile_lower.startswith('amazon'):
        return 'amazon'
    elif profile_lower.startswith('boots'):
        return 'boots'
    elif profile_lower.startswith('hp_'):
        return 'hp'
    elif profile_lower.startswith(('dow_jones', 'dj_', 'marketwatch', 'mw_', 'wsj')):
        return 'dow_jones'
    else:
        return 'general'

def ensure_client_output_folder(client):
    """Ensure client-specific output folder exists"""
    client_folder = os.path.join(app.config['OUTPUT_FOLDER'], client)
    os.makedirs(client_folder, exist_ok=True)
    return client_folder

def cleanup_old_files(max_age_days=14):
    """Delete files older than max_age_days from all client folders"""
    import time
    cutoff_time = time.time() - (max_age_days * 24 * 60 * 60)
    deleted_count = 0

    try:
        output_folder = app.config['OUTPUT_FOLDER']

        # Check root output folder
        for item in os.listdir(output_folder):
            item_path = os.path.join(output_folder, item)

            if os.path.isdir(item_path):
                # Check files in client subfolders
                for filename in os.listdir(item_path):
                    file_path = os.path.join(item_path, filename)
                    if os.path.isfile(file_path):
                        if os.path.getctime(file_path) < cutoff_time:
                            os.remove(file_path)
                            deleted_count += 1
                            print(f"Deleted old file: {file_path}")
            elif os.path.isfile(item_path):
                # Check files in root output folder (for migration)
                if os.path.getctime(item_path) < cutoff_time:
                    os.remove(item_path)
                    deleted_count += 1
                    print(f"Deleted old file: {item_path}")

        if deleted_count > 0:
            print(f"Cleaned up {deleted_count} files older than {max_age_days} days")
    except Exception as e:
        print(f"Error during cleanup: {e}")

    return deleted_count

def save_results_to_file(report_data, filename, output_mode='html', session_id=None, file_path=None):
    """Save analysis results to file and return file path"""
    print(f"DEBUG: save_results_to_file called with output_mode: '{output_mode}'")

    if not session_id:
        session_id = datetime.now().strftime('%Y%m%d_%H%M%S')

    # Determine client from profile
    profile_id = report_data.get('profile_id') or report_data.get('profiles', [None])[0]
    client = get_client_from_profile(profile_id)
    print(f"DEBUG: Detected client '{client}' from profile '{profile_id}'")

    # Ensure client-specific folder exists
    client_folder = ensure_client_output_folder(client)

    # Create filename base
    base_filename = f"{session_id}_{filename.replace(' ', '_')}"

    if output_mode == 'html':
        print(f"DEBUG: Creating HTML file because output_mode == 'html'")
        # Save HTML file in client-specific folder
        output_filename = f"{base_filename}_report.html"
        output_path = os.path.join(client_folder, output_filename)

        html_content = generate_html_content(report_data, filename, file_path)
        with open(output_path, 'w', encoding='utf-8') as f:
            f.write(html_content)

        return output_path
    else:
        print(f"DEBUG: Creating JSON file because output_mode != 'html' (it's '{output_mode}')")
        # Save JSON file in client-specific folder
        output_filename = f"{base_filename}_data.json"
        output_path = os.path.join(client_folder, output_filename)

        with open(output_path, 'w', encoding='utf-8') as f:
            json.dump(report_data, f, indent=2, ensure_ascii=False)

        return output_path

def generate_html_content(report_data, filename, file_path=None):
    """Generate HTML content for report data with expandable sections"""
    # Define a function to get color based on score
    def get_score_result(score):
        if score >= 6:
            return "Pass", "#28a745"  # Green for pass
        else:
            return "Fail", "#dc3545"  # Red for fail

    # Get reference asset information from profile selection
    profile_selection = report_data.get('profile_selection', {})
    reference_asset = profile_selection.get('reference_asset', None)
    reference_asset_used = profile_selection.get('reference_asset_used', False)

    # Build HTML for each check result with expandable sections
    check_results_html = ""
    for check_name, check_data in report_data['results'].items():
        if check_data['status'] == 'success':
            display_name = check_data.get('display_name', check_name)
            score = check_data.get('score', 0)
            result_text, score_color = get_score_result(score)
            weight = check_data.get('weight', 0)
            weighted_score = check_data.get('weighted_score', 0)

            # Extract response text - try to get detailed info from JSON data first
            json_data = check_data.get('json_data', {})
            response_text = ""

            # Structured findings (e.g. hp_copy_review) render as a table
            # instead of the default response-text block. If absent, falls
            # back to the existing text rendering below.
            findings = (json_data or {}).get('findings') if isinstance(json_data, dict) else None
            findings_html = _render_findings_table(findings) if findings is not None else None

            # Try to extract detailed analysis from JSON data
            if json_data:
                # Look for common detailed fields in the JSON
                analysis_details = json_data.get('analysis_details', '')
                explanation = json_data.get('explanation', '')
                issues_found = json_data.get('issues_found', [])
                recommendations = json_data.get('recommendations', '')
                elements_checked = json_data.get('elements_checked', {})
                elements_found = json_data.get('elements_found', {})
                marketing_text_found = json_data.get('marketing_text_found', [])
                recommended_adjustments = json_data.get('recommended_adjustments', '')

                # Build detailed response text from JSON fields
                if analysis_details:
                    response_text += f"<strong>Analysis:</strong><br>{analysis_details}<br><br>"
                elif explanation:
                    response_text += f"<strong>Analysis:</strong><br>{explanation}<br><br>"

                if elements_checked:
                    response_text += "<strong>Elements Checked:</strong><br>"
                    for element, status in elements_checked.items():
                        response_text += f"• <em>{element.replace('_', ' ').title()}:</em> {status}<br>"
                    response_text += "<br>"
                elif elements_found:
                    response_text += "<strong>Elements Found:</strong><br>"
                    for element, found in elements_found.items():
                        status_icon = "Present" if found else "Missing"
                        response_text += f"• <em>{element.replace('_', ' ').title()}:</em> {status_icon}<br>"
                    response_text += "<br>"

                if marketing_text_found:
                    response_text += "<strong>Marketing Text Found:</strong><br>"
                    for text in marketing_text_found:
                        response_text += f"• {text}<br>"
                    response_text += "<br>"

                if issues_found:
                    response_text += "<strong>Issues Found:</strong><br>"
                    if isinstance(issues_found, list):
                        for issue in issues_found:
                            response_text += f"• {issue}<br>"
                    else:
                        response_text += f"{issues_found}<br>"
                    response_text += "<br>"

                if recommendations:
                    if isinstance(recommendations, list):
                        response_text += "<strong>Recommendations:</strong><br>"
                        for rec in recommendations:
                            response_text += f"• {rec}<br>"
                    else:
                        response_text += f"<strong>Recommendation:</strong><br>{recommendations}<br>"

                if recommended_adjustments:
                    if isinstance(recommended_adjustments, list):
                        response_text += "<br><strong>Suggested Adjustments:</strong><br>"
                        for adj in recommended_adjustments:
                            response_text += f"• {adj}<br>"
                    elif isinstance(recommended_adjustments, str) and recommended_adjustments.lower() not in ['none', 'n/a']:
                        response_text += f"<br><strong>Suggested Adjustments:</strong><br>{recommended_adjustments}"

                # If still no response text from known fields, build summary from all JSON data
                if not response_text and json_data:
                    skip_keys = {'score', 'weight', 'weighted_score', 'status'}
                    summary_parts = []
                    for key, value in json_data.items():
                        if key in skip_keys:
                            continue
                        display_key = key.replace('_', ' ').title()
                        if isinstance(value, bool):
                            summary_parts.append(f"• <em>{display_key}:</em> {'Yes' if value else 'No'}")
                        elif isinstance(value, dict):
                            summary_parts.append(f"<strong>{display_key}:</strong>")
                            for sub_key, sub_val in value.items():
                                sub_display = sub_key.replace('_', ' ').title()
                                if isinstance(sub_val, bool):
                                    summary_parts.append(f"&nbsp;&nbsp;• <em>{sub_display}:</em> {'Yes' if sub_val else 'No'}")
                                else:
                                    summary_parts.append(f"&nbsp;&nbsp;• <em>{sub_display}:</em> {sub_val}")
                        elif isinstance(value, list):
                            if value:
                                summary_parts.append(f"<strong>{display_key}:</strong>")
                                for item in value:
                                    summary_parts.append(f"&nbsp;&nbsp;• {item}")
                        elif isinstance(value, str) and value and value.lower() not in ['none', 'n/a', '']:
                            summary_parts.append(f"• <em>{display_key}:</em> {value}")
                        elif isinstance(value, (int, float)):
                            summary_parts.append(f"• <em>{display_key}:</em> {value}")
                    if summary_parts:
                        response_text = "<br>".join(summary_parts)

            # If no detailed JSON data was found, fall back to original response
            if not response_text:
                response_text = check_data.get('response', '')
                # Remove JSON code blocks for cleaner reading
                response_text = re.sub(r'```json.*?```', '', response_text, flags=re.DOTALL)
                response_text = response_text.strip()

            # If still empty, provide a basic fallback
            if not response_text:
                score = check_data.get('score', 0)
                result_text, _ = get_score_result(score)
                if score == 0 and check_name in REFERENCE_ASSET_REQUIRED_CHECKS:
                    response_text = f"Reference asset is required for the '{display_name}' QC check but was not provided."
                else:
                    response_text = f"QC check result: {result_text} (Score: {score}/10)"

            # Create expandable section for each check
            check_results_html += f"""
            <div class="expandable-section">
                <div class="expandable-header" onclick="toggleSection('{check_name}')">
                    <div class="check-title">
                        <h3>{display_name}</h3>
                        <span class="score-badge" style="background-color: {score_color};">{result_text}</span>
                    </div>
                    <div class="chevron" id="chevron-{check_name}">▼</div>
                </div>
                <div class="expandable-content" id="content-{check_name}">
                    <div class="check-metadata">
                        <p><strong>Score:</strong> {score}/10 | <strong>Weight:</strong> {weight:.1%} | <strong>Weighted Score:</strong> {weighted_score:.2f}</p>
                        {'<p><strong>⭐ Bonus Check:</strong> If missing required element, this scores 0</p>' if check_name in ['face_gaze_direction', 'face_visibility', 'new_visibility'] else ''}
                        <p><strong>Reference Asset:</strong> {'✅ Used' if check_name in REFERENCE_ASSET_REQUIRED_CHECKS and reference_asset_used else ('🚨 Required but missing' if check_name in REFERENCE_ASSET_REQUIRED_CHECKS else '➖ Not required')}</p>
                        {f'<p><strong>Reference Asset Details:</strong> {reference_asset}</p>' if check_name in REFERENCE_ASSET_REQUIRED_CHECKS and reference_asset_used and reference_asset else ''}
                    </div>
                    <div class="analysis-section">
                        <h4>Analysis Details:</h4>
                        {f'<div class="response-text">{html.escape(json_data.get("summary", "") or "") if isinstance(json_data, dict) else ""}</div>{findings_html}' if findings_html is not None else f'<div class="response-text">{response_text.replace(chr(10), "<br>")}</div>'}
                    </div>
                </div>
            </div>
            """

    # Get summary score result
    overall_score = report_data['summary']['overall_score']
    overall_result, overall_color = get_score_result(overall_score/10)  # Normalize to 0-10 scale

    # Determine the correct total score based on profile
    profile_id = report_data.get('profile_id', '')
    if profile_id == 'unilever_key_visual':
        score_total = 120
    else:
        score_total = 100

    technical_html = _render_technical_section_html(report_data.get('technical_report', {}))

    html_content = f"""
    <!DOCTYPE html>
    <html lang="en">
    <head>
        <meta charset="UTF-8">
        <meta name="viewport" content="width=device-width, initial-scale=1.0">
        <title>Visual AI QC Results for {filename}</title>
        <link rel="preconnect" href="https://fonts.googleapis.com">
        <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
        <link href="https://fonts.googleapis.com/css2?family=Montserrat:wght@400;500;600;700&display=swap" rel="stylesheet">
        <style>
            body {{ font-family: 'Montserrat', -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; margin: 20px; padding: 0; background: linear-gradient(135deg, #1a1a1a 0%, #000000 100%); min-height: 100vh; }}
            .container {{ max-width: 1200px; margin: 0 auto; background-color: white; padding: 30px; border-radius: 20px; box-shadow: 0 20px 40px rgba(0,0,0,0.1); }}
            h1, h2, h3 {{ color: #2c3e50; }}
            h1 {{ margin-bottom: 10px; font-size: 2.5em; text-align: center; }}
            .file-preview {{ background: linear-gradient(135deg, #f8f9fa 0%, #e9ecef 100%); padding: 20px; border-radius: 15px; margin: 20px 0; border-left: 5px solid #FFC407; }}
            .file-info {{ display: flex; align-items: center; gap: 20px; }}
            .thumbnail {{ max-width: 150px; max-height: 150px; border-radius: 8px; box-shadow: 0 4px 8px rgba(0,0,0,0.1); border: 2px solid #dee2e6; }}
            .file-details {{ flex: 1; }}
            .filename {{ font-size: 1.2em; font-weight: bold; color: #495057; margin-bottom: 5px; word-break: break-all; overflow-wrap: break-word; }}
            .file-meta {{ color: #6c757d; font-size: 0.9em; }}
            .summary {{ background: linear-gradient(135deg, #FFF9E6 0%, #FFFBF0 100%); padding: 25px; border-radius: 15px; margin: 30px 0; border-left: 5px solid #FFC407; }}
            .summary-grid {{ display: grid; grid-template-columns: repeat(auto-fit, minmax(200px, 1fr)); gap: 20px; margin-top: 15px; }}
            .summary-item {{ background: white; padding: 15px; border-radius: 10px; text-align: center; box-shadow: 0 2px 4px rgba(0,0,0,0.05); }}
            .technical {{ background: linear-gradient(135deg, #e3f2fd 0%, #f0f7ff 100%); padding: 25px; border-radius: 15px; margin: 30px 0; border-left: 5px solid #1565c0; }}
            .technical-grid {{ display: grid; grid-template-columns: repeat(auto-fit, minmax(280px, 1fr)); gap: 8px 24px; margin-top: 12px; }}
            .tech-row {{ padding: 4px 0; color: #495057; font-size: 0.95em; word-break: break-word; }}
            .score-display {{ font-size: 2.5em; font-weight: bold; color: {overall_color}; margin-bottom: 5px; }}
            .grade {{ font-size: 1.3em; font-weight: bold; color: #495057; }}
            .expandable-section {{ margin-bottom: 15px; border: 2px solid #e9ecef; border-radius: 12px; overflow: hidden; background: white; }}
            .expandable-header {{ background: #f8f9fa; padding: 20px; cursor: pointer; display: flex; justify-content: space-between; align-items: center; transition: background-color 0.3s ease; }}
            .expandable-header:hover {{ background: #e9ecef; }}
            .check-title {{ display: flex; align-items: center; gap: 15px; }}
            .check-title h3 {{ margin: 0; color: #495057; }}
            .score-badge {{ padding: 8px 12px; border-radius: 20px; color: white; font-weight: bold; font-size: 0.9em; }}
            .chevron {{ font-size: 1.2em; transition: transform 0.3s ease; color: #FFC407; }}
            .chevron.expanded {{ transform: rotate(180deg); }}
            .expandable-content {{ padding: 0; max-height: 0; overflow: hidden; transition: all 0.3s ease; }}
            .expandable-content.expanded {{ padding: 20px; max-height: 1000px; }}
            .check-metadata {{ background: #f8f9fa; padding: 15px; border-radius: 8px; margin-bottom: 15px; }}
            .analysis-section h4 {{ color: #495057; margin-bottom: 10px; }}
            .response-text {{ background: #f8f9fa; padding: 15px; border-radius: 8px; line-height: 1.6; font-family: 'Montserrat', Georgia, serif; }}
            .json-toggle {{ cursor: pointer; color: #FFC407; text-decoration: underline; padding: 15px; text-align: center; font-weight: bold; }}
            .json-view {{ display: none; margin-top: 20px; }}
            .json-view pre {{ background-color: #2d3748; color: #e2e8f0; padding: 20px; border-radius: 10px; overflow-x: auto; font-size: 0.9em; }}
            .findings-table {{ width: 100%; border-collapse: collapse; margin-top: 12px; font-size: 0.92em; }}
            .findings-table th {{ background: #f1f3f5; color: #495057; text-align: left; padding: 8px 10px; border-bottom: 2px solid #dee2e6; font-weight: 600; }}
            .findings-table td {{ padding: 8px 10px; border-bottom: 1px solid #e9ecef; vertical-align: top; word-break: break-word; }}
            .findings-table tr:last-child td {{ border-bottom: none; }}
            .findings-table code {{ background: #f8f9fa; padding: 2px 5px; border-radius: 4px; font-family: 'SFMono-Regular', Consolas, Menlo, monospace; font-size: 0.9em; color: #c7254e; }}
            .priority-pill {{ display: inline-block; padding: 3px 8px; border-radius: 10px; color: white; font-weight: 600; font-size: 0.78em; letter-spacing: 0.03em; }}
            .priority-high {{ background-color: #dc3545; }}
            .priority-medium {{ background-color: #fd7e14; }}
            .priority-low {{ background-color: #28a745; }}
            .muted {{ color: #6c757d; font-size: 0.9em; }}
        </style>
    </head>
    <body>
        <div class="container">
            <h1>🤖 Visual AI QC Results</h1>
            <p style="text-align: center; color: #6c757d; font-size: 1.1em;">
                Analysis completed on: {report_data['timestamp']}
            </p>

            <div class="file-preview">
                <h3>📎 Analyzed File</h3>
                <div class="file-info">
                    <img src="{create_thumbnail_base64(file_path) if file_path else 'data:image/svg+xml;base64,PHN2ZyB3aWR0aD0iMTUwIiBoZWlnaHQ9IjE1MCIgdmlld0JveD0iMCAwIDE1MCAxNTAiIGZpbGw9Im5vbmUiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyI+CjxyZWN0IHdpZHRoPSIxNTAiIGhlaWdodD0iMTUwIiBmaWxsPSIjZjhmOWZhIiBzdHJva2U9IiNkZWUyZTYiIHN0cm9rZS13aWR0aD0iMiIvPgo8dGV4dCB4PSI3NSIgeT0iNzUiIHRleHQtYW5jaG9yPSJtaWRkbGUiIGZpbGw9IiM2Yzc1N2QiIGZvbnQtZmFtaWx5PSJBcmlhbCIgZm9udC1zaXplPSIxNCIgZHk9IjAuMzVlbSI+4p2MIEZpbGU8L3RleHQ+Cjx0ZXh0IHg9Ijc1IiB5PSI5NSIgdGV4dC1hbmNob3I9Im1pZGRsZSIgZmlsbD0iIzZjNzU3ZCIgZm9udC1mYW1pbHk9IkFyaWFsIiBmb250LXNpemU9IjEyIiBkeT0iMC4zNWVtIj5UaHVtYm5haWw8L3RleHQ+Cjwvc3ZnPg=='}" alt="File thumbnail" class="thumbnail" id="fileThumbnail">
                    <div class="file-details">
                        <div class="filename">{filename}</div>
                        <div class="file-meta">Original file processed for quality control analysis</div>
                    </div>
                </div>
            </div>

            <div class="summary">
                <h2>📊 Analysis Summary</h2>
                <div class="summary-grid">
                    <div class="summary-item">
                        <div class="score-display">{overall_score}/{score_total}</div>
                        <div>Overall Score</div>
                    </div>
                    <div class="summary-item">
                        <div class="grade">{report_data['summary']['grade']}</div>
                        <div>Grade</div>
                    </div>
                    <div class="summary-item">
                        <div style="font-size: 1.5em; font-weight: bold; color: #495057;">{report_data['summary']['checks_count']}</div>
                        <div>Checks Performed</div>
                    </div>
                    <div class="summary-item">
                        <div style="font-size: 1.2em; color: #FFC407; font-weight: bold;">{report_data['profile_name']}</div>
                        <div>Profile Used</div>
                    </div>
                    <div class="summary-item">
                        <div style="font-size: 1.2em; color: {'#28a745' if reference_asset_used else '#6c757d'}; font-weight: bold;">{'✅ Used' if reference_asset_used else '➖ None'}</div>
                        <div>Reference Asset</div>
                    </div>
                </div>
            </div>

            {technical_html}

            <h2>🔍 Detailed Analysis Results</h2>
            <p style="color: #6c757d; margin-bottom: 20px; font-style: italic;">
                Click on any section below to expand and view detailed analysis
            </p>
            {check_results_html}

            <div class="json-toggle" onclick="document.getElementById('json-data').style.display = document.getElementById('json-data').style.display === 'none' ? 'block' : 'none';">
                📄 Show/Hide Raw JSON Data
            </div>
            <div id="json-data" class="json-view">
                <pre>{json.dumps(report_data, indent=2)}</pre>
            </div>
        </div>

        <script>
            function toggleSection(checkName) {{
                const content = document.getElementById('content-' + checkName);
                const chevron = document.getElementById('chevron-' + checkName);

                if (content.classList.contains('expanded')) {{
                    content.classList.remove('expanded');
                    chevron.classList.remove('expanded');
                }} else {{
                    content.classList.add('expanded');
                    chevron.classList.add('expanded');
                }}
            }}

        </script>
    </body>
    </html>
    """
    return html_content

def generate_html_response(report_data, filename, save_to_file=False, session_id=None, file_path=None):
    """Generate HTML response for report data with optional file saving"""
    html_content = generate_html_content(report_data, filename, file_path)

    if save_to_file:
        # Save to file and return file path info
        output_path = save_results_to_file(report_data, filename, 'html', session_id, file_path)
        return Response(html_content, mimetype='text/html'), output_path
    else:
        return Response(html_content, mimetype='text/html')

def _render_findings_table(findings):
    """Render an hp_copy_review-style findings array as an HTML table.

    Each finding dict is expected to carry: priority (high|medium|low),
    category, quote, issue, suggested_fix, source_reference. All string
    fields are HTML-escaped before interpolation. An empty/None findings
    list renders a friendly "clean copy" note instead of an empty table.
    """
    if not findings:
        return '<p class="muted">No findings — copy is clean.</p>'
    rows = []
    for f in findings:
        priority = (f.get('priority') or 'low').lower()
        pri_class = {
            'high': 'priority-high',
            'medium': 'priority-medium',
            'low': 'priority-low',
        }.get(priority, 'priority-low')
        quote_raw = (f.get('quote') or '')[:200]
        rows.append(
            '<tr>'
            f'<td><span class="priority-pill {pri_class}">{html.escape(priority.upper())}</span></td>'
            f'<td><code>{html.escape(f.get("category", "") or "")}</code></td>'
            f'<td><code>{html.escape(quote_raw)}</code></td>'
            f'<td>{html.escape(f.get("issue", "") or "")}</td>'
            f'<td>{html.escape(f.get("suggested_fix", "") or "")}</td>'
            f'<td class="muted">{html.escape(f.get("source_reference", "") or "")}</td>'
            '</tr>'
        )
    return (
        '<table class="findings-table"><thead><tr>'
        '<th>Priority</th><th>Category</th><th>Quote</th>'
        '<th>Issue</th><th>Suggested fix</th><th>Source</th>'
        '</tr></thead><tbody>'
        + ''.join(rows) +
        '</tbody></table>'
    )


def _render_technical_section_html(report):
    """Render the technical pre-flight report as an HTML block. Empty string if no report."""
    if not report or report.get('kind') in (None, 'unknown'):
        return ''
    kind = report['kind']
    rows = []
    size_mb = report.get('file_size_mb')
    if size_mb is not None:
        rows.append(f'<div class="tech-row"><strong>File size:</strong> {size_mb} MB</div>')
    dims = report.get('dimensions')
    if dims:
        rows.append(f'<div class="tech-row"><strong>Dimensions:</strong> {dims["width"]} × {dims["height"]}</div>')
    fmt = report.get('format')
    if fmt:
        rows.append(f'<div class="tech-row"><strong>Format:</strong> {fmt}</div>')
    dpi = report.get('dpi')
    if dpi:
        rows.append(f'<div class="tech-row"><strong>DPI:</strong> {dpi[0]} × {dpi[1]}</div>')
    mode = report.get('mode')
    if mode:
        rows.append(f'<div class="tech-row"><strong>Color mode:</strong> {mode}</div>')
    pc = report.get('page_count')
    if pc is not None:
        rows.append(f'<div class="tech-row"><strong>Pages:</strong> {pc}</div>')
    pdf_ver = report.get('pdf_version')
    if pdf_ver:
        rows.append(f'<div class="tech-row"><strong>PDF version:</strong> {pdf_ver}</div>')
    duration = report.get('duration_seconds')
    if duration is not None:
        rows.append(f'<div class="tech-row"><strong>Duration:</strong> {duration}s</div>')
    codec = report.get('video_codec')
    if codec:
        rows.append(f'<div class="tech-row"><strong>Video codec:</strong> {codec}</div>')
    fps = report.get('fps')
    if fps:
        rows.append(f'<div class="tech-row"><strong>Frame rate:</strong> {fps} fps</div>')
    fonts = report.get('embedded_fonts')
    if fonts:
        suffix = ' …' if len(fonts) > 8 else ''
        rows.append(f'<div class="tech-row"><strong>Embedded fonts:</strong> {", ".join(fonts[:8])}{suffix}</div>')
    fm = report.get('filename_match')
    if fm:
        if fm['match']:
            badge = '<span style="background:#28a745;color:white;padding:4px 10px;border-radius:12px;font-size:0.85em;">✓ Matches filename</span>'
        else:
            badge = '<span style="background:#dc3545;color:white;padding:4px 10px;border-radius:12px;font-size:0.85em;">⚠ Filename mismatch</span>'
        rows.append(f'<div class="tech-row" style="margin-top:8px;">{badge} <span style="color:#6c757d;font-size:0.9em;margin-left:8px;">{fm["detail"]}</span></div>')
    errors = report.get('errors', [])
    if errors:
        rows.append(f'<div class="tech-row" style="color:#856404;font-style:italic;"><strong>Inspection notes:</strong> {"; ".join(errors)}</div>')
    if not rows:
        return ''
    return f'''
        <div class="technical">
            <h2>🔧 Technical Details <small style="color:#6c757d;font-size:0.6em;font-weight:normal;">(machine-inspected, no AI)</small></h2>
            <div class="technical-grid">{''.join(rows)}</div>
        </div>
        '''


def generate_comprehensive_html_report(analysis_result, filename, file_path=None):
    """Generate comprehensive HTML report similar to the web UI format"""
    summary = analysis_result.get('summary', {})
    qc_analysis = analysis_result.get('qc_analysis', {})
    profile_selection = analysis_result.get('profile_selection', {})
    check_results = qc_analysis.get('check_results', {})

    timestamp = datetime.now().strftime('%Y-%m-%d %H:%M:%S')
    overall_score = summary.get('overall_score', 0)
    profile_name = profile_selection.get('suggested_profile', 'Unknown Profile')
    total_checks = qc_analysis.get('total_checks', 0)
    completed_checks = qc_analysis.get('completed_checks', 0)
    reference_asset = profile_selection.get('reference_asset', None)
    reference_asset_used = profile_selection.get('reference_asset_used', False)

    # Generate check results HTML
    check_results_html = ''
    for check_name, result in check_results.items():
        if result.get('status') in ('success', 'completed'):
            score = result.get('score', 0)
            result_text = "Pass" if score >= 6 else "Fail"
            score_color = '#28a745' if score >= 6 else '#dc3545'
            response = result.get('response', 'No response available')
            display_name = check_name.replace('_', ' ').replace(chr(32).join([w.capitalize() for w in check_name.split('_')]), check_name.replace('_', ' ').title())

            # Structured findings (e.g. hp_copy_review) render as a table
            # instead of the default response-text block. Fallback to the
            # existing response rendering when 'findings' is absent.
            json_data = result.get('json_data') if isinstance(result, dict) else None
            findings = json_data.get('findings') if isinstance(json_data, dict) else None
            findings_html = _render_findings_table(findings) if findings is not None else None

            # Remove JSON blocks for cleaner display and handle empty responses
            response = re.sub(r'```json.*?```', '', response, flags=re.DOTALL).strip()
            if not response:
                if score == 0 and check_name in REFERENCE_ASSET_REQUIRED_CHECKS:
                    response = f"Reference asset is required for the '{display_name}' QC check but was not provided."
                else:
                    response = f"QC check result: {result_text} (Score: {score}/10)"

            check_results_html += f'''
                <div class="expandable-section">
                    <div class="expandable-header" onclick="toggleSection('{check_name}')">
                        <div class="check-title">
                            <h3>{display_name}</h3>
                            <span class="score-badge" style="background-color: {score_color};">{result_text}</span>
                        </div>
                        <div class="chevron" id="chevron-{check_name}">▼</div>
                    </div>
                    <div class="expandable-content" id="content-{check_name}">
                        <div class="check-metadata">
                            <p><strong>Score:</strong> {score}/10 | <strong>Weight:</strong> {result.get('weight', 0):.1%} | <strong>Weighted Score:</strong> {result.get('weighted_score', 0):.2f}</p>
                            {'<p><strong>⭐ Bonus Check:</strong> If missing required element, this scores 0</p>' if check_name in ['face_gaze_direction', 'face_visibility', 'new_visibility'] else ''}
                            <p><strong>Reference Asset:</strong> {'✅ Used' if check_name in REFERENCE_ASSET_REQUIRED_CHECKS and reference_asset_used else ('🚨 Required but missing' if check_name in REFERENCE_ASSET_REQUIRED_CHECKS else '➖ Not required')}</p>
                            {f'<p><strong>Reference Asset Details:</strong> {reference_asset}</p>' if check_name in REFERENCE_ASSET_REQUIRED_CHECKS and reference_asset_used and reference_asset else ''}
                        </div>
                        <div class="analysis-section">
                            <h4>Analysis Details:</h4>
                            {f'<div class="response-text">{html.escape(json_data.get("summary", "") or "") if isinstance(json_data, dict) else ""}</div>{findings_html}' if findings_html is not None else f'<div class="response-text">{response.replace(chr(10), "<br>")}</div>'}
                        </div>
                    </div>
                </div>
            '''

    # Convert overall score to pass/fail based on average of individual check scores
    avg_individual_score = overall_score / 10  # Normalize to 1-10 scale
    grade_text = 'Pass' if avg_individual_score >= 6 else 'Fail'
    score_color = '#28a745' if avg_individual_score >= 6 else '#dc3545'

    technical_html = _render_technical_section_html(analysis_result.get('technical_report', {}))

    return f'''<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Visual AI QC Results for {filename}</title>
    <link rel="preconnect" href="https://fonts.googleapis.com">
    <link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
    <link href="https://fonts.googleapis.com/css2?family=Montserrat:wght@400;500;600;700&display=swap" rel="stylesheet">
    <style>
        body {{ font-family: 'Montserrat', -apple-system, BlinkMacSystemFont, 'Segoe UI', Roboto, sans-serif; margin: 20px; padding: 0; background: linear-gradient(135deg, #1a1a1a 0%, #000000 100%); min-height: 100vh; }}
        .container {{ max-width: 1200px; margin: 0 auto; background-color: white; padding: 30px; border-radius: 20px; box-shadow: 0 20px 40px rgba(0,0,0,0.1); }}
        h1, h2, h3 {{ color: #2c3e50; }}
        h1 {{ margin-bottom: 10px; font-size: 2.5em; text-align: center; }}
        .file-preview {{ background: linear-gradient(135deg, #f8f9fa 0%, #e9ecef 100%); padding: 20px; border-radius: 15px; margin: 20px 0; border-left: 5px solid #FFC407; }}
        .file-info {{ display: flex; align-items: center; gap: 20px; }}
        .thumbnail {{ max-width: 150px; max-height: 150px; border-radius: 8px; box-shadow: 0 4px 8px rgba(0,0,0,0.1); border: 2px solid #dee2e6; }}
        .file-details {{ flex: 1; }}
        .filename {{ font-size: 1.2em; font-weight: bold; color: #495057; margin-bottom: 5px; word-break: break-all; overflow-wrap: break-word; }}
        .file-meta {{ color: #6c757d; font-size: 0.9em; }}
        .summary {{ background: linear-gradient(135deg, #FFF9E6 0%, #FFFBF0 100%); padding: 25px; border-radius: 15px; margin: 30px 0; border-left: 5px solid #FFC407; }}
        .summary-grid {{ display: grid; grid-template-columns: repeat(auto-fit, minmax(200px, 1fr)); gap: 20px; margin-top: 15px; }}
        .summary-item {{ background: white; padding: 15px; border-radius: 10px; text-align: center; box-shadow: 0 2px 4px rgba(0,0,0,0.05); }}
        .technical {{ background: linear-gradient(135deg, #e3f2fd 0%, #f0f7ff 100%); padding: 25px; border-radius: 15px; margin: 30px 0; border-left: 5px solid #1565c0; }}
        .technical-grid {{ display: grid; grid-template-columns: repeat(auto-fit, minmax(280px, 1fr)); gap: 8px 24px; margin-top: 12px; }}
        .tech-row {{ padding: 4px 0; color: #495057; font-size: 0.95em; word-break: break-word; }}
        .score-display {{ font-size: 2.5em; font-weight: bold; color: {score_color}; margin-bottom: 5px; }}
        .grade {{ font-size: 1.3em; font-weight: bold; color: #495057; }}
        .expandable-section {{ margin-bottom: 15px; border: 2px solid #e9ecef; border-radius: 12px; overflow: hidden; background: white; }}
        .expandable-header {{ background: #f8f9fa; padding: 20px; cursor: pointer; display: flex; justify-content: space-between; align-items: center; transition: background-color 0.3s ease; }}
        .expandable-header:hover {{ background: #e9ecef; }}
        .check-title {{ display: flex; align-items: center; gap: 15px; }}
        .check-title h3 {{ margin: 0; color: #495057; }}
        .score-badge {{ padding: 8px 12px; border-radius: 20px; color: white; font-weight: bold; font-size: 0.9em; }}
        .chevron {{ font-size: 1.2em; transition: transform 0.3s ease; color: #FFC407; }}
        .chevron.expanded {{ transform: rotate(180deg); }}
        .expandable-content {{ padding: 0; max-height: 0; overflow: hidden; transition: all 0.3s ease; }}
        .expandable-content.expanded {{ padding: 20px; max-height: 1000px; }}
        .check-metadata {{ background: #f8f9fa; padding: 15px; border-radius: 8px; margin-bottom: 15px; }}
        .analysis-section h4 {{ color: #495057; margin-bottom: 10px; }}
        .response-text {{ background: #f8f9fa; padding: 15px; border-radius: 8px; line-height: 1.6; font-family: 'Montserrat', Georgia, serif; }}
        .findings-table {{ width: 100%; border-collapse: collapse; margin-top: 12px; font-size: 0.92em; }}
        .findings-table th {{ background: #f1f3f5; color: #495057; text-align: left; padding: 8px 10px; border-bottom: 2px solid #dee2e6; font-weight: 600; }}
        .findings-table td {{ padding: 8px 10px; border-bottom: 1px solid #e9ecef; vertical-align: top; word-break: break-word; }}
        .findings-table tr:last-child td {{ border-bottom: none; }}
        .findings-table code {{ background: #f8f9fa; padding: 2px 5px; border-radius: 4px; font-family: 'SFMono-Regular', Consolas, Menlo, monospace; font-size: 0.9em; color: #c7254e; }}
        .priority-pill {{ display: inline-block; padding: 3px 8px; border-radius: 10px; color: white; font-weight: 600; font-size: 0.78em; letter-spacing: 0.03em; }}
        .priority-high {{ background-color: #dc3545; }}
        .priority-medium {{ background-color: #fd7e14; }}
        .priority-low {{ background-color: #28a745; }}
        .muted {{ color: #6c757d; font-size: 0.9em; }}
    </style>
</head>
<body>
    <div class="container">
        <h1>🤖 Visual AI QC Results</h1>
        <p style="text-align: center; color: #6c757d; font-size: 1.1em;">
            Analysis completed on: {timestamp}
        </p>

        <div class="file-preview">
            <h3>📎 Analyzed File</h3>
            <div class="file-info">
                <img src="{create_thumbnail_base64(file_path) if file_path else 'data:image/svg+xml;base64,PHN2ZyB3aWR0aD0iMTUwIiBoZWlnaHQ9IjE1MCIgdmlld0JveD0iMCAwIDE1MCAxNTAiIGZpbGw9Im5vbmUiIHhtbG5zPSJodHRwOi8vd3d3LnczLm9yZy8yMDAwL3N2ZyI+CjxyZWN0IHdpZHRoPSIxNTAiIGhlaWdodD0iMTUwIiBmaWxsPSIjZjhmOWZhIiBzdHJva2U9IiNkZWUyZTYiIHN0cm9rZS13aWR0aD0iMiIvPgo8dGV4dCB4PSI3NSIgeT0iNzUiIHRleHQtYW5jaG9yPSJtaWRkbGUiIGZpbGw9IiM2Yzc1N2QiIGZvbnQtZmFtaWx5PSJBcmlhbCIgZm9udC1zaXplPSIxNCIgZHk9IjAuMzVlbSI+4p2MIEZpbGU8L3RleHQ+Cjx0ZXh0IHg9Ijc1IiB5PSI5NSIgdGV4dC1hbmNob3I9Im1pZGRsZSIgZmlsbD0iIzZjNzU3ZCIgZm9udC1mYW1pbHk9IkFyaWFsIiBmb250LXNpemU9IjEyIiBkeT0iMC4zNWVtIj5UaHVtYm5haWw8L3RleHQ+Cjwvc3ZnPg=='}" alt="File thumbnail" class="thumbnail" id="fileThumbnail">
                <div class="file-details">
                    <div class="filename">{filename}</div>
                    <div class="file-meta">Original file processed for quality control analysis</div>
                </div>
            </div>
        </div>

        <div class="summary">
            <h2>📊 Analysis Summary</h2>
            <div class="summary-grid">
                <div class="summary-item">
                    <div class="score-display">{overall_score}/100</div>
                    <div>Overall Score</div>
                </div>
                <div class="summary-item">
                    <div class="grade">{grade_text}</div>
                    <div>Grade</div>
                </div>
                <div class="summary-item">
                    <div style="font-size: 1.5em; font-weight: bold; color: #495057;">{completed_checks}</div>
                    <div>Checks Performed</div>
                </div>
                <div class="summary-item">
                    <div style="font-size: 1.2em; color: #FFC407; font-weight: bold;">{profile_name}</div>
                    <div>Profile Used</div>
                </div>
                <div class="summary-item">
                    <div style="font-size: 1.2em; color: {'#28a745' if reference_asset_used else '#6c757d'}; font-weight: bold;">{'✅ Used' if reference_asset_used else '➖ None'}</div>
                    <div>Reference Asset</div>
                </div>
            </div>
        </div>

        {technical_html}

        <h2>🔍 Detailed Analysis Results</h2>
        <p style="color: #6c757d; margin-bottom: 20px; font-style: italic;">
            Click on any section below to expand and view detailed analysis
        </p>

        {check_results_html}
    </div>

    <script>
        function toggleSection(checkName) {{
            const content = document.getElementById('content-' + checkName);
            const chevron = document.getElementById('chevron-' + checkName);

            if (content.classList.contains('expanded')) {{
                content.classList.remove('expanded');
                chevron.classList.remove('expanded');
            }} else {{
                content.classList.add('expanded');
                chevron.classList.add('expanded');
            }}
        }}
    </script>
</body>
</html>'''

def get_reference_image_path(check_name):
    """Find a matching reference image - deprecated function, returns None"""
    # This function is deprecated since numbered criteria images are no longer used
    # Reference assets are now handled through the brand guidelines system
    return None

def get_reference_asset_image_path(reference_asset_id):
    """
    Get the actual file path for a reference asset image to send to LLM.

    Args:
        reference_asset_id: ID of the reference asset to retrieve

    Returns:
        File path to the reference image, or None if not found or not an image
    """
    if not reference_asset_id or not reference_asset_id.strip():
        return None

    try:
        # Get the reference asset file information from brand guidelines DB
        file_record = brand_db.db["files"].get(reference_asset_id)
        if not file_record:
            print(f"DEBUG: Reference asset not found: {reference_asset_id}")
            return None

        file_path = file_record.get("stored_path", "")
        if not file_path or not os.path.exists(file_path):
            print(f"DEBUG: Reference asset file not found at path: {file_path}")
            return None

        image_extensions = ['.png', '.jpg', '.jpeg', '.bmp', '.webp', '.gif', '.tiff']
        file_ext = os.path.splitext(file_path)[1].lower()

        if file_ext in image_extensions:
            print(f"DEBUG: Found reference image at: {file_path}")
            return file_path
        elif file_ext == '.pdf':
            # Check for pre-extracted cover image
            cover_path = brand_db.get_cover_image_path(reference_asset_id)
            if cover_path:
                print(f"DEBUG: Found PDF cover image at: {cover_path}")
                return cover_path
            # Fallback: extract cover on the fly
            try:
                from pdf_processor import extract_cover_image
                fallback_cover = os.path.splitext(file_path)[0] + "_cover.png"
                result = extract_cover_image(file_path, fallback_cover)
                if result:
                    print(f"DEBUG: Extracted PDF cover on-the-fly: {result}")
                    return result
            except Exception as e:
                print(f"DEBUG: Could not extract PDF cover: {e}")
            return None
        else:
            print(f"DEBUG: Reference asset is not an image: {file_path}")
            return None

    except Exception as e:
        print(f"DEBUG: Error getting reference asset image path: {e}")
        return None

def get_reference_asset_content(reference_asset_id):
    """
    Retrieve and format reference asset content for use in QC prompts.

    Args:
        reference_asset_id: ID of the reference asset to retrieve

    Returns:
        Formatted string with reference asset information, or empty string if not found
    """
    if not reference_asset_id or not reference_asset_id.strip():
        return ""

    try:
        # Get the reference asset file information from brand guidelines DB
        file_record = brand_db.db["files"].get(reference_asset_id)
        if not file_record:
            print(f"Reference asset not found: {reference_asset_id}")
            return ""

        brand_name = file_record["brand_name"]
        description = file_record.get("description", "")
        file_path = file_record.get("stored_path", "")
        original_filename = file_record.get("original_filename", "")

        # Build reference asset context for the prompt
        reference_content = "\n\n=== REFERENCE ASSET GUIDELINES ===\n"
        reference_content += f"Brand: {brand_name}\n"
        reference_content += f"Reference File: {original_filename}\n"

        if description:
            reference_content += f"Description: {description}\n"

        reference_content += "\nPlease use this reference asset as your guideline for analysis. "
        reference_content += "Compare the uploaded image against these brand standards and requirements. "
        reference_content += "Pay special attention to brand consistency, visual standards, and any specific "
        reference_content += "requirements shown in the reference material.\n"

        # Read reference content based on file type
        if file_path and os.path.exists(file_path):
            try:
                file_ext = os.path.splitext(file_path)[1].lower()
                if file_ext in ['.txt', '.md', '.json']:
                    with open(file_path, 'r', encoding='utf-8') as f:
                        content = f.read()
                        if len(content) > 3000:
                            content = content[:3000] + "... [content truncated]"
                        reference_content += f"\nReference Content:\n{content}\n"
                elif file_ext == '.pdf':
                    # Check for pre-computed summary
                    summary_path = brand_db.get_summary_path(reference_asset_id)
                    if summary_path:
                        with open(summary_path, 'r', encoding='utf-8') as f:
                            summary = f.read()
                        reference_content += f"\nBrand Guidelines Summary (extracted from {original_filename}):\n{summary}\n"
                    else:
                        # Fallback: extract text inline
                        try:
                            from pdf_processor import extract_text_from_pdf
                            raw_text = extract_text_from_pdf(file_path)
                            if raw_text and len(raw_text) > 100:
                                if len(raw_text) > 5000:
                                    raw_text = raw_text[:5000] + "... [content truncated]"
                                reference_content += f"\nExtracted PDF Content:\n{raw_text}\n"
                            else:
                                reference_content += f"\nReference PDF contains mostly images with limited extractable text.\n"
                        except Exception:
                            reference_content += f"\nReference file (.pdf) is available for visual comparison.\n"
                elif file_ext in ['.xlsx', '.xls']:
                    # For localization matrices, the context is built separately via localization_processor
                    if file_record.get('asset_type') == 'localization_matrix':
                        loc_messages = file_record.get('localization_messages', [])
                        loc_countries = file_record.get('localization_countries', [])
                        reference_content += f"\nLocalization Matrix: Contains {', '.join(loc_messages)} "
                        reference_content += f"for {len(loc_countries)} markets ({', '.join(loc_countries[:10])}).\n"
                        reference_content += "Expected copy will be cross-referenced with the media plan during analysis.\n"
                    elif file_record.get('summary_path'):
                        # Source-messaging Excel (HP and similar) — inject the Gemini-generated Markdown summary
                        try:
                            with open(file_record['summary_path'], 'r', encoding='utf-8') as f:
                                summary = f.read()
                            reference_content += f"\nSource Messaging Summary (extracted from {original_filename}):\n{summary}\n"
                        except Exception as e:
                            print(f"Failed to read source-messaging summary at {file_record['summary_path']}: {e}")
                            reference_content += f"\nReference file ({file_ext}) uploaded but summary unreadable.\n"
                    else:
                        reference_content += f"\nReference file ({file_ext}) uploaded as reference.\n"
                else:
                    reference_content += f"\nReference file ({file_ext}) is available for visual comparison.\n"
            except Exception as e:
                print(f"Error reading reference asset content: {e}")
                reference_content += "\n[Reference file available but content could not be read]\n"

        reference_content += "=== END REFERENCE ASSET GUIDELINES ===\n"

        return reference_content

    except Exception as e:
        print(f"Error retrieving reference asset {reference_asset_id}: {e}")
        return ""

def load_qc_apps():
    """Load all QC apps and their prompts"""
    for check_name in QC_CHECKS:
        try:
            # Import the app module
            try:
                module_path = f"visual_qc_apps.{check_name}.app"
                module = importlib.import_module(module_path)

                # Get app class name
                app_class_name = None
                for key in dir(module):
                    if key.endswith('App') and key != 'FlaskAppTemplate':
                        app_class_name = key
                        break
            except ImportError as e:
                print(f"Import error for {check_name}: {e}")
                continue

            if app_class_name:
                # Get the app class
                app_class = getattr(module, app_class_name)
                # Create an instance to get the prompt
                app_instance = app_class()

                # Find reference image for this check
                reference_image = get_reference_image_path(check_name)

                # Store the prompt, app class, and reference image
                qc_apps[check_name] = {
                    "name": app_class_name,
                    "prompt": app_instance.prompt,
                    "instance": app_instance,
                    "display_name": app_class_name.replace("App", "").replace("_", " "),
                    "reference_image": reference_image
                }
                print(f"Loaded QC check: {check_name}" + (f" with reference image" if reference_image else ""))
            else:
                print(f"No app class found in {module_path}")
        except Exception as e:
            print(f"Error loading {check_name} app: {e}")
            traceback.print_exc()

@app.route('/', methods=['GET'])
def serve_web_ui():
    """Serve the web UI"""
    try:
        # Use absolute path to web_ui.html (located in parent directory)
        base_dir = os.path.dirname(os.path.abspath(__file__))
        web_ui_path = os.path.join(os.path.dirname(base_dir), 'web_ui.html')
        with open(web_ui_path, 'r') as f:
            html_content = f.read()
        return Response(html_content, mimetype='text/html')
    except FileNotFoundError:
        return jsonify({'error': 'Web UI not found'}), 404

@app.route('/health', methods=['GET'])
def health_check():
    """Simple health check endpoint"""
    return jsonify({
        'status': 'healthy',
        'timestamp': datetime.now().isoformat()
    })

@app.route('/api/health/folders', methods=['GET'])
def health_check_folders():
    """Check if required folders exist and are writable"""
    try:
        upload_folder = app.config.get('UPLOAD_FOLDER', 'uploads')
        output_folder = app.config.get('OUTPUT_FOLDER', 'output')

        # Test if folders exist
        upload_exists = os.path.exists(upload_folder)
        output_exists = os.path.exists(output_folder)

        # Test if we can create directories (if they don't exist)
        upload_writable = False
        output_writable = False

        try:
            os.makedirs(upload_folder, exist_ok=True)
            upload_writable = True
        except Exception as e:
            upload_error = str(e)

        try:
            os.makedirs(output_folder, exist_ok=True)
            output_writable = True
        except Exception as e:
            output_error = str(e)

        # Test writing a file
        test_file_path = os.path.join(upload_folder, 'test_write.tmp')
        can_write_files = False
        try:
            with open(test_file_path, 'w') as f:
                f.write('test')
            os.remove(test_file_path)
            can_write_files = True
        except Exception as e:
            write_error = str(e)

        return jsonify({
            'status': 'success',
            'folders': {
                'upload_folder': upload_folder,
                'upload_exists': upload_exists,
                'upload_writable': upload_writable,
                'output_folder': output_folder,
                'output_exists': output_exists,
                'output_writable': output_writable,
                'can_write_files': can_write_files
            },
            'errors': {
                'upload_error': locals().get('upload_error'),
                'output_error': locals().get('output_error'),
                'write_error': locals().get('write_error')
            }
        })

    except Exception as e:
        import traceback
        return jsonify({
            'status': 'error',
            'message': str(e),
            'traceback': traceback.format_exc()
        }), 500

@app.route('/api/progress/<session_id>', methods=['GET'])
def get_progress(session_id):
    """Get current progress for a session"""
    if session_id not in progress_tracker:
        return jsonify({'status': 'error', 'message': 'Session not found'}), 404

    return jsonify({
        'status': 'success',
        'progress': progress_tracker[session_id]
    })

@app.route('/api/start_analysis', methods=['POST'])
@auth.require_auth
def start_analysis():
    """Start analysis and return session ID immediately"""
    import threading

    try:
        # Check if file is in request
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file part'}), 400

        file = request.files['file']

        # Check if file was selected
        if file.filename == '':
            return jsonify({'status': 'error', 'message': 'No selected file'}), 400

        # Get parameters
        profile = request.form.get('profile', 'general').lower()
        brand = request.form.get('brand', 'general').lower()
        output_mode = request.form.get('mode', 'json').lower()
        model = request.form.get('model', 'profile')
        reference_asset = request.form.get('reference_asset', '')
        model_version = request.form.get('model_version', None)  # Optional model override
        use_media_plan = request.form.get('use_media_plan', 'false').lower() == 'true'

        # Use profile if provided, otherwise fall back to brand
        if profile and profile != 'general':
            brand = profile.split('_')[0] if '_' in profile else profile

        print(f"Starting analysis with profile: {profile}, brand: {brand}, mode: {output_mode}")
        print(f"DEBUG: Raw mode parameter from request: '{request.form.get('mode')}'")
        print(f"DEBUG: Processed output_mode: '{output_mode}'")

        # Create unique session ID and save file
        session_id = datetime.now().strftime('%Y%m%d_%H%M%S')
        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        os.makedirs(session_folder, exist_ok=True)

        file_path = os.path.join(session_folder, file.filename)
        file.save(file_path)

        # Machine-side technical pre-flight (PIL/PyMuPDF/ffprobe, no LLM).
        # Stored on progress_tracker so process_single_check can prepend it to
        # every LLM prompt, and surfaced in result_data for the UI.
        technical_report = technical_inspect(file_path)

        # Derive client from profile if not provided
        client = request.form.get('client_id', request.form.get('client', 'general')).lower()
        if not client or client == 'general':
            if profile.startswith('diageo_'):
                client = 'diageo'
            elif profile.startswith('unilever_'):
                client = 'unilever'
            elif profile.startswith('loreal_'):
                client = 'loreal'
            elif profile.startswith('amazon_'):
                client = 'amazon'
            elif profile.startswith('boots_'):
                client = 'boots'
            elif profile.startswith(('dow_jones_', 'dj_', 'marketwatch_', 'mw_', 'wsj_')):
                client = 'dow_jones'
            else:
                client = 'general'

        access_err = _require_client_access(client)
        if access_err:
            return access_err

        # Log analysis start
        try:
            from usage_tracker import log_analysis_start
            file_info = {
                'filename': file.filename,
                'size': os.path.getsize(file_path) if os.path.exists(file_path) else 0
            }
            # Check if g.user is set, otherwise use a default user info
            user_info = getattr(g, 'user', {'user_id': 'unknown', 'email': 'unknown', 'name': 'unknown'})
            print(f"DEBUG: user_info = {user_info}")
            log_analysis_start(session_id, client, profile, user_info, file_info)
        except Exception as log_error:
            # Log the error but don't fail the analysis
            print(f"WARNING: Failed to log analysis start: {log_error}")
            import traceback
            traceback.print_exc()

        # Initialize progress tracking with estimated total checks
        # We'll update this with the actual number once we determine the profile
        estimated_checks = 25  # Reasonable estimate for most profiles
        progress_tracker[session_id] = {
            'total_checks': estimated_checks,
            'completed_checks': 0,
            'current_check': 'Initializing',
            'current_check_display': 'Initializing Analysis',
            'stage': 'setup',
            'percentage': 0,
            'session_id': session_id,
            'status': 'started',
            'technical_report': technical_report,
        }

        # Start analysis in background thread with explicit parameters
        def run_analysis(session_id, file_path, filename, brand, profile, output_mode, reference_asset, user_info):
            print(f"Background thread started for session: {session_id}")
            print(f"Parameters: brand={brand}, profile={profile}, mode={output_mode}")

            try:
                # Force reload QC apps to ensure they're available
                if not qc_apps:
                    load_qc_apps()

                # Use the explicitly passed parameters
                analysis_brand = brand
                analysis_profile = profile
                analysis_mode = output_mode
                analysis_reference_asset = reference_asset

                print(f"DEBUG: analysis_mode = '{analysis_mode}'")

                # Write debug info to file for easier debugging
                with open('debug_mode.txt', 'a') as f:
                    f.write(f"Session {session_id}: analysis_mode = '{analysis_mode}'\n")

                # Validate brand
                if not analysis_brand or analysis_brand.strip() == '':
                    analysis_brand = 'general'

                # Validate output mode
                print(f"DEBUG: Before validation, analysis_mode = '{analysis_mode}'")
                if analysis_mode not in ['json', 'html']:
                    print(f"DEBUG: analysis_mode '{analysis_mode}' not valid, defaulting to 'json'")
                    analysis_mode = 'json'
                else:
                    print(f"DEBUG: analysis_mode '{analysis_mode}' is valid")
                print(f"DEBUG: After validation, analysis_mode = '{analysis_mode}'")

                # Use the directly specified profile (no triage needed)
                suggested_profile = analysis_profile if analysis_profile and analysis_profile.strip() else 'general'
                print(f"Using specified profile: {suggested_profile}")

                # Update progress to show starting QC analysis
                progress_tracker[session_id].update({
                    'stage': 'qc_analysis',
                    'current_check': 'initializing',
                    'current_check_display': 'Preparing Quality Analysis',
                    'completed_checks': 0,
                    'percentage': 5
                })

                # STEP 1: Run Quality Control Analysis
                print(f"Step 1: Running QC analysis with profile '{suggested_profile}'")

                # Get the profile configuration
                profile_config = get_profile(suggested_profile)
                if not profile_config:
                    raise Exception(f'Profile {suggested_profile} not found')

                # Get enabled checks from profile
                enabled_checks = profile_config.get_enabled_checks()
                profile_weights = profile_config.get_check_weights()

                # Filter to only include checks that exist in qc_apps
                enabled_checks = [check for check in enabled_checks if check in qc_apps]

                if not enabled_checks:
                    raise Exception(f'No enabled checks found for profile {suggested_profile}')

                # Update progress tracker with total checks
                progress_tracker[session_id].update({
                    'total_checks': len(enabled_checks),
                    'stage': 'qc_analysis',
                    'percentage': 10
                })

                # Build media plan context if selected by user
                mp_context = None
                mp_match_data = None
                try:
                    if use_media_plan:
                        mp_data = _get_active_media_plan(client)
                    else:
                        mp_data = None
                    if mp_data:
                        from media_plan_processor import find_matching_asset, build_media_plan_context
                        mp_match = find_matching_asset(file.filename, mp_data)
                        if mp_match:
                            mp_match_data = mp_match['match']
                            mp_context = build_media_plan_context(mp_match_data)
                except Exception as mp_err:
                    print(f"Media plan context build error: {mp_err}")

                # Build localization context if reference asset is a localization matrix
                localization_context = ""
                try:
                    if analysis_reference_asset and mp_match_data:
                        file_record = brand_db.db.get("files", {}).get(analysis_reference_asset)
                        if file_record and file_record.get('asset_type') == 'localization_matrix':
                            loc_path = file_record.get('localization_path')
                            if loc_path and os.path.exists(loc_path):
                                with open(loc_path, 'r', encoding='utf-8') as f:
                                    loc_data = json.load(f)
                                from localization_processor import detect_message_type, build_localization_context
                                creative_name = mp_match_data.get('creative_name', '')
                                msg_type = detect_message_type(creative_name)
                                country_code = mp_match_data.get('country', '')
                                if msg_type and country_code:
                                    localization_context = build_localization_context(loc_data, msg_type, country_code)
                                    if localization_context:
                                        print(f"Localization context built: {msg_type} / {country_code}")
                                    else:
                                        print(f"No localization data for {msg_type} / {country_code}")
                                else:
                                    print(f"No message type detected from creative_name: '{creative_name}'")
                except Exception as loc_err:
                    print(f"Localization context build error: {loc_err}")

                # Combine media plan and localization contexts
                if localization_context and mp_context:
                    mp_context = mp_context + "\n" + localization_context
                elif localization_context:
                    mp_context = localization_context

                # OCR layout measurement - provides pixel-level data to supplement LLM visual checks
                ocr_ctx = None
                try:
                    from ocr_measurement import OCR_RELEVANT_CHECKS
                    ocr_check_names = set(enabled_checks) & set(OCR_RELEVANT_CHECKS)
                    if ocr_check_names:
                        from ocr_measurement import run_ocr_measurement
                        print(f"Running OCR layout measurement for {len(ocr_check_names)} checks...")
                        ocr_result = run_ocr_measurement(file_path)
                        if ocr_result and ocr_result.get('context'):
                            ocr_ctx = ocr_result['context']
                            print(f"OCR measurements computed successfully")
                            print(ocr_ctx)
                        else:
                            print("OCR measurement returned no results")
                except Exception as ocr_err:
                    print(f"OCR measurement error (non-fatal, continuing without): {ocr_err}")

                # Run QC checks in parallel batches
                check_results = process_checks_in_batches(
                    enabled_checks, qc_apps, profile_config, profile_weights,
                    file_path, analysis_reference_asset, brand_db, progress_tracker,
                    session_id, batch_size=15, media_plan_context=mp_context,
                    ocr_context=ocr_ctx
                )

                # STEP 4: Calculate Overall Score
                print(f"Step 4: Calculating overall score")

                total_weighted_score = 0
                total_weight = 0
                completed_checks = 0
                failed_checks = 0

                for check_name, result in check_results.items():
                    weight = result.get('weight', 0.1)
                    total_weight += weight

                    if result['status'] == 'success':
                        completed_checks += 1
                        score = result.get('score')
                        if score is not None:
                            total_weighted_score += score * weight
                    else:
                        failed_checks += 1

                # Calculate overall score
                # For profiles with total_weight = 10.0 (like General Check), use direct weighted score
                # For profiles with total_weight = 1.0, multiply by 10 to scale to 100
                if total_weight >= 10.0:
                    overall_score = min(total_weighted_score, 100)  # Cap at 100
                else:
                    overall_score = min(total_weighted_score * 10, 100)  # Scale to 100-point system, cap at 100

                # STEP 5: Prepare Combined Response
                print(f"Step 5: Preparing response")

                # Create comprehensive response with all data
                result_data = {
                    'status': 'success',
                    'session_id': session_id,
                    'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
                    'filename': file.filename,
                    'profile': suggested_profile,
                    'profile_id': suggested_profile,
                    'profile_name': profile_config.name,
                    'model': 'Profile-based selection',
                    'results': check_results,
                    'triage_analysis': {
                        'status': 'skipped',
                        'results': {'primary_format': 'unknown', 'specific_type': 'user_selected', 'confidence_score': 10, 'recommended_qc_profile': suggested_profile},
                        'raw_response': 'Triage skipped - using user-selected profile directly'
                    },
                    'profile_selection': {
                        'selected_profile': suggested_profile,
                        'profile_source': 'user_selected',
                        'brand': analysis_brand,
                        'format_suffix': suggested_profile,
                        'reference_asset': analysis_reference_asset if analysis_reference_asset else None,
                        'reference_asset_used': bool(analysis_reference_asset)
                    },
                    'qc_analysis': {
                        'profile_used': suggested_profile,
                        'total_checks': len(enabled_checks),
                        'completed_checks': completed_checks,
                        'failed_checks': failed_checks,
                        'check_results': check_results
                    },
                    'summary': {
                        'overall_score': round(overall_score, 1),
                        'profile': profile_config.name,
                        'checks_count': completed_checks,
                        'total_checks': len(enabled_checks),
                        'total_weighted_score': total_weighted_score,
                        'total_weight': total_weight,
                        'grade': determine_grade(overall_score)
                    },
                    'technical_report': progress_tracker[session_id].get('technical_report', {}),
                }

                # L'Oreal Static override: fail if ANY individual check fails (score < 6)
                if suggested_profile == 'loreal_static':
                    for cn, cd in check_results.items():
                        if cd.get('status') == 'success':
                            cs = cd.get('score', 0)
                            if cs is not None and cs < 6:
                                result_data['summary']['grade'] = 'Fail'
                                break

                # Amazon Static override: fail if ANY individual check fails (score < 6)
                if suggested_profile == 'amazon_static':
                    for cn, cd in check_results.items():
                        if cd.get('status') == 'success':
                            cs = cd.get('score', 0)
                            if cs is not None and cs < 6:
                                result_data['summary']['grade'] = 'Fail'
                                break

                # Boots Static override: fail if ANY individual check fails (score < 6)
                if suggested_profile == 'boots_static':
                    for cn, cd in check_results.items():
                        if cd.get('status') == 'success':
                            cs = cd.get('score', 0)
                            if cs is not None and cs < 6:
                                result_data['summary']['grade'] = 'Fail'
                                break

                # Log analysis completion
                from usage_tracker import log_analysis_complete
                results_summary = {
                    'checks_completed': completed_checks,
                    'overall_score': overall_score,
                    'status': 'success',
                    'check_results': check_results
                }
                log_analysis_complete(session_id, client, suggested_profile, user_info, results_summary)

                print(f"Analysis completed successfully")

                # Save results to file
                try:
                    print(f"DEBUG: Saving file with mode: '{analysis_mode}'")
                    output_path = save_results_to_file(result_data, file.filename, analysis_mode, session_id, file_path)
                    result_data['output_file'] = {
                        'path': output_path,
                        'filename': os.path.basename(output_path),
                        'url': f'{request.environ.get("SCRIPT_NAME", "")}/output/{os.path.basename(output_path)}'
                    }
                    print(f"Results saved to: {output_path}")
                except Exception as save_error:
                    print(f"Error saving results to file: {save_error}")

                # Store result in progress tracker
                print(f"Analysis result status: {result_data.get('status')}")
                if session_id in progress_tracker:
                    progress_tracker[session_id]['result'] = result_data
                    progress_tracker[session_id]['status'] = 'completed'
                    progress_tracker[session_id]['stage'] = 'complete'
                    progress_tracker[session_id]['percentage'] = 100
                    print(f"Results stored in progress tracker for session: {session_id}")
                else:
                    print(f"ERROR: Session {session_id} not found in progress tracker!")

            except Exception as e:
                print(f"ERROR in background thread for session {session_id}: {str(e)}")
                print(f"Exception type: {type(e)}")
                import traceback
                print(f"Traceback: {traceback.format_exc()}")
                if session_id in progress_tracker:
                    progress_tracker[session_id]['status'] = 'error'
                    progress_tracker[session_id]['stage'] = 'error'
                    progress_tracker[session_id]['error'] = str(e)
                    progress_tracker[session_id]['current_check'] = 'Error'
                    progress_tracker[session_id]['current_check_display'] = 'Analysis Failed'

        # Start background thread with explicit parameters
        # Get user_info before starting thread (g is request-scoped and won't be available in thread)
        user_info = getattr(g, 'user', {'user_id': 'unknown', 'email': 'unknown', 'name': 'unknown'})
        threading.Thread(
            target=run_analysis,
            args=(session_id, file_path, file.filename, brand, profile, output_mode, reference_asset, user_info),
            daemon=True
        ).start()

        # Return session ID immediately
        return jsonify({
            'status': 'success',
            'session_id': session_id,
            'message': 'Analysis started'
        })

    except Exception as e:
        print(f"ERROR in start_analysis: {type(e).__name__}: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500


@app.route('/api/document/start_analysis', methods=['POST'])
@auth.require_auth
def start_document_analysis():
    """Start a document-mode analysis (multi-page PDF as QC target).

    Mirrors /api/start_analysis but routes through document_mode.dispatcher.
    Reuses the same progress_tracker dict, output folder convention, and
    /api/progress polling endpoint, so the frontend integration is minimal.
    """
    import threading

    try:
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file part'}), 400

        file = request.files['file']
        if file.filename == '':
            return jsonify({'status': 'error', 'message': 'No selected file'}), 400

        if not file.filename.lower().endswith('.pdf'):
            return jsonify({'status': 'error', 'message': 'Document mode requires a PDF file'}), 400

        profile_id = request.form.get('profile', '').lower()
        if not profile_id:
            return jsonify({'status': 'error', 'message': 'profile is required'}), 400

        output_mode = request.form.get('mode', 'both').lower()
        if output_mode not in ('json', 'html', 'both'):
            output_mode = 'both'

        reference_asset = request.form.get('reference_asset', '') or None
        client = request.form.get('client_id', request.form.get('client', '')).lower()
        if not client:
            return jsonify({'status': 'error', 'message': 'client is required for document mode'}), 400

        access_err = _require_client_access(client)
        if access_err:
            return access_err

        # Resolve and validate the profile is document-mode
        profile_config = get_profile(profile_id)
        if not profile_config:
            return jsonify({'status': 'error', 'message': f'Profile "{profile_id}" not found'}), 404
        if getattr(profile_config, 'mode', 'asset') != 'document':
            return jsonify({
                'status': 'error',
                'message': f'Profile "{profile_id}" is not a document-mode profile. Use /api/start_analysis instead.'
            }), 400

        # Save the uploaded PDF
        session_id = datetime.now().strftime('%Y%m%d_%H%M%S')
        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        os.makedirs(session_folder, exist_ok=True)
        file_path = os.path.join(session_folder, file.filename)
        file.save(file_path)

        # Machine-side technical pre-flight (PyMuPDF for PDFs, no LLM).
        technical_report = technical_inspect(file_path)

        # Pre-render directory for per-page PNGs lives alongside the PDF
        pages_dir = os.path.join(session_folder, 'pages')

        # Log start
        try:
            from usage_tracker import log_analysis_start
            file_info = {
                'filename': file.filename,
                'size': os.path.getsize(file_path) if os.path.exists(file_path) else 0,
                'mode': 'document',
            }
            user_info = getattr(g, 'user', {'user_id': 'unknown', 'email': 'unknown', 'name': 'unknown'})
            log_analysis_start(session_id, client, profile_id, user_info, file_info)
        except Exception as log_error:
            print(f"WARNING: Failed to log document analysis start: {log_error}")
            user_info = getattr(g, 'user', {'user_id': 'unknown', 'email': 'unknown', 'name': 'unknown'})

        # Initialize progress
        progress_tracker[session_id] = {
            'total_checks': 0,
            'completed_checks': 0,
            'current_check': 'Initializing',
            'current_check_display': 'Initializing document analysis',
            'stage': 'setup',
            'percentage': 0,
            'session_id': session_id,
            'status': 'started',
            'mode': 'document',
            'technical_report': technical_report,
        }

        def run_document(session_id, file_path, filename, profile_id, client, output_mode, reference_asset, user_info):
            try:
                if not qc_apps:
                    load_qc_apps()

                profile_config_local = get_profile(profile_id)
                # Document-mode checks may live in qc_apps (legacy LLM checks)
                # OR in document_mode.checks registry (new deterministic checks).
                # Accept either as a valid enabled check.
                from document_mode.checks import is_document_scope_check
                enabled_checks = [
                    c for c in profile_config_local.get_enabled_checks()
                    if c in qc_apps or is_document_scope_check(c)
                ]
                profile_weights = profile_config_local.get_check_weights()

                if not enabled_checks:
                    raise Exception(f'No enabled checks found for profile {profile_id}')

                from document_mode.dispatcher import run_document_analysis
                from document_mode.ingest import ingest_pdf
                from document_mode.result_writer import write_document_report

                doc_result = run_document_analysis(
                    pdf_path=file_path,
                    profile_config=profile_config_local,
                    profile_id=profile_id,
                    profile_weights=profile_weights,
                    enabled_checks=enabled_checks,
                    qc_apps=qc_apps,
                    brand_db=brand_db,
                    analysis_reference_asset=reference_asset,
                    media_plan_context=None,
                    ocr_context=None,
                    progress_tracker=progress_tracker,
                    session_id=session_id,
                    process_checks_in_batches=process_checks_in_batches,
                    ingest_pdf_fn=ingest_pdf,
                    pages_output_dir=os.path.join(os.path.dirname(file_path), 'pages'),
                )

                # Write JSON + HTML to the client-scoped output folder
                client_folder = ensure_client_output_folder(client)
                paths = write_document_report(
                    doc_result,
                    original_filename=filename,
                    session_id=session_id,
                    output_dir=client_folder,
                    output_mode=output_mode,
                )

                # Wrap doc_result in a frontend-compatible envelope
                summary = doc_result.get('document_summary', {})
                result_data = {
                    'status': 'success',
                    'session_id': session_id,
                    'timestamp': doc_result.get('timestamp'),
                    'filename': filename,
                    'profile': profile_id,
                    'profile_id': profile_id,
                    'profile_name': profile_config_local.name,
                    'mode': 'document',
                    'document_result': doc_result,
                    'summary': {
                        'overall_score': summary.get('overall_score', 0),
                        'profile': profile_config_local.name,
                        'grade': summary.get('grade', ''),
                        'pages_processed': doc_result.get('pages_processed', 0),
                        'page_count': doc_result.get('page_count', 0),
                    },
                    'technical_report': progress_tracker[session_id].get('technical_report', {}),
                }

                if paths.get('html'):
                    result_data['output_file'] = {
                        'path': paths['html'],
                        'filename': os.path.basename(paths['html']),
                        'url': f'/output/{client}/{os.path.basename(paths["html"])}',
                    }
                if paths.get('json'):
                    result_data['output_data_file'] = {
                        'path': paths['json'],
                        'filename': os.path.basename(paths['json']),
                        'url': f'/output/{client}/{os.path.basename(paths["json"])}',
                    }

                # Log completion
                try:
                    from usage_tracker import log_analysis_complete
                    completed = sum(
                        1 for page in doc_result.get('pages', [])
                        for r in (page.get('results') or {}).values()
                        if r.get('status') == 'success'
                    )
                    log_analysis_complete(
                        session_id, client, profile_id, user_info,
                        {
                            'checks_completed': completed,
                            'overall_score': summary.get('overall_score', 0),
                            'status': 'success',
                            'mode': 'document',
                            'pages_processed': doc_result.get('pages_processed', 0),
                        },
                    )
                except Exception as log_err:
                    print(f"WARNING: failed to log doc-mode analysis completion: {log_err}")

                progress_tracker[session_id]['result'] = result_data
                progress_tracker[session_id]['status'] = 'completed'
                progress_tracker[session_id]['stage'] = 'complete'
                progress_tracker[session_id]['percentage'] = 100

            except Exception as e:
                print(f"ERROR in document run for session {session_id}: {e}")
                import traceback
                traceback.print_exc()
                if session_id in progress_tracker:
                    progress_tracker[session_id]['status'] = 'error'
                    progress_tracker[session_id]['stage'] = 'error'
                    progress_tracker[session_id]['error'] = str(e)
                    progress_tracker[session_id]['current_check_display'] = 'Document analysis failed'

        threading.Thread(
            target=run_document,
            args=(session_id, file_path, file.filename, profile_id, client, output_mode, reference_asset, user_info),
            daemon=True,
        ).start()

        return jsonify({
            'status': 'success',
            'session_id': session_id,
            'mode': 'document',
            'message': 'Document analysis started',
        })

    except Exception as e:
        print(f"ERROR in start_document_analysis: {type(e).__name__}: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/document/start_diff', methods=['POST'])
@auth.require_auth
def start_document_diff_analysis():
    """Start an old-vs-new PDF diff analysis (Phase 3).

    Accepts two PDFs as 'old_file' and 'new_file' multipart fields.
    Routes through document_mode.diff_engine.run_document_diff_analysis.
    """
    import threading

    try:
        if 'old_file' not in request.files or 'new_file' not in request.files:
            return jsonify({'status': 'error', 'message': "Both 'old_file' and 'new_file' are required"}), 400

        old_file = request.files['old_file']
        new_file = request.files['new_file']
        if not old_file.filename or not new_file.filename:
            return jsonify({'status': 'error', 'message': 'Both files must be selected'}), 400
        if not old_file.filename.lower().endswith('.pdf') or not new_file.filename.lower().endswith('.pdf'):
            return jsonify({'status': 'error', 'message': 'Both old and new must be PDFs'}), 400

        profile_id = request.form.get('profile', '').lower()
        if not profile_id:
            return jsonify({'status': 'error', 'message': 'profile is required'}), 400

        output_mode = request.form.get('mode', 'both').lower()
        if output_mode not in ('json', 'html', 'both'):
            output_mode = 'both'

        client = request.form.get('client_id', request.form.get('client', '')).lower()
        if not client:
            return jsonify({'status': 'error', 'message': 'client is required for diff mode'}), 400

        access_err = _require_client_access(client)
        if access_err:
            return access_err

        profile_config = get_profile(profile_id)
        if not profile_config:
            return jsonify({'status': 'error', 'message': f'Profile "{profile_id}" not found'}), 404
        if getattr(profile_config, 'mode', 'asset') != 'document_diff':
            return jsonify({
                'status': 'error',
                'message': f'Profile "{profile_id}" is not a document_diff profile.'
            }), 400

        session_id = datetime.now().strftime('%Y%m%d_%H%M%S')
        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        os.makedirs(session_folder, exist_ok=True)
        old_path = os.path.join(session_folder, f'old_{old_file.filename}')
        new_path = os.path.join(session_folder, f'new_{new_file.filename}')
        old_file.save(old_path)
        new_file.save(new_path)

        try:
            from usage_tracker import log_analysis_start
            user_info = getattr(g, 'user', {'user_id': 'unknown', 'email': 'unknown', 'name': 'unknown'})
            log_analysis_start(session_id, client, profile_id, user_info, {
                'filename': f'{old_file.filename} vs {new_file.filename}',
                'mode': 'document_diff',
            })
        except Exception as log_error:
            print(f"WARNING: failed to log diff start: {log_error}")
            user_info = getattr(g, 'user', {'user_id': 'unknown', 'email': 'unknown', 'name': 'unknown'})

        progress_tracker[session_id] = {
            'total_checks': 0,
            'completed_checks': 0,
            'current_check': 'Initializing diff',
            'current_check_display': 'Initializing diff analysis',
            'stage': 'setup',
            'percentage': 0,
            'session_id': session_id,
            'status': 'started',
            'mode': 'document_diff',
        }

        def run_diff():
            try:
                profile_config_local = get_profile(profile_id)
                from document_mode.diff_engine import run_document_diff_analysis
                from document_mode.ingest import ingest_pdf
                from document_mode.diff_report_writer import write_diff_report
                from llm_config import call_gemini_vision

                doc_result = run_document_diff_analysis(
                    old_pdf_path=old_path,
                    new_pdf_path=new_path,
                    old_filename=old_file.filename,
                    new_filename=new_file.filename,
                    profile_config=profile_config_local,
                    profile_id=profile_id,
                    progress_tracker=progress_tracker,
                    session_id=session_id,
                    ingest_pdf_fn=ingest_pdf,
                    call_gemini_vision_fn=call_gemini_vision,
                    pages_output_dir_old=os.path.join(session_folder, 'pages_old'),
                    pages_output_dir_new=os.path.join(session_folder, 'pages_new'),
                )

                client_folder = ensure_client_output_folder(client)
                paths = write_diff_report(
                    doc_result,
                    old_filename=old_file.filename,
                    new_filename=new_file.filename,
                    session_id=session_id,
                    output_dir=client_folder,
                    output_mode=output_mode,
                )

                summary = doc_result.get('document_summary', {})
                result_data = {
                    'status': 'success',
                    'session_id': session_id,
                    'timestamp': doc_result.get('timestamp'),
                    'filename': f'{old_file.filename} vs {new_file.filename}',
                    'profile': profile_id,
                    'profile_id': profile_id,
                    'profile_name': profile_config_local.name,
                    'mode': 'document_diff',
                    'document_result': doc_result,
                    'summary': {
                        'overall_score': summary.get('overall_score', 0),
                        'profile': profile_config_local.name,
                        'grade': summary.get('grade', ''),
                    },
                }
                if paths.get('html'):
                    result_data['output_file'] = {
                        'path': paths['html'],
                        'filename': os.path.basename(paths['html']),
                        'url': f'/output/{client}/{os.path.basename(paths["html"])}',
                    }
                if paths.get('json'):
                    result_data['output_data_file'] = {
                        'path': paths['json'],
                        'filename': os.path.basename(paths['json']),
                        'url': f'/output/{client}/{os.path.basename(paths["json"])}',
                    }

                try:
                    from usage_tracker import log_analysis_complete
                    log_analysis_complete(
                        session_id, client, profile_id, user_info,
                        {
                            'checks_completed': len(doc_result.get('pair_diffs', {})),
                            'overall_score': summary.get('overall_score', 0),
                            'status': 'success',
                            'mode': 'document_diff',
                            'token_usage': doc_result.get('token_usage', {}),
                        },
                    )
                except Exception as log_err:
                    print(f"WARNING: failed to log diff completion: {log_err}")

                progress_tracker[session_id]['result'] = result_data
                progress_tracker[session_id]['status'] = 'completed'
                progress_tracker[session_id]['stage'] = 'complete'
                progress_tracker[session_id]['percentage'] = 100

            except Exception as e:
                print(f"ERROR in diff run for session {session_id}: {e}")
                import traceback
                traceback.print_exc()
                if session_id in progress_tracker:
                    progress_tracker[session_id]['status'] = 'error'
                    progress_tracker[session_id]['stage'] = 'error'
                    progress_tracker[session_id]['error'] = str(e)
                    progress_tracker[session_id]['current_check_display'] = 'Diff analysis failed'

        threading.Thread(target=run_diff, daemon=True).start()

        return jsonify({
            'status': 'success',
            'session_id': session_id,
            'mode': 'document_diff',
            'message': 'Diff analysis started',
        })

    except Exception as e:
        print(f"ERROR in start_document_diff_analysis: {type(e).__name__}: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/output/<client>/<filename>', methods=['GET'])
@auth.require_auth
def serve_client_output_file(client, filename):
    """Serve saved output files from client-specific folders"""
    access_err = _require_client_access(client)
    if access_err:
        return access_err
    try:
        file_path = os.path.join(app.config['OUTPUT_FOLDER'], client, filename)
        if os.path.exists(file_path):
            if filename.endswith('.html'):
                with open(file_path, 'r', encoding='utf-8') as f:
                    content = f.read()
                return Response(content, mimetype='text/html')
            elif filename.endswith('.json'):
                with open(file_path, 'r', encoding='utf-8') as f:
                    content = f.read()
                return Response(content, mimetype='application/json')
            else:
                return Response(open(file_path, 'rb').read(), mimetype='application/octet-stream')
        else:
            return jsonify({'error': 'File not found'}), 404
    except Exception as e:
        return jsonify({'error': str(e)}), 500

@app.route('/output/<filename>', methods=['GET'])
def serve_output_file(filename):
    """Serve saved output files (legacy route for backward compatibility)"""
    try:
        # First try to find file in root output folder
        file_path = os.path.join(app.config['OUTPUT_FOLDER'], filename)
        if os.path.exists(file_path):
            if filename.endswith('.html'):
                with open(file_path, 'r', encoding='utf-8') as f:
                    content = f.read()
                return Response(content, mimetype='text/html')
            elif filename.endswith('.json'):
                with open(file_path, 'r', encoding='utf-8') as f:
                    content = f.read()
                return Response(content, mimetype='application/json')
            else:
                return Response(open(file_path, 'rb').read(), mimetype='application/octet-stream')
        else:
            return jsonify({'error': 'File not found'}), 404
    except Exception as e:
        return jsonify({'error': str(e)}), 500

@app.route('/api/output_files', methods=['GET'])
@auth.require_auth
def list_output_files():
    """List saved output files filtered by client, sorted by creation date (newest first)"""
    try:
        # Get client parameter (optional)
        client_filter = request.args.get('client', None)
        print(f"DEBUG: list_output_files called with client_filter='{client_filter}'")

        if client_filter:
            access_err = _require_client_access(client_filter)
            if access_err:
                return access_err

        # Run cleanup of files older than 14 days
        cleanup_old_files(max_age_days=14)

        files = []
        output_folder = app.config['OUTPUT_FOLDER']

        if os.path.exists(output_folder):
            # If client filter is provided, only check that client's folder
            if client_filter:
                client_folder = os.path.join(output_folder, client_filter)
                if os.path.exists(client_folder):
                    for filename in os.listdir(client_folder):
                        if filename.endswith(('.html', '.json')):
                            file_path = os.path.join(client_folder, filename)
                            if os.path.isfile(file_path):
                                file_stats = os.stat(file_path)
                                files.append({
                                    'filename': filename,
                                    'size': file_stats.st_size,
                                    'created': datetime.fromtimestamp(file_stats.st_ctime).strftime('%Y-%m-%d %H:%M:%S'),
                                    'created_timestamp': file_stats.st_ctime,
                                    'url': f'{request.environ.get("SCRIPT_NAME", "")}/output/{client_filter}/{filename}',
                                    'client': client_filter
                                })
            else:
                # No client filter - check all client folders
                for item in os.listdir(output_folder):
                    item_path = os.path.join(output_folder, item)
                    if os.path.isdir(item_path):
                        # This is a client folder
                        client_name = item
                        for filename in os.listdir(item_path):
                            if filename.endswith(('.html', '.json')):
                                file_path = os.path.join(item_path, filename)
                                if os.path.isfile(file_path):
                                    file_stats = os.stat(file_path)
                                    files.append({
                                        'filename': filename,
                                        'size': file_stats.st_size,
                                        'created': datetime.fromtimestamp(file_stats.st_ctime).strftime('%Y-%m-%d %H:%M:%S'),
                                        'created_timestamp': file_stats.st_ctime,
                                        'url': f'{request.environ.get("SCRIPT_NAME", "")}/output/{client_name}/{filename}',
                                        'client': client_name
                                    })

        # Sort files by creation time (newest first)
        files.sort(key=lambda x: x['created_timestamp'], reverse=True)

        # Remove the timestamp field from response (not needed by frontend)
        for file in files:
            del file['created_timestamp']

        print(f"DEBUG: Returning {len(files)} files for client_filter='{client_filter}'")
        if files:
            print(f"DEBUG: Sample file clients: {[f.get('client', 'unknown') for f in files[:3]]}")

        return jsonify({'files': files})
    except Exception as e:
        print(f"Error listing output files: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({'error': str(e)}), 500

@app.route('/api/delete_output_files', methods=['POST'])
@auth.require_auth
def delete_output_files():
    """Delete selected output files"""
    try:
        data = request.get_json()
        filenames = data.get('filenames', [])
        client = data.get('client', '')

        if not filenames or not client:
            return jsonify({'error': 'Missing filenames or client'}), 400

        output_folder = app.config['OUTPUT_FOLDER']
        deleted = []
        errors = []

        for filename in filenames:
            # Sanitize filename to prevent path traversal
            safe_filename = os.path.basename(filename)
            file_path = os.path.join(output_folder, client, safe_filename)

            if os.path.isfile(file_path):
                try:
                    os.remove(file_path)
                    deleted.append(safe_filename)
                    print(f"Deleted output file: {file_path}")
                except Exception as e:
                    errors.append({'filename': safe_filename, 'error': str(e)})
            else:
                errors.append({'filename': safe_filename, 'error': 'File not found'})

        return jsonify({
            'deleted': deleted,
            'errors': errors,
            'deleted_count': len(deleted)
        })
    except Exception as e:
        print(f"Error deleting output files: {e}")
        return jsonify({'error': str(e)}), 500

@app.route('/api/profiles', methods=['GET'])
def get_available_profiles():
    """Get all available profiles grouped by type, optionally filtered by client"""
    from profile_config import get_profile_summary, get_profile
    from client_config import get_profiles_with_visibility

    # Check if client parameter is provided
    client_id = request.args.get('client', None)

    # Force reload profiles to ensure they're up to date
    from profile_config import load_profiles
    load_profiles()

    profiles_summary = get_profile_summary()

    # Filter by client if specified (using visibility-aware function)
    if client_id:
        allowed_profiles = get_profiles_with_visibility(client_id)
        profiles_summary = {
            pid: pinfo for pid, pinfo in profiles_summary.items()
            if pid in allowed_profiles
        }

    # Group profiles by type
    triage_profiles = {}
    format_profiles = {}

    # Build detailed profile data including checks
    all_profiles_detailed = {}
    for profile_id, profile_info in profiles_summary.items():
        # Get full profile data
        try:
            profile = get_profile(profile_id)

            # Load the raw profile JSON to get weight_scale if it exists
            profile_path = os.path.join('profiles', f'{profile_id}.json')
            weight_scale = 100  # Default to 100
            if os.path.exists(profile_path):
                with open(profile_path, 'r') as f:
                    profile_data = json.load(f)
                    weight_scale = profile_data.get('weight_scale', 100)

            all_profiles_detailed[profile_id] = {
                'name': profile.name,
                'description': profile.description,
                'enabled_checks': profile.get_enabled_checks(),
                'total_checks': len(profile.checks),
                'enabled_count': len(profile.get_enabled_checks()),
                'weight_scale': weight_scale,
                'mode': getattr(profile, 'mode', 'asset'),
                'checks': {check_name: {'weight': config.weight, 'llm': config.llm, 'enabled': config.enabled}
                          for check_name, config in profile.checks.items()}
            }
        except:
            # Fallback to summary if full profile can't be loaded
            all_profiles_detailed[profile_id] = profile_info

        if '_triage' in profile_id:
            brand = profile_id.replace('_triage', '')
            triage_profiles[brand] = {
                'id': profile_id,
                'name': profile_info['name'],
                'description': profile_info['description']
            }
        elif any(suffix in profile_id for suffix in ['_print', '_digital', '_ooh', '_packaging', '_event', '_indoor']):
            format_profiles[profile_id] = {
                'id': profile_id,
                'name': profile_info['name'],
                'description': profile_info['description'],
                'enabled_checks': profile_info['enabled_checks'],
                'total_checks': profile_info['total_checks']
            }

    response_data = {
        'status': 'success',
        'triage_profiles': triage_profiles,
        'format_profiles': format_profiles,
        'all_profiles': all_profiles_detailed
    }

    # Include client info if filtered
    if client_id:
        response_data['client'] = client_id

    return jsonify(response_data)

@app.route('/api/clients', methods=['GET'])
def get_clients_endpoint():
    """Get clients visible to the current user. Admins see all; others see only their grants."""
    from client_config import get_all_clients
    from user_access import get_user_clients, is_admin

    try:
        all_clients = get_all_clients()

        # Resolve the current user's email if authenticated. Unauthenticated
        # callers get an empty list so the UI can prompt for sign-in without
        # leaking the full client catalogue.
        user_email = ''
        try:
            auth_result = app.auth_middleware.is_authenticated()
            if auth_result.get('authenticated'):
                user_email = auth_result.get('user', {}).get('email', '')
        except Exception:
            pass

        if not user_email:
            return jsonify({'status': 'success', 'clients': {}, 'is_admin': False})

        allowed_ids = get_user_clients(user_email)
        filtered = {cid: all_clients[cid] for cid in allowed_ids if cid in all_clients}

        return jsonify({
            'status': 'success',
            'clients': filtered,
            'is_admin': is_admin(user_email)
        })
    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500


@app.route('/api/all_clients', methods=['GET'])
@auth.require_auth
def list_all_clients_endpoint():
    """
    Full client catalogue (auth required). Used by the Request Access form so
    users can pick clients they don't currently have access to.
    """
    try:
        from client_config import get_all_clients
        return jsonify({'status': 'success', 'clients': get_all_clients()})
    except Exception as e:
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/clients/<client_id>/default_profile', methods=['GET'])
@auth.require_auth
def get_client_default_profile_endpoint(client_id):
    """Return the effective default profile for a client (override or static).

    Auth-required (any signed-in user) — read-only, no admin gate.
    """
    try:
        from client_config import get_all_clients, get_default_profile, get_client_profiles
        clients = get_all_clients()
        if client_id not in clients:
            return jsonify({'status': 'error', 'message': f'unknown client: {client_id}'}), 404
        access_err = _require_client_access(client_id)
        if access_err:
            return access_err
        return jsonify({
            'status': 'success',
            'client_id': client_id,
            'profiles': get_client_profiles(client_id),
            'default_profile': get_default_profile(client_id),
            'static_default': clients[client_id].get('default_profile'),
        })
    except Exception as e:
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/clients/<client_id>/default_profile', methods=['PUT'])
@auth.require_auth
def set_client_default_profile_endpoint(client_id):
    """Admin-only: set the default profile for a client (persisted as a runtime override).

    Body: {"profile_id": "<id>"}. The profile must already be in the client's
    `profiles` list — we don't allow defaulting to a profile the client can't see.
    Posts to backend/client_defaults.json so a bad write can never break server boot.
    """
    actor_email, err = _require_admin()
    if err:
        return err
    try:
        body = request.get_json(silent=True) or {}
        profile_id = (body.get('profile_id') or '').strip()
        if not profile_id:
            return jsonify({'status': 'error', 'message': 'profile_id is required'}), 400
        from client_config import set_default_profile
        ok, reason = set_default_profile(client_id, profile_id)
        if not ok:
            return jsonify({'status': 'error', 'message': reason}), 400
        print(f'Admin {actor_email}: set default_profile for {client_id} → {profile_id}')
        return jsonify({
            'status': 'success',
            'client_id': client_id,
            'default_profile': profile_id,
        })
    except Exception as e:
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/clients/<client_id>/default_profile', methods=['DELETE'])
@auth.require_auth
def clear_client_default_profile_endpoint(client_id):
    """Admin-only: clear the runtime override so the static default applies again."""
    actor_email, err = _require_admin()
    if err:
        return err
    try:
        from client_config import clear_default_profile_override, get_default_profile
        clear_default_profile_override(client_id)
        print(f'Admin {actor_email}: cleared default_profile override for {client_id}')
        return jsonify({
            'status': 'success',
            'client_id': client_id,
            'default_profile': get_default_profile(client_id),
        })
    except Exception as e:
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/access_request', methods=['POST'])
@auth.require_auth
def request_client_access():
    """
    Signed-in users request access to additional clients. Sends an email to all
    admins with the requester's identity (taken from the verified session, never
    the request body) and the clients they want.
    """
    from html import escape as _html_escape
    try:
        payload = request.get_json(silent=True) or {}
        requested_clients = payload.get('clients') or []
        reason = (payload.get('reason') or '').strip()

        if not isinstance(requested_clients, list) or not requested_clients:
            return jsonify({'status': 'error', 'message': 'Select at least one client'}), 400

        # Always source identity from the verified session, not the body.
        user_email = getattr(g, 'user', {}).get('email', '')
        user_name = getattr(g, 'user', {}).get('name', '') or user_email
        if not user_email:
            return jsonify({'status': 'error', 'message': 'Authentication required'}), 401

        from client_config import get_all_clients
        all_clients = get_all_clients()
        invalid = [c for c in requested_clients if c not in all_clients]
        if invalid:
            return jsonify({'status': 'error',
                            'message': f'Unknown client(s): {", ".join(invalid)}'}), 400

        client_labels = [all_clients[c].get('display_name', c) for c in requested_clients]

        from user_access import list_access_entries
        access_data = list_access_entries()
        admin_recipients = [e['email'] for e in access_data.get('entries', [])
                            if e.get('is_admin') and e.get('email')]
        if not admin_recipients:
            return jsonify({'status': 'error',
                            'message': 'No admin recipients configured'}), 500

        subject = f'AI QC: Client access request from {user_name}'
        text_body_lines = [
            f'{user_name} ({user_email}) has requested access to:',
            '',
        ] + [f'  - {label}' for label in client_labels]
        if reason:
            text_body_lines += ['', 'Reason / context:', reason]
        text_body_lines += ['', 'Review and grant access via the Admin panel > User Access tab.']
        text_body = '\n'.join(text_body_lines)

        html_clients = ''.join(f'<li>{_html_escape(label)}</li>' for label in client_labels)
        html_reason = ''
        if reason:
            html_reason = (
                '<p><strong>Reason / context:</strong><br>'
                + _html_escape(reason).replace('\n', '<br>')
                + '</p>'
            )
        html_body = (
            f'<p><strong>{_html_escape(user_name)}</strong> '
            f'({_html_escape(user_email)}) has requested access to:</p>'
            f'<ul>{html_clients}</ul>'
            f'{html_reason}'
            '<p>Review and grant access via the Admin panel &gt; User Access tab.</p>'
        )

        from email_service import send_email
        ok, err = send_email(
            to_addresses=admin_recipients,
            subject=subject,
            body=text_body,
            html_body=html_body,
            reply_to=user_email,
        )

        try:
            from usage_tracker import log_access_request
            log_access_request({
                'user_email': user_email,
                'user_name': user_name,
                'requested_clients': requested_clients,
                'reason': reason,
                'recipients': admin_recipients,
                'email_sent': ok,
                'email_error': err,
            })
        except Exception as log_err:
            print(f'[access_request] log failed: {log_err}')

        if not ok:
            return jsonify({'status': 'error',
                            'message': f'Could not send email: {err}'}), 502

        return jsonify({
            'status': 'success',
            'message': 'Request sent — an admin will review it shortly.',
            'recipients_count': len(admin_recipients),
        })

    except Exception as e:
        print(f'Error in /api/access_request: {e}')
        import traceback
        traceback.print_exc()
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/models', methods=['GET'])
def get_models_endpoint():
    """Get all available LLM models for selection"""
    from llm_config import get_available_models, get_model_info

    try:
        available_models = get_available_models()
        model_info = get_model_info()

        return jsonify({
            'status': 'success',
            'models': available_models,
            'model_info': model_info
        })
    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/run_check', methods=['POST'])
def run_check():
    """API endpoint to run a single QC check"""
    data = request.json

    # Validate inputs
    if not data or 'check_name' not in data or 'file_path' not in data:
        return jsonify({'status': 'error', 'message': 'Missing required parameters'}), 400

    check_name = data['check_name']
    file_path = data['file_path']
    model_name = data.get('model_name', 'Gemini')  # Default to Gemini if not specified
    output_mode = data.get('mode', 'json').lower()  # Get output mode, default to JSON

    # Validate check exists
    if check_name not in qc_apps:
        return jsonify({'status': 'error', 'message': f'QC check "{check_name}" not found'}), 404

    # Validate file exists
    if not os.path.exists(file_path):
        return jsonify({'status': 'error', 'message': 'File not found'}), 404

    try:
        # Get the prompt
        prompt = qc_apps[check_name]['prompt']

        # Get reference image if available
        reference_path = qc_apps[check_name].get('reference_image')

        # Run the QC check with reference image if available
        result = run_visual_qc(
            prompt=prompt,
            asset_path=file_path,
            reference_path=reference_path,
            model_name=model_name
        )

        # Extract score from result if possible
        score = None
        try:
            # Use our extraction function to get score from JSON blocks
            json_data = extract_json_from_response(result['response'])
            if 'score' in json_data:
                score = json_data.get('score')
                print(f"Extracted score from JSON block: {score}")

            # If we still don't have a score, look for any score in text
            if score is None:
                # Try to find a score pattern in the text
                score_pattern = r'["\']score["\']\s*:\s*(\d+)'
                score_match = re.search(score_pattern, result['response'])
                if score_match:
                    score = int(score_match.group(1))
                    print(f"Extracted score from regex: {score}")
                else:
                    # Look for visual evidence of actual scores in text like "score: 7", "score is 8", "score of 9 out of 10"
                    descriptive_score_pattern = r'score(?:\s+is|\s*:\s*|\s+of\s+)(?:\s*)(\d+)(?:\s*out\s*of\s*10)?'
                    descriptive_match = re.search(descriptive_score_pattern, result['response'].lower())
                    if descriptive_match:
                        score = int(descriptive_match.group(1))
                        print(f"Extracted score from descriptive text: {score}")
                    else:
                        # Try to determine score from pass/fail status (legacy mode)
                        result_text = result.get('response', '').upper()
                        if "PASS" in result_text:
                            score = 10  # Pass = 10/10
                            print("Detected PASS keyword, setting score to 10")
                        elif "FAIL" in result_text:
                            score = 3   # Fail = 3/10
                            print("Detected FAIL keyword, setting score to 3")
                        else:
                            print(f"Could not extract score, using default of 5")
                            score = 5  # Default middle score
        except Exception as parse_error:
            print(f"Error parsing score from response: {parse_error}")
            score = 5  # Default to middle score

        # Add the score to the result
        result['score'] = score if score is not None else 5  # Default to middle score if extraction fails

        # Process result for JSON mode
        if output_mode == 'json':
            # For JSON mode, we update the response to be ONLY the JSON part
            json_data = extract_json_from_response(result['response'])
            if json_data:
                # If we found JSON in the response, replace the full text with just the extracted JSON
                result['original_response'] = result['response']  # Save original for debugging
                result['response'] = json.dumps(json_data, indent=2)  # Pretty print the JSON

        # Add metadata but don't save to file
        output_json = {
            "timestamp": datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
            "check_name": check_name,
            "display_name": qc_apps[check_name]['display_name'],
            "model": model_name,
            "file_analyzed": os.path.basename(file_path),
            "result": result,
            "score": result['score'],
            "has_reference": reference_path is not None
        }

        return jsonify(output_json)

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e),
            'traceback': traceback.format_exc()
        }), 500

@app.route('/api/triage_file', methods=['POST'])
def api_triage_file():
    """API endpoint to perform file type triage detection"""
    try:
        # Force reload QC apps to ensure triage app is available
        if not qc_apps:
            load_qc_apps()

        # Check if file is in request
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file part'}), 400

        file = request.files['file']

        # Check if file was selected
        if file.filename == '':
            return jsonify({'status': 'error', 'message': 'No selected file'}), 400

        # Get the brand/profile base name for triage routing
        brand = request.form.get('brand', 'default')

        # Create unique session ID and save file
        session_id = datetime.now().strftime('%Y%m%d_%H%M%S')
        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        os.makedirs(session_folder, exist_ok=True)

        file_path = os.path.join(session_folder, file.filename)
        file.save(file_path)

        # Run file type triage detection
        if 'file_type_triage' not in qc_apps:
            return jsonify({'status': 'error', 'message': 'File type triage app not available'}), 500

        # Get the triage prompt
        prompt = qc_apps['file_type_triage']['prompt']

        # Run the triage check
        result = run_visual_qc(
            prompt=prompt,
            asset_path=file_path,
            model_name='Gemini'  # Use Gemini for triage
        )

        # Extract the triage results
        triage_data = extract_json_from_response(result['response'])

        if not triage_data:
            return jsonify({
                'status': 'error',
                'message': 'Could not extract triage results',
                'raw_response': result['response']
            }), 500

        # Generate the suggested profile name
        format_suffix = triage_data.get('recommended_qc_profile', '_digital')
        suggested_profile = f"{brand}{format_suffix}"

        # Return triage results
        return jsonify({
            'status': 'success',
            'session_id': session_id,
            'file_path': file_path,
            'filename': file.filename,
            'triage_results': triage_data,
            'suggested_profile': suggested_profile,
            'brand': brand,
            'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S')
        })

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e),
            'traceback': traceback.format_exc()
        }), 500

@app.route('/api/process_triaged_file', methods=['POST'])
@auth.require_auth
def api_process_triaged_file():
    """API endpoint to process a file that has already been triaged"""
    try:
        data = request.json

        # Validate required parameters
        if not data or 'session_id' not in data or 'profile' not in data:
            return jsonify({'status': 'error', 'message': 'Missing required parameters: session_id and profile'}), 400

        session_id = data['session_id']
        profile_name = data['profile']
        output_mode = data.get('mode', 'json').lower()

        # Reconstruct file path from session
        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        if not os.path.exists(session_folder):
            return jsonify({'status': 'error', 'message': 'Session not found'}), 404

        # Find the file in the session folder
        files = os.listdir(session_folder)
        if not files:
            return jsonify({'status': 'error', 'message': 'No file found in session'}), 404

        filename = files[0]  # Use the first file found
        file_path = os.path.join(session_folder, filename)

        # Validate profile exists
        if profile_name not in PROFILES:
            available_profiles = list(PROFILES.keys())
            return jsonify({
                'status': 'error',
                'message': f'Invalid profile: {profile_name}. Available profiles: {available_profiles}'
            }), 400

        # Get profile and process checks
        profile = get_profile(profile_name)
        selected_checks = profile.get_enabled_checks()
        profile_weights = profile.get_check_weights()

        if not selected_checks:
            return jsonify({'status': 'error', 'message': 'No QC checks available for the selected profile'}), 400

        # Process each check (same logic as original process_file)
        check_results = {}
        overall_weighted_score = 0
        total_weight = 0

        for i, check_name in enumerate(selected_checks):
            print(f"Processing check {i+1}/{len(selected_checks)}: {check_name}")

            # Skip if check is not available
            if check_name not in qc_apps:
                check_results[check_name] = {
                    'status': 'error',
                    'message': f'QC check not found'
                }
                continue

            # Get LLM preference for this check
            ai_model = profile.get_check_llm(check_name)

            # Get the prompt and reference image
            prompt = qc_apps[check_name]['prompt']
            reference_path = qc_apps[check_name].get('reference_image')

            try:
                # Run the QC check
                result = run_visual_qc(
                    prompt=prompt,
                    asset_path=file_path,
                    reference_path=reference_path,
                    model_name=ai_model
                )

                # Extract score from result
                score = extract_score_from_result(result, profile, check_name)
                result['score'] = score

                # Process result for JSON mode
                if output_mode == 'json':
                    json_data = extract_json_from_response(result['response'])
                    if json_data:
                        result['original_response'] = result['response']
                        result['response'] = json.dumps(json_data, indent=2)

                # Calculate weighted score
                weight = profile_weights.get(check_name, 1.0 / len(selected_checks))
                weighted_score = result['score'] * weight
                overall_weighted_score += weighted_score
                total_weight += weight

                # Store result
                check_results[check_name] = {
                    'status': 'success',
                    'display_name': qc_apps[check_name]['display_name'],
                    'score': result['score'],
                    'weight': weight,
                    'weighted_score': weighted_score,
                    'has_reference': reference_path is not None,
                    'result': result
                }

            except Exception as e:
                check_results[check_name] = {
                    'status': 'error',
                    'message': str(e),
                    'traceback': traceback.format_exc()
                }

        # Calculate overall score
        overall_score = 0
        if total_weight > 0:
            # Special case for Unilever key visual profile - show percentage of 120
            if profile_name == 'unilever_key_visual':
                # For Unilever profile, calculate as percentage of 120
                # Maximum possible score is 10 * 1.2 = 12, so scale to 120
                max_possible_score = 10 * total_weight  # 10 * 1.2 = 12
                overall_score = min(round((overall_weighted_score / max_possible_score) * 120, 1), 120)
            else:
                # Maximum possible score is 10 * total_weight, so normalize to 100%
                max_possible_score = 10 * total_weight
                overall_score = min(round((overall_weighted_score / max_possible_score) * 100, 1), 100)
        else:
            successful_checks = [r for r in check_results.values() if r.get('status') == 'success']
            if successful_checks:
                sum_scores = sum(r.get('score', 0) for r in successful_checks)
                overall_score = min(round((sum_scores / len(successful_checks)) * 10, 1), 100)

        # Generate report data
        report_data = {
            'session_id': session_id,
            'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
            'filename': filename,
            'profile': profile_name,
            'profile_id': profile_name,  # Store the profile ID for HTML detection
            'profile_name': profile.name,
            'model': 'Profile-based selection',
            'results': check_results,
            'summary': {
                'overall_score': overall_score,
                'profile': profile.name,
                'checks_count': len([r for r in check_results.values() if r.get('status') == 'success']),
                'total_checks': len(check_results),
                'total_weighted_score': overall_weighted_score,
                'total_weight': total_weight
            }
        }

        # Determine overall grade
        grade = determine_grade(overall_score)

        # L'Oreal Static override: fail if ANY individual check fails (score < 6)
        if profile_name == 'loreal_static':
            for check_name, check_data in check_results.items():
                if check_data.get('status') == 'success':
                    check_score = check_data.get('score', 0)
                    if check_score is not None and check_score < 6:
                        grade = 'Fail'
                        break

        # Boots Static override: fail if ANY individual check fails (score < 6)
        if profile_name == 'boots_static':
            for check_name, check_data in check_results.items():
                if check_data.get('status') == 'success':
                    check_score = check_data.get('score', 0)
                    if check_score is not None and check_score < 6:
                        grade = 'Fail'
                        break

        report_data['summary']['grade'] = grade

        # Save results to file regardless of output mode
        output_path = save_results_to_file(report_data, filename, output_mode, session_id, file_path)

        # Return results based on output mode
        if output_mode == 'html':
            html_response = generate_html_response(report_data, filename)
            # Add file path info to the response
            return html_response
        else:
            # For JSON mode, return the data with file path info
            report_data['output_file'] = {
                'path': output_path,
                'filename': os.path.basename(output_path),
                'url': f'{request.environ.get("SCRIPT_NAME", "")}/output/{os.path.basename(output_path)}'
            }
            return jsonify(report_data)

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e),
            'traceback': traceback.format_exc()
        }), 500

@app.route('/api/process_file', methods=['POST'])
@auth.require_auth
def api_process_file():
    """API endpoint to process a file with specified profiles and checks"""
    try:
        # Force reload QC apps to ensure they're available for this request
        if not qc_apps:
            load_qc_apps()
        print(f"API: Loaded {len(qc_apps)} QC apps for processing")

        # Check if file is in request
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file part'}), 400

        file = request.files['file']

        # Check if file was selected
        if file.filename == '':
            return jsonify({'status': 'error', 'message': 'No selected file'}), 400

        # Get output mode (json or html)
        output_mode = request.form.get('mode', 'json').lower()
        if output_mode not in ['json', 'html']:
            output_mode = 'json'  # Default to JSON if invalid mode

        # Get selected profiles from request (can be single or multiple)
        # Support both single profile parameter and multiple profiles array
        selected_profiles = []
        if 'profiles[]' in request.form:
            selected_profiles = request.form.getlist('profiles[]')
        elif 'profile' in request.form:
            selected_profiles = [request.form.get('profile')]

        if not selected_profiles:
            selected_profiles = ['default']  # Use default if none specified

        # Validate profiles
        for profile_id in selected_profiles:
            if profile_id != 'custom' and profile_id not in PROFILES:
                available_profiles = list(PROFILES.keys())
                return jsonify({
                    'status': 'error',
                    'message': f'Invalid profile: {profile_id}. Available profiles: {available_profiles}'
                }), 400

        # Track all selected checks and weights from all profiles
        all_selected_checks = set()
        combined_profile_weights = {}
        selected_profile_names = []
        custom_selection = False

        # Process each selected profile
        for profile_id in selected_profiles:
            if profile_id == 'custom':
                # Custom selection
                custom_checks = request.form.getlist('checks')
                if not custom_checks:
                    return jsonify({'status': 'error', 'message': 'Custom profile selected but no checks were specified'}), 400

                all_selected_checks.update(custom_checks)
                custom_selection = True
            else:
                # Standard profile
                profile = get_profile(profile_id)
                selected_profile_names.append(profile.name)
                profile_checks = profile.get_enabled_checks()
                all_selected_checks.update(profile_checks)

                # Add profile weights (we'll normalize later)
                profile_weights = profile.get_check_weights()
                for check, weight in profile_weights.items():
                    if check in combined_profile_weights:
                        # If a check is in multiple profiles, use the higher weight
                        combined_profile_weights[check] = max(combined_profile_weights[check], weight)
                    else:
                        combined_profile_weights[check] = weight

        # Convert to list for consistency with the rest of the code
        selected_checks = list(all_selected_checks)
        profile_weights = combined_profile_weights

        if not selected_checks:
            return jsonify({'status': 'error', 'message': 'No QC checks available for the selected profile'}), 400

        # Create unique session ID and save file
        session_id = datetime.now().strftime('%Y%m%d_%H%M%S')

        # Create session folder and save file
        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        os.makedirs(session_folder, exist_ok=True)

        file_path = os.path.join(session_folder, file.filename)
        file.save(file_path)

        # Process each check
        check_results = {}
        overall_weighted_score = 0
        total_weight = 0

        # Track progress for client
        progress = {
            'total_checks': len(selected_checks),
            'completed_checks': 0,
            'current_check': ''
        }

        for i, check_name in enumerate(selected_checks):
            # Update progress
            progress['current_check'] = check_name
            progress['completed_checks'] = i
            print(f"API Progress: {i+1}/{len(selected_checks)} - Processing {check_name}")

            # Skip if check is not available
            if check_name not in qc_apps:
                check_results[check_name] = {
                    'status': 'error',
                    'message': f'QC check not found'
                }
                continue

            # Determine which LLM to use based on the selected profiles
            # Default to Gemini
            ai_model = 'Gemini'

            # Check each profile's LLM preference for this check
            for profile_id in selected_profiles:
                if profile_id != 'custom':  # Skip custom profile
                    check_llm_map = get_check_llm_map(profile_id)
                    if check_name in check_llm_map:
                        # If any profile uses OpenAI for this check, prioritize OpenAI
                        if check_llm_map[check_name] == 'OpenAI':
                            ai_model = 'OpenAI'
                            break

            # Get the prompt
            prompt = qc_apps[check_name]['prompt']

            # Get reference image if available
            reference_path = qc_apps[check_name].get('reference_image')

            try:
                # Run the QC check
                result = run_visual_qc(
                    prompt=prompt,
                    asset_path=file_path,
                    reference_path=reference_path,
                    model_name=ai_model
                )

                # Extract score from result
                score = None
                try:
                    # Use our extraction function to get score from JSON blocks
                    json_data = extract_json_from_response(result['response'])
                    if 'score' in json_data:
                        score = json_data.get('score')
                        print(f"Extracted score from JSON block: {score}")

                    # If we still don't have a score, look for any score in text
                    if score is None:
                        # Try to find a score pattern in the text
                        score_pattern = r'["\']score["\']\s*:\s*(\d+)'
                        score_match = re.search(score_pattern, result['response'])
                        if score_match:
                            score = int(score_match.group(1))
                            print(f"Extracted score from regex: {score}")
                        else:
                            # Look for descriptive scores in text
                            descriptive_score_pattern = r'score(?:\s+is|\s*:\s*|\s+of\s+)(?:\s*)(\d+)(?:\s*out\s*of\s*10)?'
                            descriptive_match = re.search(descriptive_score_pattern, result['response'].lower())
                            if descriptive_match:
                                score = int(descriptive_match.group(1))
                                print(f"Extracted score from descriptive text: {score}")
                            else:
                                # Try to determine score from pass/fail status (legacy mode)
                                result_text = result.get('response', '').upper()
                                if "PASS" in result_text:
                                    score = 10  # Pass = 10/10
                                    print("Detected PASS keyword, setting score to 10")
                                elif "FAIL" in result_text:
                                    score = 3   # Fail = 3/10
                                    print("Detected FAIL keyword, setting score to 3")
                                else:
                                    score = 5  # Default middle score
                                    print(f"Could not extract score, using default of 5")
                except Exception as parse_error:
                    print(f"Error parsing score from response: {parse_error}")
                    score = 5  # Default to middle score

                # Add the score to the result
                result['score'] = score if score is not None else 5

                # Process result for JSON mode
                if output_mode == 'json':
                    # For JSON mode, we update the response to be ONLY the JSON part
                    json_data = extract_json_from_response(result['response'])
                    if json_data:
                        # If we found JSON in the response, replace the full text with just the extracted JSON
                        result['original_response'] = result['response']  # Save original for debugging
                        result['response'] = json.dumps(json_data, indent=2)  # Pretty print the JSON

                # Calculate weighted score
                weight = profile_weights.get(check_name, 0)
                if weight == 0 and ('default' in selected_profiles or len(selected_profiles) == 0):
                    weight = 1.0 / len(selected_checks)

                weighted_score = result['score'] * weight
                overall_weighted_score += weighted_score
                total_weight += weight

                # Store result
                check_results[check_name] = {
                    'status': 'success',
                    'display_name': qc_apps[check_name]['display_name'],
                    'score': result['score'],
                    'weight': weight,
                    'weighted_score': weighted_score,
                    'has_reference': reference_path is not None,
                    'result': result
                }

                # Update progress after successful check
                progress['completed_checks'] = i + 1

            except Exception as e:
                check_results[check_name] = {
                    'status': 'error',
                    'message': str(e),
                    'traceback': traceback.format_exc()
                }

        # Calculate overall score
        overall_score = 0
        if total_weight > 0:
            # Special case for Unilever key visual profile - show percentage of 120
            if len(selected_profiles) == 1 and selected_profiles[0] == 'unilever_key_visual':
                # For Unilever profile, calculate as percentage of 120
                # Maximum possible score is 10 * 1.2 = 12, so scale to 120
                max_possible_score = 10 * total_weight  # 10 * 1.2 = 12
                overall_score = min(round((overall_weighted_score / max_possible_score) * 120, 1), 120)
            else:
                # Maximum possible score is 10 * total_weight, so normalize to 100%
                max_possible_score = 10 * total_weight
                overall_score = min(round((overall_weighted_score / max_possible_score) * 100, 1), 100)
        else:
            # Simple average if no weights
            successful_checks = [r for r in check_results.values() if r.get('status') == 'success']
            if successful_checks:
                sum_scores = sum(r.get('score', 0) for r in successful_checks)
                overall_score = min(round((sum_scores / len(successful_checks)) * 10, 1), 100)

        # Generate report data
        report_data = {
            'session_id': session_id,
            'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
            'filename': file.filename,
            'profiles': selected_profiles,
            'profile_id': selected_profiles[0] if len(selected_profiles) == 1 else None,  # Store single profile ID for HTML detection
            'profile_name': ", ".join(selected_profile_names) or "Multiple Profiles",
            'model': 'Profile-based selection',
            'results': check_results,
            'summary': {
                'overall_score': overall_score,
                'profile': ", ".join(selected_profile_names) or "Multiple Profiles",
                'checks_count': len([r for r in check_results.values() if r.get('status') == 'success']),
                'total_checks': len(check_results),
                'total_weighted_score': overall_weighted_score,
                'total_weight': total_weight
            }
        }

        # Determine overall grade based on score (Pass/Fail)
        avg_individual_score = overall_score / 10  # Convert to 1-10 scale
        grade = 'Pass' if avg_individual_score >= 6 else 'Fail'

        # Add grade to summary
        report_data['summary']['grade'] = grade

        # Save results to file regardless of output mode
        output_path = save_results_to_file(report_data, file.filename, output_mode, session_id, file_path)

        # Return data based on output mode
        if output_mode == 'html':
            # Create a more interactive HTML view with formatted results
            # Define a function to get color based on score
            def get_score_result(score):
                if score >= 6:
                    return "Pass", "#28a745"  # Green for pass
                else:
                    return "Fail", "#dc3545"  # Red for fail

            # Build HTML for each check result
            check_results_html = ""
            for check_name, check_data in report_data['results'].items():
                if check_data['status'] == 'success':
                    display_name = check_data.get('display_name', check_name)
                    score = check_data.get('score', 0)
                    result_text, score_color = get_score_result(score)

                    # Extract response text (strip JSON blocks for cleaner display)
                    response_text = check_data['response']
                    # Remove JSON code blocks for cleaner reading
                    import re
                    response_text = re.sub(r'```json.*?```', '', response_text, flags=re.DOTALL)
                    response_text = response_text.strip()

                    check_results_html += f"""
                    <div class="check-result">
                        <h3>{display_name} <span class="score" style="color: {score_color}">{result_text}</span></h3>
                        <div class="response">{response_text.replace(chr(10), '<br>')}</div>
                    </div>
                    <hr>
                    """

            # Get summary score result
            overall_score = report_data['summary']['overall_score']
            overall_result, overall_color = get_score_result(overall_score/10)  # Normalize to 0-10 scale

            html_content = f"""
            <!DOCTYPE html>
            <html lang="en">
            <head>
                <meta charset="UTF-8">
                <meta name="viewport" content="width=device-width, initial-scale=1.0">
                <title>Visual AI QC Results for {file.filename}</title>
                <style>
                    body {{ font-family: Arial, sans-serif; margin: 20px; padding: 0; background-color: #f8f9fa; }}
                    .container {{ max-width: 1200px; margin: 0 auto; background-color: white; padding: 20px; border-radius: 8px; box-shadow: 0 0 10px rgba(0,0,0,0.1); }}
                    h1, h2, h3 {{ color: #333; }}
                    h1 {{ margin-bottom: 5px; }}
                    .summary {{ background-color: #e9ecef; padding: 15px; border-radius: 5px; margin: 20px 0; }}
                    .score {{ font-weight: normal; margin-left: 10px; }}
                    .check-result {{ margin-bottom: 20px; }}
                    .response {{ margin-top: 10px; line-height: 1.5; }}
                    hr {{ border: 0; height: 1px; background-color: #ddd; margin: 30px 0; }}
                    .grade {{ font-size: 1.2em; font-weight: bold; }}
                    pre {{ background-color: #f5f5f5; padding: 15px; border-radius: 5px; overflow-x: auto; }}
                    .json-toggle {{ cursor: pointer; color: #007bff; text-decoration: underline; }}
                    .json-view {{ display: none; margin-top: 20px; }}
                </style>
            </head>
            <body>
                <div class="container">
                    <h1>Visual AI QC Results</h1>
                    <p>File analyzed: <strong>{file.filename}</strong> | Timestamp: {report_data['timestamp']}</p>

                    <div class="summary">
                        <h2>Summary</h2>
                        <p>Overall Result: <span style="color: {overall_color}; font-weight: bold; font-size: 1.2em;">{overall_result}</span></p>
                        <p>Status: <span class="grade">{report_data['summary']['grade']}</span></p>
                        <p>Profile: {report_data['profile_name']}</p>
                        <p>Total Checks: {report_data['summary']['checks_count']}</p>
                    </div>

                    <h2>Detailed Results</h2>
                    {check_results_html}

                    <p class="json-toggle" onclick="document.getElementById('json-data').style.display = document.getElementById('json-data').style.display === 'none' ? 'block' : 'none';">
                        Show/Hide Raw JSON Data
                    </p>
                    <div id="json-data" class="json-view">
                        <pre>{json.dumps(report_data, indent=2)}</pre>
                    </div>
                </div>
            </body>
            </html>
            """
            # For HTML mode, redirect to the saved file
            return Response(html_content, mimetype='text/html')
        else:
            # For JSON mode, return the data with file path info
            report_data['output_file'] = {
                'path': output_path,
                'filename': os.path.basename(output_path),
                'url': f'{request.environ.get("SCRIPT_NAME", "")}/output/{os.path.basename(output_path)}'
            }
            return jsonify(report_data)

    except Exception as e:
        # Include progress information in error response
        error_progress = progress.get('completed_checks', 0) if 'progress' in locals() else 0
        total_checks = progress.get('total_checks', 0) if 'progress' in locals() else 0
        if not total_checks and 'selected_checks' in locals():
            total_checks = len(selected_checks)

        error_data = {
            'status': 'error',
            'message': str(e),
            'traceback': traceback.format_exc(),
            'progress': {
                'total_checks': total_checks,
                'completed_checks': error_progress,
                'percentage': (error_progress / total_checks * 100) if total_checks else 0
            }
        }

        # Get output mode if possible, default to JSON if not defined or in case of error
        output_mode = request.form.get('mode', 'json').lower() if 'mode' in request.form else 'json'

        if output_mode == 'html':
            # Create a more user-friendly error page
            html_content = f"""
            <!DOCTYPE html>
            <html lang="en">
            <head>
                <meta charset="UTF-8">
                <meta name="viewport" content="width=device-width, initial-scale=1.0">
                <title>Visual AI QC Error</title>
                <style>
                    body {{ font-family: Arial, sans-serif; margin: 20px; padding: 0; background-color: #f8f9fa; }}
                    .container {{ max-width: 1200px; margin: 0 auto; background-color: white; padding: 20px; border-radius: 8px; box-shadow: 0 0 10px rgba(0,0,0,0.1); }}
                    h1 {{ color: #dc3545; margin-bottom: 5px; }}
                    .error-box {{ background-color: #f8d7da; border: 1px solid #f5c6cb; color: #721c24; padding: 15px; border-radius: 5px; margin: 20px 0; }}
                    .progress-box {{ background-color: #cce5ff; border: 1px solid #b8daff; color: #004085; padding: 15px; border-radius: 5px; margin: 20px 0; }}
                    pre {{ background-color: #f5f5f5; padding: 15px; border-radius: 5px; overflow-x: auto; }}
                    .json-toggle {{ cursor: pointer; color: #007bff; text-decoration: underline; }}
                    .json-view {{ display: none; margin-top: 20px; }}
                    .progress-bar {{ height: 20px; background-color: #e9ecef; border-radius: 5px; margin-top: 10px; }}
                    .progress-bar-fill {{ height: 100%; background-color: #007bff; border-radius: 5px; width: {error_data['progress']['percentage']}%; }}
                </style>
            </head>
            <body>
                <div class="container">
                    <h1>Error Processing Request</h1>

                    <div class="error-box">
                        <h3>Error Message</h3>
                        <p>{error_data['message']}</p>
                    </div>

                    <div class="progress-box">
                        <h3>Processing Progress</h3>
                        <p>Completed {error_data['progress']['completed_checks']} of {error_data['progress']['total_checks']} checks</p>
                        <div class="progress-bar">
                            <div class="progress-bar-fill"></div>
                        </div>
                    </div>

                    <p class="json-toggle" onclick="document.getElementById('error-data').style.display = document.getElementById('error-data').style.display === 'none' ? 'block' : 'none';">
                        Show/Hide Technical Details
                    </p>
                    <div id="error-data" class="json-view">
                        <pre>{json.dumps(error_data, indent=2)}</pre>
                    </div>
                </div>
            </body>
            </html>
            """
            return Response(html_content, mimetype='text/html'), 500
        else:
            # Default JSON mode
            return jsonify(error_data), 500

@app.route('/analyze', methods=['POST'])
@app.route('/api/analyze', methods=['POST'])
@auth.require_auth
def api_analyze_with_triage():
    """
    Smart analysis endpoint that combines triage and profile-based QC.

    This endpoint:
    1. Runs triage to determine file type
    2. Automatically selects appropriate profile based on brand + file type
    3. Runs full QC analysis with selected profile
    4. Returns combined results showing both triage and QC analysis

    Parameters:
    - file: Image file to analyze
    - brand: Brand name (diageo, unilever, general) - defaults to 'general'
    - mode: Output mode (json, html) - defaults to 'json'
    - return_file: Whether to return file info (true/false) - defaults to 'false'
    """
    try:
        # Force reload QC apps to ensure they're available
        if not qc_apps:
            load_qc_apps()

        # Check if file is in request
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file part'}), 400

        file = request.files['file']

        # Check if file was selected
        if file.filename == '':
            return jsonify({'status': 'error', 'message': 'No selected file'}), 400

        # Get parameters
        brand = request.form.get('brand', 'general').lower()
        profile = request.form.get('profile', '').lower()
        output_mode = request.form.get('mode', 'json').lower()
        return_file = request.form.get('return_file', 'false').lower() == 'true'

        # Validate brand - allow any brand name now that users can create custom profiles
        # The old validation was too restrictive for custom profiles
        if not brand or brand.strip() == '':
            brand = 'general'

        # Validate output mode
        if output_mode not in ['json', 'html']:
            output_mode = 'json'

        # Create unique session ID and save file
        session_id = datetime.now().strftime('%Y%m%d_%H%M%S')
        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        os.makedirs(session_folder, exist_ok=True)

        file_path = os.path.join(session_folder, file.filename)
        file.save(file_path)

        # Initialize progress tracking for this session
        progress_tracker[session_id] = {
            'total_checks': 0,
            'completed_checks': 0,
            'current_check': 'Initializing',
            'current_check_display': 'Initializing Analysis',
            'stage': 'setup',
            'percentage': 0,
            'session_id': session_id
        }

        # STEP 1: Run Triage Analysis
        print(f"Step 1: Running triage analysis for {file.filename}")

        # Update progress
        progress_tracker[session_id].update({
            'stage': 'triage',
            'current_check': 'file_type_triage',
            'current_check_display': 'File Type Detection',
            'percentage': 10
        })

        if 'file_type_triage' not in qc_apps:
            return jsonify({'status': 'error', 'message': 'File type triage app not available'}), 500

        # Get the triage prompt and run triage
        triage_prompt = qc_apps['file_type_triage']['prompt']
        triage_result = run_visual_qc(
            prompt=triage_prompt,
            asset_path=file_path,
            model_name='Gemini'
        )

        # Extract triage results
        triage_data = extract_json_from_response(triage_result['response'])
        if not triage_data:
            return jsonify({
                'status': 'error',
                'message': 'Could not extract triage results',
                'raw_triage_response': triage_result['response']
            }), 500

        # STEP 2: Determine Appropriate Profile
        print(f"Step 2: Determining profile based on {'direct profile parameter' if profile else 'triage results'}")

        if profile and profile.strip():
            # Use the directly specified profile
            suggested_profile = profile
            print(f"Using directly specified profile: {suggested_profile}")
        else:
            # Get format suffix from triage results
            format_suffix = triage_data.get('recommended_qc_profile', '_digital')

            # Construct profile name
            suggested_profile = f"{brand}{format_suffix}"

            # Check if the suggested profile exists, fallback to main brand profile if not
            if suggested_profile not in PROFILES:
                suggested_profile = brand
                if suggested_profile not in PROFILES:
                    suggested_profile = 'general'  # Final fallback

            print(f"Profile constructed from triage: {suggested_profile}")

        print(f"Final selected profile: {suggested_profile}")

        # STEP 3: Run Full QC Analysis with Selected Profile
        print(f"Step 3: Running QC analysis with profile '{suggested_profile}'")

        # Get the profile configuration
        profile_config = get_profile(suggested_profile)
        if not profile_config:
            return jsonify({
                'status': 'error',
                'message': f'Profile {suggested_profile} not found'
            }), 400

        # Get enabled checks from profile using Profile object methods
        enabled_checks = profile_config.get_enabled_checks()
        profile_weights = profile_config.get_check_weights()

        # Filter to only include checks that exist in qc_apps
        enabled_checks = [check for check in enabled_checks if check in qc_apps]

        if not enabled_checks:
            return jsonify({
                'status': 'error',
                'message': f'No enabled checks found for profile {suggested_profile}'
            }), 400

        # Run QC checks in parallel batches
        # Update progress tracker with total checks
        progress_tracker[session_id].update({
            'total_checks': len(enabled_checks),
            'stage': 'qc_analysis',
            'percentage': 20
        })

        # Get reference asset from form for this endpoint
        reference_asset = request.form.get('reference_asset', '')

        # Use the parallel processing function
        check_results = process_checks_in_batches_with_triage(
            enabled_checks, qc_apps, profile_config, profile_weights,
            file_path, reference_asset, brand_db, progress_tracker,
            session_id, batch_size=15, base_percentage=20, percentage_range=70
        )

        # STEP 4: Calculate Overall Score
        print(f"Step 4: Calculating overall score")

        total_weighted_score = 0
        total_weight = 0
        completed_checks = 0
        failed_checks = 0

        for check_name, result in check_results.items():
            weight = result.get('weight', 0.1)
            total_weight += weight

            if result['status'] == 'completed':
                completed_checks += 1
                score = result.get('score')
                if score is not None:
                    total_weighted_score += score * weight
            else:
                failed_checks += 1

        # Calculate overall score - sum of weighted scores scaled to 100
        # For profiles with total_weight = 10.0 (like General Check), use direct weighted score
        # For profiles with total_weight = 1.0, multiply by 10 to scale to 100
        if total_weight >= 10.0:
            overall_score = min(total_weighted_score, 100)  # Cap at 100
        elif total_weight > 0:
            overall_score = min(total_weighted_score * 10, 100)  # Scale to 100-point system, cap at 100
        else:
            overall_score = 0

        # STEP 5: Prepare Combined Response
        print(f"Step 5: Preparing response")

        # Update progress to completion
        progress_tracker[session_id].update({
            'stage': 'complete',
            'current_check': 'Finalizing',
            'current_check_display': 'Finalizing Report',
            'percentage': 100,
            'completed_checks': len(enabled_checks)
        })

        # Since triage is skipped, set default triage data
        triage_data = {
            'primary_format': 'user_specified',
            'specific_type': 'profile_based_analysis',
            'confidence_score': 10,
            'format_indicators': 'User selected profile directly',
            'secondary_format': '',
            'recommended_qc_profile': suggested_profile
        }
        triage_result = {'response': 'Triage skipped - using user-selected profile directly'}

        # Build comprehensive response
        response_data = {
            'status': 'success',
            'session_id': session_id,
            'filename': file.filename,
            'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),

            # Triage Results Section
            'triage_analysis': {
                'primary_format': triage_data.get('primary_format', 'unknown'),
                'specific_type': triage_data.get('specific_type', 'unknown'),
                'confidence_score': triage_data.get('confidence_score', 0),
                'format_indicators': triage_data.get('format_indicators', ''),
                'secondary_format': triage_data.get('secondary_format', ''),
                'recommended_qc_profile': triage_data.get('recommended_qc_profile', ''),
                'full_triage_response': triage_result['response']
            },

            # Profile Selection Section
            'profile_selection': {
                'requested_brand': brand,
                'suggested_profile': suggested_profile,
                'profile_used': suggested_profile,
                'profile_name': profile_config.name,
                'profile_description': profile_config.description,
                'reference_asset': reference_asset if reference_asset else None,
                'reference_asset_used': bool(reference_asset)
            },

            # QC Analysis Results Section
            'qc_analysis': {
                'overall_score': round(overall_score, 2),
                'total_checks': len(enabled_checks),
                'completed_checks': completed_checks,
                'failed_checks': failed_checks,
                'total_weight': round(total_weight, 2),
                'check_results': check_results
            },

            # Summary Section
            'summary': {
                'file_type_detected': f"{triage_data.get('primary_format', 'unknown')} - {triage_data.get('specific_type', 'unknown')}",
                'profile_applied': profile_config.name,
                'overall_score': round(overall_score, 2),
                'score_percentage': f"{round(overall_score, 1)}%",
                'checks_passed': completed_checks,
                'checks_failed': failed_checks,
                'confidence': triage_data.get('confidence_score', 0)
            }
        }

        # Add file info if requested
        if return_file:
            response_data['file_info'] = {
                'path': file_path,
                'size': os.path.getsize(file_path),
                'session_folder': session_folder
            }

        # Media plan matching
        try:
            media_plan_data = _get_active_media_plan(client)
            if media_plan_data:
                from media_plan_processor import find_matching_asset, validate_asset_specs
                match_result = find_matching_asset(file.filename, media_plan_data)
                if match_result:
                    validation = validate_asset_specs(file_path, match_result['match'])
                    response_data['media_plan_match'] = {
                        'matched': True,
                        'confidence': match_result['confidence'],
                        'match_type': match_result['match_type'],
                        'asset_id': match_result['match']['asset_id'],
                        'spec': match_result['match'],
                        'validation': validation,
                    }
                else:
                    response_data['media_plan_match'] = {'matched': False}
        except Exception as mp_err:
            print(f"Media plan matching error: {mp_err}")

        # Auto-save HTML report to output directory (regardless of output_mode)
        try:
            # Generate comprehensive HTML report using the same format as the web UI
            html_report_content = generate_comprehensive_html_report(response_data, file.filename, file_path)

            # Create output filename in client-specific folder
            safe_filename = re.sub(r'[^a-zA-Z0-9.-]', '_', file.filename)
            output_filename = f"{session_id}_{safe_filename}_report.html"
            client_output_folder = ensure_client_output_folder(client)
            output_path = os.path.join(client_output_folder, output_filename)

            # Save HTML report to output directory
            with open(output_path, 'w', encoding='utf-8') as f:
                f.write(html_report_content)

            print(f"HTML report auto-saved to: {output_path}")

            # Add output file info to response
            response_data['output_file'] = {
                'path': output_path,
                'filename': output_filename,
                'auto_saved': True
            }

        except Exception as e:
            print(f"Error auto-saving HTML report: {str(e)}")
            # Don't fail the entire request if auto-save fails

        # Return appropriate format
        if output_mode == 'html':
            # Create HTML response with both triage and QC results
            triage_html = f"""
            <div class="triage-section">
                <h2>📋 File Type Analysis (Triage)</h2>
                <div class="triage-results">
                    <div class="result-item">
                        <strong>Detected Format:</strong> {triage_data.get('primary_format', 'unknown').title()} - {triage_data.get('specific_type', 'unknown')}
                    </div>
                    <div class="result-item">
                        <strong>Confidence:</strong> {triage_data.get('confidence_score', 0)}/10
                    </div>
                    <div class="result-item">
                        <strong>Key Indicators:</strong> {triage_data.get('format_indicators', 'N/A')}
                    </div>
                    <div class="result-item">
                        <strong>Recommended Profile:</strong> {triage_data.get('recommended_qc_profile', 'N/A')}
                    </div>
                </div>
            </div>
            """

            profile_html = f"""
            <div class="profile-section">
                <h2>🎯 Profile Selection</h2>
                <div class="profile-results">
                    <div class="result-item">
                        <strong>Brand:</strong> {brand.title()}
                    </div>
                    <div class="result-item">
                        <strong>Profile Used:</strong> {profile_config.name}
                    </div>
                    <div class="result-item">
                        <strong>Description:</strong> {profile_config.description}
                    </div>
                </div>
            </div>
            """

            # Generate QC results HTML
            check_results_html = ""
            for check_name, result in check_results.items():
                score = result.get('score', 0) if result.get('score') is not None else 0
                status_class = "pass" if result['status'] == 'completed' and score >= 6 else "fail"
                result_display = "Pass" if score >= 6 else "Fail" if score > 0 else "N/A"

                check_results_html += f"""
                <div class="check-result {status_class}">
                    <h3>{check_name.replace('_', ' ').title()}</h3>
                    <div class="score">Result: {result_display}</div>
                    <div class="weight">Weight: {result.get('weight', 0.1)}</div>
                    <div class="response">{result.get('response', 'No response')[:500]}...</div>
                </div>
                """

            html_content = f"""
            <!DOCTYPE html>
            <html lang="en">
            <head>
                <meta charset="UTF-8">
                <meta name="viewport" content="width=device-width, initial-scale=1.0">
                <title>Visual AI QC Analysis Results</title>
                <style>
                    body {{ font-family: Arial, sans-serif; margin: 20px; background-color: #f8f9fa; }}
                    .container {{ max-width: 1200px; margin: 0 auto; background: white; padding: 20px; border-radius: 8px; box-shadow: 0 2px 10px rgba(0,0,0,0.1); }}
                    .header {{ text-align: center; margin-bottom: 30px; border-bottom: 2px solid #007bff; padding-bottom: 20px; }}
                    .summary {{ background: #e3f2fd; padding: 20px; border-radius: 8px; margin-bottom: 30px; }}
                    .triage-section, .profile-section {{ background: #f0f8f0; padding: 20px; border-radius: 8px; margin-bottom: 20px; }}
                    .result-item {{ margin: 10px 0; padding: 10px; background: white; border-left: 4px solid #007bff; }}
                    .check-result {{ margin: 15px 0; padding: 15px; border-radius: 8px; border-left: 4px solid #ccc; }}
                    .check-result.pass {{ border-left-color: #28a745; background-color: #d4edda; }}
                    .check-result.fail {{ border-left-color: #dc3545; background-color: #f8d7da; }}
                    .score {{ font-weight: bold; color: #007bff; }}
                    .json-toggle {{ cursor: pointer; color: #007bff; text-decoration: underline; margin: 20px 0; }}
                    .json-view {{ background: #f8f9fa; padding: 15px; border-radius: 5px; overflow-x: auto; display: none; }}
                </style>
            </head>
            <body>
                <div class="container">
                    <div class="header">
                        <h1>🤖 Visual AI QC Analysis Results</h1>
                        <p>File: {file.filename} | Analyzed: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}</p>
                    </div>

                    <div class="summary">
                        <h2>📊 Summary</h2>
                        <div style="display: grid; grid-template-columns: repeat(auto-fit, minmax(200px, 1fr)); gap: 15px;">
                            <div><strong>Overall Result:</strong> {'Pass' if overall_score/10 >= 6 else 'Fail'}</div>
                            <div><strong>File Type:</strong> {triage_data.get('primary_format', 'unknown').title()}</div>
                            <div><strong>Profile Used:</strong> {profile_config.name}</div>
                            <div><strong>Checks Performed:</strong> {completed_checks}/{len(enabled_checks)}</div>
                        </div>
                    </div>

                    {triage_html}
                    {profile_html}

                    <div class="qc-section">
                        <h2>🔍 Quality Control Analysis</h2>
                        {check_results_html}
                    </div>

                    <p class="json-toggle" onclick="document.getElementById('json-data').style.display = document.getElementById('json-data').style.display === 'none' ? 'block' : 'none';">
                        Show/Hide Raw JSON Data
                    </p>
                    <div id="json-data" class="json-view">
                        <pre>{json.dumps(response_data, indent=2)}</pre>
                    </div>
                </div>
            </body>
            </html>
            """
            return Response(html_content, mimetype='text/html')
        else:
            # Add session_id to response for progress tracking
            response_data['session_id'] = session_id
            # Return JSON response
            return jsonify(response_data)

    except Exception as e:
        # Update progress to error state if session exists
        if 'session_id' in locals() and session_id in progress_tracker:
            progress_tracker[session_id].update({
                'stage': 'error',
                'current_check': 'Error',
                'current_check_display': 'Analysis Failed',
                'percentage': 0
            })

        return jsonify({
            'status': 'error',
            'message': str(e),
            'traceback': traceback.format_exc()
        }), 500

    finally:
        # Schedule cleanup of progress tracker after 5 minutes
        import threading
        import time

        def cleanup_progress():
            time.sleep(300)  # 5 minutes
            if 'session_id' in locals() and session_id in progress_tracker:
                del progress_tracker[session_id]

        if 'session_id' in locals():
            threading.Thread(target=cleanup_progress, daemon=True).start()

def _update_client_config_for_profile(profile_id, client_ids, action='add'):
    """
    Update client_config.py to add or remove a profile from client configurations

    Args:
        profile_id: Profile ID to add/remove
        client_ids: List of client IDs to update
        action: 'add' or 'remove'
    """
    try:
        client_config_path = os.path.join(os.path.dirname(__file__), 'client_config.py')

        # Read current client_config.py
        with open(client_config_path, 'r') as f:
            config_content = f.read()

        # Parse CLIENT_PROFILES dictionary
        # This is a simple approach - we'll reload the module and update it
        from client_config import CLIENT_PROFILES
        import copy

        updated_config = copy.deepcopy(CLIENT_PROFILES)

        # Update each client
        for client_id in client_ids:
            if client_id in updated_config:
                current_profiles = updated_config[client_id].get('profiles', [])

                if action == 'add' and profile_id not in current_profiles:
                    current_profiles.append(profile_id)
                    updated_config[client_id]['profiles'] = current_profiles
                elif action == 'remove' and profile_id in current_profiles:
                    current_profiles.remove(profile_id)
                    updated_config[client_id]['profiles'] = current_profiles

        # Write updated config back to file
        config_lines = [
            "#!/usr/bin/env python3",
            '"""',
            "Client configuration module for managing client-profile relationships",
            '"""',
            "",
            "CLIENT_PROFILES = {",
        ]

        for client_id, client_data in updated_config.items():
            config_lines.append(f"    '{client_id}': {{")
            config_lines.append(f"        'name': '{client_data['name']}',")
            profiles_str = ", ".join([f"'{p}'" for p in client_data['profiles']])
            config_lines.append(f"        'profiles': [{profiles_str}],")
            config_lines.append(f"        'display_name': '{client_data['display_name']}',")
            config_lines.append(f"        'description': '{client_data['description']}'")
            config_lines.append("    },")

        config_lines.append("}")
        config_lines.append("")
        config_lines.append("def get_client_profiles(client_id):")
        config_lines.append('    """Get profiles available for a specific client"""')
        config_lines.append("    return CLIENT_PROFILES.get(client_id, {}).get('profiles', [])")
        config_lines.append("")
        config_lines.append("def get_all_clients():")
        config_lines.append('    """Get all available clients"""')
        config_lines.append("    return CLIENT_PROFILES")
        config_lines.append("")
        config_lines.append("def validate_client_profile(client_id, profile_id):")
        config_lines.append('    """Validate that a profile belongs to a client"""')
        config_lines.append("    client_profiles = get_client_profiles(client_id)")
        config_lines.append("    return profile_id in client_profiles")
        config_lines.append("")

        with open(client_config_path, 'w') as f:
            f.write('\n'.join(config_lines))

        # Reload the client_config module to pick up changes
        import importlib
        import client_config
        importlib.reload(client_config)

        return True

    except Exception as e:
        print(f"Error updating client_config: {str(e)}")
        return False

@app.route('/api/profiles', methods=['POST'])
@auth.require_auth
def create_profile():
    """Create a new QC profile"""
    try:
        data = request.get_json()

        if not data:
            return jsonify({'status': 'error', 'message': 'No data provided'}), 400

        profile_name = data.get('name', '').strip()
        if not profile_name:
            return jsonify({'status': 'error', 'message': 'Profile name is required'}), 400

        # Create profile filename (sanitize name)
        import re
        safe_name = re.sub(r'[^a-zA-Z0-9_-]', '_', profile_name.lower())
        profile_filename = f"{safe_name}.json"
        profile_path = os.path.join('profiles', profile_filename)

        # Check if profile already exists
        if os.path.exists(profile_path):
            return jsonify({'status': 'error', 'message': 'Profile already exists'}), 400

        # Get visibility settings
        visibility = data.get('visibility', 'all')  # 'all' or 'client_specific'
        visible_to_clients = data.get('visible_to_clients', [])  # List of client IDs

        # Create profile data structure
        profile_data = {
            "name": profile_name,
            "description": data.get('description', ''),
            "pass_threshold": data.get('pass_threshold', 85),
            "visibility": visibility,
            "visible_to_clients": visible_to_clients,
            "created_at": datetime.now().isoformat(),
            "created_by": g.user.get('email', 'unknown'),
            "version": 1,
            "checks": data.get('checks', {})
        }

        # Save profile to file
        with open(profile_path, 'w') as f:
            json.dump(profile_data, f, indent=2)

        # Update client_config if client_specific visibility
        if visibility == 'client_specific' and visible_to_clients:
            _update_client_config_for_profile(safe_name, visible_to_clients, action='add')
        elif visibility == 'all':
            # Add to all clients in client_config
            from client_config import get_all_clients
            all_clients = list(get_all_clients().keys())
            _update_client_config_for_profile(safe_name, all_clients, action='add')

        return jsonify({
            'status': 'success',
            'message': f'Profile "{profile_name}" created successfully',
            'profile_id': safe_name,
            'profile_path': profile_path,
            'visibility': visibility
        })

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/profiles/<profile_id>', methods=['PUT'])
@auth.require_auth
def update_profile(profile_id):
    """Update an existing QC profile by creating a new version"""
    try:
        data = request.get_json()

        if not data:
            return jsonify({'status': 'error', 'message': 'No data provided'}), 400

        profile_filename = f"{profile_id}.json"
        profile_path = os.path.join('profiles', profile_filename)

        # Check if profile exists
        if not os.path.exists(profile_path):
            return jsonify({'status': 'error', 'message': 'Profile not found'}), 404

        # Load existing profile
        with open(profile_path, 'r') as f:
            existing_profile = json.load(f)

        # Determine if profile has been modified (check if any field changed)
        has_changes = False
        fields_to_check = ['name', 'description', 'pass_threshold', 'checks', 'visibility', 'visible_to_clients']
        for field in fields_to_check:
            if field in data and data[field] != existing_profile.get(field):
                has_changes = True
                break

        if not has_changes:
            return jsonify({
                'status': 'success',
                'message': 'No changes detected',
                'profile_id': profile_id
            })

        # Find next version number
        current_version = existing_profile.get('version', 1)
        next_version = current_version + 1

        # Create new versioned profile ID
        # Remove any existing version suffix (e.g., my_profile_v2 -> my_profile)
        base_profile_id = re.sub(r'_v\d+$', '', profile_id)
        new_profile_id = f"{base_profile_id}_v{next_version}"
        new_profile_filename = f"{new_profile_id}.json"
        new_profile_path = os.path.join('profiles', new_profile_filename)

        # Check if new version already exists (shouldn't happen, but be safe)
        counter = 0
        while os.path.exists(new_profile_path) and counter < 100:
            next_version += 1
            new_profile_id = f"{base_profile_id}_v{next_version}"
            new_profile_filename = f"{new_profile_id}.json"
            new_profile_path = os.path.join('profiles', new_profile_filename)
            counter += 1

        # Create new profile version with updated data
        new_profile_data = existing_profile.copy()
        new_profile_data.update({
            "name": data.get('name', existing_profile.get('name')),
            "description": data.get('description', existing_profile.get('description', '')),
            "pass_threshold": data.get('pass_threshold', existing_profile.get('pass_threshold', 85)),
            "checks": data.get('checks', existing_profile.get('checks', {})),
            "visibility": data.get('visibility', existing_profile.get('visibility', 'all')),
            "visible_to_clients": data.get('visible_to_clients', existing_profile.get('visible_to_clients', [])),
            "version": next_version,
            "modified_at": datetime.now().isoformat(),
            "modified_by": g.user.get('email', 'unknown'),
            "previous_version": profile_id
        })

        # Save new versioned profile
        with open(new_profile_path, 'w') as f:
            json.dump(new_profile_data, f, indent=2)

        # Update client_config to use new version
        visibility = new_profile_data.get('visibility', 'all')
        visible_to_clients = new_profile_data.get('visible_to_clients', [])

        # Remove old version from client configs
        from client_config import get_all_clients
        all_clients = list(get_all_clients().keys())
        _update_client_config_for_profile(profile_id, all_clients, action='remove')

        # Add new version to appropriate client configs
        if visibility == 'client_specific' and visible_to_clients:
            _update_client_config_for_profile(new_profile_id, visible_to_clients, action='add')
        elif visibility == 'all':
            _update_client_config_for_profile(new_profile_id, all_clients, action='add')

        return jsonify({
            'status': 'success',
            'message': f'Profile updated to version {next_version}. Original kept as "{profile_id}"',
            'profile_id': new_profile_id,
            'previous_profile_id': profile_id,
            'version': next_version
        })

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/profiles/<profile_id>', methods=['DELETE'])
@auth.require_auth
def delete_profile(profile_id):
    """Delete a QC profile"""
    try:
        profile_filename = f"{profile_id}.json"
        profile_path = os.path.join('profiles', profile_filename)

        # Check if profile exists
        if not os.path.exists(profile_path):
            return jsonify({'status': 'error', 'message': 'Profile not found'}), 404

        # Load profile to get name for response
        with open(profile_path, 'r') as f:
            profile_data = json.load(f)

        profile_name = profile_data.get('name', profile_id)

        # Delete profile file
        os.remove(profile_path)

        return jsonify({
            'status': 'success',
            'message': f'Profile "{profile_name}" deleted successfully'
        })

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/brand_guidelines', methods=['GET'])
def get_brand_guidelines():
    """Get all brand guidelines, optionally filtered by brand or client"""
    try:
        brand_name = request.args.get('brand')
        client_id = request.args.get('client')

        if brand_name:
            guidelines = brand_db.get_brand_guidelines(brand_name)
            return jsonify({
                'status': 'success',
                'guidelines': guidelines,
                'brands': brand_db.get_all_brands()
            })
        elif client_id:
            # Filter by client
            filtered = brand_db.get_guidelines_by_client(client_id)
            return jsonify({
                'status': 'success',
                'brands': filtered['brands'],
                'files': filtered['files']
            })
        else:
            # Return full database structure that frontend expects
            return jsonify({
                'status': 'success',
                'brands': brand_db.db['brands'],
                'files': brand_db.db['files']
            })

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/brand_guidelines', methods=['POST'])
@auth.require_auth
def upload_brand_guideline():
    """Upload a new brand guideline file"""
    try:
        # Check if file is in request
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file provided'}), 400

        file = request.files['file']
        if file.filename == '':
            return jsonify({'status': 'error', 'message': 'No file selected'}), 400

        # Get brand name and other metadata
        brand_name = request.form.get('brand_name', '').strip()
        description = request.form.get('description', '').strip()
        tags = request.form.get('tags', '').strip().split(',') if request.form.get('tags') else []
        client_id = request.form.get('client_id', 'general').strip()

        if not brand_name:
            return jsonify({'status': 'error', 'message': 'Brand name is required'}), 400

        # Save uploaded file temporarily
        temp_filename = f"temp_{datetime.now().strftime('%Y%m%d_%H%M%S')}_{file.filename}"
        temp_path = os.path.join(app.config['UPLOAD_FOLDER'], temp_filename)
        file.save(temp_path)

        try:
            # Add to brand guidelines database
            file_record = brand_db.add_brand_guideline(
                brand_name=brand_name,
                file_path=temp_path,
                description=description,
                tags=[tag.strip() for tag in tags if tag.strip()],
                client_id=client_id
            )

            # Remove temporary file
            os.remove(temp_path)

            # Trigger background PDF processing if applicable
            if file_record.get('file_type') == '.pdf':
                import threading
                def _process_pdf_bg(fid, spath, bname, fdir):
                    try:
                        from pdf_processor import process_pdf_guideline
                        result = process_pdf_guideline(spath, fid, bname, fdir)
                        brand_db.update_file_record(fid, result)
                        print(f"PDF processing complete for {fid}")
                    except Exception as e:
                        print(f"PDF processing failed for {fid}: {e}")
                        brand_db.update_file_record(fid, {
                            'processed': 'error',
                            'processing_error': str(e)
                        })

                threading.Thread(
                    target=_process_pdf_bg,
                    args=(file_record['id'], file_record['stored_path'],
                          brand_name, str(brand_db.files_dir)),
                    daemon=True
                ).start()
                file_record['processing_status'] = 'processing'

            # Trigger Excel processing: try localization matrix first (existing
            # clients), fall back to Source Messaging summary (HP and similar).
            elif file_record.get('file_type') in ('.xlsx', '.xls'):
                import threading
                def _process_excel_bg(fid, spath, fdir):
                    try:
                        from localization_processor import parse_localization_matrix
                        parsed = parse_localization_matrix(spath)
                        if parsed:
                            json_path = os.path.join(fdir, f"{fid}_localization.json")
                            with open(json_path, 'w', encoding='utf-8') as f:
                                json.dump(parsed, f, indent=2, ensure_ascii=False)
                            brand_db.update_file_record(fid, {
                                'processed': True,
                                'processed_at': datetime.now().isoformat(),
                                'localization_path': json_path,
                                'localization_messages': list(parsed.get('messages', {}).keys()),
                                'localization_countries': parsed.get('countries', []),
                                'asset_type': 'localization_matrix',
                            })
                            print(f"Localization matrix parsing complete for {fid}: "
                                  f"{len(parsed.get('messages', {}))} messages, "
                                  f"{len(parsed.get('countries', []))} countries")
                            return

                        # Not a localization matrix — process as Source Messaging
                        # (HP-style structured Markdown summary via Gemini).
                        from excel_processor import process_excel_file
                        summary_text, summary_path = process_excel_file(spath, fid)
                        brand_db.update_file_record(fid, {
                            'processed': True,
                            'processed_at': datetime.now().isoformat(),
                            'summary_path': summary_path,
                            'summary_length': len(summary_text),
                            'cover_image_path': None,
                            'asset_type': 'source_messaging',
                        })
                        print(f"Source-messaging summary complete for {fid}: "
                              f"{len(summary_text)} chars")
                    except Exception as e:
                        print(f"Excel processing failed for {fid}: {e}")
                        brand_db.update_file_record(fid, {
                            'processed': 'error',
                            'processing_error': str(e),
                        })

                threading.Thread(
                    target=_process_excel_bg,
                    args=(file_record['id'], file_record['stored_path'],
                          str(brand_db.files_dir)),
                    daemon=True,
                ).start()
                file_record['processing_status'] = 'processing'

            return jsonify({
                'status': 'success',
                'message': f'Brand guideline uploaded successfully for {brand_name}',
                'file_record': file_record
            })

        except Exception as e:
            # Clean up temp file on error
            if os.path.exists(temp_path):
                os.remove(temp_path)
            raise e

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/brand_guidelines/<file_id>', methods=['DELETE'])
@auth.require_auth
def delete_brand_guideline(file_id):
    """Delete a brand guideline file"""
    try:
        success = brand_db.delete_guideline(file_id)

        if success:
            return jsonify({
                'status': 'success',
                'message': 'Brand guideline deleted successfully'
            })
        else:
            return jsonify({
                'status': 'error',
                'message': 'Brand guideline not found'
            }), 404

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/brand_guidelines/<file_id>/status', methods=['GET'])
def get_guideline_processing_status(file_id):
    """Check processing status of a brand guideline"""
    file_record = brand_db.db["files"].get(file_id)
    if not file_record:
        return jsonify({'status': 'error', 'message': 'Not found'}), 404
    return jsonify({
        'status': 'success',
        'processed': file_record.get('processed', False),
        'processing_error': file_record.get('processing_error'),
        'page_count': file_record.get('page_count'),
        'summary_length': file_record.get('summary_length'),
        'processed_at': file_record.get('processed_at')
    })


@app.route('/api/brand_guidelines/<file_id>/reprocess', methods=['POST'])
@auth.require_auth
def reprocess_guideline(file_id):
    """Re-process a PDF brand guideline (re-extract and re-summarize)"""
    file_record = brand_db.db["files"].get(file_id)
    if not file_record:
        return jsonify({'status': 'error', 'message': 'Not found'}), 404
    if file_record.get('file_type') != '.pdf':
        return jsonify({'status': 'error', 'message': 'Only PDF files can be reprocessed'}), 400

    import threading
    def _reprocess_bg(fid, spath, bname, fdir):
        try:
            from pdf_processor import process_pdf_guideline
            result = process_pdf_guideline(spath, fid, bname, fdir)
            brand_db.update_file_record(fid, result)
            print(f"PDF reprocessing complete for {fid}")
        except Exception as e:
            print(f"PDF reprocessing failed for {fid}: {e}")
            brand_db.update_file_record(fid, {
                'processed': 'error',
                'processing_error': str(e)
            })

    threading.Thread(
        target=_reprocess_bg,
        args=(file_id, file_record['stored_path'],
              file_record['brand_name'], str(brand_db.files_dir)),
        daemon=True
    ).start()

    return jsonify({'status': 'success', 'message': 'Reprocessing started'})


@app.route('/api/media_plan', methods=['POST'])
@auth.require_auth
def upload_media_plan():
    """Upload a media plan Excel file for a client"""
    try:
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file provided'}), 400

        file = request.files['file']
        if not file.filename:
            return jsonify({'status': 'error', 'message': 'No file selected'}), 400

        client_id = request.form.get('client_id', 'general').strip().lower()
        if not client_id:
            return jsonify({'status': 'error', 'message': 'client_id is required'}), 400

        access_err = _require_client_access(client_id)
        if access_err:
            return access_err

        display_name = (request.form.get('display_name') or '').strip()

        # Save the Excel file
        timestamp = datetime.now().strftime('%Y%m%d_%H%M%S')
        safe_name = re.sub(r'[^a-zA-Z0-9._-]', '_', file.filename)
        excel_filename = f"{client_id}_{timestamp}_{safe_name}"
        excel_path = os.path.join(MEDIA_PLANS_DIR, excel_filename)
        file.save(excel_path)

        # Parse the media plan
        from media_plan_processor import parse_media_plan
        parsed = parse_media_plan(excel_path)

        # Save parsed JSON for fast lookup
        json_filename = f"{client_id}_{timestamp}.json"
        json_path = os.path.join(MEDIA_PLANS_DIR, json_filename)
        with open(json_path, 'w') as f:
            json.dump(parsed, f, indent=2)

        # Remove old plan files for this client
        db = _load_media_plans_db()
        old_plan = db.get(client_id)
        if old_plan:
            for key in ('excel_path', 'json_path'):
                old_path = old_plan.get(key)
                if old_path and os.path.exists(old_path):
                    try:
                        os.remove(old_path)
                    except Exception:
                        pass

        # Save to DB
        db[client_id] = {
            'client_id': client_id,
            'original_filename': file.filename,
            'display_name': display_name or file.filename,
            'excel_path': excel_path,
            'json_path': json_path,
            'upload_date': datetime.now().isoformat(),
            'total_assets': parsed['total_assets'],
            'channels': parsed['channels'],
        }
        _save_media_plans_db(db)

        return jsonify({
            'status': 'success',
            'message': f'Media plan uploaded with {parsed["total_assets"]} assets across {len(parsed["channels"])} channels',
            'total_assets': parsed['total_assets'],
            'channels': parsed['channels'],
        })

    except Exception as e:
        print(f"Error uploading media plan: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/media_plan', methods=['GET'])
@auth.require_auth
def get_media_plan():
    """Get the active media plan for a client"""
    client_id = request.args.get('client', '').strip().lower()
    if not client_id:
        return jsonify({'status': 'error', 'message': 'client parameter required'}), 400

    access_err = _require_client_access(client_id)
    if access_err:
        return access_err

    db = _load_media_plans_db()
    plan_info = db.get(client_id)
    if not plan_info:
        return jsonify({'status': 'success', 'plan': None})

    return jsonify({
        'status': 'success',
        'plan': {
            'original_filename': plan_info.get('original_filename'),
            'upload_date': plan_info.get('upload_date'),
            'total_assets': plan_info.get('total_assets'),
            'channels': plan_info.get('channels'),
        }
    })


@app.route('/api/media_plan/<client_id>', methods=['DELETE'])
@auth.require_auth
def delete_media_plan(client_id):
    """Delete the media plan for a client"""
    access_err = _require_client_access(client_id)
    if access_err:
        return access_err
    db = _load_media_plans_db()
    plan_info = db.get(client_id)
    if not plan_info:
        return jsonify({'status': 'error', 'message': 'No media plan found'}), 404

    # Delete files
    for key in ('excel_path', 'json_path'):
        path = plan_info.get(key)
        if path and os.path.exists(path):
            try:
                os.remove(path)
            except Exception:
                pass

    del db[client_id]
    _save_media_plans_db(db)

    return jsonify({'status': 'success', 'message': 'Media plan deleted'})


@app.route('/api/detect_brand', methods=['POST'])
def detect_brand_from_file():
    """Detect brand from uploaded file using AI analysis"""
    try:
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file provided'}), 400

        file = request.files['file']
        if file.filename == '':
            return jsonify({'status': 'error', 'message': 'No file selected'}), 400

        # Save file temporarily for analysis
        temp_filename = f"brand_detect_{datetime.now().strftime('%Y%m%d_%H%M%S')}_{file.filename}"
        temp_path = os.path.join(app.config['UPLOAD_FOLDER'], temp_filename)
        file.save(temp_path)

        try:
            # Get available brands
            available_brands = brand_db.get_all_brands()

            # Create brand detection prompt - works whether brands are available or not
            if available_brands:
                brands_list = ', '.join(available_brands)
                brand_detection_prompt = f"""
                Analyze this image and determine:
                1. Which brand this belongs to from the following options: {brands_list}
                2. Whether this is a Key Visual or POS (Point of Sale) material
                3. Your confidence level (0-100%)

                Look for brand logos, colors, typography, and other brand elements.
                If the brand is not in the provided list, still attempt to identify it.

                Respond with JSON format:
                {{
                    "detected_brand": "brand_name or null if uncertain",
                    "file_type": "Key Visual" or "POS",
                    "confidence": confidence_percentage,
                    "reasoning": "explanation of detection"
                }}
                """
            else:
                brand_detection_prompt = """
                Analyze this image and determine:
                1. What brand this belongs to (identify any visible brand names, logos, or distinctive brand elements)
                2. Whether this is a Key Visual or POS (Point of Sale) material
                3. Your confidence level (0-100%)

                Look for brand logos, colors, typography, and other brand elements.
                Even if no brand guidelines are available, attempt to identify the brand from visual elements.

                Respond with JSON format:
                {
                    "detected_brand": "brand_name or null if uncertain",
                    "file_type": "Key Visual" or "POS",
                    "confidence": confidence_percentage,
                    "reasoning": "explanation of detection"
                }
                """

            # Run AI analysis
            result = run_visual_qc(
                prompt=brand_detection_prompt,
                asset_path=temp_path,
                model_name="Gemini"
            )

            # Extract JSON from response
            detection_data = extract_json_from_response(result['response'])

            # Clean up temp file
            os.remove(temp_path)

            return jsonify({
                'status': 'success',
                'detection': {
                    'detected_brand': detection_data.get('detected_brand'),
                    'file_type': detection_data.get('file_type', 'unknown'),
                    'confidence': detection_data.get('confidence', 0),
                    'reasoning': detection_data.get('reasoning', ''),
                    'available_brands': available_brands
                }
            })

        except Exception as e:
            # Clean up temp file on error
            if os.path.exists(temp_path):
                os.remove(temp_path)
            raise e

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/profile_usage_stats', methods=['GET'])
def get_profile_usage_stats():
    """Get usage statistics for a specific profile over a time period"""
    try:
        profile_id = request.args.get('profile', '')
        days = int(request.args.get('days', 30))

        if not profile_id:
            return jsonify({'status': 'error', 'message': 'Profile parameter required'}), 400

        # Import load_logs from generate_usage_report
        from generate_usage_report import load_logs

        start_date = (datetime.now() - timedelta(days=days)).strftime('%Y-%m-%d')
        end_date = datetime.now().strftime('%Y-%m-%d')

        entries = load_logs(start_date=start_date, end_date=end_date)

        # Filter to analysis_complete events for this profile
        profile_entries = [
            e for e in entries
            if e.get('event') == 'analysis_complete'
            and e.get('profile_id', '') == profile_id
        ]

        total_analyses = len(profile_entries)
        total_checks = sum(e.get('checks_run', e.get('checks_completed', 0)) for e in profile_entries)
        total_cost = sum(e.get('total_cost_usd', e.get('estimated_cost_usd', 0)) for e in profile_entries)
        scores = [e.get('overall_score', 0) for e in profile_entries if e.get('overall_score') is not None]
        avg_score = round(sum(scores) / len(scores), 1) if scores else 0

        # Build recent analyses list (last 50)
        recent = []
        for e in sorted(profile_entries, key=lambda x: x.get('timestamp', ''), reverse=True)[:50]:
            recent.append({
                'date': e.get('timestamp', '')[:19],
                'user': e.get('user_email', 'Unknown'),
                'client': e.get('client', ''),
                'checks': e.get('checks_run', e.get('checks_completed', 0)),
                'score': round(e.get('overall_score', 0), 2),
                'cost': round(e.get('total_cost_usd', e.get('estimated_cost_usd', 0)), 4)
            })

        return jsonify({
            'status': 'success',
            'total_analyses': total_analyses,
            'total_checks': total_checks,
            'total_cost_usd': round(total_cost, 4),
            'avg_score': avg_score,
            'recent': recent
        })

    except Exception as e:
        print(f"Error getting profile usage stats: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500


@app.route('/api/client_usage_stats', methods=['GET'])
@auth.require_auth
def get_client_usage_stats():
    """Get usage statistics scoped to a specific client with date filtering"""
    try:
        client = request.args.get('client')
        if not client:
            return jsonify({'status': 'error', 'message': 'client parameter required'}), 400

        access_err = _require_client_access(client)
        if access_err:
            return access_err

        start_date = request.args.get('start_date')
        end_date = request.args.get('end_date')

        # Default to last 30 days
        if not start_date:
            start_date = (datetime.now() - timedelta(days=30)).strftime('%Y-%m-%d')
        if not end_date:
            end_date = datetime.now().strftime('%Y-%m-%d')

        from generate_usage_report import load_logs
        entries = load_logs(start_date=start_date, end_date=end_date)

        # Filter to analysis_complete events for this client
        client_entries = [
            e for e in entries
            if e.get('event') == 'analysis_complete' and e.get('client') == client
        ]

        unique_users = set(e.get('user_email', 'unknown') for e in client_entries)
        total_checks = sum(e.get('checks_run', e.get('checks_completed', 0)) for e in client_entries)
        total_cost = sum(e.get('total_cost_usd', e.get('estimated_cost_usd', 0)) for e in client_entries)
        scores = [e.get('overall_score', 0) for e in client_entries if e.get('overall_score') is not None]
        avg_score = round(sum(scores) / len(scores), 1) if scores else 0

        total_input_tokens = 0
        total_output_tokens = 0
        by_provider = {}
        for e in client_entries:
            tu = e.get('token_usage') or {}
            total_input_tokens += tu.get('total_prompt_tokens', 0)
            total_output_tokens += tu.get('total_completion_tokens', 0)
            for provider, pstats in (tu.get('by_provider') or {}).items():
                agg = by_provider.setdefault(provider, {
                    'input_tokens': 0,
                    'output_tokens': 0,
                    'cost_usd': 0.0
                })
                agg['input_tokens'] += pstats.get('prompt_tokens', 0)
                agg['output_tokens'] += pstats.get('completion_tokens', 0)
                agg['cost_usd'] += pstats.get('cost', 0)
        for agg in by_provider.values():
            agg['cost_usd'] = round(agg['cost_usd'], 4)

        # Build recent analyses list (last 50)
        recent = []
        for e in sorted(client_entries, key=lambda x: x.get('timestamp', ''), reverse=True)[:50]:
            tu = e.get('token_usage') or {}
            recent.append({
                'date': e.get('timestamp', '')[:19],
                'user': e.get('user_email', 'Unknown'),
                'profile': e.get('profile_id', e.get('profile', '')),
                'checks': e.get('checks_run', e.get('checks_completed', 0)),
                'score': round(e.get('overall_score', 0), 2),
                'cost': round(e.get('total_cost_usd', e.get('estimated_cost_usd', 0)), 4),
                'input_tokens': tu.get('total_prompt_tokens', 0),
                'output_tokens': tu.get('total_completion_tokens', 0)
            })

        return jsonify({
            'status': 'success',
            'client': client,
            'start_date': start_date,
            'end_date': end_date,
            'total_analyses': len(client_entries),
            'unique_users': len(unique_users),
            'total_checks': total_checks,
            'estimated_cost_usd': round(total_cost, 4),
            'total_input_tokens': total_input_tokens,
            'total_output_tokens': total_output_tokens,
            'by_provider': by_provider,
            'avg_score': avg_score,
            'recent': recent
        })

    except Exception as e:
        print(f"Error getting client usage stats: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/admin/check', methods=['GET'])
@auth.require_auth
def check_admin():
    """Check if the current user is an admin"""
    from user_access import is_admin
    user_email = getattr(g, 'user', {}).get('email', '')
    return jsonify({'is_admin': is_admin(user_email)})


@app.route('/api/admin/users', methods=['GET'])
@auth.require_auth
def get_admin_users():
    """Get all users who have accessed the platform (admin only)"""
    from user_access import is_admin
    user_email = getattr(g, 'user', {}).get('email', '')
    if not is_admin(user_email):
        return jsonify({'status': 'error', 'message': 'Admin access required'}), 403

    try:
        from generate_usage_report import load_logs
        entries = load_logs()  # All time

        users = {}
        total_platform_analyses = 0
        total_platform_cost = 0
        total_platform_input_tokens = 0
        total_platform_output_tokens = 0

        for e in entries:
            event_type = e.get('event', '')
            email = e.get('user_email', 'unknown')
            if not email or email == 'unknown':
                continue

            # Track user from any event type (login visits + analyses)
            if email not in users:
                users[email] = {
                    'name': e.get('user_name', ''),
                    'email': email,
                    'total_analyses': 0,
                    'total_checks': 0,
                    'clients': set(),
                    'last_active': '',
                    'total_cost': 0,
                    'input_tokens': 0,
                    'output_tokens': 0
                }

            # Update last active from any event
            ts = e.get('timestamp', '')
            if ts > users[email]['last_active']:
                users[email]['last_active'] = ts

            # Update name if we have a better one
            name = e.get('user_name', '')
            if name and not users[email]['name']:
                users[email]['name'] = name

            # Only count analysis stats from analysis_complete events
            if event_type == 'analysis_complete':
                total_platform_analyses += 1
                cost = e.get('total_cost_usd', e.get('estimated_cost_usd', 0))
                total_platform_cost += cost

                tu = e.get('token_usage') or {}
                input_tokens = tu.get('total_prompt_tokens', 0)
                output_tokens = tu.get('total_completion_tokens', 0)
                total_platform_input_tokens += input_tokens
                total_platform_output_tokens += output_tokens

                users[email]['total_analyses'] += 1
                users[email]['total_checks'] += e.get('checks_run', e.get('checks_completed', 0))
                client = e.get('client', '')
                if client:
                    users[email]['clients'].add(client)
                users[email]['total_cost'] += cost
                users[email]['input_tokens'] += input_tokens
                users[email]['output_tokens'] += output_tokens

        # Convert sets to lists for JSON serialization
        user_list = []
        for u in users.values():
            u['clients'] = sorted(list(u['clients']))
            u['total_cost'] = round(u['total_cost'], 4)
            user_list.append(u)

        # Sort by last active descending
        user_list.sort(key=lambda x: x['last_active'], reverse=True)

        return jsonify({
            'status': 'success',
            'users': user_list,
            'total_unique_users': len(users),
            'total_platform_analyses': total_platform_analyses,
            'total_platform_cost': round(total_platform_cost, 4),
            'total_platform_input_tokens': total_platform_input_tokens,
            'total_platform_output_tokens': total_platform_output_tokens
        })

    except Exception as e:
        print(f"Error getting admin users: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({'status': 'error', 'message': str(e)}), 500


def _require_admin():
    """Return (user_email, None) if admin, else (None, error_response)."""
    from user_access import is_admin
    user_email = getattr(g, 'user', {}).get('email', '')
    if not is_admin(user_email):
        return None, (jsonify({'status': 'error', 'message': 'Admin access required'}), 403)
    return user_email, None


def _require_client_access(client_id):
    """
    Validate the authed user can access `client_id`.
    Returns None on success, or a (response, status) tuple to short-circuit the endpoint.
    """
    if not client_id:
        return None  # endpoint didn't scope by client
    from user_access import get_user_clients
    user_email = getattr(g, 'user', {}).get('email', '')
    if not user_email:
        return jsonify({'status': 'error', 'message': 'Authentication required'}), 401
    allowed = get_user_clients(user_email)
    if client_id not in allowed:
        return jsonify({
            'status': 'error',
            'code': 'client_access_denied',
            'message': f'You do not have access to client "{client_id}"'
        }), 403
    return None


@app.route('/api/admin/user_access', methods=['GET'])
@auth.require_auth
def get_user_access_list():
    """List all users with their client grants. Joins login-log users with explicit grants."""
    _, err = _require_admin()
    if err:
        return err

    try:
        from user_access import list_access_entries
        from generate_usage_report import load_logs

        access = list_access_entries()
        entries_by_email = {e['email'].lower(): e for e in access['entries']}

        # Enrich with login-log data (name + last_active) for users who have signed in
        login_users = {}
        for log_entry in load_logs():
            email = log_entry.get('user_email')
            if not email:
                continue
            lower = email.lower()
            ts = log_entry.get('timestamp', '')
            if lower not in login_users or ts > login_users[lower].get('last_active', ''):
                login_users[lower] = {
                    'email': email,
                    'name': log_entry.get('user_name', ''),
                    'last_active': ts
                }

        # Merge: everyone in login logs + everyone with an explicit grant
        all_emails = set(login_users.keys()) | set(entries_by_email.keys())
        merged = []
        for lower in all_emails:
            entry = entries_by_email.get(lower, {
                'email': login_users.get(lower, {}).get('email', lower),
                'clients': access['default_clients'],
                'is_admin': False,
                'updated_at': None,
                'updated_by': None
            })
            login = login_users.get(lower, {})
            merged.append({
                **entry,
                'name': login.get('name', ''),
                'last_active': login.get('last_active', ''),
                'has_explicit_grant': lower in entries_by_email
            })

        merged.sort(key=lambda x: (not x.get('is_admin'), x.get('email', '').lower()))

        return jsonify({
            'status': 'success',
            'default_clients': access['default_clients'],
            'users': merged
        })
    except Exception as e:
        print(f"Error listing user access: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/admin/user_access/<path:target_email>', methods=['PUT'])
@auth.require_auth
def set_user_access(target_email):
    """Set the list of clients a user can see. Body: {"clients": ["general", ...]}"""
    actor_email, err = _require_admin()
    if err:
        return err

    data = request.get_json(silent=True) or {}
    clients = data.get('clients')
    if not isinstance(clients, list):
        return jsonify({'status': 'error', 'message': 'clients must be a list'}), 400

    try:
        from user_access import set_user_clients
        from usage_tracker import log_access_change
        audit = set_user_clients(target_email, clients, actor_email)
        log_access_change(audit)
        return jsonify({'status': 'success', 'audit': audit})
    except ValueError as ve:
        return jsonify({'status': 'error', 'message': str(ve)}), 400
    except Exception as e:
        print(f"Error setting user access: {e}")
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/admin/user_access/<path:target_email>/promote', methods=['POST'])
@auth.require_auth
def promote_user_admin(target_email):
    """Promote a user to admin."""
    actor_email, err = _require_admin()
    if err:
        return err

    try:
        from user_access import promote_admin
        from usage_tracker import log_access_change
        audit = promote_admin(target_email, actor_email)
        log_access_change(audit)
        return jsonify({'status': 'success', 'audit': audit})
    except ValueError as ve:
        return jsonify({'status': 'error', 'message': str(ve)}), 400
    except Exception as e:
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/admin/user_access/<path:target_email>/demote', methods=['POST'])
@auth.require_auth
def demote_user_admin(target_email):
    """Remove admin role from a user. Blocked if it would leave zero admins."""
    actor_email, err = _require_admin()
    if err:
        return err

    try:
        from user_access import demote_admin
        from usage_tracker import log_access_change
        audit = demote_admin(target_email, actor_email)
        log_access_change(audit)
        return jsonify({'status': 'success', 'audit': audit})
    except ValueError as ve:
        return jsonify({'status': 'error', 'message': str(ve)}), 400
    except Exception as e:
        return jsonify({'status': 'error', 'message': str(e)}), 500


@app.route('/api/consolidate_reports', methods=['POST'])
@auth.require_auth
def consolidate_reports():
    """Generate a consolidated HTML summary from multiple saved reports"""
    try:
        data = request.get_json()
        if not data or 'files' not in data:
            return jsonify({'status': 'error', 'message': 'files list required'}), 400

        files_list = data['files']
        if len(files_list) < 2:
            return jsonify({'status': 'error', 'message': 'At least 2 files required'}), 400

        output_folder = app.config['OUTPUT_FOLDER']
        reports = []

        for file_info in files_list:
            filename = file_info.get('filename', '')
            client = file_info.get('client', '')
            file_path = os.path.join(output_folder, client, filename) if client else os.path.join(output_folder, filename)

            if not os.path.exists(file_path) or not file_path.endswith('.html'):
                continue

            with open(file_path, 'r') as f:
                html_content = f.read()

            # Extract embedded JSON from <div id="json-data"><pre>...</pre></div>
            json_match = re.search(r'<div id="json-data"[^>]*>\s*<pre>(.*?)</pre>\s*</div>', html_content, re.DOTALL)
            if json_match:
                try:
                    report_data = json.loads(json_match.group(1))
                    reports.append({
                        'filename': filename,
                        'client': client,
                        'data': report_data
                    })
                except json.JSONDecodeError:
                    continue

        if len(reports) < 2:
            return jsonify({'status': 'error', 'message': 'Could not extract data from enough reports (need at least 2)'}), 400

        # Build consolidated HTML
        timestamp = datetime.now().strftime('%Y-%m-%d %H:%M:%S')

        # Summary table rows
        summary_rows = ''
        all_failed_checks = []
        for r in reports:
            rd = r['data']
            summary = rd.get('summary', {})
            score = summary.get('overall_score', 0)
            # Use the grade from the report (respects profile-specific grading overrides)
            grade = summary.get('grade', rd.get('grade', determine_grade(score) if score else 'N/A'))
            profile_name = rd.get('profile_name', rd.get('profile', 'Unknown'))
            fname = rd.get('filename', r['filename'])
            pass_fail_color = '#2e7d32' if grade == 'Pass' else '#c62828'
            summary_rows += f'''
                <tr>
                    <td style="padding: 10px; border-bottom: 1px solid #dee2e6;">{fname}</td>
                    <td style="padding: 10px; border-bottom: 1px solid #dee2e6;">{profile_name}</td>
                    <td style="padding: 10px; border-bottom: 1px solid #dee2e6; text-align: center;">{round(score, 1) if score else 'N/A'}</td>
                    <td style="padding: 10px; border-bottom: 1px solid #dee2e6; text-align: center; color: {pass_fail_color}; font-weight: 700;">{grade}</td>
                </tr>'''

            # Collect failed checks
            results = rd.get('results', {})
            for check_name, check_data in results.items():
                if check_data.get('status') != 'success':
                    continue
                check_score = check_data.get('score', 0)
                if check_score is not None and check_score < 6:
                    # Extract human-readable explanation from json_data
                    json_data = check_data.get('json_data', {})
                    explanation = json_data.get('explanation', '')
                    recommendations = json_data.get('recommendations', [])

                    # Build issue summary from explanation + recommendations
                    issue_parts = []
                    if explanation:
                        issue_parts.append(explanation)
                    if recommendations:
                        rec_text = ' | '.join(r for r in recommendations if r)
                        if rec_text:
                            issue_parts.append(f'Recommendations: {rec_text}')

                    issue_summary = ' '.join(issue_parts) if issue_parts else 'No details available'
                    # Truncate if very long
                    if len(issue_summary) > 500:
                        issue_summary = issue_summary[:497] + '...'

                    all_failed_checks.append({
                        'filename': fname,
                        'check': check_data.get('display_name', check_name.replace('_', ' ').title()),
                        'score': check_score,
                        'summary': issue_summary
                    })

        # Failed checks rows
        failed_rows = ''
        if all_failed_checks:
            for fc in all_failed_checks:
                failed_rows += f'''
                    <tr style="background: #fff5f5;">
                        <td style="padding: 10px; border-bottom: 1px solid #dee2e6;">{fc['filename']}</td>
                        <td style="padding: 10px; border-bottom: 1px solid #dee2e6;">{fc['check']}</td>
                        <td style="padding: 10px; border-bottom: 1px solid #dee2e6; text-align: center; color: #c62828; font-weight: 700;">{fc['score']}/10</td>
                        <td style="padding: 10px; border-bottom: 1px solid #dee2e6; font-size: 0.85em; color: #555;">{fc['summary']}</td>
                    </tr>'''
        else:
            failed_rows = '<tr><td colspan="4" style="padding: 20px; text-align: center; color: #2e7d32;">No failed checks found across all reports!</td></tr>'

        consolidated_html = f'''<!DOCTYPE html>
<html lang="en">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>Consolidated QC Report - {timestamp}</title>
    <link href="https://fonts.googleapis.com/css2?family=Montserrat:wght@400;600;700&display=swap" rel="stylesheet">
    <style>
        body {{ font-family: 'Montserrat', sans-serif; margin: 0; padding: 20px; background: #f5f5f5; color: #333; }}
        .container {{ max-width: 1000px; margin: 0 auto; background: white; border-radius: 12px; box-shadow: 0 2px 12px rgba(0,0,0,0.1); padding: 30px; }}
        h1 {{ color: #1a1a2e; margin-bottom: 5px; }}
        h2 {{ color: #495057; border-bottom: 2px solid #dee2e6; padding-bottom: 8px; margin-top: 30px; }}
        .meta {{ color: #6c757d; font-size: 0.9em; margin-bottom: 25px; }}
        table {{ width: 100%; border-collapse: collapse; margin: 15px 0; table-layout: fixed; }}
        th {{ background: #f8f9fa; padding: 12px 10px; text-align: left; border-bottom: 2px solid #dee2e6; font-weight: 700; font-size: 0.9em; }}
        td {{ font-size: 0.9em; word-break: break-word; overflow-wrap: break-word; }}
    </style>
</head>
<body>
    <div class="container">
        <h1>Consolidated QC Report</h1>
        <p class="meta">Generated: {timestamp} | Reports: {len(reports)}</p>

        <h2>Summary</h2>
        <table>
            <thead>
                <tr>
                    <th>File</th>
                    <th>Profile</th>
                    <th style="text-align: center;">Score</th>
                    <th style="text-align: center;">Result</th>
                </tr>
            </thead>
            <tbody>{summary_rows}</tbody>
        </table>

        <h2>Failed Checks</h2>
        <table>
            <thead>
                <tr>
                    <th>File</th>
                    <th>Check</th>
                    <th style="text-align: center;">Score</th>
                    <th>Issue Summary</th>
                </tr>
            </thead>
            <tbody>{failed_rows}</tbody>
        </table>
    </div>
</body>
</html>'''

        # Save consolidated report
        consolidated_filename = f"consolidated_{datetime.now().strftime('%Y%m%d_%H%M%S')}.html"
        # Determine client folder - use the first report's client or 'general'
        client_folder = reports[0].get('client', 'general') or 'general'
        client_output_dir = os.path.join(output_folder, client_folder)
        os.makedirs(client_output_dir, exist_ok=True)
        consolidated_path = os.path.join(client_output_dir, consolidated_filename)

        with open(consolidated_path, 'w') as f:
            f.write(consolidated_html)

        url = f"{request.environ.get('SCRIPT_NAME', '')}/output/{client_folder}/{consolidated_filename}"

        return jsonify({
            'status': 'success',
            'filename': consolidated_filename,
            'url': url
        })

    except Exception as e:
        print(f"Error consolidating reports: {e}")
        import traceback
        traceback.print_exc()
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500


@app.route('/api/qc-apps', methods=['GET'])
def get_qc_apps():
    """Get list of all QC applications with their metadata"""
    try:
        # User-friendly descriptions for each QC tool
        tool_descriptions = {
            'accessibility': 'Evaluates color contrast, text legibility, and accessibility compliance to ensure content is usable by people with visual impairments and meets WCAG standards.',
            'animation_transitions': 'Checks animation quality, smoothness, timing, and transitions in video or animated content to ensure professional motion design.',
            'aspect_ratio': 'Verifies the image or video aspect ratio matches intended display formats (16:9, 4:3, 1:1, etc.) to prevent stretching or cropping issues.',
            'background_contrast': 'Analyzes contrast between background and foreground elements to ensure text and important content remain clearly visible and readable.',
            'brand_assets_visibility': 'Validates that required brand assets (logos, trademarks, brand elements) are present, visible, and properly positioned according to brand guidelines.',
            'call_to_action': 'Evaluates the presence, clarity, and prominence of call-to-action (CTA) elements to ensure they effectively guide user behavior.',
            'color_format': 'Checks color space and format (RGB, CMYK, etc.) to ensure correct color reproduction for the intended output medium (digital, print).',
            'crop_marks': 'Verifies presence and correct placement of crop marks, bleeds, and trim marks for print-ready files to ensure accurate cutting and finishing.',
            'curved_edges': 'Checks for smooth, professional curved edges and rounded corners in design elements, ensuring consistent styling across the creative.',
            'curved_edges_digital': 'Evaluates curved edges specifically for digital displays, checking for anti-aliasing and smooth rendering on screens.',
            'curved_edges_print': 'Validates curved edges for print output, ensuring clean vector paths and proper resolution for physical reproduction.',
            'dark_mode_legibility': 'Tests content legibility in dark mode or low-light environments, ensuring text remains readable with appropriate contrast.',
            'element_alignment': 'Checks alignment of design elements (text, images, buttons) to ensure professional layout and visual consistency.',
            'face_gaze_direction': 'Analyzes the direction people in images are looking to ensure gaze guides viewer attention toward key content or CTAs.',
            'face_visibility': 'Checks for clear, well-lit, and unobscured faces in imagery, ensuring people are properly featured when human connection is important.',
            'file_naming': 'Validates file naming conventions for proper organization, version control, and asset management in production workflows.',
            'image_resolution': 'Verifies image resolution and quality to ensure crisp, professional output without pixelation or blur at intended display size.',
            'imperative_verb': 'Checks that CTAs use strong imperative verbs ("Get," "Start," "Join") to create clear, action-oriented messaging.',
            'inclusive': 'Evaluates representation and inclusivity in imagery and messaging to ensure diverse, respectful, and welcoming content.',
            'layer_organization': 'Reviews file layer structure and organization for clean, maintainable design files that other team members can easily work with.',
            'logo_visibility': 'Ensures brand logos are present, properly sized, clearly visible, and positioned according to brand guidelines.',
            'lowercase_text': 'Checks for improper use of all-lowercase text where standard capitalization would improve readability and professionalism.',
            'new_visibility': 'Validates presence and visibility of "NEW" badges or indicators when promoting new products, features, or offerings.',
            'print_bleed': 'Verifies correct bleed area setup for print files to prevent white edges and ensure full-coverage printing to the trim edge.',
            'product_visibility': 'Ensures product imagery is clear, well-lit, properly featured, and showcases key product attributes effectively.',
            'responsiveness': 'Checks how design elements adapt across different screen sizes and devices to ensure consistent experience on mobile, tablet, and desktop.',
            'safety_area': 'Validates that important content (text, logos, CTAs) stays within safe zones to avoid cutoff on various display formats and aspect ratios.',
            'supporting_images': 'Evaluates quality, relevance, and composition of supporting images to ensure they enhance the message and maintain visual interest.',
            'text_readability': 'Analyzes text size, font choice, spacing, and contrast to ensure copy is easily readable across different viewing conditions.',
            'visual_elements_count': 'Checks for appropriate number of visual elements to avoid cluttered or empty designs, ensuring balanced composition.',
            'visual_hierarchy': 'Evaluates the logical flow and priority of visual elements to guide viewer attention from most to least important information.',
            'visuals_left_text_right': 'Validates proper layout convention (visuals left, text right) for left-to-right reading audiences to optimize information flow.',
            'word_count': 'Checks text length to ensure messaging is concise and appropriate for the medium, avoiding over-crowding or insufficient information.'
        }

        qc_apps_data = {}

        # Build QC apps data from loaded QC checks
        for check_name in qc_apps.keys():
            # Get display name
            display_name = qc_apps[check_name].get('display_name', check_name.replace('_', ' ').title())

            # Get description from mapping, or fall back to auto-generated description
            description = tool_descriptions.get(check_name)
            if not description:
                # Fallback: Extract from prompt if custom description not available
                prompt = qc_apps[check_name].get('prompt', '')
                description_lines = prompt.split('\n\n')
                description = description_lines[0][:300] if description_lines else f'{display_name} quality check'

            # Default weights - can be customized
            qc_apps_data[check_name] = {
                'display_name': display_name,
                'enabled': True,
                'required_weight': 0.1,  # Default weight
                'optional_weight': 0.0,
                'description': description,
                'full_prompt': qc_apps[check_name].get('prompt', '')  # Include full prompt for detailed view
            }

        return jsonify({
            'status': 'success',
            'qc_apps': qc_apps_data,
            'total_apps': len(qc_apps_data)
        })

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/generate_report', methods=['POST'])
def api_generate_report():
    """Generate HTML report from existing session data"""
    try:
        # Get parameters
        session_id = request.form.get('session_id')
        if not session_id:
            return jsonify({'status': 'error', 'message': 'Session ID required'}), 400

        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        if not os.path.exists(session_folder):
            return jsonify({'status': 'error', 'message': 'Session not found'}), 404

        # Find the analysis result file
        result_files = [f for f in os.listdir(session_folder) if f.endswith('_results.json')]
        if not result_files:
            return jsonify({'status': 'error', 'message': 'No analysis results found for session'}), 404

        # Load the most recent results file
        result_file = sorted(result_files)[-1]
        result_path = os.path.join(session_folder, result_file)

        with open(result_path, 'r') as f:
            report_data = json.load(f)

        # Find the original file
        files = [f for f in os.listdir(session_folder) if not f.endswith('_results.json')]
        if not files:
            return jsonify({'status': 'error', 'message': 'Original file not found'}), 404

        original_file = files[0]
        file_path = os.path.join(session_folder, original_file)

        # Generate HTML using existing function
        html_content = generate_html_content(report_data, original_file, file_path)

        return html_content, 200, {'Content-Type': 'text/html'}

    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

# Authentication endpoints
@app.route('/auth/login', methods=['POST'])
def auth_login():
    """Process authentication tokens from MSAL popup."""
    try:
        # Get token from request
        data = request.get_json()
        if not data or 'token' not in data:
            return jsonify({
                'success': False,
                'error': 'Token is required',
                'authenticated': False
            }), 400

        token = data['token']

        # Validate and set authentication token - returns response with cookie set
        return auth.set_auth_token(token)

    except Exception as e:
        return jsonify({
            'success': False,
            'error': f'Authentication failed: {str(e)}',
            'authenticated': False
        }), 500

@app.route('/auth/logout', methods=['POST'])
def auth_logout():
    """Clear authentication session."""
    try:
        return auth.clear_auth_token()
    except Exception as e:
        return jsonify({
            'success': False,
            'error': f'Logout failed: {str(e)}'
        }), 500

@app.route('/auth/status', methods=['GET'])
def auth_status():
    """Get current authentication status and log user visit."""
    try:
        status = auth.get_auth_status()

        # Log user visit if authenticated
        if status.get('authenticated') and status.get('user'):
            try:
                from usage_tracker import log_user_login
                log_user_login(status['user'])
            except Exception as log_err:
                print(f"Warning: Failed to log user visit: {log_err}")

        return jsonify(status)
    except Exception as e:
        return jsonify({
            'authenticated': False,
            'error': f'Status check failed: {str(e)}'
        }), 500


# ---------------------------------------------------------------------------
# Box.com OAuth (per-creator user authentication for automation folders).
# Flow:
#   1. User (signed into the QC tool via MSAL) hits GET /auth/box/login.
#      We generate a JWT-signed state encoding their email and 302 to Box.
#   2. Box redirects back to GET /auth/box/callback with ?code=...&state=...
#      We verify the state, exchange the code for tokens, fetch the Box user,
#      and persist via box_tokens.save_tokens.
# Tokens are then used by background workers (PR3) and on-demand calls.
#
# The Box redirect URI is computed per-request (not a fixed env var) so the
# same code works on laptop, dev, and prod. When BOX_REDIRECT_URI is set in
# the env it wins (escape hatch).
# ---------------------------------------------------------------------------

def _box_redirect_uri():
    """
    Compute the public OAuth callback URL.

    Resolution order:
      1. BOX_REDIRECT_URI env var if set (escape hatch / unusual deploys).
      2. X-Forwarded-Host header if Apache sets it (some setups do).
      3. Otherwise, infer from request.host: anything that isn't localhost
         is treated as being behind the Apache proxy at /ai_qc/ over HTTPS
         (this matches optical-dev / optical-prod where Apache uses
         ProxyPreserveHost so request.host is already the public hostname,
         but the backend connection is plain http and Flask sees no prefix).
    """
    explicit = (os.environ.get('BOX_REDIRECT_URI') or '').strip()
    if explicit:
        return explicit

    forwarded_host = request.headers.get('X-Forwarded-Host')
    if forwarded_host:
        host = forwarded_host.split(',')[0].strip()
        proto = request.headers.get('X-Forwarded-Proto', 'https')
        return f'{proto}://{host}/ai_qc/auth/box/callback'

    host = (request.host or '').strip()
    is_local = (not host) or 'localhost' in host or host.startswith('127.0.0.1')
    if not is_local:
        # Behind the optical-dev / optical-prod Apache proxy, mounted at /ai_qc/.
        return f'https://{host}/ai_qc/auth/box/callback'
    return f'{request.scheme}://{host}/auth/box/callback'


# ---------- Box JWT service-account: webhook ingestion + workflow helper ----------

# Bounded in-memory dedup for box-delivery-id. Box uses at-least-once delivery;
# a 200 from us tells it not to retry, so duplicates are rare. The maxlen keeps
# memory tiny while still catching the common retry window.
_box_recent_deliveries = collections.deque(maxlen=500)
_box_recent_deliveries_set = set()
_box_recent_deliveries_lock = threading.Lock()

# Extensions accepted from a Box upload. Keeps the webhook from kicking off QC
# on Word docs, ZIPs, etc. Mirrors what technical_check.inspect knows how to read.
_BOX_QC_EXTS = {
    '.jpg', '.jpeg', '.png', '.gif', '.bmp', '.tiff', '.tif', '.webp',
    '.pdf',
    '.mp4', '.avi', '.mov', '.mkv', '.wmv', '.flv', '.webm',
}


def _box_remember_delivery(delivery_id):
    """Return True if first time seeing this delivery_id; False if duplicate."""
    with _box_recent_deliveries_lock:
        if delivery_id in _box_recent_deliveries_set:
            return False
        _box_recent_deliveries.append(delivery_id)
        _box_recent_deliveries_set.add(delivery_id)
        if len(_box_recent_deliveries_set) > _box_recent_deliveries.maxlen:
            _box_recent_deliveries_set.clear()
            _box_recent_deliveries_set.update(_box_recent_deliveries)
        return True


def _run_box_triggered_analysis(client_id, profile_id, file_id, filename, session_id):
    """Background worker for the Box webhook flow.

    Downloads the Box file, runs the technical pre-flight + LLM check pipeline,
    writes the HTML report to disk under output/<client>/, and uploads the same
    report back to the client's box_reports_folder_id (or box_folder_id as a
    fallback). Uses a synthetic 'box_webhook' user for usage tracking.

    Skips media-plan and localization context — those are user-UI concepts that
    don't have a meaningful source in a webhook-triggered run.
    """
    try:
        from client_config import get_all_clients as _get_all_clients
        client_cfg = _get_all_clients().get(client_id, {})
        session_folder = os.path.join(app.config['UPLOAD_FOLDER'], session_id)
        os.makedirs(session_folder, exist_ok=True)
        file_path = os.path.join(session_folder, filename)

        # 1. Download the asset from Box.
        box_jwt_client.download_file(file_id, file_path)
        print(f'Box webhook: downloaded {filename} → {file_path}')

        # 2. Technical pre-flight (same as user-uploaded flow).
        technical_report = technical_inspect(file_path)

        # 3. Init progress tracker.
        progress_tracker[session_id] = {
            'total_checks': 25,
            'completed_checks': 0,
            'current_check': 'Initializing',
            'current_check_display': 'Box-triggered analysis',
            'stage': 'setup',
            'percentage': 0,
            'session_id': session_id,
            'status': 'started',
            'source': 'box_webhook',
            'box_file_id': file_id,
            'technical_report': technical_report,
        }

        # 4. Log analysis start with a synthetic system user.
        try:
            from usage_tracker import log_analysis_start
            log_analysis_start(
                session_id, client_id, profile_id,
                {'user_id': 'box_webhook', 'email': 'box_webhook@system', 'name': 'Box Webhook'},
                {'filename': filename, 'size': os.path.getsize(file_path)},
            )
        except Exception as log_err:
            print(f'WARNING: usage log_analysis_start failed: {log_err}')

        # 5. Resolve profile + enabled checks.
        profile_config = get_profile(profile_id)
        if not profile_config:
            raise Exception(f'Profile {profile_id} not found')
        enabled_checks = [c for c in profile_config.get_enabled_checks() if c in qc_apps]
        if not enabled_checks:
            raise Exception(f'No enabled checks for profile {profile_id}')
        profile_weights = profile_config.get_check_weights()
        progress_tracker[session_id].update({
            'total_checks': len(enabled_checks),
            'stage': 'qc_analysis',
            'percentage': 10,
        })

        # 6. Run check batches (no media plan / localization / OCR in webhook MVP).
        check_results = process_checks_in_batches(
            enabled_checks, qc_apps, profile_config, profile_weights,
            file_path, None, brand_db, progress_tracker,
            session_id, batch_size=15, media_plan_context=None, ocr_context=None,
        )

        # 7. Score aggregation.
        total_weighted_score = 0
        total_weight = 0
        completed_checks = 0
        failed_checks = 0
        for _check_name, result in check_results.items():
            w = result.get('weight', 0.1)
            total_weight += w
            if result.get('status') == 'success':
                completed_checks += 1
                s = result.get('score')
                if s is not None:
                    total_weighted_score += s * w
            else:
                failed_checks += 1
        if total_weight >= 10.0:
            overall_score = min(total_weighted_score, 100)
        else:
            overall_score = min(total_weighted_score * 10, 100)

        # 8. Result envelope matching the user-flow shape.
        result_data = {
            'status': 'success',
            'session_id': session_id,
            'timestamp': datetime.now().strftime('%Y-%m-%d %H:%M:%S'),
            'filename': filename,
            'profile': profile_id,
            'profile_id': profile_id,
            'profile_name': profile_config.name,
            'model': 'Profile-based selection',
            'results': check_results,
            'profile_selection': {
                'selected_profile': profile_id,
                'profile_source': 'box_webhook',
                'brand': client_id,
                'format_suffix': profile_id,
                'reference_asset': None,
                'reference_asset_used': False,
            },
            'qc_analysis': {
                'profile_used': profile_id,
                'total_checks': len(enabled_checks),
                'completed_checks': completed_checks,
                'failed_checks': failed_checks,
                'check_results': check_results,
            },
            'summary': {
                'overall_score': round(overall_score, 1),
                'profile': profile_config.name,
                'checks_count': completed_checks,
                'total_checks': len(enabled_checks),
                'total_weighted_score': total_weighted_score,
                'total_weight': total_weight,
                'grade': determine_grade(overall_score),
            },
            'technical_report': progress_tracker[session_id].get('technical_report', {}),
            'source': 'box_webhook',
            'box_file_id': file_id,
        }

        # Strict-grade override applies the same way for webhook-triggered runs.
        if getattr(profile_config, 'strict_grade', False):
            for _cn, cd in check_results.items():
                if cd.get('status') == 'success':
                    cs = cd.get('score', 0)
                    if cs is not None and cs < 6:
                        result_data['summary']['grade'] = 'Fail'
                        break

        # 9. Write HTML report to disk so the UI's saved-files listing shows it.
        report_filename = f'QC_Report_{session_id}_{os.path.splitext(filename)[0]}.html'
        client_folder = ensure_client_output_folder(client_id)
        report_path = os.path.join(client_folder, report_filename)
        with open(report_path, 'w', encoding='utf-8') as f:
            f.write(generate_comprehensive_html_report(result_data, filename, file_path=file_path))
        result_data['output_file'] = {
            'path': report_path,
            'filename': report_filename,
            'url': f'/output/{client_id}/{report_filename}',
        }

        # 10. Upload the report back to Box. Prefer the dedicated reports folder if
        # configured; fall back to the same folder the source lived in.
        reports_folder = client_cfg.get('box_reports_folder_id') or client_cfg.get('box_folder_id')
        report_uploaded_ok = False
        if reports_folder:
            try:
                uploaded = box_jwt_client.upload_file(report_path, str(reports_folder), name=report_filename)
                result_data['box_report_upload'] = {
                    'box_file_id': uploaded.get('id'),
                    'box_file_name': uploaded.get('name'),
                    'box_folder_id': str(reports_folder),
                }
                report_uploaded_ok = True
                print(f"Box webhook: uploaded report {report_filename} → folder {reports_folder} (id={uploaded.get('id')})")
            except Exception as up_err:
                print(f'WARNING: failed to upload report to Box: {up_err}')
                result_data['box_report_upload_error'] = str(up_err)
        else:
            print(f'Box webhook: no box_reports_folder_id (or box_folder_id) on client {client_id}; report stays local only')

        # 10b. Move the source file out of INCOMING into a `_PROCESSED` subfolder so the
        # next upload of the same filename triggers a fresh FILE.UPLOADED event (Box's
        # V2 webhook doesn't fire on same-name version replacements; freeing the name
        # is the cleanest workaround). Only runs if the report made it back to Box —
        # if upload failed, we want the source to stay so the user can retry by simply
        # re-uploading. Failures here are non-fatal: log, record, continue.
        source_folder_id = client_cfg.get('box_folder_id')
        if report_uploaded_ok and source_folder_id:
            try:
                processed_folder_id = box_jwt_client.find_or_create_subfolder(
                    str(source_folder_id), '_PROCESSED'
                )
                processed_name = f'{session_id}_{filename}'
                moved = box_jwt_client.move_file(file_id, processed_folder_id, new_name=processed_name)
                result_data['box_source_moved'] = {
                    'box_file_id': moved.get('id'),
                    'box_folder_id': processed_folder_id,
                    'box_file_name': moved.get('name'),
                }
                print(f'Box webhook: moved source → _PROCESSED/{processed_name} (folder {processed_folder_id})')
            except Exception as mv_err:
                print(f'WARNING: failed to move source file to _PROCESSED: {mv_err}')
                result_data['box_source_move_error'] = str(mv_err)

        # 11. Mark complete on progress_tracker for /api/progress consumers.
        progress_tracker[session_id]['result'] = result_data
        progress_tracker[session_id]['status'] = 'completed'
        progress_tracker[session_id]['stage'] = 'complete'
        progress_tracker[session_id]['percentage'] = 100

        # 12. Usage tracker completion event.
        try:
            from usage_tracker import log_analysis_complete
            log_analysis_complete(
                session_id, client_id, profile_id,
                {'user_id': 'box_webhook', 'email': 'box_webhook@system', 'name': 'Box Webhook'},
                {'checks_completed': completed_checks, 'overall_score': overall_score,
                 'status': 'success', 'source': 'box_webhook'},
            )
        except Exception as log_err:
            print(f'WARNING: usage log_analysis_complete failed: {log_err}')

        print(f'Box webhook: analysis complete for session {session_id}, score {overall_score}')

    except Exception as e:
        print(f'ERROR in Box-triggered analysis (session {session_id}): {e}')
        import traceback
        traceback.print_exc()
        if session_id in progress_tracker:
            progress_tracker[session_id]['status'] = 'error'
            progress_tracker[session_id]['stage'] = 'error'
            progress_tracker[session_id]['error'] = str(e)


@app.route('/api/box/webhook', methods=['POST'])
def box_webhook():
    """Receive a Box V2 webhook. Authenticated by HMAC signature on every request.

    Box expects a 200 within ~10 seconds. We verify the signature, ack, and run
    the analysis on a background thread.
    """
    raw_body = request.get_data(cache=True)
    headers = {k.lower(): v for k, v in request.headers.items()}

    primary_key = os.environ.get('BOX_WEBHOOK_PRIMARY_KEY')
    secondary_key = os.environ.get('BOX_WEBHOOK_SECONDARY_KEY')
    if not primary_key and not secondary_key:
        print('Box webhook: no signing keys in env (set BOX_WEBHOOK_PRIMARY_KEY); refusing all deliveries')
        return jsonify({'status': 'error', 'message': 'webhook signing not configured'}), 503

    if not box_jwt_client.verify_webhook_signature(raw_body, headers, primary_key, secondary_key):
        print('Box webhook: signature verification failed')
        return jsonify({'status': 'error', 'message': 'invalid signature'}), 401

    delivery_id = headers.get('box-delivery-id', '')
    if delivery_id and not _box_remember_delivery(delivery_id):
        return jsonify({'status': 'ok', 'message': 'duplicate'}), 200

    try:
        payload = json.loads(raw_body.decode('utf-8'))
    except Exception:
        return jsonify({'status': 'error', 'message': 'invalid JSON'}), 400

    trigger = payload.get('trigger', '')
    if trigger != 'FILE.UPLOADED':
        return jsonify({'status': 'ok', 'message': f'ignored trigger {trigger}'}), 200

    source = payload.get('source') or {}
    if source.get('type') != 'file':
        return jsonify({'status': 'ok', 'message': 'not a file event'}), 200

    file_id = str(source.get('id', ''))
    filename = source.get('name', '')
    parent = source.get('parent') or {}
    parent_folder_id = str(parent.get('id', ''))
    if not file_id or not parent_folder_id or not filename:
        return jsonify({'status': 'error', 'message': 'malformed payload'}), 400

    ext = os.path.splitext(filename)[1].lower()
    if ext not in _BOX_QC_EXTS:
        print(f'Box webhook: skipping non-QC extension {ext} ({filename})')
        return jsonify({'status': 'ok', 'message': f'unsupported extension {ext}'}), 200

    from client_config import get_client_by_box_folder, get_all_clients, get_default_profile
    client_id = get_client_by_box_folder(parent_folder_id)
    if not client_id:
        print(f'Box webhook: no client configured for Box folder {parent_folder_id}')
        return jsonify({'status': 'ok', 'message': 'no client mapping'}), 200

    client_cfg = get_all_clients().get(client_id, {})
    profile_id = get_default_profile(client_id) or (client_cfg.get('profiles') or ['static_general'])[0]

    session_id = datetime.now().strftime('%Y%m%d_%H%M%S')
    print(f'Box webhook: dispatching session={session_id} client={client_id} profile={profile_id} file_id={file_id} name={filename}')

    threading.Thread(
        target=_run_box_triggered_analysis,
        args=(client_id, profile_id, file_id, filename, session_id),
        daemon=True,
    ).start()

    return jsonify({
        'status': 'ok',
        'session_id': session_id,
        'client_id': client_id,
        'profile_id': profile_id,
    }), 200


@app.route('/auth/box/login', methods=['GET'])
@auth.require_auth
def box_login():
    """Kick off the Box OAuth flow for the signed-in user."""
    import box_client

    if not box_client.is_configured():
        return jsonify({'status': 'error',
                        'message': 'Box integration is not configured (BOX_CLIENT_ID / BOX_CLIENT_SECRET missing).'}), 503

    user_email = getattr(g, 'user', {}).get('email', '')
    if not user_email:
        return jsonify({'status': 'error', 'message': 'Authentication required'}), 401

    redirect_uri = _box_redirect_uri()
    state = box_client.make_state(user_email)
    return redirect(box_client.build_authorize_url(state, redirect_uri))


@app.route('/auth/box/callback', methods=['GET'])
def box_callback():
    """Handle Box's redirect back after the user approves the app."""
    import box_client
    import box_tokens

    error = request.args.get('error')
    if error:
        # User cancelled, or Box rejected the request — surface a friendly page.
        description = request.args.get('error_description', '')
        return _box_callback_html('Box connection cancelled or failed.',
                                  detail=f'{error}: {description}', success=False), 400

    code = request.args.get('code')
    state = request.args.get('state')
    if not code or not state:
        return _box_callback_html('Missing code or state in callback.',
                                  success=False), 400

    user_email = box_client.verify_state(state)
    if not user_email:
        return _box_callback_html('Invalid or expired state — please start the connection from the QC tool again.',
                                  success=False), 400

    redirect_uri = _box_redirect_uri()
    try:
        tokens = box_client.exchange_code_for_tokens(code, redirect_uri)
    except Exception as e:
        print(f'[box_callback] code exchange failed: {e}')
        return _box_callback_html('Could not complete the Box token exchange.',
                                  detail=str(e), success=False), 502

    box_user = None
    try:
        box_user = box_client.get_box_user(tokens['access_token'])
    except Exception as e:
        # Non-fatal — we still got tokens, just couldn't read the Box identity.
        print(f'[box_callback] /users/me failed: {e}')

    box_tokens.save_tokens(user_email, tokens, box_user=box_user)

    return _box_callback_html('Box connected.',
                              detail=(box_user or {}).get('login') or user_email,
                              success=True)


def _box_callback_html(message, detail='', success=True):
    """Tiny self-contained HTML response for the OAuth callback."""
    color = '#28a745' if success else '#dc3545'
    detail_html = f'<p style="color:#6c757d;font-size:0.95em;">{detail}</p>' if detail else ''
    body = f"""
<!doctype html>
<html><head><meta charset="utf-8"><title>Box connection</title></head>
<body style="font-family: -apple-system, Segoe UI, Roboto, Helvetica, Arial, sans-serif; padding: 60px 30px; text-align: center; color: #212529;">
  <h1 style="color: {color}; margin-bottom: 12px;">{message}</h1>
  {detail_html}
  <p style="margin-top: 24px;"><a href="../" style="color: #007bff; text-decoration: none;">Return to AI QC →</a></p>
  <script>
    // If this was opened in a popup, close it and let the opener refresh status.
    if (window.opener && !window.opener.closed) {{
      try {{ window.opener.postMessage({{ type: 'box-oauth-result', success: {str(success).lower()} }}, '*'); }} catch (e) {{}}
      setTimeout(function() {{ window.close(); }}, 1200);
    }}
  </script>
</body></html>
"""
    return Response(body, mimetype='text/html')


@app.route('/api/box/status', methods=['GET'])
@auth.require_auth
def box_status():
    """Whether the current user has connected their Box account."""
    import box_client
    import box_tokens

    user_email = getattr(g, 'user', {}).get('email', '')
    record = box_tokens.get_tokens(user_email)

    if not record:
        return jsonify({
            'status': 'success',
            'connected': False,
            'configured': box_client.is_configured(),
        })

    return jsonify({
        'status': 'success',
        'connected': True,
        'configured': True,
        'box_user_login': record.get('box_user_login'),
        'box_user_name': record.get('box_user_name'),
        'connected_at': record.get('connected_at'),
        'access_token_expires_at': record.get('access_token_expires_at'),
    })


@app.route('/api/box/disconnect', methods=['POST'])
@auth.require_auth
def box_disconnect():
    """Forget the current user's Box tokens. Best-effort revoke at Box too."""
    import box_client
    import box_tokens

    user_email = getattr(g, 'user', {}).get('email', '')
    record = box_tokens.get_tokens(user_email)
    if record and record.get('refresh_token'):
        try:
            box_client.revoke_tokens(record['refresh_token'])
        except Exception as e:
            print(f'[box_disconnect] revoke failed for {user_email}: {e}')

    box_tokens.delete_tokens(user_email)
    return jsonify({'status': 'success', 'message': 'Box disconnected'})


@app.route('/api/box/test_folder', methods=['GET'])
@auth.require_auth
def box_test_folder():
    """
    Smoke-test endpoint: list a Box folder's items using the current user's
    stored tokens. Used to prove the OAuth round-trip works end-to-end before
    we wire the watcher in PR3. Folder ID '0' is the user's All Files root.
    """
    import box_client

    user_email = getattr(g, 'user', {}).get('email', '')
    folder_id = (request.args.get('folder_id') or '0').strip()

    access_token = box_client.get_valid_access_token(user_email)
    if not access_token:
        return jsonify({'status': 'error',
                        'code': 'box_not_connected',
                        'message': 'Connect your Box account first via /auth/box/login'}), 401

    try:
        result = box_client.list_folder_items(access_token, folder_id)
    except Exception as e:
        print(f'[box_test_folder] list failed: {e}')
        return jsonify({'status': 'error', 'message': str(e)}), 502

    items = [
        {
            'id': it.get('id'),
            'name': it.get('name'),
            'type': it.get('type'),
            'size': it.get('size'),
            'created_at': it.get('created_at'),
            'created_by_login': (it.get('created_by') or {}).get('login'),
        }
        for it in (result.get('entries') or [])
    ]
    return jsonify({
        'status': 'success',
        'folder_id': folder_id,
        'total_count': result.get('total_count'),
        'items': items,
    })


@app.route('/api/usage/stats', methods=['GET'])
@auth.require_auth
def get_usage_stats_endpoint():
    """Get usage statistics (admin endpoint)"""
    from usage_tracker import get_usage_stats

    # Get query parameters
    start_date = request.args.get('start_date')
    end_date = request.args.get('end_date')
    client = request.args.get('client')
    user_id = request.args.get('user_id')

    try:
        stats = get_usage_stats(
            start_date=start_date,
            end_date=end_date,
            client=client,
            user_id=user_id
        )

        return jsonify({
            'status': 'success',
            'stats': stats
        })
    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/usage/export', methods=['GET'])
@auth.require_auth
def export_usage_logs_endpoint():
    """Export usage logs as CSV (admin endpoint)"""
    import csv
    import io
    from usage_tracker import USAGE_LOG_DIR

    # Get date range
    start_date = request.args.get('start_date')
    end_date = request.args.get('end_date')

    try:
        # Collect all log entries
        import glob
        log_files = glob.glob(os.path.join(USAGE_LOG_DIR, '*.jsonl'))

        # Create CSV
        output = io.StringIO()
        fieldnames = ['timestamp', 'event', 'session_id', 'client', 'profile',
                      'user_email', 'checks_completed', 'overall_score', 'estimated_cost_usd']
        writer = csv.DictWriter(output, fieldnames=fieldnames)
        writer.writeheader()

        for log_file in sorted(log_files):
            with open(log_file, 'r') as f:
                for line in f:
                    try:
                        entry = json.loads(line.strip())
                        if entry.get('event') == 'analysis_complete':
                            writer.writerow({
                                'timestamp': entry.get('timestamp'),
                                'event': entry.get('event'),
                                'session_id': entry.get('session_id'),
                                'client': entry.get('client'),
                                'profile': entry.get('profile'),
                                'user_email': entry.get('user_email'),
                                'checks_completed': entry.get('checks_completed'),
                                'overall_score': entry.get('overall_score'),
                                'estimated_cost_usd': entry.get('estimated_cost_usd')
                            })
                    except:
                        continue

        # Return as downloadable CSV
        output.seek(0)
        return Response(
            output.getvalue(),
            mimetype='text/csv',
            headers={'Content-Disposition': 'attachment; filename=usage_export.csv'}
        )
    except Exception as e:
        return jsonify({
            'status': 'error',
            'message': str(e)
        }), 500

@app.route('/api/debug/test_file_upload', methods=['POST'])
@auth.require_auth
def debug_test_file_upload():
    """Debug endpoint to test file upload handling"""
    try:
        # Check if file is in request
        if 'file' not in request.files:
            return jsonify({'status': 'error', 'message': 'No file part', 'files_in_request': list(request.files.keys())}), 400

        file = request.files['file']

        # Check if file was selected
        if file.filename == '':
            return jsonify({'status': 'error', 'message': 'No selected file'}), 400

        # Get parameters
        profile = request.form.get('profile', 'general').lower()

        # Create session ID
        session_id = datetime.now().strftime('%Y%m%d_%H%M%S')

        # Check upload folder configuration
        upload_folder = app.config.get('UPLOAD_FOLDER', 'uploads')

        return jsonify({
            'status': 'success',
            'message': 'File upload test successful',
            'session_id': session_id,
            'filename': file.filename,
            'profile': profile,
            'upload_folder': upload_folder,
            'upload_folder_exists': os.path.exists(upload_folder),
            'form_data': dict(request.form),
            'files': list(request.files.keys())
        })

    except Exception as e:
        import traceback
        return jsonify({
            'status': 'error',
            'message': str(e),
            'traceback': traceback.format_exc()
        }), 500

# Initialize application
if not qc_apps:
    load_qc_apps()
    print(f"Initialized app with {len(qc_apps)} QC apps")
    print(f"Brand Guidelines DB initialized: {len(brand_db.get_all_brands())} brands")

# Backfill: process any existing unprocessed PDF guidelines
def _backfill_unprocessed_pdfs():
    import threading
    unprocessed = []
    for file_id, record in brand_db.db.get("files", {}).items():
        if record.get("file_type") == ".pdf" and not record.get("processed"):
            stored_path = record.get("stored_path", "")
            if stored_path and os.path.exists(stored_path):
                unprocessed.append((file_id, stored_path, record.get("brand_name", ""), str(brand_db.files_dir)))

    if unprocessed:
        print(f"Found {len(unprocessed)} unprocessed PDF guidelines - starting background processing")
        def _process_all():
            for fid, spath, bname, fdir in unprocessed:
                try:
                    from pdf_processor import process_pdf_guideline
                    result = process_pdf_guideline(spath, fid, bname, fdir)
                    brand_db.update_file_record(fid, result)
                    print(f"Backfill complete for {fid}")
                except Exception as e:
                    print(f"Backfill failed for {fid}: {e}")
                    brand_db.update_file_record(fid, {'processed': 'error', 'processing_error': str(e)})
        threading.Thread(target=_process_all, daemon=True).start()

_backfill_unprocessed_pdfs()

# When run directly
if __name__ == "__main__":
    import argparse

    # Get default port from environment, fallback to 7183
    default_port = int(os.environ.get('PORT', 7183))
    default_debug = debug_mode  # Use the debug setting from environment

    parser = argparse.ArgumentParser(description='Run Visual AI QC API server')
    parser.add_argument('--host', type=str, default='0.0.0.0', help='Host to bind to')
    parser.add_argument('--port', type=int, default=default_port, help=f'Port to listen on (default: {default_port} from environment)')
    parser.add_argument('--debug', action='store_true', default=default_debug, help=f'Run in debug mode (default: {default_debug} from environment)')

    args = parser.parse_args()

    print(f"Environment: {current_environment}")
    print(f"Starting Flask API server on {args.host}:{args.port}")
    print(f"Debug mode: {args.debug}")
    app.run(host=args.host, port=args.port, debug=args.debug)