Spaces:

shiva0013
/

pdftools

Sleeping

File size: 104,422 Bytes

"""
LocalTools Server - PDF Editor & Image Scraper
FastAPI backend with async operations, logging, and cleanup
"""

import asyncio
import io
import json
import logging
import re
import uuid
import zipfile
from contextlib import asynccontextmanager
from datetime import datetime, timedelta
from pathlib import Path
from typing import Optional, List
from urllib.parse import urljoin, urlparse

import aiohttp
import fitz  # PyMuPDF
from PIL import Image
from pydantic import BaseModel, Field, HttpUrl
from pydantic_settings import BaseSettings

from fastapi import FastAPI, HTTPException, UploadFile, File, Form, BackgroundTasks
from fastapi.responses import FileResponse, HTMLResponse, JSONResponse
from fastapi.staticfiles import StaticFiles
from fastapi.middleware.cors import CORSMiddleware


# =============== Configuration ===============

class Settings(BaseSettings):
    """Application settings with environment variable support"""
    app_name: str = "LocalTools"
    debug: bool = False
    
    # Paths
    work_dir: str = "work"
    output_dir: str = "outputs"
    static_dir: str = "static"
    
    # Limits
    max_pdf_size_mb: int = 100
    max_image_size_mb: int = 50
    min_image_dimension: int = 50
    request_timeout: int = 60
    
    # Cleanup
    cleanup_interval_hours: int = 24
    file_retention_hours: int = 48
    
    class Config:
        env_prefix = "LOCALTOOLS_"


settings = Settings()


# =============== Logging Setup ===============

logging.basicConfig(
    level=logging.DEBUG if settings.debug else logging.INFO,
    format="%(asctime)s | %(levelname)-8s | %(name)s | %(message)s",
    datefmt="%Y-%m-%d %H:%M:%S"
)
logger = logging.getLogger("localtools")


# =============== Path Setup ===============

APP_DIR = Path(__file__).parent
STATIC_DIR = APP_DIR / settings.static_dir
WORK_DIR = APP_DIR / settings.work_dir
OUT_DIR = APP_DIR / settings.output_dir
SCRAPE_DIR = WORK_DIR / "scrape_jobs"

for directory in [WORK_DIR, OUT_DIR, SCRAPE_DIR]:
    directory.mkdir(exist_ok=True)


# =============== Constants ===============

UA_HEADERS = {
    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36"
}

ALLOWED_IMAGE_TYPES = {"image/jpeg", "image/png", "image/gif", "image/webp", "image/bmp"}


# =============== Response Models ===============

class ScrapeResult(BaseModel):
    job_id: str
    images: List[dict]
    total_found: int
    filtered_count: int


class HealthResponse(BaseModel):
    status: str
    version: str = "1.0.0"
    uptime_seconds: float


# =============== Cleanup Task ===============

startup_time = datetime.now()

async def cleanup_old_files():
    """Remove files older than retention period"""
    retention = timedelta(hours=settings.file_retention_hours)
    cutoff = datetime.now() - retention
    removed = 0
    
    for directory in [WORK_DIR, OUT_DIR]:
        for file_path in directory.glob("*"):
            if file_path.is_file():
                mtime = datetime.fromtimestamp(file_path.stat().st_mtime)
                if mtime < cutoff:
                    try:
                        file_path.unlink()
                        removed += 1
                    except Exception as e:
                        logger.warning(f"Failed to remove {file_path}: {e}")
    
    # Clean old scrape jobs
    for job_dir in SCRAPE_DIR.glob("*"):
        if job_dir.is_dir():
            mtime = datetime.fromtimestamp(job_dir.stat().st_mtime)
            if mtime < cutoff:
                try:
                    for f in job_dir.glob("*"):
                        f.unlink()
                    job_dir.rmdir()
                    removed += 1
                except Exception as e:
                    logger.warning(f"Failed to remove job {job_dir}: {e}")
    
    if removed > 0:
        logger.info(f"Cleanup: removed {removed} old files/directories")


async def periodic_cleanup():
    """Run cleanup periodically"""
    while True:
        await asyncio.sleep(settings.cleanup_interval_hours * 3600)
        await cleanup_old_files()


# =============== Lifespan ===============

@asynccontextmanager
async def lifespan(app: FastAPI):
    """Startup and shutdown events"""
    logger.info(f"Starting {settings.app_name}")
    
    # Start cleanup task
    cleanup_task = asyncio.create_task(periodic_cleanup())
    
    # Run initial cleanup
    await cleanup_old_files()
    
    yield
    
    # Shutdown
    cleanup_task.cancel()
    logger.info("Shutting down")


# =============== App Setup ===============

app = FastAPI(
    title=settings.app_name,
    description="PDF Editor & Image Scraper API",
    version="1.0.0",
    lifespan=lifespan
)

# CORS middleware
app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],
    allow_methods=["*"],
    allow_headers=["*"],
)

# Static files
app.mount("/static", StaticFiles(directory=str(STATIC_DIR)), name="static")


# =============== PDF Helpers ===============

def to_points(value: float, unit: str) -> float:
    """Convert measurement to PDF points"""
    conversions = {
        "pt": 1.0,
        "points": 1.0,
        "in": 72.0,
        "inch": 72.0,
        "inches": 72.0,
        "cm": 72.0 / 2.54,
        "centimeter": 72.0 / 2.54,
        "centimeters": 72.0 / 2.54,
        "mm": 72.0 / 25.4,
        "millimeter": 72.0 / 25.4,
        "millimeters": 72.0 / 25.4,
    }
    
    unit_lower = unit.lower().strip()
    if unit_lower not in conversions:
        raise ValueError(f"Invalid unit: {unit}. Use: pt, in, cm, or mm")
    
    return float(value) * conversions[unit_lower]


def parse_page_spec(spec: str, total_pages: int) -> set[int]:
    """
    Parse page specification string to set of 0-based page indices.
    Input: "1,3,5" or "2-6" or "1,3-5,9" (1-based)
    Output: Set of 0-based indices
    """
    spec = (spec or "").strip().replace(" ", "")
    if not spec:
        return set()

    result = set()
    for part in spec.split(","):
        if not part:
            continue
        
        try:
            if "-" in part:
                start_str, end_str = part.split("-", 1)
                start, end = int(start_str), int(end_str)
                if start > end:
                    start, end = end, start
                for p in range(start, end + 1):
                    if 1 <= p <= total_pages:
                        result.add(p - 1)
            else:
                p = int(part)
                if 1 <= p <= total_pages:
                    result.add(p - 1)
        except ValueError:
            logger.warning(f"Invalid page spec part: {part}")
            continue
    
    return result


def extract_drive_file_id(url: str) -> Optional[str]:
    """Extract Google Drive file ID from URL"""
    patterns = [
        r"/file/d/([^/]+)",
        r"[?&]id=([^&]+)",
    ]
    
    for pattern in patterns:
        match = re.search(pattern, url)
        if match:
            return match.group(1)
    
    return None


async def download_from_url(url: str, out_path: Path, is_drive: bool = False) -> Path:
    """Download file from URL using aiohttp"""
    timeout = aiohttp.ClientTimeout(total=settings.request_timeout)
    
    async with aiohttp.ClientSession(timeout=timeout, headers=UA_HEADERS) as session:
        if is_drive:
            file_id = extract_drive_file_id(url)
            if not file_id:
                raise ValueError("Invalid Google Drive URL. Use format: /file/d/<ID>/view")
            
            download_url = f"https://drive.google.com/uc?export=download&id={file_id}"
            
            async with session.get(download_url) as resp:
                resp.raise_for_status()
                
                # Check for confirmation token (large files)
                cookies = resp.cookies
                confirm_token = None
                for key, cookie in cookies.items():
                    if key.startswith("download_warning"):
                        confirm_token = cookie.value
                        break
                
                if confirm_token:
                    download_url = f"{download_url}&confirm={confirm_token}"
                    async with session.get(download_url) as resp2:
                        resp2.raise_for_status()
                        content = await resp2.read()
                else:
                    content = await resp.read()
        else:
            async with session.get(url) as resp:
                resp.raise_for_status()
                content = await resp.read()
    
    # Validate PDF
    if not content[:5] == b"%PDF-":
        # Check if it's an HTML error page
        if b"<html" in content[:1000].lower() or b"sign in" in content[:1000].lower():
            raise ValueError("Access denied. For Drive files, set sharing to 'Anyone with link'")
        raise ValueError("Downloaded file is not a valid PDF")
    
    out_path.parent.mkdir(parents=True, exist_ok=True)
    out_path.write_bytes(content)
    
    logger.info(f"Downloaded PDF: {out_path.name} ({len(content)} bytes)")
    return out_path


def validate_pdf_upload(data: bytes) -> None:
    """Validate uploaded PDF data"""
    if not data:
        raise ValueError("Empty file uploaded")
    
    if len(data) > settings.max_pdf_size_mb * 1024 * 1024:
        raise ValueError(f"File too large. Maximum size: {settings.max_pdf_size_mb}MB")
    
    if not data[:5] == b"%PDF-":
        raise ValueError("Invalid PDF file")


def add_text_watermark(page: fitz.Page, text: str, font_size: float, rotate: int) -> None:
    """Add text watermark to PDF page"""
    if not text.strip():
        return

    rect = page.rect
    box = fitz.Rect(
        rect.x0 + rect.width * 0.05,
        rect.y0 + rect.height * 0.05,
        rect.x1 - rect.width * 0.05,
        rect.y1 - rect.height * 0.05,
    )

    try:
        page.insert_textbox(
            box, text,
            fontsize=float(font_size),
            rotate=int(rotate),
            align=fitz.TEXT_ALIGN_CENTER,
            color=(0.55, 0.55, 0.55),
            overlay=True,
            fill_opacity=0.18,
            stroke_opacity=0.18,
        )
    except TypeError:
        # Fallback for older PyMuPDF versions
        page.insert_textbox(
            box, text,
            fontsize=float(font_size),
            rotate=int(rotate),
            align=fitz.TEXT_ALIGN_CENTER,
            color=(0.75, 0.75, 0.75),
            overlay=True,
        )


def process_pdf(
    input_path: Path,
    output_path: Path,
    remove_pages: str,
    crop_top: float,
    crop_bottom: float,
    crop_left: float,
    crop_right: float,
    unit: str,
    watermark_text: str,
    watermark_size: float,
    watermark_rotate: int,
) -> dict:
    """Process PDF with cropping, page removal, and watermark"""
    
    src = fitz.open(str(input_path))
    total = src.page_count
    remove_set = parse_page_spec(remove_pages, total)

    # Convert crop values to points
    T = to_points(crop_top, unit)
    B = to_points(crop_bottom, unit)
    L = to_points(crop_left, unit)
    R = to_points(crop_right, unit)

    out = fitz.open()
    kept = 0

    for i in range(total):
        if i in remove_set:
            continue

        out.insert_pdf(src, from_page=i, to_page=i)
        page = out.load_page(out.page_count - 1)

        rect = page.rect
        crop_rect = fitz.Rect(rect.x0 + L, rect.y0 + T, rect.x1 - R, rect.y1 - B)
        
        if crop_rect.is_empty or crop_rect.width <= 2 or crop_rect.height <= 2:
            raise ValueError(f"Invalid crop on page {i+1}. Reduce crop values.")

        page.set_cropbox(crop_rect)

        if watermark_text.strip():
            add_text_watermark(page, watermark_text, watermark_size, watermark_rotate)

        kept += 1

    if kept == 0:
        raise ValueError("All pages removed. Output would be empty.")

    output_path.parent.mkdir(parents=True, exist_ok=True)
    out.save(str(output_path))
    out.close()
    src.close()

    logger.info(f"Processed PDF: {kept}/{total} pages kept")
    
    return {
        "original_pages": total,
        "output_pages": kept,
        "removed_pages": len(remove_set)
    }


# =============== Image Scraper Helpers ===============

def normalize_url(url: str) -> str:
    """Normalize URL by removing fragment"""
    parsed = urlparse(url)
    return parsed._replace(fragment="").geturl()


def best_from_srcset(srcset: str, base_url: str) -> Optional[str]:
    """Extract best quality image URL from srcset attribute"""
    if not srcset:
        return None
    
    candidates = []
    for part in srcset.split(","):
        part = part.strip()
        if not part:
            continue
        
        bits = part.split()
        img_url = urljoin(base_url, bits[0])
        score = 0.0
        
        if len(bits) > 1:
            descriptor = bits[1].lower().strip()
            try:
                if descriptor.endswith("w"):
                    score = float(descriptor[:-1])
                elif descriptor.endswith("x"):
                    score = float(descriptor[:-1]) * 10000.0
            except ValueError:
                pass
        
        candidates.append((score, img_url))
    
    if not candidates:
        return None
    
    candidates.sort(key=lambda x: x[0], reverse=True)
    return candidates[0][1]


def safe_filename(url: str, fallback: str) -> str:
    """Generate safe filename from URL"""
    name = Path(urlparse(url).path).name or fallback
    name = re.sub(r"[^a-zA-Z0-9._-]+", "_", name)
    
    if "." not in name:
        name += ".jpg"
    
    return name[:120]


async def fetch_image(session: aiohttp.ClientSession, img_url: str) -> tuple[bytes, Optional[int], Optional[int], Optional[str]]:
    """Fetch image and return bytes with dimensions"""
    async with session.get(img_url) as resp:
        resp.raise_for_status()
        content_type = resp.headers.get("Content-Type", "")
        data = await resp.read()
    
    width = height = None
    try:
        with Image.open(io.BytesIO(data)) as img:
            width, height = img.size
    except Exception:
        pass
    
    return data, width, height, content_type


async def scrape_images(page_url: str) -> dict:
    """Scrape images from webpage"""
    page_url = page_url.strip()
    if not page_url:
        raise ValueError("Web page URL is required")

    timeout = aiohttp.ClientTimeout(total=settings.request_timeout)
    
    async with aiohttp.ClientSession(timeout=timeout, headers=UA_HEADERS) as session:
        # Fetch page HTML
        async with session.get(page_url) as resp:
            resp.raise_for_status()
            html = await resp.text()

        # Parse HTML (using regex for simplicity, avoiding lxml dependency issues)
        found_urls: List[str] = []
        
        # Find all img tags
        img_pattern = r'<img[^>]+>'
        lazy_attrs = ["data-src", "data-original", "data-lazy-src", "data-url", "data-image", "data-srcset", "srcset", "src"]
        
        for img_match in re.finditer(img_pattern, html, re.IGNORECASE):
            img_tag = img_match.group()
            
            for attr in lazy_attrs:
                attr_pattern = rf'{attr}=["\']([^"\']+)["\']'
                attr_match = re.search(attr_pattern, img_tag, re.IGNORECASE)
                
                if attr_match:
                    value = attr_match.group(1)
                    
                    if "srcset" in attr.lower():
                        best = best_from_srcset(value, page_url)
                        if best:
                            found_urls.append(best)
                    else:
                        found_urls.append(urljoin(page_url, value))

        # Deduplicate
        seen = set()
        deduped = []
        for url in found_urls:
            normalized = normalize_url(url)
            if normalized not in seen and normalized.startswith("http"):
                seen.add(normalized)
                deduped.append(normalized)

        logger.info(f"Found {len(deduped)} unique image URLs on {page_url}")

        # Create job directory
        job_id = uuid.uuid4().hex[:10]
        job_dir = SCRAPE_DIR / job_id
        job_dir.mkdir(parents=True, exist_ok=True)

        # Fetch images concurrently
        images = []
        filtered = 0
        
        async def process_image(idx: int, url: str):
            nonlocal filtered
            try:
                data, width, height, content_type = await fetch_image(session, url)
                
                # Filter small images
                if width and height:
                    if width < settings.min_image_dimension or height < settings.min_image_dimension:
                        filtered += 1
                        return None
                
                img_id = uuid.uuid4().hex[:10]
                filename = safe_filename(url, f"image_{idx}.jpg")
                
                # Save image data
                (job_dir / f"{img_id}.bin").write_bytes(data)
                
                return {
                    "id": img_id,
                    "url": url,
                    "filename": filename,
                    "width": width,
                    "height": height,
                    "bytes": len(data),
                }
            except Exception as e:
                logger.debug(f"Failed to fetch {url}: {e}")
                return None

        # Process images with concurrency limit
        semaphore = asyncio.Semaphore(10)
        
        async def limited_process(idx: int, url: str):
            async with semaphore:
                return await process_image(idx, url)
        
        tasks = [limited_process(idx, url) for idx, url in enumerate(deduped, 1)]
        results = await asyncio.gather(*tasks)
        
        images = [r for r in results if r is not None]

        # Save metadata
        meta = {
            "page_url": page_url,
            "scraped_at": datetime.now().isoformat(),
            "images": images
        }
        (job_dir / "meta.json").write_text(
            json.dumps(meta, ensure_ascii=False, indent=2),
            encoding="utf-8"
        )

        logger.info(f"Scraped {len(images)} images, filtered {filtered} small icons")

        return {
            "job_id": job_id,
            "images": images,
            "total_found": len(deduped),
            "filtered_count": filtered
        }


def load_scrape_job(job_id: str) -> dict:
    """Load scrape job metadata"""
    job_dir = SCRAPE_DIR / job_id
    meta_path = job_dir / "meta.json"
    
    if not job_dir.exists() or not meta_path.exists():
        raise HTTPException(status_code=404, detail="Scrape job not found. Please scrape again.")
    
    try:
        return json.loads(meta_path.read_text(encoding="utf-8"))
    except Exception as e:
        logger.error(f"Failed to load job {job_id}: {e}")
        raise HTTPException(status_code=500, detail="Corrupted scrape job metadata")


# =============== Utility Functions ===============

def sanitize_filename(name: str, default: str = "file") -> str:
    """Sanitize filename for safe file system use"""
    name = (name or default).strip()
    name = re.sub(r"[^a-zA-Z0-9._-]+", "_", name)
    return name[:200] or default


def generate_job_id() -> str:
    """Generate unique job ID"""
    return uuid.uuid4().hex[:10]


# =============== API Routes ===============

@app.get("/", response_class=HTMLResponse)
async def home():
    """Serve main HTML page"""
    index_path = STATIC_DIR / "index.html"
    if not index_path.exists():
        raise HTTPException(status_code=500, detail="Frontend not found")
    return HTMLResponse(index_path.read_text(encoding="utf-8"))


@app.get("/api/health", response_model=HealthResponse)
async def health_check():
    """Health check endpoint"""
    uptime = (datetime.now() - startup_time).total_seconds()
    return HealthResponse(status="healthy", uptime_seconds=uptime)


@app.post("/api/fetch")
async def api_fetch_pdf(
    url: str = Form(""),
    file: UploadFile = File(None),
    output_name: str = Form("original.pdf"),
):
    """Fetch/upload PDF for preview (no processing)"""
    output_name = sanitize_filename(output_name, "original.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"

    job_id = generate_job_id()
    input_path = WORK_DIR / f"original_{job_id}.pdf"

    try:
        if file is not None and file.filename:
            data = await file.read()
            validate_pdf_upload(data)
            input_path.write_bytes(data)
            logger.info(f"Uploaded PDF: {file.filename}")
        elif url.strip():
            is_drive = "drive.google.com" in url
            await download_from_url(url, input_path, is_drive=is_drive)
        else:
            raise ValueError("Provide a PDF URL or upload a file")
            
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except aiohttp.ClientError as e:
        logger.error(f"Download failed: {e}")
        raise HTTPException(status_code=400, detail=f"Download failed: {str(e)}")
    except Exception as e:
        logger.exception("Unexpected error in fetch")
        raise HTTPException(status_code=500, detail="Internal server error")

    return FileResponse(
        path=str(input_path),
        media_type="application/pdf",
        filename=output_name
    )


@app.post("/api/process")
async def api_process_pdf(
    url: str = Form(""),
    file: UploadFile = File(None),
    output_name: str = Form("cropped.pdf"),
    remove_pages: str = Form(""),
    unit: str = Form("mm"),
    top: float = Form(0),
    bottom: float = Form(0),
    left: float = Form(0),
    right: float = Form(0),
    watermark_text: str = Form(""),
    watermark_size: float = Form(36),
    watermark_rotate: int = Form(45),
):
    """Process PDF with cropping, page removal, and watermark"""
    output_name = sanitize_filename(output_name, "cropped.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"

    job_id = generate_job_id()
    input_path = WORK_DIR / f"input_{job_id}.pdf"
    output_path = OUT_DIR / f"{job_id}_{output_name}"

    # Get input PDF
    try:
        if file is not None and file.filename:
            data = await file.read()
            validate_pdf_upload(data)
            input_path.write_bytes(data)
        elif url.strip():
            is_drive = "drive.google.com" in url
            await download_from_url(url, input_path, is_drive=is_drive)
        else:
            raise ValueError("Provide a PDF URL or upload a file")
            
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except aiohttp.ClientError as e:
        raise HTTPException(status_code=400, detail=f"Download failed: {str(e)}")

    # Process PDF
    try:
        process_pdf(
            input_path=input_path,
            output_path=output_path,
            remove_pages=remove_pages,
            crop_top=top,
            crop_bottom=bottom,
            crop_left=left,
            crop_right=right,
            unit=unit,
            watermark_text=watermark_text,
            watermark_size=watermark_size,
            watermark_rotate=watermark_rotate,
        )
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except Exception as e:
        logger.exception("PDF processing failed")
        raise HTTPException(status_code=500, detail=f"Processing failed: {str(e)}")

    return FileResponse(
        path=str(output_path),
        media_type="application/pdf",
        filename=output_name
    )


@app.post("/api/scrape-images")
async def api_scrape_images(page_url: str = Form(...)):
    """Scrape images from a webpage"""
    try:
        result = await scrape_images(page_url)
        return JSONResponse(result)
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except aiohttp.ClientError as e:
        raise HTTPException(status_code=400, detail=f"Failed to fetch page: {str(e)}")
    except Exception as e:
        logger.exception("Scrape failed")
        raise HTTPException(status_code=500, detail="Scraping failed")


@app.post("/api/download-zip")
async def api_download_zip(
    job_id: str = Form(...),
    image_ids: str = Form(...),
    zip_name: str = Form("images.zip")
):
    """Download selected images as ZIP"""
    meta = load_scrape_job(job_id.strip())
    job_dir = SCRAPE_DIR / job_id.strip()

    selected = [x.strip() for x in image_ids.split(",") if x.strip()]
    if not selected:
        raise HTTPException(status_code=400, detail="No images selected")

    zip_name = sanitize_filename(zip_name, "images.zip")
    if not zip_name.lower().endswith(".zip"):
        zip_name += ".zip"

    output_path = OUT_DIR / f"{generate_job_id()}_{zip_name}"
    id_to_meta = {img["id"]: img for img in meta.get("images", [])}

    with zipfile.ZipFile(output_path, "w", compression=zipfile.ZIP_DEFLATED) as zf:
        for img_id in selected:
            bin_path = job_dir / f"{img_id}.bin"
            if bin_path.exists():
                filename = id_to_meta.get(img_id, {}).get("filename", f"{img_id}.jpg")
                zf.writestr(filename, bin_path.read_bytes())

    logger.info(f"Created ZIP with {len(selected)} images")

    return FileResponse(
        path=str(output_path),
        media_type="application/zip",
        filename=zip_name
    )


@app.post("/api/download-pdf")
async def api_download_pdf(
    job_id: str = Form(...),
    image_ids: str = Form(...),
    pdf_name: str = Form("images.pdf")
):
    """Download selected images as PDF"""
    meta = load_scrape_job(job_id.strip())
    job_dir = SCRAPE_DIR / job_id.strip()

    selected = [x.strip() for x in image_ids.split(",") if x.strip()]
    if not selected:
        raise HTTPException(status_code=400, detail="No images selected")

    pdf_name = sanitize_filename(pdf_name, "images.pdf")
    if not pdf_name.lower().endswith(".pdf"):
        pdf_name += ".pdf"

    # Convert images to PDF pages
    pil_pages: List[Image.Image] = []
    for img_id in selected:
        bin_path = job_dir / f"{img_id}.bin"
        if not bin_path.exists():
            continue
        try:
            with Image.open(bin_path) as img:
                rgb = img.convert("RGB")
                pil_pages.append(rgb.copy())
        except Exception as e:
            logger.warning(f"Failed to process image {img_id}: {e}")
            continue

    if not pil_pages:
        raise HTTPException(status_code=400, detail="No valid images to convert")

    output_path = OUT_DIR / f"{generate_job_id()}_{pdf_name}"
    
    first = pil_pages[0]
    rest = pil_pages[1:] if len(pil_pages) > 1 else []
    first.save(output_path, "PDF", save_all=True, append_images=rest)

    logger.info(f"Created PDF with {len(pil_pages)} images")

    return FileResponse(
        path=str(output_path),
        media_type="application/pdf",
        filename=pdf_name
    )


@app.post("/api/cleanup")
async def api_trigger_cleanup(background_tasks: BackgroundTasks):
    """Manually trigger cleanup (for admin use)"""
    background_tasks.add_task(cleanup_old_files)
    return {"message": "Cleanup scheduled"}


@app.post("/api/remove-watermark")
async def api_remove_watermark(
    url: str = Form(""),
    file: UploadFile = File(None),
    output_name: str = Form("cleaned.pdf"),
    watermark_text: str = Form("Educated Nepal"),
    method: str = Form("inpaint"),
    intensity: int = Form(50),
    dpi: int = Form(120),
    quality: int = Form(70),
):
    """Remove watermark from PDF using image processing"""
    try:
        from watermark_remover import remove_watermark_from_pdf, CV2_AVAILABLE
        
        if not CV2_AVAILABLE:
            raise HTTPException(
                status_code=500, 
                detail="OpenCV not installed. Run: pip install opencv-python-headless"
            )
    except ImportError as e:
        raise HTTPException(status_code=500, detail=str(e))
    
    output_name = sanitize_filename(output_name, "cleaned.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"

    job_id = generate_job_id()
    input_path = WORK_DIR / f"input_{job_id}.pdf"
    output_path = OUT_DIR / f"{job_id}_{output_name}"

    # Get input PDF
    try:
        if file is not None and file.filename:
            data = await file.read()
            validate_pdf_upload(data)
            input_path.write_bytes(data)
        elif url.strip():
            is_drive = "drive.google.com" in url
            await download_from_url(url, input_path, is_drive=is_drive)
        else:
            raise ValueError("Provide a PDF URL or upload a file")
            
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except aiohttp.ClientError as e:
        raise HTTPException(status_code=400, detail=f"Download failed: {str(e)}")

    # Clamp values
    dpi = max(72, min(200, dpi))
    quality = max(30, min(95, quality))

    # Process watermark removal
    try:
        pdf_bytes = input_path.read_bytes()
        original_size = len(pdf_bytes)
        
        result_bytes = remove_watermark_from_pdf(
            pdf_bytes=pdf_bytes,
            watermark_text=watermark_text,
            method=method,
            intensity=intensity,
            dpi=dpi,
            jpeg_quality=quality
        )
        output_path.write_bytes(result_bytes)
        
        output_size = len(result_bytes)
        logger.info(f"Watermark removed: {output_name}, {original_size/1024:.0f}KB -> {output_size/1024:.0f}KB")
        
    except Exception as e:
        logger.exception("Watermark removal failed")
        raise HTTPException(status_code=500, detail=f"Processing failed: {str(e)}")

    return FileResponse(
        path=str(output_path),
        media_type="application/pdf",
        filename=output_name,
        headers={
            "X-Original-Size": str(original_size),
            "X-Output-Size": str(output_size)
        }
    )


@app.post("/api/watermark-preview")
async def api_watermark_preview(
    url: str = Form(""),
    file: UploadFile = File(None),
    page: int = Form(0),
    method: str = Form("inpaint"),
    intensity: int = Form(50),
):
    """Preview watermark removal on a single page - returns original and processed images"""
    try:
        from watermark_remover import preview_single_page, CV2_AVAILABLE
        
        if not CV2_AVAILABLE:
            raise HTTPException(status_code=500, detail="OpenCV not installed")
    except ImportError as e:
        raise HTTPException(status_code=500, detail=str(e))

    # Get input PDF
    try:
        if file is not None and file.filename:
            pdf_bytes = await file.read()
            validate_pdf_upload(pdf_bytes)
        elif url.strip():
            job_id = generate_job_id()
            input_path = WORK_DIR / f"preview_{job_id}.pdf"
            is_drive = "drive.google.com" in url
            await download_from_url(url, input_path, is_drive=is_drive)
            pdf_bytes = input_path.read_bytes()
        else:
            raise ValueError("Provide a PDF URL or upload a file")
            
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))

    # Generate preview
    try:
        import base64
        original_png, processed_png = preview_single_page(
            pdf_bytes=pdf_bytes,
            page_num=page,
            method=method,
            intensity=intensity,
            dpi=100
        )
        
        return JSONResponse({
            "original": base64.b64encode(original_png).decode(),
            "processed": base64.b64encode(processed_png).decode(),
            "page": page
        })
        
    except Exception as e:
        logger.exception("Preview generation failed")
        raise HTTPException(status_code=500, detail=f"Preview failed: {str(e)}")


# =============== Images to PDF ===============

@app.post("/api/images-to-pdf")
async def api_images_to_pdf(
    files: List[UploadFile] = File(...),
    order: str = Form(""),
    output_name: str = Form("images.pdf"),
    page_size: str = Form("a4"),
    margin: int = Form(20),
):
    """Convert multiple images to PDF with custom order"""
    if not files:
        raise HTTPException(status_code=400, detail="No images provided")
    
    output_name = sanitize_filename(output_name, "images.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"
    
    # Parse order if provided (comma-separated indices)
    if order.strip():
        try:
            indices = [int(i.strip()) for i in order.split(",")]
            ordered_files = [files[i] for i in indices if 0 <= i < len(files)]
        except (ValueError, IndexError):
            ordered_files = files
    else:
        ordered_files = files
    
    # Page sizes in points
    page_sizes = {
        "a4": (595, 842),
        "letter": (612, 792),
        "a3": (842, 1191),
        "fit": None  # Fit to image
    }
    
    try:
        pil_images = []
        for f in ordered_files:
            data = await f.read()
            try:
                img = Image.open(io.BytesIO(data))
                if img.mode in ('RGBA', 'P'):
                    img = img.convert('RGB')
                pil_images.append(img)
            except Exception as e:
                logger.warning(f"Skipping invalid image {f.filename}: {e}")
                continue
        
        if not pil_images:
            raise HTTPException(status_code=400, detail="No valid images found")
        
        # Create PDF
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}"
        
        if page_size == "fit":
            # Each page fits the image
            first = pil_images[0]
            rest = pil_images[1:] if len(pil_images) > 1 else []
            first.save(output_path, "PDF", save_all=True, append_images=rest)
        else:
            # Fixed page size with margins
            page_w, page_h = page_sizes.get(page_size, page_sizes["a4"])
            
            doc = fitz.open()
            for img in pil_images:
                # Save image to bytes
                img_buffer = io.BytesIO()
                img.save(img_buffer, format='JPEG', quality=90)
                img_bytes = img_buffer.getvalue()
                
                # Create page
                page = doc.new_page(width=page_w, height=page_h)
                
                # Calculate image rect with margins
                img_w, img_h = img.size
                available_w = page_w - 2 * margin
                available_h = page_h - 2 * margin
                
                # Scale to fit
                scale = min(available_w / img_w, available_h / img_h)
                new_w = img_w * scale
                new_h = img_h * scale
                
                # Center on page
                x = (page_w - new_w) / 2
                y = (page_h - new_h) / 2
                
                rect = fitz.Rect(x, y, x + new_w, y + new_h)
                page.insert_image(rect, stream=img_bytes)
            
            doc.save(str(output_path))
            doc.close()
        
        logger.info(f"Created PDF from {len(pil_images)} images")
        
        return FileResponse(
            path=str(output_path),
            media_type="application/pdf",
            filename=output_name
        )
        
    except Exception as e:
        logger.exception("Images to PDF failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== Merge PDFs ===============

@app.post("/api/merge-pdf")
async def api_merge_pdf(
    files: List[UploadFile] = File(...),
    order: str = Form(""),
    output_name: str = Form("merged.pdf"),
):
    """Merge multiple PDFs into one"""
    if not files or len(files) < 2:
        raise HTTPException(status_code=400, detail="At least 2 PDF files required")
    
    output_name = sanitize_filename(output_name, "merged.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"
    
    # Parse order if provided
    if order.strip():
        try:
            indices = [int(i.strip()) for i in order.split(",")]
            ordered_files = [files[i] for i in indices if 0 <= i < len(files)]
        except (ValueError, IndexError):
            ordered_files = files
    else:
        ordered_files = files
    
    try:
        output_doc = fitz.open()
        total_pages = 0
        
        for f in ordered_files:
            data = await f.read()
            if not data[:5] == b"%PDF-":
                logger.warning(f"Skipping non-PDF file: {f.filename}")
                continue
            
            src_doc = fitz.open(stream=data, filetype="pdf")
            output_doc.insert_pdf(src_doc)
            total_pages += len(src_doc)
            src_doc.close()
        
        if total_pages == 0:
            raise HTTPException(status_code=400, detail="No valid PDF files found")
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}"
        output_doc.save(str(output_path), deflate=True)
        output_doc.close()
        
        logger.info(f"Merged {len(ordered_files)} PDFs, {total_pages} total pages")
        
        return FileResponse(
            path=str(output_path),
            media_type="application/pdf",
            filename=output_name
        )
        
    except Exception as e:
        logger.exception("PDF merge failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== Split PDF ===============

@app.post("/api/split-pdf")
async def api_split_pdf(
    file: UploadFile = File(...),
    mode: str = Form("all"),
    pages: str = Form(""),
    output_name: str = Form("split"),
):
    """
    Split PDF into multiple files.
    Modes: 'all' (each page), 'range' (specific pages), 'chunks' (every N pages)
    """
    data = await file.read()
    validate_pdf_upload(data)
    
    output_name = sanitize_filename(output_name, "split")
    
    try:
        src_doc = fitz.open(stream=data, filetype="pdf")
        total_pages = len(src_doc)
        
        if mode == "all":
            # Split into individual pages
            job_id = generate_job_id()
            zip_path = OUT_DIR / f"{job_id}_{output_name}.zip"
            
            with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zf:
                for i in range(total_pages):
                    page_doc = fitz.open()
                    page_doc.insert_pdf(src_doc, from_page=i, to_page=i)
                    
                    pdf_bytes = page_doc.tobytes()
                    zf.writestr(f"{output_name}_page_{i+1}.pdf", pdf_bytes)
                    page_doc.close()
            
            src_doc.close()
            logger.info(f"Split PDF into {total_pages} individual pages")
            
            return FileResponse(
                path=str(zip_path),
                media_type="application/zip",
                filename=f"{output_name}_pages.zip"
            )
        
        elif mode == "range":
            # Extract specific pages
            page_set = parse_page_spec(pages, total_pages)
            if not page_set:
                raise HTTPException(status_code=400, detail="No valid pages specified")
            
            output_doc = fitz.open()
            for i in sorted(page_set):
                output_doc.insert_pdf(src_doc, from_page=i, to_page=i)
            
            output_path = OUT_DIR / f"{generate_job_id()}_{output_name}.pdf"
            output_doc.save(str(output_path))
            output_doc.close()
            src_doc.close()
            
            logger.info(f"Extracted {len(page_set)} pages from PDF")
            
            return FileResponse(
                path=str(output_path),
                media_type="application/pdf",
                filename=f"{output_name}.pdf"
            )
        
        elif mode == "chunks":
            # Split into chunks of N pages
            try:
                chunk_size = int(pages) if pages else 1
                chunk_size = max(1, chunk_size)
            except ValueError:
                chunk_size = 1
            
            job_id = generate_job_id()
            zip_path = OUT_DIR / f"{job_id}_{output_name}.zip"
            
            with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zf:
                chunk_num = 1
                for start in range(0, total_pages, chunk_size):
                    end = min(start + chunk_size - 1, total_pages - 1)
                    
                    chunk_doc = fitz.open()
                    chunk_doc.insert_pdf(src_doc, from_page=start, to_page=end)
                    
                    pdf_bytes = chunk_doc.tobytes()
                    zf.writestr(f"{output_name}_part_{chunk_num}.pdf", pdf_bytes)
                    chunk_doc.close()
                    chunk_num += 1
            
            src_doc.close()
            logger.info(f"Split PDF into {chunk_num-1} chunks of {chunk_size} pages")
            
            return FileResponse(
                path=str(zip_path),
                media_type="application/zip",
                filename=f"{output_name}_parts.zip"
            )
        
        else:
            raise HTTPException(status_code=400, detail="Invalid split mode")
            
    except HTTPException:
        raise
    except Exception as e:
        logger.exception("PDF split failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== PDF to Images ===============

@app.post("/api/pdf-to-images")
async def api_pdf_to_images(
    file: UploadFile = File(...),
    format: str = Form("png"),
    dpi: int = Form(200),
    pages: str = Form(""),
    output_name: str = Form("pages"),
):
    """Convert PDF pages to high-quality images (PNG or JPG)
    
    DPI Guide:
    - 150: Fast, small files (web preview)
    - 200: Good quality (default)
    - 300: Print quality
    - 400: Ultra sharp (presentations)
    - 600: Maximum quality (OCR/archive)
    """
    data = await file.read()
    validate_pdf_upload(data)
    
    output_name = sanitize_filename(output_name, "pages")
    format = format.lower() if format.lower() in ["png", "jpg", "jpeg"] else "png"
    if format == "jpeg":
        format = "jpg"
    
    # Allow higher DPI for ultra-sharp output (up to 600)
    dpi = max(72, min(600, dpi))
    
    try:
        src_doc = fitz.open(stream=data, filetype="pdf")
        total_pages = len(src_doc)
        
        # Parse page selection
        if pages.strip():
            page_set = parse_page_spec(pages, total_pages)
        else:
            page_set = set(range(total_pages))
        
        if not page_set:
            raise HTTPException(status_code=400, detail="No valid pages specified")
        
        job_id = generate_job_id()
        zip_path = OUT_DIR / f"{job_id}_{output_name}.zip"
        
        # Vector render at specified DPI - handles portrait/landscape automatically
        zoom = dpi / 72.0
        matrix = fitz.Matrix(zoom, zoom)
        
        with zipfile.ZipFile(zip_path, 'w', zipfile.ZIP_DEFLATED) as zf:
            for i in sorted(page_set):
                page = src_doc.load_page(i)
                # alpha=False removes transparency for sharper text
                pix = page.get_pixmap(matrix=matrix, alpha=False)
                
                if format == "png":
                    img_bytes = pix.tobytes("png")
                else:
                    # Convert to JPG via PIL
                    img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
                    buffer = io.BytesIO()
                    img.save(buffer, format="JPEG", quality=95, optimize=True)
                    img_bytes = buffer.getvalue()
                
                zf.writestr(f"{output_name}_page_{i+1}.{format}", img_bytes)
        
        src_doc.close()
        logger.info(f"Converted {len(page_set)} pages to {format.upper()} at {dpi} DPI")
        
        return FileResponse(
            path=str(zip_path),
            media_type="application/zip",
            filename=f"{output_name}_images.zip"
        )
        
    except HTTPException:
        raise
    except Exception as e:
        logger.exception("PDF to images failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== Compress PDF ===============

@app.post("/api/compress-pdf")
async def api_compress_pdf(
    file: UploadFile = File(...),
    quality: int = Form(60),
    output_name: str = Form("compressed.pdf"),
):
    """Compress PDF by reducing image quality and cleaning metadata"""
    data = await file.read()
    validate_pdf_upload(data)
    
    output_name = sanitize_filename(output_name, "compressed.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"
    
    # Use quality directly (10-100 scale, same as image compression)
    jpeg_quality = max(10, min(100, quality))
    
    # Calculate max dimension based on quality
    # Lower quality = smaller max dimension for more compression
    max_dim = int(1000 + (quality / 100) * 2000)  # Range: 1000-3000
    
    logger.info(f"Compressing PDF with quality={jpeg_quality}, max_dim={max_dim}")
    
    try:
        src_doc = fitz.open(stream=data, filetype="pdf")
        images_processed = 0
        
        # Compress images within the PDF
        for page_num in range(len(src_doc)):
            page = src_doc.load_page(page_num)
            image_list = page.get_images(full=True)
            
            for img_index, img_info in enumerate(image_list):
                xref = img_info[0]
                
                try:
                    # Extract image
                    base_image = src_doc.extract_image(xref)
                    if not base_image:
                        continue
                    
                    image_bytes = base_image["image"]
                    original_img_size = len(image_bytes)
                    
                    # Skip very small images
                    if original_img_size < 5000:
                        continue
                    
                    # Open and compress image
                    img = Image.open(io.BytesIO(image_bytes))
                    
                    # Convert to RGB if necessary
                    if img.mode in ('RGBA', 'P'):
                        background = Image.new('RGB', img.size, (255, 255, 255))
                        if img.mode == 'P':
                            img = img.convert('RGBA')
                        if img.mode == 'RGBA':
                            background.paste(img, mask=img.split()[3])
                            img = background
                        else:
                            img = img.convert('RGB')
                    elif img.mode != 'RGB':
                        img = img.convert('RGB')
                    
                    # Resize if larger than max_dim
                    if max(img.size) > max_dim:
                        ratio = max_dim / max(img.size)
                        new_size = (int(img.size[0] * ratio), int(img.size[1] * ratio))
                        img = img.resize(new_size, Image.Resampling.LANCZOS)
                    
                    # Compress to JPEG with specified quality
                    buffer = io.BytesIO()
                    img.save(buffer, format="JPEG", quality=jpeg_quality, optimize=True)
                    compressed_bytes = buffer.getvalue()
                    
                    # Always replace to apply quality setting (even if slightly larger)
                    # This ensures quality slider actually affects output
                    page.replace_image(xref, stream=compressed_bytes)
                    images_processed += 1
                        
                except Exception as e:
                    logger.debug(f"Could not compress image {xref}: {e}")
                    continue
        
        logger.info(f"Processed {images_processed} images")
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}"
        
        # Save with compression options
        src_doc.save(
            str(output_path),
            garbage=4,           # Remove unused objects
            deflate=True,        # Compress streams
            clean=True,          # Clean content streams
        )
        
        original_size = len(data)
        compressed_size = output_path.stat().st_size
        
        # If compression didn't help much, try alternative method
        if compressed_size >= original_size * 0.95:
            src_doc.close()
            # Fallback: just clean and deflate without image processing
            src_doc = fitz.open(stream=data, filetype="pdf")
            src_doc.save(
                str(output_path),
                garbage=4,
                deflate=True,
                clean=True,
            )
            compressed_size = output_path.stat().st_size
        
        reduction = ((original_size - compressed_size) / original_size) * 100
        if reduction < 0:
            reduction = 0
            # If still larger, just copy original
            output_path.write_bytes(data)
            compressed_size = original_size
        
        src_doc.close()
        
        logger.info(f"Compressed PDF: {original_size} -> {compressed_size} bytes ({reduction:.1f}% reduction)")
        
        return FileResponse(
            path=str(output_path),
            media_type="application/pdf",
            filename=output_name,
            headers={
                "X-Original-Size": str(original_size),
                "X-Compressed-Size": str(compressed_size),
                "X-Reduction-Percent": f"{reduction:.1f}"
            }
        )
        
    except Exception as e:
        logger.exception("PDF compression failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== Rotate PDF ===============

@app.post("/api/rotate-pdf")
async def api_rotate_pdf(
    file: UploadFile = File(...),
    rotation: int = Form(90),
    pages: str = Form(""),
    output_name: str = Form("rotated.pdf"),
):
    """Rotate PDF pages (90, 180, or 270 degrees)"""
    data = await file.read()
    validate_pdf_upload(data)
    
    output_name = sanitize_filename(output_name, "rotated.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"
    
    # Normalize rotation to 90, 180, or 270
    rotation = int(rotation) % 360
    if rotation not in [90, 180, 270]:
        rotation = 90
    
    try:
        src_doc = fitz.open(stream=data, filetype="pdf")
        total_pages = len(src_doc)
        
        # Parse page selection (empty = all pages)
        if pages.strip():
            page_set = parse_page_spec(pages, total_pages)
        else:
            page_set = set(range(total_pages))
        
        # Rotate selected pages
        for i in page_set:
            page = src_doc.load_page(i)
            page.set_rotation(page.rotation + rotation)
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}"
        src_doc.save(str(output_path))
        src_doc.close()
        
        logger.info(f"Rotated {len(page_set)} pages by {rotation}°")
        
        return FileResponse(
            path=str(output_path),
            media_type="application/pdf",
            filename=output_name
        )
        
    except Exception as e:
        logger.exception("PDF rotation failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== Add Page Numbers ===============

@app.post("/api/add-page-numbers")
async def api_add_page_numbers(
    file: UploadFile = File(...),
    position: str = Form("bottom-center"),
    format: str = Form("Page {n} of {total}"),
    start_number: int = Form(1),
    font_size: int = Form(11),
    margin: int = Form(30),
    output_name: str = Form("numbered.pdf"),
):
    """Add page numbers to PDF"""
    data = await file.read()
    validate_pdf_upload(data)
    
    output_name = sanitize_filename(output_name, "numbered.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"
    
    # Position mapping
    positions = {
        "top-left": ("left", "top"),
        "top-center": ("center", "top"),
        "top-right": ("right", "top"),
        "bottom-left": ("left", "bottom"),
        "bottom-center": ("center", "bottom"),
        "bottom-right": ("right", "bottom"),
    }
    h_align, v_align = positions.get(position, ("center", "bottom"))
    
    try:
        src_doc = fitz.open(stream=data, filetype="pdf")
        total_pages = len(src_doc)
        
        for i in range(total_pages):
            page = src_doc.load_page(i)
            rect = page.rect
            
            # Format page number text
            page_num = start_number + i
            text = format.replace("{n}", str(page_num)).replace("{total}", str(total_pages))
            
            # Calculate position
            text_width = fitz.get_text_length(text, fontsize=font_size)
            
            if h_align == "left":
                x = margin
            elif h_align == "right":
                x = rect.width - margin - text_width
            else:  # center
                x = (rect.width - text_width) / 2
            
            if v_align == "top":
                y = margin + font_size
            else:  # bottom
                y = rect.height - margin
            
            # Insert text
            page.insert_text(
                (x, y),
                text,
                fontsize=font_size,
                color=(0.3, 0.3, 0.3),
            )
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}"
        src_doc.save(str(output_path))
        src_doc.close()
        
        logger.info(f"Added page numbers to {total_pages} pages")
        
        return FileResponse(
            path=str(output_path),
            media_type="application/pdf",
            filename=output_name
        )
        
    except Exception as e:
        logger.exception("Add page numbers failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== PDF OCR (Text Extraction) ===============

# Check for Tesseract availability
TESSERACT_AVAILABLE = False
try:
    import pytesseract
    # Test if tesseract is installed
    pytesseract.get_tesseract_version()
    TESSERACT_AVAILABLE = True
except Exception:
    logger.warning("Tesseract not available. OCR will use basic text extraction only.")


@app.post("/api/pdf-ocr")
async def api_pdf_ocr(
    file: UploadFile = File(...),
    language: str = Form("eng"),
    pages: str = Form(""),
    output_format: str = Form("txt"),
    dpi: int = Form(200),
):
    """Extract text from PDF using OCR (Tesseract) or native text extraction"""
    data = await file.read()
    validate_pdf_upload(data)
    
    dpi = max(100, min(400, dpi))
    
    try:
        src_doc = fitz.open(stream=data, filetype="pdf")
        total_pages = len(src_doc)
        
        # Parse page selection
        if pages.strip():
            page_set = parse_page_spec(pages, total_pages)
        else:
            page_set = set(range(total_pages))
        
        if not page_set:
            raise HTTPException(status_code=400, detail="No valid pages specified")
        
        all_text = []
        
        for page_num in sorted(page_set):
            page = src_doc.load_page(page_num)
            
            # First try native text extraction
            native_text = page.get_text("text").strip()
            
            # If native text is substantial, use it
            if len(native_text) > 50:
                all_text.append(f"--- Page {page_num + 1} ---\n{native_text}")
            elif TESSERACT_AVAILABLE:
                # Use OCR for scanned pages
                import pytesseract
                
                zoom = dpi / 72.0
                mat = fitz.Matrix(zoom, zoom)
                pix = page.get_pixmap(matrix=mat)
                
                # Convert to PIL Image
                img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
                
                # Run OCR
                ocr_text = pytesseract.image_to_string(img, lang=language)
                all_text.append(f"--- Page {page_num + 1} (OCR) ---\n{ocr_text.strip()}")
            else:
                # No OCR available, use whatever native text we got
                all_text.append(f"--- Page {page_num + 1} ---\n{native_text if native_text else '[No text detected - Tesseract not installed]'}")
        
        src_doc.close()
        
        combined_text = "\n\n".join(all_text)
        
        job_id = generate_job_id()
        
        if output_format == "json":
            # Return as JSON
            return JSONResponse({
                "pages": len(page_set),
                "text": combined_text,
                "ocr_used": TESSERACT_AVAILABLE,
            })
        else:
            # Return as text file
            output_path = OUT_DIR / f"{job_id}_extracted.txt"
            output_path.write_text(combined_text, encoding="utf-8")
            
            logger.info(f"Extracted text from {len(page_set)} pages")
            
            return FileResponse(
                path=str(output_path),
                media_type="text/plain",
                filename="extracted_text.txt"
            )
        
    except HTTPException:
        raise
    except Exception as e:
        logger.exception("PDF OCR failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.get("/api/ocr-status")
async def api_ocr_status():
    """Check if Tesseract OCR is available"""
    return {"available": TESSERACT_AVAILABLE}


# =============== Enhance Quality ===============

def enhance_image(img: Image.Image, level: str = "medium") -> Image.Image:
    """Enhance image quality with sharpening and contrast adjustment"""
    from PIL import ImageEnhance, ImageFilter
    
    # Level presets: (sharpness, contrast, color, brightness)
    presets = {
        "light": (1.2, 1.05, 1.05, 1.02),
        "medium": (1.4, 1.1, 1.1, 1.03),
        "strong": (1.6, 1.15, 1.15, 1.05),
    }
    sharpness, contrast, color, brightness = presets.get(level, presets["medium"])
    
    # Convert to RGB if needed
    if img.mode in ('RGBA', 'P'):
        # Preserve alpha if present
        if img.mode == 'RGBA':
            alpha = img.split()[3]
            img = img.convert('RGB')
        else:
            img = img.convert('RGB')
            alpha = None
    else:
        img = img.convert('RGB')
        alpha = None
    
    # Apply slight unsharp mask for detail enhancement
    img = img.filter(ImageFilter.UnsharpMask(radius=1.5, percent=50, threshold=3))
    
    # Enhance sharpness
    enhancer = ImageEnhance.Sharpness(img)
    img = enhancer.enhance(sharpness)
    
    # Enhance contrast
    enhancer = ImageEnhance.Contrast(img)
    img = enhancer.enhance(contrast)
    
    # Enhance color saturation slightly
    enhancer = ImageEnhance.Color(img)
    img = enhancer.enhance(color)
    
    # Slight brightness adjustment
    enhancer = ImageEnhance.Brightness(img)
    img = enhancer.enhance(brightness)
    
    # Restore alpha channel if it existed
    if alpha:
        img = img.convert('RGBA')
        img.putalpha(alpha)
    
    return img


@app.post("/api/enhance-image")
async def api_enhance_image(
    file: UploadFile = File(...),
    level: str = Form("medium"),
    upscale: float = Form(1.0),
    output_name: str = Form("enhanced"),
):
    """Enhance image quality with sharpening and optional upscaling"""
    data = await file.read()
    original_size = len(data)
    
    if original_size > settings.max_image_size_mb * 1024 * 1024:
        raise HTTPException(status_code=400, detail=f"Image too large. Max: {settings.max_image_size_mb}MB")
    
    output_name = sanitize_filename(output_name, "enhanced")
    level = level if level in ["light", "medium", "strong"] else "medium"
    upscale = max(1.0, min(2.0, upscale))  # Limit upscale to 2x max
    
    try:
        img = Image.open(io.BytesIO(data))
        original_format = file.filename.split('.')[-1].lower() if file.filename else 'jpg'
        
        # Upscale if requested (using LANCZOS for quality)
        if upscale > 1.0:
            new_size = (int(img.size[0] * upscale), int(img.size[1] * upscale))
            img = img.resize(new_size, Image.Resampling.LANCZOS)
        
        # Apply enhancement
        img = enhance_image(img, level)
        
        # Determine output format and quality
        if original_format in ['jpg', 'jpeg']:
            output_format = 'JPEG'
            ext = 'jpg'
            mime = 'image/jpeg'
            if img.mode == 'RGBA':
                img = img.convert('RGB')
            # Use quality that keeps file size reasonable
            quality = 88
        elif original_format == 'webp':
            output_format = 'WEBP'
            ext = 'webp'
            mime = 'image/webp'
            quality = 88
        else:
            output_format = 'PNG'
            ext = 'png'
            mime = 'image/png'
            quality = None
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}.{ext}"
        
        save_kwargs = {'optimize': True}
        if quality:
            save_kwargs['quality'] = quality
        
        img.save(str(output_path), output_format, **save_kwargs)
        
        enhanced_size = output_path.stat().st_size
        
        # If file got too large (more than 3x original), reduce quality
        if enhanced_size > original_size * 3 and output_format in ['JPEG', 'WEBP']:
            quality = 75
            img.save(str(output_path), output_format, quality=quality, optimize=True)
            enhanced_size = output_path.stat().st_size
        
        logger.info(f"Enhanced image: {original_size} -> {enhanced_size} bytes")
        
        return FileResponse(
            path=str(output_path),
            media_type=mime,
            filename=f"{output_name}.{ext}",
            headers={
                "X-Original-Size": str(original_size),
                "X-Enhanced-Size": str(enhanced_size),
            }
        )
        
    except Exception as e:
        logger.exception("Image enhancement failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/enhance-pdf")
async def api_enhance_pdf(
    file: UploadFile = File(...),
    level: str = Form("medium"),
    dpi: int = Form(150),
    output_name: str = Form("enhanced.pdf"),
):
    """Enhance PDF quality by improving embedded images"""
    data = await file.read()
    original_size = len(data)
    validate_pdf_upload(data)
    
    output_name = sanitize_filename(output_name, "enhanced.pdf")
    if not output_name.lower().endswith(".pdf"):
        output_name += ".pdf"
    
    level = level if level in ["light", "medium", "strong"] else "medium"
    dpi = max(100, min(200, dpi))  # Limit DPI to prevent bloat
    
    # Quality settings based on level
    jpeg_quality = {"light": 82, "medium": 85, "strong": 88}.get(level, 85)
    
    try:
        src_doc = fitz.open(stream=data, filetype="pdf")
        images_enhanced = 0
        
        for page_num in range(len(src_doc)):
            page = src_doc.load_page(page_num)
            image_list = page.get_images(full=True)
            
            for img_info in image_list:
                xref = img_info[0]
                
                try:
                    base_image = src_doc.extract_image(xref)
                    if not base_image:
                        continue
                    
                    image_bytes = base_image["image"]
                    
                    # Skip small images (icons, etc.)
                    if len(image_bytes) < 5000:
                        continue
                    
                    # Open and enhance image
                    img = Image.open(io.BytesIO(image_bytes))
                    
                    # Skip if already small dimensions
                    if max(img.size) < 100:
                        continue
                    
                    # Convert mode if needed
                    if img.mode in ('RGBA', 'P'):
                        img = img.convert('RGB')
                    elif img.mode != 'RGB':
                        img = img.convert('RGB')
                    
                    # Apply enhancement
                    img = enhance_image(img, level)
                    
                    # Save as optimized JPEG
                    buffer = io.BytesIO()
                    img.save(buffer, format="JPEG", quality=jpeg_quality, optimize=True)
                    enhanced_bytes = buffer.getvalue()
                    
                    # Only replace if not significantly larger
                    if len(enhanced_bytes) <= len(image_bytes) * 1.5:
                        page.replace_image(xref, stream=enhanced_bytes)
                        images_enhanced += 1
                    
                except Exception as e:
                    logger.debug(f"Could not enhance image {xref}: {e}")
                    continue
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}"
        
        # Save with optimization
        src_doc.save(
            str(output_path),
            garbage=3,
            deflate=True,
            clean=True,
        )
        src_doc.close()
        
        enhanced_size = output_path.stat().st_size
        
        # Safety check: if file is way too large, just return original
        if enhanced_size > original_size * 4:
            output_path.write_bytes(data)
            enhanced_size = original_size
            logger.warning("Enhanced PDF was too large, returning original")
        
        size_change = ((enhanced_size - original_size) / original_size) * 100
        
        logger.info(f"Enhanced PDF: {images_enhanced} images, {original_size} -> {enhanced_size} bytes ({size_change:+.1f}%)")
        
        return FileResponse(
            path=str(output_path),
            media_type="application/pdf",
            filename=output_name,
            headers={
                "X-Original-Size": str(original_size),
                "X-Enhanced-Size": str(enhanced_size),
                "X-Images-Enhanced": str(images_enhanced),
            }
        )
        
    except Exception as e:
        logger.exception("PDF enhancement failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== Image Tools ===============

# Check for rembg availability
REMBG_AVAILABLE = False
rembg_remove = None

def _check_rembg():
    """Safely check if rembg is available"""
    global REMBG_AVAILABLE, rembg_remove
    try:
        import sys
        import io
        # Capture stderr to suppress rembg warnings
        old_stderr = sys.stderr
        sys.stderr = io.StringIO()
        try:
            from rembg import remove
            rembg_remove = remove
            REMBG_AVAILABLE = True
        finally:
            sys.stderr = old_stderr
    except (ImportError, Exception) as e:
        REMBG_AVAILABLE = False
        logger.info(f"rembg not available: {e}")

# Don't check at import time - check lazily on first use
# _check_rembg()


@app.post("/api/remove-background")
async def api_remove_background(
    file: UploadFile = File(...),
    output_name: str = Form("no-bg.png"),
):
    """Remove background from image using AI (rembg)"""
    global REMBG_AVAILABLE, rembg_remove
    
    # Lazy load rembg on first use
    if rembg_remove is None and not REMBG_AVAILABLE:
        try:
            from rembg import remove
            rembg_remove = remove
            REMBG_AVAILABLE = True
        except Exception as e:
            logger.warning(f"rembg not available: {e}")
            REMBG_AVAILABLE = False
    
    if not REMBG_AVAILABLE or rembg_remove is None:
        raise HTTPException(
            status_code=500,
            detail="rembg not installed. Run: pip install rembg[gpu] or pip install rembg"
        )
    
    data = await file.read()
    if len(data) > settings.max_image_size_mb * 1024 * 1024:
        raise HTTPException(status_code=400, detail=f"Image too large. Max: {settings.max_image_size_mb}MB")
    
    output_name = sanitize_filename(output_name, "no-bg.png")
    if not output_name.lower().endswith(".png"):
        output_name += ".png"
    
    try:
        # Process with rembg
        result = rembg_remove(data)
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}"
        output_path.write_bytes(result)
        
        logger.info(f"Background removed: {output_name}")
        
        return FileResponse(
            path=str(output_path),
            media_type="image/png",
            filename=output_name
        )
        
    except Exception as e:
        logger.exception("Background removal failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/add-image-watermark")
async def api_add_image_watermark(
    file: UploadFile = File(...),
    text: str = Form(""),
    position: str = Form("center"),
    opacity: int = Form(50),
    font_size: int = Form(36),
    color: str = Form("#000000"),
    rotation: int = Form(0),
    output_name: str = Form("watermarked"),
):
    """Add text watermark to image"""
    data = await file.read()
    if len(data) > settings.max_image_size_mb * 1024 * 1024:
        raise HTTPException(status_code=400, detail=f"Image too large. Max: {settings.max_image_size_mb}MB")
    
    if not text.strip():
        raise HTTPException(status_code=400, detail="Watermark text is required")
    
    output_name = sanitize_filename(output_name, "watermarked")
    
    try:
        from PIL import ImageDraw, ImageFont
        
        img = Image.open(io.BytesIO(data))
        if img.mode != 'RGBA':
            img = img.convert('RGBA')
        
        # Create watermark layer
        watermark = Image.new('RGBA', img.size, (0, 0, 0, 0))
        draw = ImageDraw.Draw(watermark)
        
        # Try to use a font, fallback to default
        try:
            font = ImageFont.truetype("arial.ttf", font_size)
        except:
            font = ImageFont.load_default()
        
        # Parse color
        color_hex = color.lstrip('#')
        r, g, b = tuple(int(color_hex[i:i+2], 16) for i in (0, 2, 4))
        alpha = int(255 * opacity / 100)
        
        # Get text size
        bbox = draw.textbbox((0, 0), text, font=font)
        text_width = bbox[2] - bbox[0]
        text_height = bbox[3] - bbox[1]
        
        # Calculate position
        positions = {
            "top-left": (20, 20),
            "top-center": ((img.width - text_width) // 2, 20),
            "top-right": (img.width - text_width - 20, 20),
            "center": ((img.width - text_width) // 2, (img.height - text_height) // 2),
            "bottom-left": (20, img.height - text_height - 20),
            "bottom-center": ((img.width - text_width) // 2, img.height - text_height - 20),
            "bottom-right": (img.width - text_width - 20, img.height - text_height - 20),
            "tile": None,
        }
        
        if position == "tile":
            # Tile watermark across image
            for y in range(0, img.height, text_height + 100):
                for x in range(0, img.width, text_width + 100):
                    draw.text((x, y), text, font=font, fill=(r, g, b, alpha))
        else:
            pos = positions.get(position, positions["center"])
            draw.text(pos, text, font=font, fill=(r, g, b, alpha))
        
        # Rotate watermark if needed
        if rotation != 0:
            watermark = watermark.rotate(rotation, expand=False, center=(img.width//2, img.height//2))
        
        # Composite
        result = Image.alpha_composite(img, watermark)
        
        # Determine output format
        original_format = file.filename.split('.')[-1].lower() if file.filename else 'png'
        if original_format in ['jpg', 'jpeg']:
            result = result.convert('RGB')
            output_format = 'JPEG'
            output_name += '.jpg'
            mime = 'image/jpeg'
        else:
            output_format = 'PNG'
            output_name += '.png'
            mime = 'image/png'
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}"
        result.save(str(output_path), output_format, quality=95)
        
        logger.info(f"Watermark added: {output_name}")
        
        return FileResponse(path=str(output_path), media_type=mime, filename=output_name)
        
    except Exception as e:
        logger.exception("Add watermark failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/resize-image")
async def api_resize_image(
    file: UploadFile = File(...),
    preset: str = Form("custom"),
    width: int = Form(0),
    height: int = Form(0),
    maintain_aspect: bool = Form(True),
    output_name: str = Form("resized"),
):
    """Resize image with presets or custom dimensions"""
    data = await file.read()
    if len(data) > settings.max_image_size_mb * 1024 * 1024:
        raise HTTPException(status_code=400, detail=f"Image too large. Max: {settings.max_image_size_mb}MB")
    
    output_name = sanitize_filename(output_name, "resized")
    
    # Presets
    presets = {
        "thumbnail": (150, 150),
        "small": (320, 240),
        "medium": (640, 480),
        "hd": (1280, 720),
        "fullhd": (1920, 1080),
        "4k": (3840, 2160),
        "square-sm": (500, 500),
        "square-lg": (1000, 1000),
    }
    
    try:
        img = Image.open(io.BytesIO(data))
        original_width, original_height = img.size
        
        # Determine target size
        if preset != "custom" and preset in presets:
            target_width, target_height = presets[preset]
        else:
            target_width = width if width > 0 else original_width
            target_height = height if height > 0 else original_height
        
        # Maintain aspect ratio
        if maintain_aspect:
            ratio = min(target_width / original_width, target_height / original_height)
            target_width = int(original_width * ratio)
            target_height = int(original_height * ratio)
        
        # Resize
        resized = img.resize((target_width, target_height), Image.Resampling.LANCZOS)
        
        # Determine output format
        original_format = file.filename.split('.')[-1].lower() if file.filename else 'png'
        format_map = {'jpg': 'JPEG', 'jpeg': 'JPEG', 'png': 'PNG', 'webp': 'WEBP', 'gif': 'GIF'}
        output_format = format_map.get(original_format, 'PNG')
        ext = original_format if original_format in format_map else 'png'
        
        if output_format == 'JPEG' and resized.mode == 'RGBA':
            resized = resized.convert('RGB')
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}.{ext}"
        resized.save(str(output_path), output_format, quality=95)
        
        mime_map = {'JPEG': 'image/jpeg', 'PNG': 'image/png', 'WEBP': 'image/webp', 'GIF': 'image/gif'}
        
        logger.info(f"Resized image: {original_width}x{original_height} -> {target_width}x{target_height}")
        
        return FileResponse(
            path=str(output_path),
            media_type=mime_map.get(output_format, 'image/png'),
            filename=f"{output_name}.{ext}",
            headers={
                "X-Original-Size": f"{original_width}x{original_height}",
                "X-New-Size": f"{target_width}x{target_height}"
            }
        )
        
    except Exception as e:
        logger.exception("Resize image failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/convert-image")
async def api_convert_image(
    file: UploadFile = File(...),
    target_format: str = Form("png"),
    quality: int = Form(90),
    output_name: str = Form("converted"),
):
    """Convert image between formats (JPG, PNG, WebP, GIF)"""
    data = await file.read()
    if len(data) > settings.max_image_size_mb * 1024 * 1024:
        raise HTTPException(status_code=400, detail=f"Image too large. Max: {settings.max_image_size_mb}MB")
    
    output_name = sanitize_filename(output_name, "converted")
    target_format = target_format.lower()
    
    format_map = {
        'jpg': ('JPEG', 'image/jpeg', 'jpg'),
        'jpeg': ('JPEG', 'image/jpeg', 'jpg'),
        'png': ('PNG', 'image/png', 'png'),
        'webp': ('WEBP', 'image/webp', 'webp'),
        'gif': ('GIF', 'image/gif', 'gif'),
    }
    
    if target_format not in format_map:
        raise HTTPException(status_code=400, detail="Unsupported format. Use: jpg, png, webp, gif")
    
    pil_format, mime, ext = format_map[target_format]
    
    try:
        img = Image.open(io.BytesIO(data))
        
        # Handle transparency for JPEG
        if pil_format == 'JPEG' and img.mode in ('RGBA', 'P'):
            background = Image.new('RGB', img.size, (255, 255, 255))
            if img.mode == 'P':
                img = img.convert('RGBA')
            background.paste(img, mask=img.split()[3] if len(img.split()) == 4 else None)
            img = background
        elif pil_format == 'JPEG' and img.mode != 'RGB':
            img = img.convert('RGB')
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}.{ext}"
        
        save_kwargs = {}
        if pil_format in ['JPEG', 'WEBP']:
            save_kwargs['quality'] = quality
        if pil_format == 'PNG':
            save_kwargs['optimize'] = True
        
        img.save(str(output_path), pil_format, **save_kwargs)
        
        logger.info(f"Converted image to {target_format.upper()}")
        
        return FileResponse(
            path=str(output_path),
            media_type=mime,
            filename=f"{output_name}.{ext}"
        )
        
    except Exception as e:
        logger.exception("Convert image failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/compress-image")
async def api_compress_image(
    file: UploadFile = File(...),
    quality: int = Form(70),
    output_name: str = Form("compressed"),
):
    """Compress image to reduce file size"""
    data = await file.read()
    original_size = len(data)
    
    if original_size > settings.max_image_size_mb * 1024 * 1024:
        raise HTTPException(status_code=400, detail=f"Image too large. Max: {settings.max_image_size_mb}MB")
    
    output_name = sanitize_filename(output_name, "compressed")
    quality = max(10, min(100, quality))
    
    try:
        img = Image.open(io.BytesIO(data))
        
        # Always convert to JPEG for effective compression with quality control
        # (PNG optimize doesn't use quality setting and gives minimal compression)
        if img.mode in ('RGBA', 'P'):
            # Handle transparency by compositing on white background
            background = Image.new('RGB', img.size, (255, 255, 255))
            if img.mode == 'P':
                img = img.convert('RGBA')
            if img.mode == 'RGBA':
                background.paste(img, mask=img.split()[3])
                img = background
            else:
                img = img.convert('RGB')
        elif img.mode != 'RGB':
            img = img.convert('RGB')
        
        output_format = 'JPEG'
        ext = 'jpg'
        mime = 'image/jpeg'
        save_kwargs = {'quality': quality, 'optimize': True}
        
        output_path = OUT_DIR / f"{generate_job_id()}_{output_name}.{ext}"
        img.save(str(output_path), output_format, **save_kwargs)
        
        compressed_size = output_path.stat().st_size
        reduction = ((original_size - compressed_size) / original_size) * 100
        
        logger.info(f"Compressed image: {original_size} -> {compressed_size} bytes ({reduction:.1f}% reduction)")
        
        return FileResponse(
            path=str(output_path),
            media_type=mime,
            filename=f"{output_name}.{ext}",
            headers={
                "X-Original-Size": str(original_size),
                "X-Compressed-Size": str(compressed_size),
                "X-Reduction-Percent": f"{reduction:.1f}"
            }
        )
        
    except Exception as e:
        logger.exception("Compress image failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== Estimate File Size Endpoints ===============

@app.post("/api/estimate/compress-image")
async def api_estimate_compress_image(
    file: UploadFile = File(...),
    quality: int = Form(70),
):
    """Estimate compressed image file size - matches actual compression logic"""
    data = await file.read()
    original_size = len(data)
    
    if original_size > settings.max_image_size_mb * 1024 * 1024:
        raise HTTPException(status_code=400, detail=f"Image too large. Max: {settings.max_image_size_mb}MB")
    
    quality = max(10, min(100, quality))
    
    try:
        img = Image.open(io.BytesIO(data))
        
        # Always convert to JPEG for compression (matches actual compression logic)
        if img.mode in ('RGBA', 'P'):
            background = Image.new('RGB', img.size, (255, 255, 255))
            if img.mode == 'P':
                img = img.convert('RGBA')
            if img.mode == 'RGBA':
                background.paste(img, mask=img.split()[3])
                img = background
            else:
                img = img.convert('RGB')
        elif img.mode != 'RGB':
            img = img.convert('RGB')
        
        buffer = io.BytesIO()
        img.save(buffer, format="JPEG", quality=quality, optimize=True)
        estimated_size = len(buffer.getvalue())
        
        reduction = ((original_size - estimated_size) / original_size) * 100 if original_size > 0 else 0
        
        return JSONResponse({
            "original_size": original_size,
            "estimated_size": estimated_size,
            "reduction_percent": round(max(0, reduction), 1)
        })
        
    except Exception as e:
        logger.exception("Estimate compress image failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/estimate/convert-image")
async def api_estimate_convert_image(
    file: UploadFile = File(...),
    target_format: str = Form("png"),
    quality: int = Form(90),
):
    """Estimate converted image file size"""
    data = await file.read()
    original_size = len(data)
    
    if original_size > settings.max_image_size_mb * 1024 * 1024:
        raise HTTPException(status_code=400, detail=f"Image too large. Max: {settings.max_image_size_mb}MB")
    
    target_format = target_format.lower()
    format_map = {
        'jpg': ('JPEG', 'jpg'),
        'jpeg': ('JPEG', 'jpg'),
        'png': ('PNG', 'png'),
        'webp': ('WEBP', 'webp'),
        'gif': ('GIF', 'gif'),
    }
    
    if target_format not in format_map:
        raise HTTPException(status_code=400, detail="Unsupported format")
    
    pil_format, ext = format_map[target_format]
    
    try:
        img = Image.open(io.BytesIO(data))
        
        # Handle transparency for JPEG
        if pil_format == 'JPEG' and img.mode in ('RGBA', 'P'):
            background = Image.new('RGB', img.size, (255, 255, 255))
            if img.mode == 'P':
                img = img.convert('RGBA')
            background.paste(img, mask=img.split()[3] if len(img.split()) == 4 else None)
            img = background
        elif pil_format == 'JPEG' and img.mode != 'RGB':
            img = img.convert('RGB')
        
        buffer = io.BytesIO()
        save_kwargs = {}
        if pil_format in ['JPEG', 'WEBP']:
            save_kwargs['quality'] = quality
        if pil_format == 'PNG':
            save_kwargs['optimize'] = True
        
        img.save(buffer, pil_format, **save_kwargs)
        estimated_size = len(buffer.getvalue())
        
        return JSONResponse({
            "original_size": original_size,
            "estimated_size": estimated_size,
            "target_format": target_format.upper()
        })
        
    except Exception as e:
        logger.exception("Estimate convert image failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/estimate/compress-pdf")
async def api_estimate_compress_pdf(
    file: UploadFile = File(...),
    quality: int = Form(60),
):
    """Estimate compressed PDF file size by actually compressing it in memory"""
    data = await file.read()
    original_size = len(data)
    validate_pdf_upload(data)
    
    # Use quality directly (10-100 scale)
    jpeg_quality = max(10, min(100, quality))
    max_dim = int(1000 + (quality / 100) * 2000)  # Range: 1000-3000
    
    try:
        src_doc = fitz.open(stream=data, filetype="pdf")
        total_pages = len(src_doc)
        
        # Process ALL pages for accurate estimation
        for page_num in range(total_pages):
            page = src_doc.load_page(page_num)
            image_list = page.get_images(full=True)
            
            for img_info in image_list:
                xref = img_info[0]
                try:
                    base_image = src_doc.extract_image(xref)
                    if not base_image or len(base_image["image"]) < 5000:
                        continue
                    
                    image_bytes = base_image["image"]
                    
                    img = Image.open(io.BytesIO(image_bytes))
                    if img.mode in ('RGBA', 'P'):
                        background = Image.new('RGB', img.size, (255, 255, 255))
                        if img.mode == 'P':
                            img = img.convert('RGBA')
                        if img.mode == 'RGBA':
                            background.paste(img, mask=img.split()[3])
                            img = background
                        else:
                            img = img.convert('RGB')
                    elif img.mode != 'RGB':
                        img = img.convert('RGB')
                    
                    # Resize if larger than max_dim
                    if max(img.size) > max_dim:
                        ratio = max_dim / max(img.size)
                        new_size = (int(img.size[0] * ratio), int(img.size[1] * ratio))
                        img = img.resize(new_size, Image.Resampling.LANCZOS)
                    
                    buffer = io.BytesIO()
                    img.save(buffer, format="JPEG", quality=jpeg_quality, optimize=True)
                    compressed_bytes = buffer.getvalue()
                    
                    # Always replace to apply quality setting
                    page.replace_image(xref, stream=compressed_bytes)
                        
                except Exception:
                    continue
        
        # Get actual compressed size
        compressed_bytes = src_doc.tobytes(garbage=4, deflate=True, clean=True)
        estimated_size = len(compressed_bytes)
        src_doc.close()
        
        reduction = ((original_size - estimated_size) / original_size) * 100 if original_size > 0 else 0
        
        return JSONResponse({
            "original_size": original_size,
            "estimated_size": estimated_size,
            "reduction_percent": round(max(0, reduction), 1),
            "quality": quality
        })
        
    except Exception as e:
        logger.exception("Estimate compress PDF failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.get("/api/rembg-status")
async def api_rembg_status():
    """Check if rembg is available"""
    global REMBG_AVAILABLE, rembg_remove
    
    # Try to load rembg if not checked yet
    if rembg_remove is None and not REMBG_AVAILABLE:
        try:
            from rembg import remove
            rembg_remove = remove
            REMBG_AVAILABLE = True
        except Exception:
            REMBG_AVAILABLE = False
    
    return {"available": REMBG_AVAILABLE}


# =============== Preview Endpoints ===============

def image_to_base64(img: Image.Image, format: str = "PNG", quality: int = 95) -> str:
    """Convert PIL Image to base64 string"""
    import base64
    buffer = io.BytesIO()
    if format == "JPEG" and img.mode in ('RGBA', 'P'):
        img = img.convert('RGB')
    img.save(buffer, format=format, quality=quality if format == "JPEG" else None)
    return base64.b64encode(buffer.getvalue()).decode()


def prepare_preview_image(img: Image.Image, max_size: int = 1920) -> Image.Image:
    """Prepare image for preview - only resize if larger than max_size (HD)"""
    if max(img.size) > max_size:
        img.thumbnail((max_size, max_size), Image.Resampling.LANCZOS)
    return img


def pdf_page_to_base64(pdf_bytes: bytes, page_num: int = 0, dpi: int = 200) -> str:
    """Convert PDF page to base64 PNG at high quality"""
    import base64
    doc = fitz.open(stream=pdf_bytes, filetype="pdf")
    page = doc.load_page(page_num)
    zoom = dpi / 72.0
    mat = fitz.Matrix(zoom, zoom)
    pix = page.get_pixmap(matrix=mat)
    png_bytes = pix.tobytes("png")
    doc.close()
    return base64.b64encode(png_bytes).decode()


@app.post("/api/preview/compress-pdf")
async def api_preview_compress_pdf(
    file: UploadFile = File(...),
    quality: int = Form(60),
):
    """Preview PDF compression - returns original and compressed first page"""
    data = await file.read()
    validate_pdf_upload(data)
    
    jpeg_quality = max(10, min(100, quality))
    max_dim = int(1000 + (quality / 100) * 2000)  # Range: 1000-3000
    
    try:
        # Get original first page (higher DPI for better quality)
        original_b64 = pdf_page_to_base64(data, 0, 150)
        
        # Compress PDF
        src_doc = fitz.open(stream=data, filetype="pdf")
        
        for page_num in range(min(1, len(src_doc))):  # Only process first page for preview
            page = src_doc.load_page(page_num)
            image_list = page.get_images(full=True)
            
            for img_info in image_list:
                xref = img_info[0]
                try:
                    base_image = src_doc.extract_image(xref)
                    if not base_image or len(base_image["image"]) < 5000:
                        continue
                    
                    img = Image.open(io.BytesIO(base_image["image"]))
                    if img.mode in ('RGBA', 'P'):
                        background = Image.new('RGB', img.size, (255, 255, 255))
                        if img.mode == 'P':
                            img = img.convert('RGBA')
                        if img.mode == 'RGBA':
                            background.paste(img, mask=img.split()[3])
                            img = background
                        else:
                            img = img.convert('RGB')
                    elif img.mode != 'RGB':
                        img = img.convert('RGB')
                    
                    # Resize if larger than max_dim
                    if max(img.size) > max_dim:
                        ratio = max_dim / max(img.size)
                        new_size = (int(img.size[0] * ratio), int(img.size[1] * ratio))
                        img = img.resize(new_size, Image.Resampling.LANCZOS)
                    
                    buffer = io.BytesIO()
                    img.save(buffer, format="JPEG", quality=jpeg_quality, optimize=True)
                    # Always replace to apply quality setting
                    page.replace_image(xref, stream=buffer.getvalue())
                except Exception:
                    continue
        
        compressed_bytes = src_doc.tobytes(garbage=4, deflate=True, clean=True)
        src_doc.close()
        
        processed_b64 = pdf_page_to_base64(compressed_bytes, 0, 150)
        
        return JSONResponse({
            "original": original_b64,
            "processed": processed_b64,
            "original_size": len(data),
            "processed_size": len(compressed_bytes)
        })
        
    except Exception as e:
        logger.exception("Compress preview failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/preview/rotate-pdf")
async def api_preview_rotate_pdf(
    file: UploadFile = File(...),
    rotation: int = Form(90),
):
    """Preview PDF rotation - returns original and rotated first page"""
    data = await file.read()
    validate_pdf_upload(data)
    
    rotation = int(rotation) % 360
    if rotation not in [90, 180, 270]:
        rotation = 90
    
    try:
        original_b64 = pdf_page_to_base64(data, 0, 150)
        
        src_doc = fitz.open(stream=data, filetype="pdf")
        page = src_doc.load_page(0)
        page.set_rotation(page.rotation + rotation)
        rotated_bytes = src_doc.tobytes()
        src_doc.close()
        
        processed_b64 = pdf_page_to_base64(rotated_bytes, 0, 150)
        
        return JSONResponse({
            "original": original_b64,
            "processed": processed_b64
        })
        
    except Exception as e:
        logger.exception("Rotate preview failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/preview/page-numbers")
async def api_preview_page_numbers(
    file: UploadFile = File(...),
    position: str = Form("bottom-center"),
    format: str = Form("Page {n} of {total}"),
    start_number: int = Form(1),
    font_size: int = Form(11),
):
    """Preview page numbers - returns original and numbered first page"""
    data = await file.read()
    validate_pdf_upload(data)
    
    positions = {
        "top-left": ("left", "top"),
        "top-center": ("center", "top"),
        "top-right": ("right", "top"),
        "bottom-left": ("left", "bottom"),
        "bottom-center": ("center", "bottom"),
        "bottom-right": ("right", "bottom"),
    }
    h_align, v_align = positions.get(position, ("center", "bottom"))
    margin = 30
    
    try:
        original_b64 = pdf_page_to_base64(data, 0, 150)
        
        src_doc = fitz.open(stream=data, filetype="pdf")
        total_pages = len(src_doc)
        page = src_doc.load_page(0)
        rect = page.rect
        
        text = format.replace("{n}", str(start_number)).replace("{total}", str(total_pages))
        text_width = fitz.get_text_length(text, fontsize=font_size)
        
        if h_align == "left":
            x = margin
        elif h_align == "right":
            x = rect.width - margin - text_width
        else:
            x = (rect.width - text_width) / 2
        
        if v_align == "top":
            y = margin + font_size
        else:
            y = rect.height - margin
        
        page.insert_text((x, y), text, fontsize=font_size, color=(0.3, 0.3, 0.3))
        
        numbered_bytes = src_doc.tobytes()
        src_doc.close()
        
        processed_b64 = pdf_page_to_base64(numbered_bytes, 0, 150)
        
        return JSONResponse({
            "original": original_b64,
            "processed": processed_b64
        })
        
    except Exception as e:
        logger.exception("Page numbers preview failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/preview/remove-background")
async def api_preview_remove_background(
    file: UploadFile = File(...),
):
    """Preview background removal - returns original and processed image in HD quality"""
    global REMBG_AVAILABLE, rembg_remove
    
    if rembg_remove is None and not REMBG_AVAILABLE:
        try:
            from rembg import remove
            rembg_remove = remove
            REMBG_AVAILABLE = True
        except Exception:
            REMBG_AVAILABLE = False
    
    if not REMBG_AVAILABLE or rembg_remove is None:
        raise HTTPException(status_code=500, detail="rembg not installed")
    
    data = await file.read()
    
    try:
        img = Image.open(io.BytesIO(data))
        img = prepare_preview_image(img)
        original_b64 = image_to_base64(img, "PNG")
        
        # Process with rembg
        img_buffer = io.BytesIO()
        img_rgb = img.convert('RGB') if img.mode != 'RGB' else img
        img_rgb.save(img_buffer, format='PNG')
        result = rembg_remove(img_buffer.getvalue())
        
        result_img = Image.open(io.BytesIO(result))
        processed_b64 = image_to_base64(result_img, "PNG")
        
        return JSONResponse({
            "original": original_b64,
            "processed": processed_b64
        })
        
    except Exception as e:
        logger.exception("Remove background preview failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/preview/enhance-image")
async def api_preview_enhance_image(
    file: UploadFile = File(...),
    level: str = Form("medium"),
    upscale: float = Form(1.0),
):
    """Preview image enhancement - returns original and enhanced image in HD quality"""
    data = await file.read()
    
    try:
        img = Image.open(io.BytesIO(data))
        img = prepare_preview_image(img)
        original_b64 = image_to_base64(img.convert('RGB'), "JPEG", 95)
        
        work_img = img.copy()
        if upscale > 1.0:
            new_size = (int(work_img.size[0] * min(upscale, 2.0)), int(work_img.size[1] * min(upscale, 2.0)))
            work_img = work_img.resize(new_size, Image.Resampling.LANCZOS)
        
        enhanced = enhance_image(work_img, level)
        enhanced = prepare_preview_image(enhanced)
        processed_b64 = image_to_base64(enhanced.convert('RGB'), "JPEG", 95)
        
        return JSONResponse({
            "original": original_b64,
            "processed": processed_b64
        })
        
    except Exception as e:
        logger.exception("Enhance preview failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/preview/image-watermark")
async def api_preview_image_watermark(
    file: UploadFile = File(...),
    text: str = Form(""),
    position: str = Form("center"),
    opacity: int = Form(50),
    font_size: int = Form(36),
    color: str = Form("#000000"),
):
    """Preview image watermark - returns original and watermarked image in HD quality"""
    from PIL import ImageDraw, ImageFont
    
    data = await file.read()
    
    if not text.strip():
        raise HTTPException(status_code=400, detail="Watermark text required")
    
    try:
        img = Image.open(io.BytesIO(data))
        img = prepare_preview_image(img)
        original_b64 = image_to_base64(img.convert('RGB'), "JPEG", 95)
        
        if img.mode != 'RGBA':
            img = img.convert('RGBA')
        
        watermark = Image.new('RGBA', img.size, (0, 0, 0, 0))
        draw = ImageDraw.Draw(watermark)
        
        try:
            font = ImageFont.truetype("arial.ttf", font_size)
        except:
            font = ImageFont.load_default()
        
        color_hex = color.lstrip('#')
        r, g, b = tuple(int(color_hex[i:i+2], 16) for i in (0, 2, 4))
        alpha = int(255 * opacity / 100)
        
        bbox = draw.textbbox((0, 0), text, font=font)
        text_width = bbox[2] - bbox[0]
        text_height = bbox[3] - bbox[1]
        
        positions = {
            "top-left": (20, 20),
            "top-center": ((img.width - text_width) // 2, 20),
            "top-right": (img.width - text_width - 20, 20),
            "center": ((img.width - text_width) // 2, (img.height - text_height) // 2),
            "bottom-left": (20, img.height - text_height - 20),
            "bottom-center": ((img.width - text_width) // 2, img.height - text_height - 20),
            "bottom-right": (img.width - text_width - 20, img.height - text_height - 20),
        }
        
        pos = positions.get(position, positions["center"])
        draw.text(pos, text, font=font, fill=(r, g, b, alpha))
        
        result = Image.alpha_composite(img, watermark)
        processed_b64 = image_to_base64(result.convert('RGB'), "JPEG", 95)
        
        return JSONResponse({
            "original": original_b64,
            "processed": processed_b64
        })
        
    except Exception as e:
        logger.exception("Watermark preview failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/preview/resize-image")
async def api_preview_resize_image(
    file: UploadFile = File(...),
    preset: str = Form("custom"),
    width: int = Form(0),
    height: int = Form(0),
    maintain_aspect: bool = Form(True),
):
    """Preview image resize - returns original and resized image in HD quality"""
    data = await file.read()
    
    presets = {
        "thumbnail": (150, 150),
        "small": (320, 240),
        "medium": (640, 480),
        "hd": (1280, 720),
        "fullhd": (1920, 1080),
        "4k": (3840, 2160),
        "square-sm": (500, 500),
        "square-lg": (1000, 1000),
    }
    
    try:
        img = Image.open(io.BytesIO(data))
        original_width, original_height = img.size
        
        # Original preview (HD quality)
        original_preview = prepare_preview_image(img.copy())
        original_b64 = image_to_base64(original_preview.convert('RGB'), "JPEG", 95)
        
        # Determine target size
        if preset != "custom" and preset in presets:
            target_width, target_height = presets[preset]
        else:
            target_width = width if width > 0 else original_width
            target_height = height if height > 0 else original_height
        
        if maintain_aspect:
            ratio = min(target_width / original_width, target_height / original_height)
            target_width = int(original_width * ratio)
            target_height = int(original_height * ratio)
        
        # Resized preview (HD quality)
        resized = img.resize((target_width, target_height), Image.Resampling.LANCZOS)
        resized_preview = prepare_preview_image(resized)
        processed_b64 = image_to_base64(resized_preview.convert('RGB'), "JPEG", 95)
        
        return JSONResponse({
            "original": original_b64,
            "processed": processed_b64,
            "original_size": f"{original_width}x{original_height}",
            "new_size": f"{target_width}x{target_height}"
        })
        
    except Exception as e:
        logger.exception("Resize preview failed")
        raise HTTPException(status_code=500, detail=str(e))


@app.post("/api/preview/compress-image")
async def api_preview_compress_image(
    file: UploadFile = File(...),
    quality: int = Form(70),
):
    """Preview image compression - returns original and compressed image in HD quality"""
    data = await file.read()
    original_size = len(data)
    
    try:
        img = Image.open(io.BytesIO(data))
        img = prepare_preview_image(img)
        original_b64 = image_to_base64(img.convert('RGB'), "JPEG", 98)
        
        # Compress with user's quality setting
        if img.mode != 'RGB':
            img = img.convert('RGB')
        
        buffer = io.BytesIO()
        img.save(buffer, format="JPEG", quality=quality, optimize=True)
        compressed_size = len(buffer.getvalue())
        
        compressed_img = Image.open(io.BytesIO(buffer.getvalue()))
        processed_b64 = image_to_base64(compressed_img, "JPEG", 98)
        
        return JSONResponse({
            "original": original_b64,
            "processed": processed_b64,
            "original_size": original_size,
            "compressed_size": compressed_size
        })
        
    except Exception as e:
        logger.exception("Compress preview failed")
        raise HTTPException(status_code=500, detail=str(e))


# =============== Run Server ===============

if __name__ == "__main__":
    import uvicorn
    uvicorn.run(
        "server:app",
        host="127.0.0.1",
        port=8000,
        reload=settings.debug
    )