tw/image/perspective_fix.py

"""
透视矫正三步流程：
  Step1: Gemini 去背景 → 纯白背景
  Step2: OpenCV 在白背景图上检测四角 → warpPerspective 展平
  Step3: Gemini 对展平结果做高清增强

用法：
  python perspective_fix.py <图片路径或URL> [--debug] [--skip-step1] [--skip-step3]
"""
import sys, io
sys.stdout = io.TextIOWrapper(sys.stdout.buffer, encoding="utf-8", errors="replace")
sys.stderr = io.TextIOWrapper(sys.stderr.buffer, encoding="utf-8", errors="replace")

import os, asyncio, uuid, tempfile
import numpy as np
import cv2
from dotenv import load_dotenv

load_dotenv()

_OUTPUT_DIR = os.getenv("RESULT_IMAGE_DIR", "results")
os.makedirs(_OUTPUT_DIR, exist_ok=True)

# ═══════════════════════════════════════════════════════════════
# Gemini 辅助函数
# ═══════════════════════════════════════════════════════════════

async def _gemini_call(input_path: str, output_path: str, prompt: str,
                       aspect_ratio: str = "1:1", label: str = "") -> bool:
    from services.service_gemini import GeminiExtractV2Service
    service = GeminiExtractV2Service()
    try:
        ok, msg, _ = await service.extract_pattern(
            input_path=input_path,
            output_path=output_path,
            custom_prompt=prompt,
            aspect_ratio=aspect_ratio,
        )
        status = "成功" if ok else "失败"
        print(f"  [{label}] Gemini {status}: {msg[:80]}")
        return ok and os.path.exists(output_path)
    except Exception as e:
        print(f"  [{label}] Gemini 异常: {e}")
        return False
    finally:
        await service.cleanup()


PROMPT_WHITE_BG = (
    "请处理这张图片：\n"
    "1. 识别图中的地毯/地垫/印花布料/产品本体作为主体\n"
    "2. 去掉主体上面放置的所有物品（杯子、碗、餐具、装饰品等），只保留地垫本身\n"
    "3. 把所有背景（桌面、地板、墙壁、阴影）全部替换为纯白色(#FFFFFF)\n"
    "4. 保持地垫/产品的颜色、图案、边缘完全不变\n"
    "输出：只有主体产品、纯白背景、无杂物的干净产品图。"
)

# 当第一次去背景效果不好时（白色覆盖率过低），用更强硬的提示词重试
PROMPT_WHITE_BG_STRONG = (
    "严格执行：将这张图的背景彻底替换为纯白色 RGB(255,255,255)。\n"
    "只保留图片中央的产品/地毯/布料主体，其他所有区域（桌面/地板/墙/阴影/物品）"
    "一律改为纯白色。产品边缘要干净锐利，不留任何半透明或灰色区域。\n"
    "重要：不论主体上摆放了什么东西，统统去掉，只输出产品本身+白色背景。"
)

PROMPT_ENHANCE = (
    "请对这张已展平的图案进行高清增强：提升整体清晰度和色彩饱和度，"
    "修复边缘锯齿，补全缺失细节，输出印刷级高质量平面图，背景保持纯白。"
)

# Step3 增强失败时的兜底提示词（更简单，成功率更高）
PROMPT_ENHANCE_SIMPLE = (
    "请提升这张图片的清晰度和画质，输出高清版本，背景保持纯白。"
)


def _measure_white_coverage(image: np.ndarray) -> float:
    """返回图片中白色像素的百分比，用于判断去背景效果"""
    gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)
    _, mask = cv2.threshold(gray, 245, 255, cv2.THRESH_BINARY)
    return float(np.sum(mask == 255)) / mask.size


def _color_match(source: np.ndarray, target: np.ndarray,
                 strength: float = 0.75, exclude_white: bool = True) -> np.ndarray:
    """
    将 target 的色调匹配到 source（类 PS「匹配颜色」）。
    使用 LAB 色彩空间 Reinhard 均值/标准差迁移。

    Args:
        source:        原图（色彩参考来源）
        target:        待调整图（处理后结果）
        strength:      迁移强度 0.0-1.0，推荐 0.6-0.85
        exclude_white: 统计时排除白色像素，避免背景影响肤色/图案计算
    Returns:
        调色后的 BGR 图像
    """
    src_f = source.astype(np.float32) / 255.0
    tgt_f = target.astype(np.float32) / 255.0

    src_lab = cv2.cvtColor(src_f, cv2.COLOR_BGR2Lab)
    tgt_lab = cv2.cvtColor(tgt_f, cv2.COLOR_BGR2Lab)
    result  = tgt_lab.copy()

    for ch in range(3):
        if exclude_white:
            # 排除极亮像素（L > 95）统计，只看图案区域
            src_mask = src_lab[:, :, 0] < 95
            tgt_mask = tgt_lab[:, :, 0] < 95
            src_vals = src_lab[:, :, ch][src_mask]
            tgt_vals = tgt_lab[:, :, ch][tgt_mask]
        else:
            src_vals = src_lab[:, :, ch].ravel()
            tgt_vals = tgt_lab[:, :, ch].ravel()

        if src_vals.size == 0 or tgt_vals.size == 0:
            continue

        src_mean, src_std = float(src_vals.mean()), float(src_vals.std())
        tgt_mean, tgt_std = float(tgt_vals.mean()), float(tgt_vals.std())

        if tgt_std < 1e-6:
            continue

        # Reinhard 迁移：先归一化到目标，再重映射到源分布
        shifted = (tgt_lab[:, :, ch] - tgt_mean) / tgt_std * src_std + src_mean
        # 按 strength 混合：strength=1 完全迁移，0 保持不变
        result[:, :, ch] = shifted * strength + tgt_lab[:, :, ch] * (1.0 - strength)

    result_bgr = cv2.cvtColor(result, cv2.COLOR_Lab2BGR)
    result_bgr = np.clip(result_bgr * 255, 0, 255).astype(np.uint8)

    print(f"  [颜色匹配] 强度={strength:.0%} | "
          f"源均值L={src_lab[:,:,0].mean():.1f} → 目标均值L={tgt_lab[:,:,0].mean():.1f}")
    return result_bgr


# ═══════════════════════════════════════════════════════════════
# OpenCV 透视矫正
# ═══════════════════════════════════════════════════════════════

def order_points(pts: np.ndarray) -> np.ndarray:
    """
    把四个点排列为 [左上, 右上, 右下, 左下]。
    使用质心角度排序，对矩形、菱形、平行四边形等各种透视形状均适用。
    """
    cx, cy = pts[:, 0].mean(), pts[:, 1].mean()
    # 计算每个点相对质心的角度（从正上方顺时针）
    angles = np.arctan2(pts[:, 1] - cy, pts[:, 0] - cx)
    # 顺时针排序：从右上开始（角度最小的）
    order = np.argsort(angles)
    sorted_pts = pts[order]
    # 找到最左上角作为起点（x+y 最小）
    s = sorted_pts.sum(axis=1)
    start = np.argmin(s)
    # 从左上角开始顺时针排列 → [左上, 右上, 右下, 左下]
    indices = [(start + i) % 4 for i in range(4)]
    rect = sorted_pts[indices].astype("float32")
    return rect


def four_point_transform(image: np.ndarray, pts: np.ndarray) -> np.ndarray:
    rect = order_points(pts)
    tl, tr, br, bl = rect

    w1 = np.linalg.norm(br - bl)
    w2 = np.linalg.norm(tr - tl)
    h1 = np.linalg.norm(tr - br)
    h2 = np.linalg.norm(tl - bl)
    W = int(max(w1, w2))
    H = int(max(h1, h2))

    print(f"  [CV] 角点: TL={tl.astype(int)} TR={tr.astype(int)} BR={br.astype(int)} BL={bl.astype(int)}")
    print(f"  [CV] 矫正后目标尺寸: {W}x{H}")

    dst = np.array([
        [0,     0    ],
        [W - 1, 0    ],
        [W - 1, H - 1],
        [0,     H - 1],
    ], dtype="float32")

    M = cv2.getPerspectiveTransform(rect, dst)
    warped = cv2.warpPerspective(
        image, M, (W, H),
        flags=cv2.INTER_LANCZOS4,
        borderMode=cv2.BORDER_CONSTANT,
        borderValue=(255, 255, 255),
    )
    return warped


def _detect_bg_color(image: np.ndarray, corner_size: int = 24) -> np.ndarray:
    """
    从图片四个角落采样，估计背景颜色（BGR）。
    适用于白色、米色、黄色、灰色等各种背景。
    """
    H, W = image.shape[:2]
    cs = min(corner_size, H // 5, W // 5)
    corners = [
        image[:cs, :cs],        # 左上
        image[:cs, W-cs:],      # 右上
        image[H-cs:, :cs],      # 左下
        image[H-cs:, W-cs:],    # 右下
    ]
    pixels = np.concatenate([c.reshape(-1, 3) for c in corners], axis=0)
    bg = np.median(pixels, axis=0).astype(np.uint8)
    return bg  # BGR


def tool_trim_white_border(image: np.ndarray,
                           tolerance: int = 18,
                           bg_ratio: float = 0.90,
                           padding: int = 4) -> tuple[np.ndarray, bool, dict]:
    """
    【Tool】智能背景边裁切（支持任意背景色：白/黄/米/灰等）。

    算法：
    1. 从四角采样估计背景色
    2. 逐行/列扫描：若该行/列中 bg_ratio 以上的像素与背景色差异 <= tolerance，则为背景行/列
    3. 找到内容区域边界后裁切

    Returns:
        (裁切后图片, 是否裁切, 详情dict)
    """
    H, W = image.shape[:2]
    bg_color = _detect_bg_color(image)
    img_f = image.astype(np.int32)

    # 每个像素与背景色的最大通道差异
    diff = np.abs(img_f - bg_color.astype(np.int32)).max(axis=2)  # H x W
    is_bg = diff <= tolerance  # True = 接近背景色

    row_bg_ratio = is_bg.mean(axis=1)   # 每行的背景像素占比
    col_bg_ratio = is_bg.mean(axis=0)   # 每列的背景像素占比

    top    = next((i for i in range(H)        if row_bg_ratio[i] < bg_ratio), H)
    bottom = next((i for i in range(H-1,-1,-1) if row_bg_ratio[i] < bg_ratio), -1) + 1
    left   = next((i for i in range(W)        if col_bg_ratio[i] < bg_ratio), W)
    right  = next((i for i in range(W-1,-1,-1) if col_bg_ratio[i] < bg_ratio), -1) + 1

    border_top    = top
    border_bottom = H - bottom
    border_left   = left
    border_right  = W - right
    max_border    = max(border_top, border_bottom, border_left, border_right)

    bg_hex = "#{:02X}{:02X}{:02X}".format(int(bg_color[2]), int(bg_color[1]), int(bg_color[0]))
    info   = {"top": border_top, "bottom": border_bottom,
              "left": border_left, "right": border_right, "bg_color": bg_hex}

    if max_border < 5:
        print(f"  [裁边] 背景色{bg_hex} | 上{border_top} 下{border_bottom} 左{border_left} 右{border_right}px → 无需裁切")
        return image, False, info

    y1 = max(0, top    - padding)
    y2 = min(H, bottom + padding)
    x1 = max(0, left   - padding)
    x2 = min(W, right  + padding)
    cropped = image[y1:y2, x1:x2]
    ch, cw = cropped.shape[:2]
    print(f"  [裁边] 背景色{bg_hex} | 上{border_top} 下{border_bottom} 左{border_left} 右{border_right}px → 裁切 {W}x{H}→{cw}x{ch}")
    return cropped, True, info


async def tool_color_match(orig_img: np.ndarray, result_img: np.ndarray,
                           strength: float = 0.75) -> np.ndarray:
    """【Tool】颜色匹配（封装版，供 AI 决策层调用）"""
    return _color_match(orig_img, result_img, strength=strength)


async def ai_decide_postprocess(orig_img: np.ndarray, result_img: np.ndarray) -> dict:
    """
    【AI 决策层】用视觉模型分析出图效果，决定是否需要颜色匹配和白边裁切。

    Returns:
        {
            "need_color_match": bool,
            "color_strength":   float,   # 0.5-0.9
            "need_trim":        bool,
            "reason":           str,
        }
    """
    import base64
    from dotenv import load_dotenv
    load_dotenv()
    api_key  = os.getenv("OPENAI_API_KEY")
    base_url = os.getenv("OPENAI_BASE_URL")
    model    = os.getenv("VISION_MODEL", "glm-4v-flash")

    # 无 API 时默认两个都做
    if not api_key:
        return {"need_color_match": True, "color_strength": 0.75,
                "need_trim": True, "reason": "无API Key，默认执行"}

    def _encode(img: np.ndarray) -> str:
        resized = cv2.resize(img, (512, 512))
        _, buf = cv2.imencode(".jpg", resized, [cv2.IMWRITE_JPEG_QUALITY, 80])
        return base64.b64encode(buf).decode()

    orig_b64   = _encode(orig_img)
    result_b64 = _encode(result_img)

    prompt = (
        "你是图片后处理决策助手。图一是原图，图二是AI处理后的结果图。请判断：\n\n"
        "【问题1】颜色差异：处理后图片的整体色调与原图相比，差异是否明显？\n"
        "（明显=色调/饱和度/冷暖差异很大；轻微=有轻微偏差；无=颜色基本一致）\n\n"
        "【问题2】多余边框：处理后图片四周是否有不属于图案内容的多余空白边框？\n"
        "注意：边框颜色不一定是白色，也可能是黄色、米色、灰色等任何纯色。\n"
        "判断标准：图案内容的外围是否有一圈明显的纯色空白带。\n\n"
        "严格按格式回答（每行一个字段，不要多余内容）：\n"
        "颜色差异: <明显|轻微|无>\n"
        "多余边框: <有|无>\n"
        "边框位置: <有边框的方向如「上下」，没有则填无>"
    )

    try:
        from openai import AsyncOpenAI
        client = AsyncOpenAI(base_url=base_url, api_key=api_key)
        response = await client.chat.completions.create(
            model=model,
            messages=[{
                "role": "user",
                "content": [
                    {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{orig_b64}"}},
                    {"type": "image_url", "image_url": {"url": f"data:image/jpeg;base64,{result_b64}"}},
                    {"type": "text", "text": prompt},
                ],
            }],
        )
        text = response.choices[0].message.content or ""
        print(f"  [AI决策] 原始回答: {text.strip()[:120]}")

        def _get(key):
            for line in text.splitlines():
                line = line.strip()
                if line.startswith(key):
                    return line.split(":", 1)[-1].strip()
            return ""

        color_level = _get("颜色差异")
        has_border  = "有" in _get("多余边框")
        border_pos  = _get("边框位置")

        strength_map = {"明显": 0.80, "轻微": 0.55, "无": 0.0}
        color_strength = strength_map.get(color_level, 0.75)
        need_color = color_strength > 0

        reason = f"颜色差异={color_level or '?'}, 边框={'有('+border_pos+')' if has_border else '无'}"
        print(f"  [AI决策] {reason} → 颜色匹配={'✓' if need_color else '✗'}(强度{color_strength:.0%}), 裁边={'✓' if has_border else '✗'}")

        return {
            "need_color_match": need_color,
            "color_strength":   color_strength,
            "need_trim":        has_border,
            "reason":           reason,
        }

    except Exception as e:
        print(f"  [AI决策] 调用失败({e})，默认执行颜色匹配+裁边")
        return {"need_color_match": True, "color_strength": 0.75,
                "need_trim": True, "reason": f"AI决策失败: {e}"}


def _points_are_unique(pts: np.ndarray, min_dist: float = 20.0) -> bool:
    """检查4个角点两两之间距离都大于 min_dist，防止重复点导致退化变换"""
    for i in range(len(pts)):
        for j in range(i + 1, len(pts)):
            if np.linalg.norm(pts[i] - pts[j]) < min_dist:
                return False
    return True


def find_quad(image: np.ndarray):
    """
    在白背景图上检测主体四边形角点。
    策略（按优先级）：
      1. 二值化 + approxPolyDP（epsilon 从小到大尝试）
      2. 凸包取极值四点（最左/最右/最上/最下）
      3. minAreaRect 四角
    """
    h, w = image.shape[:2]
    img_area = h * w
    gray = cv2.cvtColor(image, cv2.COLOR_BGR2GRAY)

    # ── 获取主体轮廓 ──────────────────────────────────────────
    _, thresh = cv2.threshold(gray, 245, 255, cv2.THRESH_BINARY_INV)
    kernel = cv2.getStructuringElement(cv2.MORPH_RECT, (20, 20))
    closed = cv2.morphologyEx(thresh, cv2.MORPH_CLOSE, kernel)

    cnts, _ = cv2.findContours(closed, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)
    if not cnts:
        edges = cv2.Canny(gray, 30, 100)
        k2 = cv2.getStructuringElement(cv2.MORPH_RECT, (10, 10))
        closed = cv2.morphologyEx(edges, cv2.MORPH_CLOSE, k2)
        cnts, _ = cv2.findContours(closed, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE)

    if not cnts:
        print("  [CV] 无法检测轮廓")
        return None

    c = max(cnts, key=cv2.contourArea)
    area = cv2.contourArea(c)
    print(f"  [CV] 主体轮廓面积: {area:.0f} / {img_area} ({area/img_area*100:.1f}%)")
    if area < img_area * 0.05:
        print("  [CV] 面积太小，背景可能去除不完全")
        return None

    peri = cv2.arcLength(c, True)

    # ── 策略1：approxPolyDP，epsilon 逐步放大直到得到4个唯一角点 ──
    for eps_ratio in [0.02, 0.03, 0.04, 0.05, 0.06]:
        approx = cv2.approxPolyDP(c, eps_ratio * peri, True)
        pts = approx.reshape(-1, 2).astype("float32")
        if len(pts) == 4 and _points_are_unique(pts):
            print(f"  [CV] approxPolyDP 成功 (eps={eps_ratio}), 4个唯一角点")
            return pts
        print(f"  [CV] approxPolyDP eps={eps_ratio}: {len(pts)} 顶点，唯一={_points_are_unique(pts) if len(pts)==4 else 'N/A'}")

    # ── 策略2：凸包极值四点（最左/最上/最右/最下）─────────────
    hull = cv2.convexHull(c).reshape(-1, 2).astype("float32")
    if len(hull) >= 4:
        # 取4个极值方向的点
        left   = hull[np.argmin(hull[:, 0])]    # 最左
        right  = hull[np.argmax(hull[:, 0])]    # 最右
        top    = hull[np.argmin(hull[:, 1])]    # 最上
        bottom = hull[np.argmax(hull[:, 1])]    # 最下
        pts = np.array([left, top, right, bottom], dtype="float32")
        if _points_are_unique(pts):
            print(f"  [CV] 使用凸包极值四点: L={left.astype(int)} T={top.astype(int)} R={right.astype(int)} B={bottom.astype(int)}")
            return pts

    # ── 策略3：minAreaRect 四角（兜底）─────────────────────────
    print(f"  [CV] 兜底：使用 minAreaRect")
    rect = cv2.minAreaRect(c)
    box = cv2.boxPoints(rect).astype("float32")
    return box


def save_debug_img(image: np.ndarray, pts, path: str):
    """保存带角点标注的调试图"""
    dbg = image.copy()
    if pts is not None:
        rect = order_points(pts)
        labels = ["TL", "TR", "BR", "BL"]
        colors = [(0,0,255), (0,255,0), (255,0,0), (0,165,255)]
        for i, (px, py) in enumerate(rect):
            cv2.circle(dbg, (int(px), int(py)), 12, colors[i], -1)
            cv2.putText(dbg, labels[i], (int(px)+15, int(py)),
                        cv2.FONT_HERSHEY_SIMPLEX, 1.2, colors[i], 3)
        box = rect.reshape((-1,1,2)).astype(np.int32)
        cv2.polylines(dbg, [box], True, (0,0,255), 3)
    cv2.imwrite(path, dbg, [cv2.IMWRITE_JPEG_QUALITY, 90])
    print(f"  [Debug] 调试图: {path}")


# ═══════════════════════════════════════════════════════════════
# 主流程
# ═══════════════════════════════════════════════════════════════

async def process(src: str, debug: bool = False,
                  skip_step1: bool = False, skip_step3: bool = False) -> str | None:
    uid = uuid.uuid4().hex
    tmp = []  # 临时文件列表，最后统一清理

    # ── 下载（URL 情况）──────────────────────────────────────
    if src.startswith("http"):
        import aiohttp
        dl = os.path.join(tempfile.gettempdir(), f"pfix_dl_{uid}.jpg")
        tmp.append(dl)
        print("[下载] 原图中...")
        async with aiohttp.ClientSession(headers={
            "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64)",
            "Referer": "https://www.taobao.com/",
        }) as sess:
            async with sess.get(src, timeout=aiohttp.ClientTimeout(total=30)) as r:
                if r.status != 200:
                    print(f"[下载] 失败: HTTP {r.status}")
                    return None
                with open(dl, "wb") as f:
                    f.write(await r.read())
        local_src = dl
    else:
        local_src = src

    current  = local_src  # 当前处理中的文件
    orig_img = cv2.imread(local_src)  # 保留原图用于颜色匹配
    # 记录原图宽高比，用于检测 Gemini 旋转问题
    orig_ratio = (orig_img.shape[1] / orig_img.shape[0]) if orig_img is not None else 1.0

    try:
        # ── Step 1: Gemini 去背景 → 白背景 ──────────────────
        if not skip_step1:
            print("\n" + "─"*50)
            print("Step 1 / 3  |  Gemini 去背景 → 白色背景")
            print("─"*50)
            s1_out = os.path.join(tempfile.gettempdir(), f"pfix_s1_{uid}.jpg")
            tmp.append(s1_out)
            ok = await _gemini_call(current, s1_out, PROMPT_WHITE_BG,
                                    aspect_ratio="auto", label="去背景")
            if ok:
                # 检查白色覆盖率，判断背景去除是否充分
                s1_img = cv2.imread(s1_out)
                white_pct = _measure_white_coverage(s1_img) if s1_img is not None else 0.0
                print(f"  [去背景] 白色覆盖率: {white_pct:.1%}", end="")
                if white_pct < 0.20:
                    # 背景去除太差，用强化提示词重试
                    print(" → 太低，强化提示词重试...")
                    s1_retry = os.path.join(tempfile.gettempdir(), f"pfix_s1r_{uid}.jpg")
                    tmp.append(s1_retry)
                    ok2 = await _gemini_call(current, s1_retry, PROMPT_WHITE_BG_STRONG,
                                            aspect_ratio="auto", label="去背景(强化)")
                    if ok2:
                        r_img = cv2.imread(s1_retry)
                        retry_pct = _measure_white_coverage(r_img) if r_img is not None else 0.0
                        print(f"  [去背景] 重试白色覆盖率: {retry_pct:.1%}", end="")
                        if retry_pct >= white_pct:
                            print(" → 效果更好，采用重试结果")
                            current = s1_retry
                        else:
                            print(" → 效果未提升，保留首次结果")
                            current = s1_out
                    else:
                        print("  [去背景] 重试失败，保留首次结果")
                        current = s1_out
                else:
                    print(" → 合格")
                    current = s1_out
            else:
                print("  Step1 失败，用原图继续")
        else:
            print("\n[跳过 Step1] 直接用原图")

        # ── Step 2: OpenCV 在白背景图上检测+透视矫正 ─────────
        print("\n" + "─"*50)
        print("Step 2 / 3  |  OpenCV 轮廓检测 + 透视矫正")
        print("─"*50)
        img = cv2.imread(current)
        if img is None:
            print(f"  无法读取: {current}")
            return None

        h, w = img.shape[:2]
        print(f"  输入尺寸: {w}x{h}")
        pts = find_quad(img)

        if debug:
            dbg_path = os.path.join(_OUTPUT_DIR, f"debug_{uid}.jpg")
            save_debug_img(img, pts, dbg_path)

        if pts is not None:
            warped = four_point_transform(img, pts)

            # ── 方向校正：Gemini 可能把图旋转 90°，需要纠正 ──
            wh2, ww2 = warped.shape[:2]
            warped_ratio = ww2 / wh2  # 宽/高
            # 若原图横竖方向与矫正结果相反（比例差异超过 1.5 倍），旋转 90°
            if orig_ratio > 1.0 and warped_ratio < 1.0 / 1.5:
                # 原图横，结果竖 → 顺时针转 90°
                warped = cv2.rotate(warped, cv2.ROTATE_90_CLOCKWISE)
                print(f"  [方向校正] 原图横({orig_ratio:.2f}) vs 矫正竖({warped_ratio:.2f}) → 旋转90°")
            elif orig_ratio < 1.0 and warped_ratio > 1.5:
                # 原图竖，结果横 → 逆时针转 90°
                warped = cv2.rotate(warped, cv2.ROTATE_90_COUNTERCLOCKWISE)
                print(f"  [方向校正] 原图竖({orig_ratio:.2f}) vs 矫正横({warped_ratio:.2f}) → 旋转-90°")
            else:
                print(f"  [方向校正] 方向一致，无需旋转 (原图比例={orig_ratio:.2f}, 矫正比例={warped_ratio:.2f})")

            s2_out = os.path.join(tempfile.gettempdir(), f"pfix_s2_{uid}.jpg")
            tmp.append(s2_out)
            cv2.imwrite(s2_out, warped, [cv2.IMWRITE_JPEG_QUALITY, 95])
            current = s2_out
            wh2, ww2 = warped.shape[:2]
            print(f"  透视矫正完成 → {ww2}x{wh2}")
        else:
            print("  角点检测失败，跳过透视矫正，继续用白背景图")

        # ── Step 3: Qwen 高清增强 ─────────────────────────────
        if not skip_step3:
            print("\n" + "─"*50)
            print("Step 3 / 5  |  Qwen 高清增强（RunningHub）")
            print("─"*50)
            final_out = os.path.join(_OUTPUT_DIR, f"pfix_final_{uid}.jpg")
            from services.service_qwen import 清晰化_api
            ok = await 清晰化_api(img_path=current, save_path=final_out)
            if ok:
                print(f"  [高清增强] Qwen 成功")
            else:
                # Qwen 失败，用 Gemini 简化提示词兜底
                print("  Qwen 失败，Gemini 兜底重试...")
                ok = await _gemini_call(current, final_out, PROMPT_ENHANCE_SIMPLE,
                                        aspect_ratio="auto", label="高清增强(Gemini兜底)")
            if not ok:
                print("  Step3 全部失败，直接保存矫正结果")
                import shutil
                shutil.copy2(current, final_out)
        else:
            final_out = os.path.join(_OUTPUT_DIR, f"pfix_final_{uid}.jpg")
            import shutil
            shutil.copy2(current, final_out)
            print("\n[跳过 Step3] 直接保存矫正结果")

        # ── Step 4: AI 决策 + 后处理（颜色匹配 & 白边裁切）────
        print("\n" + "─"*50)
        print("Step 4 / 4  |  AI 决策后处理（颜色匹配 / 白边裁切）")
        print("─"*50)
        final_img = cv2.imread(final_out)
        if final_img is not None and orig_img is not None:
            decision = await ai_decide_postprocess(orig_img, final_img)

            # Tool 1: 颜色匹配
            if decision["need_color_match"]:
                final_img = await tool_color_match(orig_img, final_img,
                                                   strength=decision["color_strength"])
                cv2.imwrite(final_out, final_img, [cv2.IMWRITE_JPEG_QUALITY, 95])
            else:
                print("  [颜色匹配] AI 判断无需调色，跳过")

            # Tool 2: 白边裁切
            if decision["need_trim"]:
                trimmed, did_trim, _ = tool_trim_white_border(final_img)
                if did_trim:
                    cv2.imwrite(final_out, trimmed, [cv2.IMWRITE_JPEG_QUALITY, 95])
            else:
                print("  [裁边] AI 判断无白边，跳过")
        else:
            print("  [Step4] 图片读取失败，跳过后处理")

        size_kb = os.path.getsize(final_out) / 1024
        print(f"\n{'='*50}")
        print(f"  完成！输出文件: {final_out}")
        print(f"  文件大小: {size_kb:.0f} KB")
        print(f"{'='*50}")
        return final_out

    finally:
        for f in tmp:
            if os.path.exists(f):
                os.remove(f)


if __name__ == "__main__":
    if len(sys.argv) < 2:
        print("用法: python perspective_fix.py <图片路径或URL> [--debug] [--skip-step1] [--skip-step3]")
        sys.exit(1)

    src_arg      = sys.argv[1]
    debug_arg    = "--debug"      in sys.argv
    skip1_arg    = "--skip-step1" in sys.argv
    skip3_arg    = "--skip-step3" in sys.argv
    asyncio.run(process(src_arg, debug=debug_arg, skip_step1=skip1_arg, skip_step3=skip3_arg))