import os
import io
import json
import time
import uuid
import random
import tempfile
import zipfile
from dataclasses import dataclass, asdict
from typing import Any, Dict, List, Optional, Tuple

import numpy as np
import torch
import gradio as gr
import spaces

from PIL import Image
from pptx import Presentation
from diffusers import QwenImageLayeredPipeline

from huggingface_hub import HfApi, login
from huggingface_hub.utils import HfHubHTTPError


LOG_DIR = "/tmp/local"
MAX_SEED = np.iinfo(np.int32).max


# -------------------------
# HF auth (Spaces secrets)
# -------------------------
def _get_hf_token() -> Optional[str]:
    # priority: HF_TOKEN -> hf -> HUGGINGFACEHUB_API_TOKEN
    return (
        os.environ.get("HF_TOKEN")
        or os.environ.get("hf")
        or os.environ.get("HUGGINGFACEHUB_API_TOKEN")
    )


def _get_dataset_repo() -> Optional[str]:
    # priority: DATASET_REPO -> HF_DATASET_REPO
    return os.environ.get("DATASET_REPO") or os.environ.get("HF_DATASET_REPO")


HF_TOKEN = _get_hf_token()
DATASET_REPO = _get_dataset_repo()

if HF_TOKEN:
    try:
        login(token=HF_TOKEN)
    except Exception as e:
        print("HF login failed:", repr(e))


# -------------------------
# Helpers
# -------------------------
def ensure_dirname(path: str):
    if path and not os.path.exists(path):
        os.makedirs(path, exist_ok=True)


def px_to_emu(px, dpi=96):
    inch = px / dpi
    emu = inch * 914400
    return int(emu)


def imagelist_to_pptx_from_pils(images: List[Image.Image]) -> str:
    if not images:
        raise ValueError("No images to export")

    w, h = images[0].size
    prs = Presentation()
    prs.slide_width = px_to_emu(w)
    prs.slide_height = px_to_emu(h)

    slide = prs.slides.add_slide(prs.slide_layouts[6])
    left = top = 0

    for img in images:
        tmp = tempfile.NamedTemporaryFile(suffix=".png", delete=False)  # /tmp
        img.save(tmp.name)
        slide.shapes.add_picture(
            tmp.name,
            left,
            top,
            width=px_to_emu(w),
            height=px_to_emu(h),
        )

    out = tempfile.NamedTemporaryFile(suffix=".pptx", delete=False)  # /tmp
    prs.save(out.name)
    return out.name


def imagelist_to_zip_from_pils(images: List[Image.Image], prefix: str = "layer") -> str:
    outzip = tempfile.NamedTemporaryFile(suffix=".zip", delete=False)  # /tmp
    with zipfile.ZipFile(outzip.name, "w", zipfile.ZIP_DEFLATED) as zipf:
        for i, img in enumerate(images):
            buf = io.BytesIO()
            img.save(buf, format="PNG")
            zipf.writestr(f"{prefix}_{i+1}.png", buf.getvalue())
    return outzip.name


def _clamp_int(x, default: int, lo: int, hi: int) -> int:
    try:
        v = int(x)
    except Exception:
        v = default
    return max(lo, min(hi, v))


def _normalize_resolution(resolution: Any) -> int:
    resolution = _clamp_int(resolution, default=640, lo=640, hi=1024)
    if resolution not in (640, 1024):
        resolution = 640
    return resolution


def _normalize_input_image(input_image: Any) -> Image.Image:
    if isinstance(input_image, list):
        input_image = input_image[0]

    if isinstance(input_image, str):
        pil_image = Image.open(input_image).convert("RGB").convert("RGBA")
    elif isinstance(input_image, Image.Image):
        pil_image = input_image.convert("RGB").convert("RGBA")
    elif isinstance(input_image, np.ndarray):
        pil_image = Image.fromarray(input_image).convert("RGB").convert("RGBA")
    else:
        raise ValueError(f"Unsupported input_image type: {type(input_image)}")

    return pil_image


# -------------------------
# Dataset persistence helpers
# -------------------------
def ds_enabled() -> bool:
    return bool(_get_hf_token()) and bool(_get_dataset_repo())


def ds_api() -> HfApi:
    token = _get_hf_token()
    if not token:
        raise RuntimeError("HF token missing")
    return HfApi(token=token)


def ds_repo_id() -> str:
    repo = _get_dataset_repo()
    if not repo:
        raise RuntimeError("DATASET_REPO/HF_DATASET_REPO missing")
    return repo


def ds_ensure_repo() -> Tuple[bool, str]:
    if not ds_enabled():
        return False, "Dataset persistence disabled: missing HF token and/or dataset repo env."

    api = ds_api()
    repo_id = ds_repo_id()
    try:
        api.create_repo(repo_id=repo_id, repo_type="dataset", exist_ok=True, private=True)
        return True, f"Dataset repo ready: {repo_id}"
    except HfHubHTTPError as e:
        return False, f"Failed to create/ensure dataset repo: {e}"
    except Exception as e:
        return False, f"Failed to create/ensure dataset repo: {repr(e)}"


def ds_upload_bytes(path_in_repo: str, data: bytes, commit_message: str) -> Tuple[bool, str]:
    if not ds_enabled():
        return False, "Dataset persistence disabled: missing HF token and/or dataset repo env."

    api = ds_api()
    repo_id = ds_repo_id()
    try:
        with tempfile.NamedTemporaryFile(delete=False) as tmp:
            tmp.write(data)
            tmp.flush()
            api.upload_file(
                path_or_fileobj=tmp.name,
                path_in_repo=path_in_repo,
                repo_id=repo_id,
                repo_type="dataset",
                commit_message=commit_message,
            )
        return True, f"Uploaded: {path_in_repo}"
    except HfHubHTTPError as e:
        # 403 "must use a write token" — это сюда
        return False, f"Upload failed (HTTP): {e}"
    except Exception as e:
        return False, f"Upload failed: {repr(e)}"


def ds_download_bytes(path_in_repo: str) -> Tuple[Optional[bytes], str]:
    if not ds_enabled():
        return None, "Dataset persistence disabled"

    api = ds_api()
    repo_id = ds_repo_id()
    try:
        tmpdir = tempfile.mkdtemp()
        local_path = api.hf_hub_download(
            repo_id=repo_id,
            repo_type="dataset",
            filename=path_in_repo,
            local_dir=tmpdir,
        )
        with open(local_path, "rb") as f:
            return f.read(), "OK"
    except HfHubHTTPError as e:
        return None, f"Download failed (HTTP): {e}"
    except Exception as e:
        return None, f"Download failed: {repr(e)}"


def _root_index_path() -> str:
    return "index.json"


def ds_read_root_index() -> Dict[str, Any]:
    """
    Root index.json (backward compatible):
      {
        "id": "<last_session_id>",
        "last_session_id": "<last_session_id>",
        "sessions": ["sess_...", ...],
        "updated_at": 123.0
      }
    """
    b, _ = ds_download_bytes(_root_index_path())
    if b is None:
        return {"id": None, "last_session_id": None, "sessions": [], "updated_at": time.time()}

    try:
        obj = json.loads(b.decode("utf-8"))
        if "last_session_id" not in obj and "id" in obj:
            obj["last_session_id"] = obj.get("id")
        if "id" not in obj:
            obj["id"] = obj.get("last_session_id")
        if "sessions" not in obj or not isinstance(obj["sessions"], list):
            obj["sessions"] = []
        return obj
    except Exception:
        return {"id": None, "last_session_id": None, "sessions": [], "updated_at": time.time()}


def ds_write_root_index(last_session_id: Optional[str]) -> Tuple[bool, str]:
    idx = ds_read_root_index()
    idx["last_session_id"] = last_session_id
    idx["id"] = last_session_id  # FIX: KeyError('id')
    idx["updated_at"] = time.time()
    if last_session_id:
        idx["sessions"] = [last_session_id] + [s for s in idx.get("sessions", []) if s != last_session_id]
    b = json.dumps(idx, ensure_ascii=False, indent=2).encode("utf-8")
    return ds_upload_bytes(_root_index_path(), b, f"update root index last_session_id={last_session_id}")


def ds_list_sessions(max_sessions: int = 50) -> Tuple[List[str], str]:
    if not ds_enabled():
        return [], "Dataset persistence disabled"

    api = ds_api()
    repo_id = ds_repo_id()
    try:
        # Prefer root index (fast)
        sess = []
        try:
            root = ds_read_root_index()
            sess = [s for s in root.get("sessions", []) if isinstance(s, str)]
        except Exception:
            sess = []

        # Fallback scan
        if not sess:
            files = api.list_repo_files(repo_id=repo_id, repo_type="dataset")
            found = set()
            for p in files:
                if p.startswith("sessions/") and (p.endswith("/index.json") or p.endswith("/session.json")):
                    parts = p.split("/")
                    if len(parts) >= 3:
                        found.add(parts[1])
            sess = sorted(found, reverse=True)

        sess = sess[:max_sessions]
        return sess, f"Found {len(sess)} session(s)"
    except Exception as e:
        return [], f"List sessions failed: {repr(e)}"


# -------------------------
# Node / History model
# -------------------------
@dataclass
class NodeMeta:
    node_id: str
    name: str
    parent_id: Optional[str]
    children: List[str]
    op: str  # "decompose" | "refine" | "duplicate"
    created_at: float

    source_node_id: Optional[str] = None
    source_layer_idx: Optional[int] = None
    sub_layers: Optional[int] = None
    settings: Optional[Dict[str, Any]] = None


def _new_id(prefix: str) -> str:
    return f"{prefix}_{uuid.uuid4().hex[:10]}"


def _make_chips(state: Dict[str, Any]) -> str:
    node_id = state.get("selected_node_id")
    nodes: Dict[str, Any] = state.get("nodes", {})
    if not node_id or node_id not in nodes:
        return "[root] [parent:-] [children:0]"
    meta = nodes[node_id]["meta"]
    parent = meta.get("parent_id") or "-"
    children = meta.get("children") or []
    root = state.get("root_node_id") or "-"
    return f"[root:{root}] [parent:{parent}] [children:{len(children)}]"


def _history_choices(state: Dict[str, Any]) -> List[Tuple[str, str]]:
    nodes: Dict[str, Any] = state.get("nodes", {})
    items = []
    for nid, obj in nodes.items():
        meta = obj["meta"]
        items.append((meta.get("created_at", 0.0), nid, meta.get("name", nid)))
    items.sort(key=lambda x: x[0])
    return [(f"{name} — {nid}", nid) for _, nid, name in items]


def _get_node_images(state: Dict[str, Any], node_id: str) -> List[Image.Image]:
    nodes: Dict[str, Any] = state.get("nodes", {})
    if node_id not in nodes:
        return []
    return nodes[node_id].get("images", []) or []


def _add_node(
    state: Dict[str, Any],
    *,
    name: str,
    parent_id: Optional[str],
    op: str,
    images: List[Image.Image],
    settings: Optional[Dict[str, Any]] = None,
    source_node_id: Optional[str] = None,
    source_layer_idx: Optional[int] = None,
    sub_layers: Optional[int] = None,
) -> str:
    node_id = _new_id("node")
    meta = NodeMeta(
        node_id=node_id,
        name=name,
        parent_id=parent_id,
        children=[],
        op=op,
        created_at=time.time(),
        source_node_id=source_node_id,
        source_layer_idx=source_layer_idx,
        sub_layers=sub_layers,
        settings=settings or {},
    )
    state.setdefault("nodes", {})
    state["nodes"][node_id] = {"meta": asdict(meta), "images": images}
    if parent_id and parent_id in state["nodes"]:
        state["nodes"][parent_id]["meta"].setdefault("children", [])
        state["nodes"][parent_id]["meta"]["children"].append(node_id)
    return node_id


def _rename_node(state: Dict[str, Any], node_id: str, new_name: str):
    if not new_name:
        return
    if node_id in state.get("nodes", {}):
        state["nodes"][node_id]["meta"]["name"] = new_name


def _duplicate_node(state: Dict[str, Any], node_id: str) -> Optional[str]:
    if node_id not in state.get("nodes", {}):
        return None
    src = state["nodes"][node_id]
    meta = src["meta"]
    parent_id = meta.get("parent_id")
    images = src.get("images", [])
    name = f"{meta.get('name','node')} (copy)"
    return _add_node(
        state,
        name=name,
        parent_id=parent_id,
        op="duplicate",
        images=images,
        settings=meta.get("settings") or {},
    )


# -------------------------
# GPU duration + GPU-only pipeline runner
#   IMPORTANT: pipeline init is INSIDE GPU worker (ZeroGPU friendly)
# -------------------------
def get_duration(*args, **kwargs):
    # wrapper may pass random kwargs like pil_image_rgba etc; ignore
    gpu_duration = kwargs.get("gpu_duration", 1000)
    return _clamp_int(gpu_duration, default=1000, lo=20, hi=1500)


_GPU_PIPE: Optional[QwenImageLayeredPipeline] = None


def _gpu_get_pipe() -> QwenImageLayeredPipeline:
    global _GPU_PIPE
    if _GPU_PIPE is not None:
        return _GPU_PIPE

    # This function runs inside GPU worker (due to @spaces.GPU on caller)
    if not torch.cuda.is_available():
        raise RuntimeError(
            "CUDA is not available inside GPU worker. "
            "Check Space hardware: it must be ZeroGPU/GPU, not CPU."
        )

    dtype = torch.bfloat16
    _GPU_PIPE = QwenImageLayeredPipeline.from_pretrained(
        "Qwen/Qwen-Image-Layered",
        torch_dtype=dtype,
    ).to("cuda")
    return _GPU_PIPE


@spaces.GPU(duration=get_duration)
def gpu_run_pipeline(
    pil_image_rgba: Image.Image,
    seed=777,
    randomize_seed=False,
    prompt=None,
    neg_prompt=" ",
    true_guidance_scale=4.0,
    num_inference_steps=50,
    layer=4,
    cfg_norm=True,
    use_en_prompt=True,
    resolution=640,
    gpu_duration=1000,
):
    # Everything heavy here happens on GPU worker
    if randomize_seed:
        seed = random.randint(0, MAX_SEED)

    resolution = _normalize_resolution(resolution)

    if not torch.cuda.is_available():
        raise RuntimeError("No CUDA GPUs are available (GPU worker not running).")

    generator = torch.Generator(device="cuda").manual_seed(int(seed))

    inputs = {
        "image": pil_image_rgba,
        "generator": generator,
        "true_cfg_scale": float(true_guidance_scale),
        "prompt": prompt,
        "negative_prompt": neg_prompt,
        "num_inference_steps": int(num_inference_steps),
        "num_images_per_prompt": 1,
        "layers": int(layer),
        "resolution": int(resolution),
        "cfg_normalize": bool(cfg_norm),
        "use_en_prompt": bool(use_en_prompt),
    }

    # reduce allocator hiccups
    try:
        torch.cuda.empty_cache()
    except Exception:
        pass

    pipe = _gpu_get_pipe()

    with torch.inference_mode():
        out = pipe(**inputs)
        output_images = out.images[0]  # list of PIL layers

    return output_images, int(seed), inputs


# -------------------------
# Dataset persistence: save/load nodes + session
# -------------------------
def _pil_to_png_bytes(img: Image.Image) -> bytes:
    buf = io.BytesIO()
    img.save(buf, format="PNG")
    return buf.getvalue()


def _png_bytes_to_pil(b: bytes) -> Image.Image:
    return Image.open(io.BytesIO(b)).convert("RGBA")


def _session_base(session_id: str) -> str:
    return f"sessions/{session_id}"


def _node_base(session_id: str, node_id: str) -> str:
    return f"{_session_base(session_id)}/nodes/{node_id}"


def _persist_node_to_dataset(state: Dict[str, Any], node_id: str) -> Tuple[bool, str]:
    if not ds_enabled():
        return False, "Dataset persistence disabled. Set DATASET_REPO and HF_TOKEN/hf."

    ok, msg = ds_ensure_repo()
    if not ok:
        return False, msg

    session_id = state.get("session_id")
    if not session_id:
        return False, "No session_id in state (run Decompose first)"

    nodes = state.get("nodes", {})
    if node_id not in nodes:
        return False, "Unknown node_id"

    node = nodes[node_id]
    meta = node["meta"]
    imgs: List[Image.Image] = node.get("images", []) or []

    node_json = json.dumps(meta, ensure_ascii=False, indent=2).encode("utf-8")
    path_node_json = f"{_node_base(session_id, node_id)}/node.json"
    ok1, msg1 = ds_upload_bytes(path_node_json, node_json, f"save node {node_id}")
    if not ok1:
        return False, msg1

    for i, img in enumerate(imgs):
        b = _pil_to_png_bytes(img)
        path_img = f"{_node_base(session_id, node_id)}/layer_{i+1}.png"
        ok2, msg2 = ds_upload_bytes(path_img, b, f"save node {node_id} layer {i+1}")
        if not ok2:
            return False, msg2

    return True, f"Saved node {node_id} to dataset"


def _persist_session_manifest(state: Dict[str, Any]) -> Tuple[bool, str]:
    if not ds_enabled():
        return False, "Dataset persistence disabled"

    ok, msg = ds_ensure_repo()
    if not ok:
        return False, msg

    session_id = state.get("session_id")
    if not session_id:
        return False, "No session_id"

    manifest = {
        "session_id": session_id,
        "created_at": state.get("created_at"),
        "root_node_id": state.get("root_node_id"),
        "selected_node_id": state.get("selected_node_id"),
        "nodes": {
            nid: {"meta": obj["meta"], "num_layers": len(obj.get("images", []) or [])}
            for nid, obj in (state.get("nodes", {}) or {}).items()
        },
    }
    b = json.dumps(manifest, ensure_ascii=False, indent=2).encode("utf-8")

    # Save under sessions/<id>/index.json (как у тебя в датасете на скрине)
    ok1, msg1 = ds_upload_bytes(f"{_session_base(session_id)}/index.json", b, f"save session index {session_id}")
    if not ok1:
        return False, msg1

    # Optional duplicate name for compatibility
    ok2, msg2 = ds_upload_bytes(f"{_session_base(session_id)}/session.json", b, f"save session manifest {session_id}")
    if not ok2:
        return False, msg2

    # Root index.json (fix KeyError('id') + last session)
    ok3, msg3 = ds_write_root_index(session_id)
    if not ok3:
        return False, msg3

    return True, "Saved session manifest + root index"


def _load_session_manifest(session_id: str) -> Tuple[Optional[Dict[str, Any]], str]:
    for p in (f"{_session_base(session_id)}/index.json", f"{_session_base(session_id)}/session.json"):
        b, msg = ds_download_bytes(p)
        if b is None:
            continue
        try:
            return json.loads(b.decode("utf-8")), "OK"
        except Exception as e:
            return None, f"Failed to parse manifest: {repr(e)}"
    return None, f"Manifest not found for session {session_id}"


def _load_node_images(session_id: str, node_id: str, num_layers: int) -> Tuple[List[Image.Image], str]:
    imgs: List[Image.Image] = []
    for i in range(num_layers):
        b, msg = ds_download_bytes(f"{_node_base(session_id, node_id)}/layer_{i+1}.png")
        if b is None:
            return [], msg
        imgs.append(_png_bytes_to_pil(b))
    return imgs, "OK"


# -------------------------
# UI callbacks
# -------------------------
def _init_state() -> Dict[str, Any]:
    return {
        "session_id": None,
        "created_at": None,
        "root_node_id": None,
        "selected_node_id": None,
        "nodes": {},
        "last_refined_node_id": None,
    }


def _persistence_status_text() -> str:
    tok = _get_hf_token()
    repo = _get_dataset_repo()
    if tok and repo:
        return f"✅ Dataset persistence enabled: `{repo}`"
    if repo and not tok:
        return "⚠️ Dataset repo set, but HF_TOKEN/hf missing"
    if tok and not repo:
        return "⚠️ HF_TOKEN/hf set, but DATASET_REPO missing"
    return "⚠️ Dataset persistence disabled (set HF_TOKEN + DATASET_REPO secrets to enable)"


def on_refresh_sessions():
    sessions, msg = ds_list_sessions()
    return gr.update(choices=sessions, value=(sessions[0] if sessions else None)), msg


def on_init_dataset():
    ok, msg = ds_ensure_repo()
    return msg


def _current_node_export(state: Dict[str, Any], node_id: str) -> Tuple[Optional[str], Optional[str], str]:
    imgs = _get_node_images(state, node_id)
    if not imgs:
        return None, None, "No images to export"
    pptx_path = imagelist_to_pptx_from_pils(imgs)
    zip_path = imagelist_to_zip_from_pils(imgs, prefix=f"{node_id}_layer")
    return pptx_path, zip_path, "OK"


def _build_layer_dropdown(n: int) -> Tuple[List[str], Optional[str]]:
    if n <= 0:
        return [], None
    choices = [f"Layer {i+1}" for i in range(n)]
    return choices, choices[0]


def _layer_label(idx: int, n: int) -> str:
    if n <= 0:
        return "Selected: -"
    idx = max(0, min(n - 1, idx))
    return f"Selected: Layer {idx+1} / {n}"


def on_decompose_click(
    state: Dict[str, Any],
    input_image,
    seed,
    randomize_seed,
    prompt,
    neg_prompt,
    true_guidance_scale,
    num_inference_steps,
    layer,
    cfg_norm,
    use_en_prompt,
    resolution,
    gpu_duration,
):
    if state is None or not isinstance(state, dict):
        state = _init_state()

    pil_image = _normalize_input_image(input_image)

    if not state.get("session_id"):
        state["session_id"] = _new_id("sess")
        state["created_at"] = time.time()

    layers_out, used_seed, _used_inputs = gpu_run_pipeline(
        pil_image_rgba=pil_image,
        seed=seed,
        randomize_seed=randomize_seed,
        prompt=prompt,
        neg_prompt=neg_prompt,
        true_guidance_scale=true_guidance_scale,
        num_inference_steps=num_inference_steps,
        layer=layer,
        cfg_norm=cfg_norm,
        use_en_prompt=use_en_prompt,
        resolution=resolution,
        gpu_duration=gpu_duration,
    )

    settings_snapshot = {
        "seed": used_seed,
        "randomize_seed": bool(randomize_seed),
        "prompt": prompt,
        "neg_prompt": neg_prompt,
        "true_guidance_scale": float(true_guidance_scale),
        "num_inference_steps": int(num_inference_steps),
        "layers": int(layer),
        "resolution": int(_normalize_resolution(resolution)),
        "cfg_norm": bool(cfg_norm),
        "use_en_prompt": bool(use_en_prompt),
        "gpu_duration": int(_clamp_int(gpu_duration, 1000, 20, 1500)),
    }

    state["nodes"] = {}
    state["last_refined_node_id"] = None

    root_id = _add_node(
        state,
        name="root (decompose)",
        parent_id=None,
        op="decompose",
        images=layers_out,
        settings=settings_snapshot,
    )
    state["root_node_id"] = root_id
    state["selected_node_id"] = root_id

    n_layers = len(layers_out)
    layer_choices, layer_value = _build_layer_dropdown(n_layers)
    hist_choices = _history_choices(state)
    chips = _make_chips(state)
    selected_label = _layer_label(0, n_layers)

    refined_visible = gr.update(visible=False)
    refined_gallery = []

    pptx_path, zip_path, exp_msg = _current_node_export(state, root_id)
    status = f"Decomposed into {n_layers} layer(s). Seed={used_seed}. {exp_msg}"

    return (
        state,
        layers_out,
        layers_out,
        gr.update(choices=layer_choices, value=layer_value),
        gr.update(value=0),
        selected_label,
        gr.update(choices=[c[1] for c in hist_choices], value=root_id),
        chips,
        refined_visible,
        refined_gallery,
        pptx_path,
        zip_path,
        status,
        str(used_seed),
    )


def on_layer_pick_from_dropdown(state: Dict[str, Any], layer_name: str):
    node_id = state.get("selected_node_id")
    imgs = _get_node_images(state, node_id) if node_id else []
    n = len(imgs)

    if not layer_name or not layer_name.startswith("Layer "):
        idx = 0
    else:
        try:
            idx = int(layer_name.replace("Layer ", "").strip()) - 1
        except Exception:
            idx = 0

    idx = max(0, min(n - 1, idx)) if n > 0 else 0
    return gr.update(value=idx), _layer_label(idx, n)


def on_layer_pick_from_gallery(state: Dict[str, Any], evt: gr.SelectData):
    node_id = state.get("selected_node_id")
    imgs = _get_node_images(state, node_id) if node_id else []
    n = len(imgs)

    idx = int(evt.index) if evt and evt.index is not None else 0
    idx = max(0, min(n - 1, idx)) if n > 0 else 0
    dd_value = f"Layer {idx+1}" if n > 0 else None
    return gr.update(value=idx), gr.update(value=dd_value), _layer_label(idx, n)


def _refine_from_source(
    state: Dict[str, Any],
    source_node_id: str,
    source_layer_idx: int,
    sub_layers: int,
    prompt,
    neg_prompt,
    true_guidance_scale,
    num_inference_steps,
    cfg_norm,
    use_en_prompt,
    resolution,
    gpu_duration,
    seed,
    randomize_seed,
):
    src_imgs = _get_node_images(state, source_node_id)
    if not src_imgs:
        raise ValueError("Source node has no images")
    if source_layer_idx < 0 or source_layer_idx >= len(src_imgs):
        raise ValueError("Invalid layer index")

    selected_layer_img = src_imgs[source_layer_idx]

    layers_out, used_seed, _used_inputs = gpu_run_pipeline(
        pil_image_rgba=selected_layer_img,
        seed=seed,
        randomize_seed=randomize_seed,
        prompt=prompt,
        neg_prompt=neg_prompt,
        true_guidance_scale=true_guidance_scale,
        num_inference_steps=num_inference_steps,
        layer=sub_layers,
        cfg_norm=cfg_norm,
        use_en_prompt=use_en_prompt,
        resolution=resolution,
        gpu_duration=gpu_duration,
    )

    settings_snapshot = {
        "seed": used_seed,
        "randomize_seed": bool(randomize_seed),
        "prompt": prompt,
        "neg_prompt": neg_prompt,
        "true_guidance_scale": float(true_guidance_scale),
        "num_inference_steps": int(num_inference_steps),
        "layers": int(sub_layers),
        "resolution": int(_normalize_resolution(resolution)),
        "cfg_norm": bool(cfg_norm),
        "use_en_prompt": bool(use_en_prompt),
        "gpu_duration": int(_clamp_int(gpu_duration, 1000, 20, 1500)),
        "refined_from": {"source_node_id": source_node_id, "source_layer_idx": int(source_layer_idx)},
    }
    return layers_out, used_seed, settings_snapshot


def on_refine_click(
    state: Dict[str, Any],
    selected_layer_idx: int,
    sub_layers: int,
    prompt,
    neg_prompt,
    true_guidance_scale,
    num_inference_steps,
    cfg_norm,
    use_en_prompt,
    resolution,
    gpu_duration,
    seed,
    randomize_seed,
):
    if not state.get("selected_node_id"):
        return (
            state, gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(),
            gr.update(visible=False), [], None, None, "No selected node. Run Decompose first.", gr.update()
        )

    source_node_id = state["selected_node_id"]
    src_imgs = _get_node_images(state, source_node_id)
    if not src_imgs:
        return (
            state, gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(),
            gr.update(visible=False), [], None, None, "Selected node has no images.", gr.update()
        )

    n = len(src_imgs)
    idx = int(selected_layer_idx) if selected_layer_idx is not None else 0
    idx = max(0, min(n - 1, idx))
    sub_layers = _clamp_int(sub_layers, default=3, lo=2, hi=10)

    layers_out, used_seed, settings_snapshot = _refine_from_source(
        state,
        source_node_id=source_node_id,
        source_layer_idx=idx,
        sub_layers=sub_layers,
        prompt=prompt,
        neg_prompt=neg_prompt,
        true_guidance_scale=true_guidance_scale,
        num_inference_steps=num_inference_steps,
        cfg_norm=cfg_norm,
        use_en_prompt=use_en_prompt,
        resolution=resolution,
        gpu_duration=gpu_duration,
        seed=seed,
        randomize_seed=randomize_seed,
    )

    child_name = f"refine ({state['nodes'][source_node_id]['meta']['name']}) L{idx+1}"
    child_id = _add_node(
        state,
        name=child_name,
        parent_id=source_node_id,
        op="refine",
        images=layers_out,
        settings=settings_snapshot,
        source_node_id=source_node_id,
        source_layer_idx=idx,
        sub_layers=sub_layers,
    )
    state["selected_node_id"] = child_id
    state["last_refined_node_id"] = child_id

    n_layers = len(layers_out)
    layer_choices, layer_value = _build_layer_dropdown(n_layers)
    hist_choices = _history_choices(state)
    chips = _make_chips(state)
    selected_label = _layer_label(0, n_layers)

    pptx_path, zip_path, exp_msg = _current_node_export(state, child_id)
    status = f"Refined into {n_layers} sub-layer(s). Seed={used_seed}. {exp_msg}"

    return (
        state,
        layers_out,
        layers_out,
        gr.update(choices=layer_choices, value=layer_value),
        gr.update(value=0),
        selected_label,
        gr.update(choices=[c[1] for c in hist_choices], value=child_id),
        chips,
        gr.update(visible=True),
        layers_out,
        pptx_path,
        zip_path,
        status,
        gr.update(),
    )


def on_history_select(state: Dict[str, Any], node_id: str):
    if not node_id or node_id not in state.get("nodes", {}):
        return (
            state, gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(),
            gr.update(visible=False), [], None, None, "Unknown node."
        )

    state["selected_node_id"] = node_id
    imgs = _get_node_images(state, node_id)
    n_layers = len(imgs)
    layer_choices, layer_value = _build_layer_dropdown(n_layers)
    hist_choices = _history_choices(state)
    chips = _make_chips(state)
    selected_label = _layer_label(0, n_layers)

    pptx_path, zip_path, exp_msg = _current_node_export(state, node_id)

    return (
        state,
        imgs,
        imgs,
        gr.update(choices=layer_choices, value=layer_value),
        gr.update(value=0),
        selected_label,
        gr.update(choices=[c[1] for c in hist_choices], value=node_id),
        chips,
        gr.update(visible=False),
        [],
        pptx_path,
        zip_path,
        f"Selected node: {node_id}. {exp_msg}",
    )


def on_back_to_parent(state: Dict[str, Any]):
    node_id = state.get("selected_node_id")
    if not node_id or node_id not in state.get("nodes", {}):
        return state, gr.update(), "No selected node."
    parent = state["nodes"][node_id]["meta"].get("parent_id")
    if not parent:
        return state, gr.update(), "Already at root."
    return on_history_select(state, parent)


def on_duplicate_node(state: Dict[str, Any]):
    node_id = state.get("selected_node_id")
    if not node_id:
        return state, gr.update(), "No selected node."
    new_id = _duplicate_node(state, node_id)
    if not new_id:
        return state, gr.update(), "Duplicate failed."
    return on_history_select(state, new_id)


def on_rename_node(state: Dict[str, Any], new_name: str):
    node_id = state.get("selected_node_id")
    if not node_id:
        return state, gr.update(), "No selected node."
    _rename_node(state, node_id, new_name)
    hist_choices = _history_choices(state)
    chips = _make_chips(state)
    return state, gr.update(choices=[c[1] for c in hist_choices], value=node_id), chips, "Renamed."


def on_export_selected(state: Dict[str, Any]):
    node_id = state.get("selected_node_id")
    if not node_id:
        return None, None, "No selected node."
    pptx_path, zip_path, msg = _current_node_export(state, node_id)
    return pptx_path, zip_path, msg


def on_save_current(state: Dict[str, Any]):
    node_id = state.get("selected_node_id")
    if not node_id:
        return "Nothing to save."

    ok1, msg1 = _persist_node_to_dataset(state, node_id)
    if not ok1:
        return msg1

    ok2, msg2 = _persist_session_manifest(state)
    if not ok2:
        return msg2

    return f"✅ Saved node + session manifest. {msg1}"


def on_load_session(state: Dict[str, Any], session_id: str):
    if not session_id:
        return (
            state, gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(),
            gr.update(visible=False), [], None, None, "Pick a session id."
        )

    manifest, msg = _load_session_manifest(session_id)
    if manifest is None:
        return (
            state, gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(),
            gr.update(visible=False), [], None, None, msg
        )

    new_state = _init_state()
    new_state["session_id"] = manifest.get("session_id") or session_id
    new_state["created_at"] = manifest.get("created_at")
    new_state["root_node_id"] = manifest.get("root_node_id")
    new_state["selected_node_id"] = manifest.get("selected_node_id") or manifest.get("root_node_id")

    nodes_meta = manifest.get("nodes", {}) or {}
    for nid, obj in nodes_meta.items():
        meta = obj.get("meta") or {}
        new_state["nodes"][nid] = {"meta": meta, "images": []}

    sel = new_state["selected_node_id"]
    if not sel or sel not in nodes_meta:
        sel = new_state["root_node_id"]
        new_state["selected_node_id"] = sel

    if sel and sel in nodes_meta:
        num_layers = int(nodes_meta[sel].get("num_layers", 0))
        imgs, msg2 = _load_node_images(session_id, sel, num_layers)
        if not imgs:
            return (
                new_state, gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(), gr.update(),
                gr.update(visible=False), [], None, None, f"Loaded manifest but failed to load images: {msg2}"
            )
        new_state["nodes"][sel]["images"] = imgs

        root = new_state.get("root_node_id")
        if root and root != sel and root in nodes_meta and not new_state["nodes"][root]["images"]:
            rl = int(nodes_meta[root].get("num_layers", 0))
            rimgs, _ = _load_node_images(session_id, root, rl)
            if rimgs:
                new_state["nodes"][root]["images"] = rimgs

    imgs = _get_node_images(new_state, sel) if sel else []
    n_layers = len(imgs)
    layer_choices, layer_value = _build_layer_dropdown(n_layers)
    hist_choices = _history_choices(new_state)
    chips = _make_chips(new_state)
    selected_label = _layer_label(0, n_layers)

    pptx_path, zip_path, exp_msg = _current_node_export(new_state, sel) if sel else (None, None, "No node")

    return (
        new_state,
        imgs,
        imgs,
        gr.update(choices=layer_choices, value=layer_value),
        gr.update(value=0),
        selected_label,
        gr.update(choices=[c[1] for c in hist_choices], value=sel),
        chips,
        gr.update(visible=False),
        [],
        pptx_path,
        zip_path,
        f"Loaded session {session_id}. {exp_msg}",
    )


def on_history_need_images(state: Dict[str, Any], node_id: str):
    if not node_id or node_id not in state.get("nodes", {}):
        return state, "Unknown node."

    imgs = state["nodes"][node_id].get("images", [])
    if imgs:
        return state, "OK"

    session_id = state.get("session_id")
    if not session_id:
        return state, "No session_id."

    manifest, msg = _load_session_manifest(session_id)
    if not manifest:
        return state, f"Cannot load manifest: {msg}"

    node_obj = (manifest.get("nodes", {}) or {}).get(node_id, {})
    num_layers = int(node_obj.get("num_layers", 0))
    if num_layers <= 0:
        return state, "No layers in manifest for this node."

    imgs2, msg2 = _load_node_images(session_id, node_id, num_layers)
    if not imgs2:
        return state, f"Failed to load images: {msg2}"

    state["nodes"][node_id]["images"] = imgs2
    return state, "Loaded images."


# -------------------------
# Build UI
# -------------------------
ensure_dirname(LOG_DIR)

examples = [
    "assets/test_images/1.png",
    "assets/test_images/2.png",
    "assets/test_images/3.png",
    "assets/test_images/4.png",
    "assets/test_images/5.png",
    "assets/test_images/6.png",
    "assets/test_images/7.png",
    "assets/test_images/8.png",
    "assets/test_images/9.png",
    "assets/test_images/10.png",
    "assets/test_images/11.png",
    "assets/test_images/12.png",
    "assets/test_images/13.png",
]

with gr.Blocks() as demo:
    state = gr.State(_init_state())

    gr.HTML(
        '<img src="https://qianwen-res.oss-cn-beijing.aliyuncs.com/Qwen-Image/layered/qwen-image-layered-logo.png" '
        'alt="Qwen-Image-Layered Logo" width="600" style="display: block; margin: 0 auto;">'
    )

    persistence_banner = gr.Markdown(_persistence_status_text())

    with gr.Row():
        btn_init_ds = gr.Button("Init dataset repo", variant="secondary")
        btn_refresh_sessions = gr.Button("Refresh sessions", variant="secondary")
        ds_status = gr.Markdown("")

    with gr.Row():
        load_session_dd = gr.Dropdown(
            label="Load session (from dataset)",
            choices=[],
            value=None,
            allow_custom_value=True,
        )
        btn_load_session = gr.Button("Load session", variant="primary")

    gr.Markdown(
        """
The text prompt describes the overall content of the input image.
It is not designed to control the semantic content of individual layers explicitly.
        """
    )

    with gr.Row():
        with gr.Column(scale=1):
            input_image = gr.Image(label="Input Image", image_mode="RGBA")

            with gr.Accordion("Advanced Settings", open=False):
                prompt = gr.Textbox(
                    label="Prompt (Optional)",
                    placeholder="Describe the image (optional)",
                    value="",
                    lines=2,
                )
                neg_prompt = gr.Textbox(
                    label="Negative Prompt (Optional)",
                    placeholder="Negative prompt",
                    value=" ",
                    lines=2,
                )

                seed = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0)
                randomize_seed = gr.Checkbox(label="Randomize seed", value=True)

                true_guidance_scale = gr.Slider(
                    label="True guidance scale", minimum=1.0, maximum=10.0, step=0.1, value=4.0
                )

                num_inference_steps = gr.Slider(
                    label="Number of inference steps", minimum=1, maximum=100, step=1, value=50  # DO NOT CHANGE
                )

                layer = gr.Slider(label="Layers", minimum=2, maximum=10, step=1, value=7)  # DO NOT CHANGE

                resolution = gr.Radio(label="Processing resolution", choices=[640, 1024], value=640)  # DO NOT CHANGE

                cfg_norm = gr.Checkbox(label="Enable CFG normalization", value=True)
                use_en_prompt = gr.Checkbox(label="Auto caption language: True=EN, False=ZH", value=True)

                gpu_duration = gr.Textbox(
                    label="GPU duration override (seconds, 20..1500)",
                    value="1000",
                    lines=1,
                    placeholder="e.g. 120, 300, 1000, 1500",
                )

            btn_decompose = gr.Button("Decompose!", variant="primary")

            with gr.Group():
                gr.Markdown("### Refine (Recursive Decomposition)")
                sub_layers = gr.Slider(label="Sub-layers (Refine)", minimum=2, maximum=10, step=1, value=3)
                btn_refine = gr.Button("Refine selected layer", variant="primary")

        with gr.Column(scale=2):
            gr.Markdown("### Current node layers")
            gallery = gr.Gallery(label="Layers", columns=4, rows=1, format="png")

            gr.Markdown("### Layer picker (Photoshop-style)")
            layer_picker = gr.Gallery(label="Pick a layer", columns=8, rows=1, format="png")

            with gr.Row():
                layer_dropdown = gr.Dropdown(label="Refine layer", choices=[], value=None)
                selected_layer_idx = gr.Number(label="Selected layer index (0-based)", value=0, precision=0, interactive=False)
                selected_layer_label = gr.Markdown("Selected: -")

            with gr.Accordion("Refined layers (last refine)", open=True, visible=False) as refined_block:
                refined_gallery = gr.Gallery(label="Refined layers", columns=4, rows=1, format="png")

            gr.Markdown("### History (nodes)")
            with gr.Row():
                history_dd = gr.Dropdown(label="Node id", choices=[], value=None)
                chips_md = gr.Markdown("[root] [parent:-] [children:0]")

            with gr.Row():
                btn_back_parent = gr.Button("← back to parent", variant="secondary")
                btn_duplicate = gr.Button("Duplicate node (branch)", variant="secondary")

            with gr.Row():
                rename_text = gr.Textbox(label="Branch name", value="", lines=1, placeholder="Type new name and click Rename")
                btn_rename = gr.Button("Rename", variant="secondary")

            with gr.Row():
                btn_export = gr.Button("Export selected node (ZIP/PPTX)", variant="primary")
                btn_save = gr.Button("Save selected node to dataset", variant="primary")

            with gr.Row():
                export_pptx = gr.File(label="Download PPTX")
                export_zip = gr.File(label="Download ZIP")

            status = gr.Markdown("")
            seed_used = gr.Textbox(label="Seed used", value="", interactive=False)

    gr.Examples(
        examples=examples,
        inputs=[input_image],
        outputs=[gallery, export_pptx, export_zip],
        fn=lambda img: ([], None, None),
        cache_examples=False,
        run_on_click=False,
    )

    btn_init_ds.click(fn=on_init_dataset, outputs=[ds_status])
    btn_refresh_sessions.click(fn=on_refresh_sessions, outputs=[load_session_dd, ds_status])

    btn_load_session.click(
        fn=on_load_session,
        inputs=[state, load_session_dd],
        outputs=[
            state, gallery, layer_picker, layer_dropdown, selected_layer_idx, selected_layer_label,
            history_dd, chips_md, refined_block, refined_gallery, export_pptx, export_zip, status
        ],
    )

    btn_decompose.click(
        fn=on_decompose_click,
        inputs=[
            state, input_image, seed, randomize_seed, prompt, neg_prompt, true_guidance_scale,
            num_inference_steps, layer, cfg_norm, use_en_prompt, resolution, gpu_duration
        ],
        outputs=[
            state, gallery, layer_picker, layer_dropdown, selected_layer_idx, selected_layer_label,
            history_dd, chips_md, refined_block, refined_gallery, export_pptx, export_zip, status, seed_used
        ],
    )

    layer_picker.select(
        fn=on_layer_pick_from_gallery,
        inputs=[state],
        outputs=[selected_layer_idx, layer_dropdown, selected_layer_label],
    )

    layer_dropdown.change(
        fn=on_layer_pick_from_dropdown,
        inputs=[state, layer_dropdown],
        outputs=[selected_layer_idx, selected_layer_label],
    )

    btn_refine.click(
        fn=on_refine_click,
        inputs=[
            state, selected_layer_idx, sub_layers, prompt, neg_prompt, true_guidance_scale,
            num_inference_steps, cfg_norm, use_en_prompt, resolution, gpu_duration, seed, randomize_seed
        ],
        outputs=[
            state, gallery, layer_picker, layer_dropdown, selected_layer_idx, selected_layer_label,
            history_dd, chips_md, refined_block, refined_gallery, export_pptx, export_zip, status, seed_used
        ],
    )

    def _history_select_with_lazy(state_, node_id_):
        state_, _ = on_history_need_images(state_, node_id_)
        return on_history_select(state_, node_id_)

    history_dd.change(
        fn=_history_select_with_lazy,
        inputs=[state, history_dd],
        outputs=[
            state, gallery, layer_picker, layer_dropdown, selected_layer_idx, selected_layer_label,
            history_dd, chips_md, refined_block, refined_gallery, export_pptx, export_zip, status
        ],
    )

    btn_back_parent.click(
        fn=on_back_to_parent,
        inputs=[state],
        outputs=[
            state, gallery, layer_picker, layer_dropdown, selected_layer_idx, selected_layer_label,
            history_dd, chips_md, refined_block, refined_gallery, export_pptx, export_zip, status
        ],
    )

    btn_duplicate.click(
        fn=on_duplicate_node,
        inputs=[state],
        outputs=[
            state, gallery, layer_picker, layer_dropdown, selected_layer_idx, selected_layer_label,
            history_dd, chips_md, refined_block, refined_gallery, export_pptx, export_zip, status
        ],
    )

    btn_rename.click(fn=on_rename_node, inputs=[state, rename_text], outputs=[state, history_dd, chips_md, status])
    btn_export.click(fn=on_export_selected, inputs=[state], outputs=[export_pptx, export_zip, status])
    btn_save.click(fn=on_save_current, inputs=[state], outputs=[status])

    demo.queue()

if __name__ == "__main__":
    demo.launch()