Spaces:

ghostai1
/

GhostPack

Running

File size: 39,307 Bytes

2fde0c7

#!/usr/bin/env python3
# ==========================================================
# FILE: ghostpack_gradio_f1.py
# ==========================================================
import os, sys, time, json, argparse, importlib.util, subprocess, traceback
import torch, einops, numpy as np
from PIL import Image
import io
import gradio as gr
import asyncio
from queue import Queue
from threading import Thread, Event
import re
import logging
from diffusers import AutoencoderKLHunyuanVideo
from transformers import (
    LlamaModel, CLIPTextModel, LlamaTokenizerFast, CLIPTokenizer,
    SiglipImageProcessor, SiglipVisionModel
)
from diffusers_helper.hf_login import login
from diffusers_helper.hunyuan import (
    encode_prompt_conds, vae_decode, vae_encode, vae_decode_fake
)
from diffusers_helper.utils import (
    save_bcthw_as_mp4, crop_or_pad_yield_mask, soft_append_bcthw,
    resize_and_center_crop, generate_timestamp
)
from diffusers_helper.models.hunyuan_video_packed import HunyuanVideoTransformer3DModelPacked
from diffusers_helper.pipelines.k_diffusion_hunyuan import sample_hunyuan
from diffusers_helper.memory import (
    gpu, get_cuda_free_memory_gb, move_model_to_device_with_memory_preservation,
    offload_model_from_device_for_memory_preservation, fake_diffusers_current_device,
    DynamicSwapInstaller, unload_complete_models, load_model_as_complete
)
from diffusers_helper.clip_vision import hf_clip_vision_encode
from diffusers_helper.bucket_tools import find_nearest_bucket

# Set up logging
logging.basicConfig(filename='/home/ubuntu/ghostpack/ghostpack.log', level=logging.ERROR, format='%(asctime)s %(levelname)s:%(message)s')

# MODIFIED: Added version number
VERSION = "1.0.0"

# ------------------------- CLI ----------------------------
parser = argparse.ArgumentParser()
parser.add_argument('--share', action='store_true')
parser.add_argument('--server', type=str, default='0.0.0.0')
parser.add_argument('--port', type=int)
parser.add_argument('--inbrowser', action='store_true')
parser.add_argument('--cli', action='store_true')
args = parser.parse_args()

# MODIFIED: Global state variables
render_progress = 0.0
render_status = "idle"
render_times = []
stream = None
start_render_time = None

BASE = os.path.abspath(os.path.dirname(__file__))
os.environ['HF_HOME'] = os.path.join(BASE, 'hf_download')

if args.cli:
    print("👻 GhostPack F1 Pro CLI\n")
    print("python ghostpack_gradio_f1.py           # launch UI")
    print("python ghostpack_gradio_f1.py --cli     # show help\n")
    sys.exit(0)

# ---------------------- Paths -----------------------------
OUT_BASE    = os.path.join('/home/ubuntu/ghostpack', 'outputs')
OUT_IMG     = os.path.join(OUT_BASE, 'img')
OUT_TEMP    = os.path.join(OUT_BASE, 'tmp')
OUT_VID     = os.path.join(OUT_BASE, 'vid')
OUT_DATA    = os.path.join(OUT_BASE, 'data')
PROMPT_LOG  = os.path.join(OUT_DATA, 'prompts.txt')
SAVED_PROMPTS = os.path.join(OUT_DATA, 'saved_prompts.json')
INSTALL_LOG = os.path.join(OUT_DATA, 'install_logs.txt')
LAST_CLEANUP_FILE = os.path.join(OUT_DATA, 'last_cleanup.txt')
VIDEO_INFO_JSON = os.path.join(OUT_DATA, 'video_info.json')

# MODIFIED: Create directories and initialize files with permissions
for d in (OUT_BASE, OUT_IMG, OUT_TEMP, OUT_VID, OUT_DATA):
    try:
        os.makedirs(d, exist_ok=True)
        os.chmod(d, 0o775)
    except Exception as e:
        logging.error(f"Failed to create/chmod directory {d}: {e}")
if not os.path.exists(SAVED_PROMPTS):
    try:
        with open(SAVED_PROMPTS, 'w') as f:
            json.dump([], f)
        os.chmod(SAVED_PROMPTS, 0o664)
    except Exception as e:
        logging.error(f"Failed to create/chmod {SAVED_PROMPTS}: {e}")
if not os.path.exists(INSTALL_LOG):
    try:
        open(INSTALL_LOG, 'w').close()
        os.chmod(INSTALL_LOG, 0o664)
    except Exception as e:
        logging.error(f"Failed to create/chmod {INSTALL_LOG}: {e}")
if not os.path.exists(PROMPT_LOG):
    try:
        open(PROMPT_LOG, 'w').close()
        os.chmod(PROMPT_LOG, 0o664)
    except Exception as e:
        logging.error(f"Failed to create/chmod {PROMPT_LOG}: {e}")
if not os.path.exists(LAST_CLEANUP_FILE):
    try:
        with open(LAST_CLEANUP_FILE, 'w') as f:
            f.write(str(time.time()))
        os.chmod(LAST_CLEANUP_FILE, 0o664)
    except Exception as e:
        logging.error(f"Failed to create/chmod {LAST_CLEANUP_FILE}: {e}")
if not os.path.exists(VIDEO_INFO_JSON):
    try:
        with open(VIDEO_INFO_JSON, 'w') as f:
            json.dump([], f)
        os.chmod(VIDEO_INFO_JSON, 0o664)
    except Exception as e:
        logging.error(f"Failed to create/chmod {VIDEO_INFO_JSON}: {e}")

# ---------------- Prompt utils ---------------------------
def get_last_prompts():
    try:
        return json.load(open(SAVED_PROMPTS))[-5:][::-1]
    except Exception as e:
        logging.error(f"Failed to load prompts from {SAVED_PROMPTS}: {e}")
        return []

def save_prompt_fn(prompt, n_p):
    if not prompt:
        return "❌ No prompt"
    try:
        data = json.load(open(SAVED_PROMPTS))
        entry = {'prompt': prompt, 'negative': n_p}
        if entry not in data:
            data.append(entry)
            with open(SAVED_PROMPTS, 'w') as f:
                json.dump(data, f)
            os.chmod(SAVED_PROMPTS, 0o664)
        return "✅ Saved"
    except Exception as e:
        logging.error(f"Failed to save prompt to {SAVED_PROMPTS}: {e}")
        return "❌ Save failed"

def load_prompt_fn(idx):
    lst = get_last_prompts()
    return lst[idx]['prompt'] if idx < len(lst) else ""

# ---------------- Cleanup utils --------------------------
def clear_temp_videos():
    try:
        for f in os.listdir(OUT_TEMP):
            os.remove(os.path.join(OUT_TEMP, f))
        return "✅ Temp cleared"
    except Exception as e:
        logging.error(f"Failed to clear temp videos in {OUT_TEMP}: {e}")
        return "❌ Clear failed"

def clear_old_files():
    cutoff = time.time() - 7 * 24 * 3600
    c = 0
    try:
        for d in (OUT_TEMP, OUT_IMG, OUT_VID, OUT_DATA):
            for f in os.listdir(d):
                p = os.path.join(d, f)
                if os.path.isfile(p) and os.path.getmtime(p) < cutoff:
                    os.remove(p)
                    c += 1
        with open(LAST_CLEANUP_FILE, 'w') as f:
            f.write(str(time.time()))
        os.chmod(LAST_CLEANUP_FILE, 0o664)
        return f"✅ {c} old files removed"
    except Exception as e:
        logging.error(f"Failed to clear old files: {e}")
        return "❌ Clear failed"

def clear_images():
    try:
        for f in os.listdir(OUT_IMG):
            os.remove(os.path.join(OUT_IMG, f))
        return "✅ Images cleared"
    except Exception as e:
        logging.error(f"Failed to clear images in {OUT_IMG}: {e}")
        return "❌ Clear failed"

def clear_videos():
    try:
        for f in os.listdir(OUT_VID):
            os.remove(os.path.join(OUT_VID, f))
        return "✅ Videos cleared"
    except Exception as e:
        logging.error(f"Failed to clear videos in {OUT_VID}: {e}")
        return "❌ Clear failed"

def check_and_run_weekly_cleanup():
    try:
        with open(LAST_CLEANUP_FILE, 'r') as f:
            last_cleanup = float(f.read().strip())
    except (FileNotFoundError, ValueError):
        last_cleanup = 0
    if time.time() - last_cleanup > 7 * 24 * 3600:
        return clear_old_files()
    return ""

# ---------------- Gallery helpers ------------------------
def list_images():
    return sorted(
        [os.path.join(OUT_IMG, f) for f in os.listdir(OUT_IMG) if f.lower().endswith(('.png', '.jpg'))],
        key=os.path.getmtime
    )

def list_videos():
    return sorted(
        [os.path.join(OUT_VID, f) for f in os.listdir(OUT_VID) if f.lower().endswith('.mp4')],
        key=os.path.getmtime
    )

def load_image(sel):
    imgs = list_images()
    if sel in [os.path.basename(p) for p in imgs]:
        pth = imgs[[os.path.basename(p) for p in imgs].index(sel)]
        return gr.update(value=pth), gr.update(value=os.path.basename(pth))
    return gr.update(), gr.update()

def load_video(sel):
    vids = list_videos()
    if sel in [os.path.basename(p) for p in vids]:
        pth = vids[[os.path.basename(p) for p in vids].index(sel)]
        return gr.update(value=pth), gr.update(value=os.path.basename(pth))
    return gr.update(), gr.update()

def next_image_and_load(sel):
    imgs = list_images()
    if not imgs:
        return gr.update(), gr.update()
    names = [os.path.basename(i) for i in imgs]
    idx = (names.index(sel) + 1) % len(names) if sel in names else 0
    pth = imgs[idx]
    return gr.update(value=pth), gr.update(value=os.path.basename(pth))

def next_video_and_load(sel):
    vids = list_videos()
    if not vids:
        return gr.update(), gr.update()
    names = [os.path.basename(v) for v in vids]
    idx = (names.index(sel) + 1) % len(names) if sel in names else 0
    pth = vids[idx]
    return gr.update(value=pth), gr.update(value=os.path.basename(pth))

def gallery_image_select(evt: gr.SelectData):
    imgs = list_images()
    if evt.index is not None and evt.index < len(imgs):
        pth = imgs[evt.index]
        return gr.update(value=pth), gr.update(value=os.path.basename(pth))
    return gr.update(), gr.update()

def gallery_video_select(evt: gr.SelectData):
    vids = list_videos()
    if evt.index is not None and evt.index < len(vids):
        pth = vids[evt.index]
        return gr.update(value=pth), gr.update(value=os.path.basename(pth))
    return gr.update(), gr.update()

# ---------------- Install status -------------------------
def check_mod(n): return importlib.util.find_spec(n) is not None
def status_xformers(): return "✅ xformers" if check_mod("xformers") else "❌ xformers"
def status_sage(): return "✅ sage-attn" if check_mod("sageattention") else "❌ sage-attn"
def status_flash(): return "✅ flash-attn" if check_mod("flash_attn") else "⚠️ flash-attn"

def install_pkg(pkg, warn=None):
    if warn:
        print(warn)
        time.sleep(1)
    try:
        out = subprocess.check_output(
            [sys.executable, "-m", "pip", "install", pkg],
            stderr=subprocess.STDOUT, text=True
        )
        res = f"✅ {pkg}\n{out}\n"
    except subprocess.CalledProcessError as e:
        res = f"❌ {pkg}\n{e.output}\n"
    with open(INSTALL_LOG, 'a') as f:
        f.write(f"[{pkg}] {res}")
    return res

install_xformers = lambda: install_pkg("xformers")
install_sage_attn = lambda: install_pkg("sage-attn")
install_flash_attn = lambda: install_pkg("flash-attn", "⚠️ long compile")
refresh_logs = lambda: open(INSTALL_LOG).read()
clear_logs = lambda: (open(INSTALL_LOG, 'w').close() or "✅ Logs cleared")

# ---------------- Model load -----------------------------
free_mem = get_cuda_free_memory_gb(gpu)
hv = free_mem > 60

try:
    text_encoder = LlamaModel.from_pretrained(
        "hunyuanvideo-community/HunyuanVideo",
        subfolder='text_encoder', torch_dtype=torch.float16
    ).cpu().eval()
    text_encoder_2 = CLIPTextModel.from_pretrained(
        "hunyuanvideo-community/HunyuanVideo",
        subfolder='text_encoder_2', torch_dtype=torch.float16
    ).cpu().eval()
    tokenizer = LlamaTokenizerFast.from_pretrained(
        "hunyuanvideo-community/HunyuanVideo",
        subfolder='tokenizer'
    )
    tokenizer_2 = CLIPTokenizer.from_pretrained(
        "hunyuanvideo-community/HunyuanVideo",
        subfolder='tokenizer_2'
    )
    vae = AutoencoderKLHunyuanVideo.from_pretrained(
        "hunyuanvideo-community/HunyuanVideo",
        subfolder='vae', torch_dtype=torch.float16
    ).cpu().eval()
    feature_extractor = SiglipImageProcessor.from_pretrained(
        "lllyasviel/flux_redux_bfl", subfolder='feature_extractor'
    )
    image_encoder = SiglipVisionModel.from_pretrained(
        "lllyasviel/flux_redux_bfl",
        subfolder='image_encoder', torch_dtype=torch.float16
    ).cpu().eval()
    transformer = HunyuanVideoTransformer3DModelPacked.from_pretrained(
        "lllyasviel/FramePack_F1_I2V_HY_20250503",
        torch_dtype=torch.bfloat16
    ).cpu().eval()
except Exception as e:
    logging.error(f"Failed to load models: {e}")
    raise

if not hv:
    vae.enable_slicing()
    vae.enable_tiling()

transformer.high_quality_fp32_output_for_inference = True
transformer.to(dtype=torch.bfloat16)

for m in (vae, image_encoder, text_encoder, text_encoder_2):
    m.to(dtype=torch.float16)
for m in (vae, image_encoder, text_encoder, text_encoder_2, transformer):
    m.requires_grad_(False)

if not hv:
    DynamicSwapInstaller.install_model(transformer, device=gpu)
    DynamicSwapInstaller.install_model(text_encoder, device=gpu)
else:
    for m in (text_encoder, text_encoder_2, image_encoder, vae, transformer):
        m.to(gpu)

class AsyncStream:
    def __init__(self):
        self.input_queue = Queue()
        self.output_queue = Queue()
        self.stop_event = Event()

    def put(self, item):
        self.output_queue.put(item)

    def get(self):
        return self.output_queue.get()

    def is_stopped(self):
        return self.stop_event.is_set()

    def stop(self):
        self.stop_event.set()
        self.input_queue.put("end")

# ---------------- Worker -------------------------------
@torch.no_grad()
def worker(img, prompt, n_p, seed, secs, win, stp, cfg, gsc, rsc, keep, tea, crf, camera_action="Static Camera"):
    global render_progress, render_status, render_times, start_render_time, stream
    start_render_time = time.time()
    render_status = "rendering"
    render_progress = 0.0
    stream = AsyncStream()

    # Validate prompt for smoothness, stop, and silence, and append camera action
    if "stop" not in prompt.lower() and secs > 5:
        prompt += " The subject stops moving after 5 seconds."
    if "smooth" not in prompt.lower():
        prompt = f"Smooth animation: {prompt}"
    if "silent" not in prompt.lower():
        prompt += ", silent"
    prompt = update_prompt(prompt, camera_action)
    if len(prompt.split()) > 50:
        print("Warning: Complex prompt may slow rendering or cause instability.")

    # Check VRAM availability
    if get_cuda_free_memory_gb(gpu) < 2:
        render_status = "error"
        logging.error("Low VRAM (<2GB). Lower 'kee' or 'win'.")
        raise Exception("Low VRAM (<2GB). Lower 'kee' or 'win'.")

    sections = max(round((secs * 30) / (win * 4)), 1)
    jid = generate_timestamp()
    try:
        with open(PROMPT_LOG, 'a') as f:
            f.write(f"{jid}\t{prompt}\t{n_p}\n")
        os.chmod(PROMPT_LOG, 0o664)
    except Exception as e:
        logging.error(f"Failed to write to {PROMPT_LOG}: {e}")
    stream.put(('progress', (None, "", ProgressBar().make_progress_bar_html(0, "Start"))))
    try:
        if not hv:
            unload_complete_models(text_encoder, text_encoder_2, image_encoder, vae, transformer)
            fake_diffusers_current_device(text_encoder, gpu)
            load_model_as_complete(text_encoder_2, gpu)
        lv, cp = encode_prompt_conds(prompt, text_encoder, text_encoder_2, tokenizer, tokenizer_2)
        if cfg == 1:
            lv_n = torch.zeros_like(lv)
            cp_n = torch.zeros_like(cp)
        else:
            lv_n, cp_n = encode_prompt_conds(n_p, text_encoder, text_encoder_2, tokenizer, tokenizer_2)
        lv, m = crop_or_pad_yield_mask(lv, 512)
        lv_n, m_n = crop_or_pad_yield_mask(lv_n, 512)
        lv, cp, lv_n, cp_n = [x.to(torch.bfloat16) for x in (lv, cp, lv_n, cp_n)]
        H, W, _ = img.shape
        h, w = find_nearest_bucket(H, W, 640)
        img_np = resize_and_center_crop(img, w, h)
        img_filename = f"{jid}.png"
        try:
            Image.fromarray(img_np).save(os.path.join(OUT_IMG, img_filename))
            os.chmod(os.path.join(OUT_IMG, img_filename), 0o664)
        except Exception as e:
            logging.error(f"Failed to save image {img_filename}: {e}")
            raise
        img_pt = (torch.from_numpy(img_np).float() / 127.5 - 1).permute(2, 0, 1)[None, :, None]
        if not hv:
            load_model_as_complete(vae, gpu)
        start_lat = vae_encode(img_pt, vae)
        if not hv:
            load_model_as_complete(image_encoder, gpu)
        img_emb = hf_clip_vision_encode(img_np, feature_extractor, image_encoder).last_hidden_state.to(torch.bfloat16)
        gen = torch.Generator("cpu").manual_seed(seed)
        hist_lat = torch.zeros((1, 16, 1 + 2 + 16, h // 8, w // 8), dtype=torch.float32).cpu()
        hist_px = None
        total = 0
        pad_seq = [3] + [2] * (sections - 3) + [1, 0] if sections > 4 else list(reversed(range(sections)))
        section_index = 0
        for pad in pad_seq:
            if stream.is_stopped():
                render_status = "stopped"
                stream.put(("stopped", None))
                return None
            last = pad == 0
            pad_sz = pad * win
            idx = torch.arange(0, sum([1, pad_sz, win, 1, 2, 16]))[None]
            a, b, c, d, e, f = idx.split([1, pad_sz, win, 1, 2, 16], 1)
            clean_idx = torch.cat([a, d], 1)
            pre = start_lat.to(hist_lat)
            post, two, four = hist_lat[:, :, :1 + 2 + 16].split([1, 2, 16], 2)
            clean = torch.cat([pre, post], 2)
            if not hv:
                unload_complete_models()
                move_model_to_device_with_memory_preservation(transformer, gpu, keep)
            transformer.initialize_teacache(tea, stp)
            def cb(d):
                global render_progress
                pv = vae_decode_fake(d["denoised"])
                pv = (pv * 255).cpu().numpy().clip(0, 255).astype(np.uint8)
                pv = einops.rearrange(pv, "b c t h w->(b h)(t w)c")
                cur = d["i"] + 1
                render_progress = (cur / stp) * 100
                stream.put(('progress', (pv, f"{cur}/{stp}", ProgressBar().make_progress_bar_html(int(100 * cur / stp), f"{cur}/{stp}"))))
                if stream.is_stopped():
                    stream.put(("stopped", None))
                    raise KeyboardInterrupt
            new_lat = sample_hunyuan(
                transformer=transformer, sampler="unipc", width=w, height=h, frames=win * 4 - 3,
                real_guidance_scale=cfg, distilled_guidance_scale=gsc, guidance_rescale=rsc,
                num_inference_steps=stp, generator=gen,
                prompt_embeds=lv, prompt_embeds_mask=m, prompt_poolers=cp,
                negative_prompt_embeds=lv_n, negative_prompt_embeds_mask=m_n, negative_prompt_poolers=cp_n,
                device=gpu, dtype=torch.bfloat16, image_embeddings=img_emb,
                latent_indices=c, clean_latents=clean, clean_latent_indices=clean_idx,
                clean_latents_2x=two, clean_latent_2x_indices=e,
                clean_latents_4x=four, clean_latent_4x_indices=f, callback=cb
            )
            if last:
                new_lat = torch.cat([start_lat.to(new_lat), new_lat], 2)
            total += new_lat.shape[2]
            hist_lat = torch.cat([new_lat.to(hist_lat), hist_lat], 2)
            if not hv:
                offload_model_from_device_for_memory_preservation(transformer, gpu, 8)
                load_model_as_complete(vae, gpu)
            real = hist_lat[:, :, :total]
            if hist_px is None:
                hist_px = vae_decode(real, vae).cpu()
            else:
                overlap = win * 4 - 3
                curr = vae_decode(real[:, :, :win * 2], vae).cpu()
                hist_px = soft_append_bcthw(curr, hist_px, overlap)
            if not hv:
                unload_complete_models()
            tmp_filename = f"{jid}_{total}.mp4"
            tmp = os.path.join(OUT_TEMP, tmp_filename)
            try:
                save_bcthw_as_mp4(hist_px, tmp, fps=30, crf=crf)
                os.chmod(tmp, 0o664)
            except Exception as e:
                logging.error(f"Failed to save video {tmp}: {e}")
                raise
            stream.put(('file', tmp))
            section_index += 1
            if last:
                fin_filename = f"{jid}_{total}.mp4"
                fin = os.path.join(OUT_VID, fin_filename)
                try:
                    os.replace(tmp, fin)
                    os.chmod(fin, 0o664)
                    save_video_info(prompt, n_p, fin_filename, seed, secs, None)
                    stream.put(('complete', fin))
                    render_status = "complete"
                    end_time = time.time()
                    render_time = end_time - start_render_time
                    render_times.append(render_time)
                    if len(render_times) > 3:
                        render_times.pop(0)
                    return fin
                except Exception as e:
                    logging.error(f"Failed to finalize video {fin}: {e}")
                    raise
    except Exception as e:
        traceback.print_exc()
        render_status = "error"
        stream.put(("stopped", str(e)))
        logging.error(f"Worker failed: {e}")
        return None
    finally:
        render_progress = 0.0
        start_render_time = None

@torch.no_grad()
def process(img, prm, npr, sd, sec, win, stp, cfg, gsc, rsc, kee, tea, crf):
    global stream
    if img is None:
        yield None, None, "Please upload an image to proceed.", "", gr.update(interactive=False), gr.update(interactive=True)
        return
    yield None, None, "", "", gr.update(interactive=False), gr.update(interactive=True)
    loop = asyncio.new_event_loop()
    asyncio.set_event_loop(loop)
    try:
        future = loop.run_in_executor(None, lambda: worker(img, prm, npr, sd, sec, win, stp, cfg, gsc, rsc, kee, tea, crf))
        out, log = None, ""
        while True:
            try:
                if stream and not stream.output_queue.empty():
                    flag, data = stream.get()
                    if flag == "file":
                        out = data
                        yield out, gr.update(), gr.update(), log, gr.update(interactive=False), gr.update(interactive=True)
                    elif flag == "progress":
                        pv, desc, html = data
                        log = desc
                        yield gr.update(), gr.update(visible=True, value=pv), desc, html, gr.update(interactive=False), gr.update(interactive=True)
                    elif flag in ("complete", "stopped", "end"):
                        yield out, gr.update(visible=False), gr.update(), "", gr.update(interactive=True), gr.update(interactive=False)
                        break
            except Exception as e:
                logging.error(f"Error in process queue: {e}")
                yield None, gr.update(visible=False), "Error occurred during processing.", "", gr.update(interactive=True), gr.update(interactive=False)
                break
    finally:
        loop.close()

def end_process():
    if stream:
        stream.stop()

# ------------------- UI ------------------------------
quick_prompts = [
    ["Smooth animation: A character waves for 3 seconds, then stands still for 2 seconds, static camera, silent."],
    ["Smooth animation: A character moves for 5 seconds, static camera, silent."]
]
css = """
.orange-button{background:#ff6200;color:#fff;border-color:#ff6200;}
.load-button{background:#4CAF50;color:#fff;border-color:#4CAF50;margin-left:10px;}
.big-setting-button{background:#0066cc;color:#fff;border:none;padding:14px 24px;font-size:18px;width:100%;border-radius:6px;margin:8px 0;}
.styled-dropdown{width:250px;padding:5px;border-radius:4px;}
.viewer-column{width:100%;max-width:900px;margin:0 auto;}
.media-preview img,.media-preview video{max-width:100%;height:380px;object-fit:contain;border:1px solid #444;border-radius:6px;}
.media-container{display:flex;gap:20px;align-items:flex-start;}
.control-box{min-width:220px;}
.control-grid{display:grid;grid-template-columns:1fr 1fr;gap:10px;}
.image-gallery{display:grid!important;grid-template-columns:repeat(auto-fit,minmax(300px,1fr))!important;gap:10px;padding:10px!important;overflow-y:auto!important;max-height:360px!important;}
.image-gallery .gallery-item{padding:10px;height:360px!important;width:300px!important;}
.image-gallery img{object-fit:contain;height:360px!important;width:300px!important;}
.video-gallery{display:grid!important;grid-template-columns:repeat(auto-fit,minmax(300px,1fr))!important;gap:10px;padding:10px!important;overflow-y:auto!important;max-height:360px!important;}
.video-gallery .gallery-item{padding:10px;height:360px!important;width:300px!important;}
.video-gallery video{object-fit:contain;height:360px!important;width:300px!important;}
.stop-button {background-color: #ff4d4d !important; color: white !important;}
.progress-bar {
    width: 100%;
    height: 20px;
    background-color: #444;
    border-radius: 10px;
    overflow: hidden;
}
.progress-bar-fill {
    height: 100%;
    background-color: #ff6200;
    border-radius: 10px;
    transition: width 0.3s ease-in-out;
}
"""

blk = gr.Blocks(css=css, title="GhostPack F1 Pro").queue()
with blk:
    gr.Markdown("# 👻 GhostPack F1 Pro")
    with gr.Tabs():

        with gr.TabItem("👻 Generate"):
            with gr.Row():
                with gr.Column():
                    img_in = gr.Image(sources="upload", type="numpy", label="Image", height=320)
                    generate_button = gr.Button("Generate Video", elem_id="generate_button")
                    stop_button = gr.Button("Stop Generation", elem_id="stop_button", elem_classes="stop-button")
                    prm = gr.Textbox(
                        label="Prompt",
                        value="Smooth animation: A female stands with subtle, sensual micro-movements, breathing gently, slight head tilt, static camera, silent",
                        elem_id="prompt_input"
                    )
                    npr = gr.Textbox(
                        label="Negative Prompt",
                        value="low quality, blurry, speaking, talking, moaning, vocalizing, lip movement, mouth animation, sound, dialogue, speech, whispering, shouting, lip sync, facial animation, expressive face, verbal expression, animated mouth",
                        elem_id="negative_prompt_input"
                    )
                    save_msg = gr.Markdown("")
                    btn_save = gr.Button("Save Prompt")
                    btn1, btn2, btn3 = gr.Button("Load Most Recent"), gr.Button("Load 2nd Recent"), gr.Button("Load 3rd Recent")
                    ds = gr.Dataset(samples=quick_prompts, label="Quick List", components=[prm])
                    ds.click(lambda x: x[0], [ds], [prm])
                    btn_save.click(save_prompt_fn, [prm, npr], [save_msg])
                    btn1.click(lambda: load_prompt_fn(0), [], [prm])
                    btn2.click(lambda: load_prompt_fn(1), [], [prm])
                    btn3.click(lambda: load_prompt_fn(2), [], [prm])
                with gr.Column():
                    pv = gr.Image(label="Next Latents", height=200, visible=False)
                    vid = gr.Video(label="Finished", autoplay=True, height=500, loop=True, show_share_button=False)
                    log_md = gr.Markdown("")
                    bar = gr.HTML("")
            with gr.Column():
                se = gr.Number(label="Seed", value=31337, precision=0, elem_id="seed_input")
                sec = gr.Slider(label="Video Length (s)", minimum=1, maximum=120, value=5, step=0.1, elem_id="video_length_input")
                win = gr.Slider(label="Latent Window", minimum=1, maximum=33, value=5, step=1, elem_id="latent_window_input")
                stp = gr.Slider(label="Steps", minimum=1, maximum=100, value=12, step=1, elem_id="steps_input")
                cfg = gr.Slider(label="CFG", minimum=1, maximum=32, value=1, step=0.01, elem_id="cfg_input", visible=False)
                gsc = gr.Slider(label="Distilled CFG", minimum=1, maximum=32, value=7, step=0.1, elem_id="distilled_cfg_input")
                rsc = gr.Slider(label="CFG Re-Scale", minimum=0, maximum=1, value=0.7, step=0.01, elem_id="cfg_rescale_input")
                kee = gr.Slider(label="GPU Keep (GB)", minimum=4, maximum=free_mem, value=6, step=0.1, elem_id="gpu_keep_input")
                crf = gr.Slider(label="MP4 CRF", minimum=0, maximum=100, value=20, step=1, elem_id="mp4_crf_input")
                tea = gr.Checkbox(label="Use TeaCache", value=True, elem_id="use_teacache_input")
            generate_button.click(
                fn=process,
                inputs=[img_in, prm, npr, se, sec, win, stp, cfg, gsc, rsc, kee, tea, crf],
                outputs=[vid, pv, log_md, bar, generate_button, stop_button]
            )
            stop_button.click(fn=end_process)
            gr.Button("Update Progress").click(
                fn=get_progress,
                outputs=[log_md, bar]
            )

        with gr.TabItem("🖼️ Image Gallery"):
            with gr.Row(elem_classes="media-container"):
                with gr.Column(scale=3):
                    image_preview = gr.Image(
                        label="Viewer",
                        value=(list_images()[0] if list_images() else None),
                        interactive=False, elem_classes="media-preview"
                    )
                with gr.Column(elem_classes="control-box"):
                    image_dropdown = gr.Dropdown(
                        choices=[os.path.basename(i) for i in list_images()],
                        value=(os.path.basename(list_images()[0]) if list_images() else None),
                        label="Select", elem_classes="styled-dropdown"
                    )
                    with gr.Row(elem_classes="control-grid"):
                        load_btn = gr.Button("Load", elem_classes="load-button")
                        next_btn = gr.Button("Next", elem_classes="load-button")
                    with gr.Row(elem_classes="control-grid"):
                        refresh_btn = gr.Button("Refresh")
                        delete_btn = gr.Button("Delete", elem_classes="orange-button")
            image_gallery = gr.Gallery(
                value=list_images(), label="Thumbnails", columns=6, height=360,
                allow_preview=False, type="filepath", elem_classes="image-gallery"
            )
            load_btn.click(load_image, [image_dropdown], [image_preview, image_dropdown])
            next_btn.click(next_image_and_load, [image_dropdown], [image_preview, image_dropdown])
            refresh_btn.click(
                lambda: (
                    gr.update(choices=[os.path.basename(i) for i in list_images()],
                              value=os.path.basename(list_images()[0]) if list_images() else None),
                    gr.update(value=list_images()[0] if list_images() else None),
                    gr.update(value=list_images())
                ),
                [],
                [image_dropdown, image_preview, image_gallery]
            )
            delete_btn.click(
                lambda sel: (os.remove(os.path.join(OUT_IMG, sel)) if sel else None) or load_image(""),
                [image_dropdown],
                [image_preview, image_dropdown]
            )
            image_gallery.select(gallery_image_select, [], [image_preview, image_dropdown])

        with gr.TabItem("🎬 Video Gallery"):
            with gr.Row(elem_classes="media-container"):
                with gr.Column(scale=3):
                    video_preview = gr.Video(
                        label="Viewer",
                        value=(list_videos()[0] if list_videos() else None),
                        autoplay=True, loop=True, interactive=False, elem_classes="media-preview"
                    )
                with gr.Column(elem_classes="control-box"):
                    video_dropdown = gr.Dropdown(
                        choices=[os.path.basename(v) for v in list_videos()],
                        value=(os.path.basename(list_videos()[0]) if list_videos() else None),
                        label="Select", elem_classes="styled-dropdown"
                    )
                    with gr.Row(elem_classes="control-grid"):
                        load_vbtn = gr.Button("Load", elem_classes="load-button")
                        next_vbtn = gr.Button("Next", elem_classes="load-button")
                    with gr.Row(elem_classes="control-grid"):
                        refresh_v = gr.Button("Refresh")
                        delete_v = gr.Button("Delete", elem_classes="orange-button")
            video_gallery = gr.Gallery(
                value=list_videos(), label="Thumbnails", columns=6, height=360,
                allow_preview=False, type="filepath", elem_classes="video-gallery"
            )
            load_vbtn.click(load_video, [video_dropdown], [video_preview, video_dropdown])
            next_vbtn.click(next_video_and_load, [video_dropdown], [video_preview, video_dropdown])
            refresh_v.click(
                lambda: (
                    gr.update(choices=[os.path.basename(v) for v in list_videos()],
                              value=os.path.basename(list_videos()[0]) if list_videos() else None),
                    gr.update(value=list_videos()[0] if list_videos() else None),
                    gr.update(value=list_videos())
                ),
                [],
                [video_dropdown, video_preview, video_gallery]
            )
            delete_v.click(
                lambda sel: (os.remove(os.path.join(OUT_VID, sel)) if sel else None) or load_video(""),
                [video_dropdown],
                [video_preview, video_dropdown]
            )
            video_gallery.select(gallery_video_select, [], [video_preview, video_dropdown])

        with gr.TabItem("👻 About"):
            gr.Markdown("## GhostPack F1 Pro")
            with gr.Row():
                with gr.Column():
                    gr.Markdown("**🛠️ Description**\nImage-to-Video toolkit powered by HunyuanVideo & FramePack-F1")
                with gr.Column():
                    gr.Markdown(f"**📦 Version**\n{VERSION}")
                with gr.Column():
                    gr.Markdown("**✍️ Author**\nGhostAI")
                with gr.Column():
                    gr.Markdown("**🔗 Repo**\nhttps://huggingface.co/spaces/ghostai1/GhostPack")

        with gr.TabItem("⚙️ Settings"):
            ct = gr.Button("Clear Temp", elem_classes="big-setting-button")
            ctmsg = gr.Markdown("")
            co = gr.Button("Clear Old", elem_classes="big-setting-button")
            comsg = gr.Markdown("")
            ci = gr.Button("Clear Images", elem_classes="big-setting-button")
            cimg = gr.Markdown("")
            cv = gr.Button("Clear Videos", elem_classes="big-setting-button")
            cvid = gr.Markdown("")
            ct.click(clear_temp_videos, [], ctmsg)
            co.click(clear_old_files, [], comsg)
            ci.click(clear_images, [], cimg)
            cv.click(clear_videos, [], cvid)

        with gr.TabItem("🛠️ Install"):
            xs = gr.Textbox(value=status_xformers(), interactive=False, label="xformers")
            bx = gr.Button("Install xformers", elem_classes="big-setting-button")
            ss = gr.Textbox(value=status_sage(), interactive=False, label="sage-attn")
            bs = gr.Button("Install sage-attn", elem_classes="big-setting-button")
            fs = gr.Textbox(value=status_flash(), interactive=False, label="flash-attn")
            bf = gr.Button("Install flash-attn", elem_classes="big-setting-button")
            bx.click(install_xformers, [], xs)
            bs.click(install_sage_attn, [], ss)
            bf.click(install_flash_attn, [], fs)

        with gr.TabItem("📜 Logs"):
            logs = gr.Textbox(lines=20, interactive=False, label="Install Logs")
            rl = gr.Button("Refresh", elem_classes="big-setting-button")
            cl = gr.Button("Clear", elem_classes="big-setting-button")
            rl.click(refresh_logs, [], logs)
            cl.click(clear_logs, [], logs)

    # Force video previews to seek to 2s
    gr.HTML("""
<script>
document.querySelectorAll('.video-gallery video').forEach(v => {
  v.addEventListener('loadedmetadata', () => {
    if (v.duration > 2) v.currentTime = 2;
  });
});
</script>
""")

    # Camera action update
    camera_action_input = gr.Dropdown(
        choices=[
            "Static Camera",
            "Slight Orbit Left",
            "Slight Orbit Right",
            "Slight Orbit Up",
            "Slight Orbit Down",
            "Top-Down View",
            "Slight Zoom In",
            "Slight Zoom Out"
        ],
        label="Camera Action",
        value="Static Camera",
        elem_id="camera_action_input",
        info="Select a camera movement to append to the prompt."
    )
    camera_action_input.change(
        fn=lambda prompt, camera_action: update_prompt(prompt, camera_action),
        inputs=[prm, camera_action_input],
        outputs=prm
    )

def update_prompt(prompt, camera_action):
    # Remove existing camera action from prompt
    camera_actions = [
        "static camera", "slight camera orbit left", "slight camera orbit right",
        "slight camera orbit up", "slight camera orbit down", "top-down view",
        "slight camera zoom in", "slight camera zoom out"
    ]
    for action in camera_actions:
        prompt = re.sub(rf',\s*{re.escape(action)}\b', '', prompt, flags=re.IGNORECASE).strip()
    # Append selected camera action
    if camera_action and camera_action != "None":
        camera_phrase = f", {camera_action.lower()}"
        if len(prompt.split()) + len(camera_phrase.split()) <= 50:
            return prompt + camera_phrase
        else:
            logging.warning(f"Prompt exceeds 50 words after adding camera action: {prompt}")
    return prompt

def get_progress():
    markdown_text = f"Status: {render_status}\nProgress: {render_progress:.1f}%\nLast Render Time: {render_times[-1] if render_times else 0:.1f}s"
    progress_bar_html = ProgressBar().make_progress_bar_html(int(render_progress), f"{int(render_progress)}%")
    return markdown_text, progress_bar_html

class ProgressBar:
    def make_progress_bar_css(self):
        return """
        .progress-bar {
            width: 100%;
            height: 20px;
            background-color: #444;
            border-radius: 10px;
            overflow: hidden;
        }
        .progress-bar-fill {
            height: 100%;
            background-color: #ff6200;
            border-radius: 10px;
            transition: width 0.3s ease-in-out;
        }
        """

    def make_progress_bar_html(self, percentage, label):
        css = self.make_progress_bar_css()
        fill_width = f"{percentage}%"
        html = f"""
        <style>{css}</style>
        <div class="progress-bar">
            <div class="progress-bar-fill" style="width: {fill_width};">
                <span style="color: white; position: absolute; margin-left: 10px;">{label}</span>
            </div>
        </div>
        """
        return html

blk.launch(
    server_name=args.server,
    server_port=args.port,
    share=args.share,
    inbrowser=args.inbrowser
)