import torch
import numpy as np
from diffusers import WanImageToVideoPipeline
from diffusers.utils import export_to_video, load_image

model_id = "/workspace/Wan2.2-I2V-A14B-Diffusers-bf16"
dtype = torch.bfloat16

pipe = WanImageToVideoPipeline.from_pretrained(
    model_id,
    torch_dtype=dtype,
)

pipe.enable_attention_slicing()
pipe.vae.enable_slicing()
pipe.vae.enable_tiling()
pipe.enable_model_cpu_offload()

print("WAN I2V loaded with balanced CPU offload")


# ---------- RUN ----------
image = load_image(
    "https://huggingface.co/datasets/YiYiXu/testing-images/resolve/main/wan_i2v_input.JPG"
)

target_height = 480

# Сохраняем соотношение сторон
aspect_ratio = image.width / image.height
target_width = int(target_height * aspect_ratio)

# Учитываем модификаторы (patch_size и vae_scale_factor)
mod_value = pipe.vae_scale_factor_spatial * pipe.transformer.config.patch_size[1]
mod_value = 64
print(mod_value)
height = target_height // mod_value * mod_value
width = target_width // mod_value * mod_value

image = image.resize((width, height))

print((width, height))
prompt = "Summer beach vacation style, a white cat wearing sunglasses sits on a surfboard. The fluffy-furred feline gazes directly at the camera with a relaxed expression. Blurred beach scenery forms the background featuring crystal-clear waters, distant green hills, and a blue sky dotted with white clouds. The cat assumes a naturally relaxed posture, as if savoring the sea breeze and warm sunlight. A close-up shot highlights the feline's intricate details and the refreshing atmosphere of the seaside."

negative_prompt = "色调艳丽，过曝，静态，细节模糊不清，字幕，风格，作品，画作，画面，静止，整体发灰，最差质量，低质量，JPEG压缩残留，丑陋的，残缺的，多余的手指，画得不好的手部，画得不好的脸部，畸形的，毁容的，形态畸形的肢体，手指融合，静止不动的画面，杂乱的背景，三条腿，背景人很多，倒着走"
generator = torch.Generator("cuda").manual_seed(0)
output = pipe(
    image=image,
    prompt=prompt,
    negative_prompt=negative_prompt,
    height=height,
    width=width,
    num_frames=81,
    guidance_scale=3.5,
    num_inference_steps=25,
    generator=generator,
).frames[0]
export_to_video(output, "i2v_output.mp4", fps=16)
print('ok')