Wan2.2-Animate / app.py
kelseye's picture
Update app.py
7b7aba3 verified
# app.py
import os
import oss2
import sys
import uuid
import shutil
import time
import gradio as gr
import requests
import dashscope
from dashscope.utils.oss_utils import check_and_upload_local
DASHSCOPE_API_KEY = os.getenv("DASHSCOPE_API_KEY")
dashscope.api_key = DASHSCOPE_API_KEY
class WanAnimateApp:
def __init__(self, url, get_url):
self.url = url
self.get_url = get_url
def predict(
self,
ref_img,
video,
model_id,
model,
):
# Upload files to OSS if needed and get URLs
_, image_url = check_and_upload_local(model_id, ref_img, DASHSCOPE_API_KEY)
_, video_url = check_and_upload_local(model_id, video, DASHSCOPE_API_KEY)
# Prepare the request payload
payload = {
"model": model_id,
"input": {
"image_url": image_url,
"video_url": video_url
},
"parameters": {
"check_image": True,
"mode": model,
}
}
# Set up headers
headers = {
"X-DashScope-Async": "enable",
"X-DashScope-OssResourceResolve": "enable",
"Authorization": f"Bearer {DASHSCOPE_API_KEY}",
"Content-Type": "application/json"
}
# Make the initial API request
url = self.url
response = requests.post(url, json=payload, headers=headers)
# Check if request was successful
if response.status_code != 200:
raise Exception(f"Initial request failed with status code {response.status_code}: {response.text}")
# Get the task ID from response
result = response.json()
task_id = result.get("output", {}).get("task_id")
if not task_id:
raise Exception("Failed to get task ID from response")
# Poll for results
get_url = f"{self.get_url}/{task_id}"
headers = {
"Authorization": f"Bearer {DASHSCOPE_API_KEY}",
"Content-Type": "application/json"
}
while True:
response = requests.get(get_url, headers=headers)
if response.status_code != 200:
raise Exception(f"Failed to get task status: {response.status_code}: {response.text}")
result = response.json()
print(result)
task_status = result.get("output", {}).get("task_status")
if task_status == "SUCCEEDED":
# Task completed successfully, return video URL
video_url = result["output"]["results"]["video_url"]
return video_url, "SUCCEEDED"
elif task_status == "FAILED":
# Task failed, raise an exception with error message
error_msg = result.get("output", {}).get("message", "Unknown error")
code_msg = result.get("output", {}).get("code", "Unknown code")
print(f"\n\nTask failed: {error_msg} Code: {code_msg} TaskId: {task_id}\n\n")
return None, f"Task failed: {error_msg} Code: {code_msg} TaskId: {task_id}"
# raise Exception(f"Task failed: {error_msg} TaskId: {task_id}")
else:
# Task is still running, wait and retry
time.sleep(5) # Wait 5 seconds before polling again
def start_app():
import argparse
parser = argparse.ArgumentParser(description="Wan2.2-Animate 视频生成工具")
args = parser.parse_args()
url = "https://dashscope.aliyuncs.com/api/v1/services/aigc/image2video/video-synthesis/"
# url = "https://poc-dashscope.aliyuncs.com/api/v1/services/aigc/image2video/video-synthesis"
get_url = f"https://dashscope.aliyuncs.com/api/v1/tasks/"
# get_url = f"https://poc-dashscope.aliyuncs.com/api/v1/tasks"
app = WanAnimateApp(url=url, get_url=get_url)
with gr.Blocks(title="Wan2.2-Animate 视频生成") as demo:
gr.HTML("""
<div style="padding: 2rem; text-align: center; max-width: 1200px; margin: 0 auto; font-family: Arial, sans-serif;">
<h1 style="font-size: 2.5rem; font-weight: bold; margin-bottom: 0.5rem; color: #333;">
Wan2.2-Animate: Unified Character Animation and Replacement with Holistic Replication
</h1>
<h3 style="font-size: 2.5rem; font-weight: bold; margin-bottom: 0.5rem; color: #333;">
Wan2.2-Animate: 统一的角色动画和视频人物替换模型
</h3>
<div style="font-size: 1.25rem; margin-bottom: 1.5rem; color: #555;">
Tongyi Lab, Alibaba
</div>
<div style="display: flex; flex-wrap: wrap; justify-content: center; gap: 1rem; margin-bottom: 1rem;">
<!-- 第一行按钮 -->
<a href="https://arxiv.org/abs/2509.14055" target="_blank"
style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; /* 浅灰色背景 */ color: #333; /* 深色文字 */ text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
<span style="margin-right: 0.5rem;">📄</span> <!-- 使用文档图标 -->
<span>Paper</span>
</a>
<a href="https://github.com/Wan-Video/Wan2.2" target="_blank"
style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
<span style="margin-right: 0.5rem;">💻</span> <!-- 使用电脑图标 -->
<span>GitHub</span>
</a>
<a href="https://huggingface.co/Wan-AI/Wan2.2-Animate-14B" target="_blank"
style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
<span style="margin-right: 0.5rem;">🤗</span>
<span>HF Model</span>
</a>
<a href="https://www.modelscope.cn/models/Wan-AI/Wan2.2-Animate-14B" target="_blank"
style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
<span style="margin-right: 0.5rem;">🤖</span>
<span>MS Model</span>
</a>
</div>
<div style="display: flex; flex-wrap: wrap; justify-content: center; gap: 1rem;">
<!-- 第二行按钮 -->
<a href="https://huggingface.co/spaces/Wan-AI/Wan2.2-Animate" target="_blank"
style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
<span style="margin-right: 0.5rem;">🤗</span>
<span>HF Space</span>
</a>
<a href="https://www.modelscope.cn/studios/Wan-AI/Wan2.2-Animate" target="_blank"
style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
<span style="margin-right: 0.5rem;">🤖</span>
<span>MS Studio</span>
</a>
</div>
</div>
""")
gr.HTML("""
<details>
<summary>‼️Usage (使用说明)</summary>
Wan-Animate supports two mode:
<ul>
<li>Move Mode: animate the character in input image with movements from the input video</li>
<li>Mix Mode: replace the character in input video with the character in input image</li>
</ul>
Wan-Animate 支持两种模式:
<ul>
<li>Move模式: 用输入视频中提取的动作,驱动输入图片中的角色</li>
<li>Mix模式: 用输入图片中的角色,替换输入视频中的角色</li>
</ul>
Currently, the following restrictions apply to inputs:
<ul> <li>Video file size: Less than 200MB</li>
<li>Video resolution: The shorter side must be greater than 200, and the longer side must be less than 2048</li>
<li>Video duration: 2s to 30s</li>
<li>Video aspect ratio: 1:3 to 3:1</li>
<li>Video formats: mp4, avi, mov</li>
<li>Image file size: Less than 5MB</li>
<li>Image resolution: The shorter side must be greater than 200, and the longer side must be less than 4096</li>
<li>Image formats: jpg, png, jpeg, webp, bmp</li> </ul>
当前,对于输入有以下的限制
<ul>
<li>视频文件大小: 小于 200MB</li>
<li>视频分辨率: 最小边大于 200, 最大边小于2048</li>
<li>视频时长: 2s ~ 30s </li>
<li>视频比例:1:3 ~ 3:1 </li>
<li>视频格式: mp4, avi, mov </li>
<li>图片文件大小: 小于5MB </li>
<li>图片分辨率:最小边大于200,最大边小于4096 </li>
<li>图片格式: jpg, png, jpeg, webp, bmp </li>
</ul>
<p> Currently, the inference quality has two variants. You can use our open-source code for more flexible configuration. </p>
<p>当前,推理质量有两个变种。 您可以使用我们的开源代码,来进行更灵活的设置。</p>
<ul>
<li> wan-pro: 25fps, 720p </li>
<li> wan-std: 15fps, 720p </li>
</ul>
</details>
""")
with gr.Row():
with gr.Column():
ref_img = gr.Image(
label="Reference Image(参考图像)",
type="filepath",
sources=["upload"],
)
video = gr.Video(
label="Template Video(模版视频)",
sources=["upload"],
)
with gr.Row():
model_id = gr.Dropdown(
label="Mode(模式)",
choices=["wan2.2-animate-move", "wan2.2-animate-mix"],
value="wan2.2-animate-move",
info=""
)
model = gr.Dropdown(
label="推理质量(Inference Quality)",
choices=["wan-pro", "wan-std"],
value="wan-pro",
)
run_button = gr.Button("Generate Video(生成视频)")
with gr.Column():
output_video = gr.Video(label="Output Video(输出视频)")
output_status = gr.Textbox(label="Status(状态)")
run_button.click(
fn=app.predict,
inputs=[
ref_img,
video,
model_id,
model,
],
outputs=[output_video, output_status],
)
example_data = [
['./examples/mov/1/1.jpeg', './examples/mov/1/1.mp4', 'wan2.2-animate-move', 'wan-pro'],
['./examples/mov/2/2.jpeg', './examples/mov/2/2.mp4', 'wan2.2-animate-move', 'wan-pro'],
['./examples/mix/1/1.jpeg', './examples/mix/1/1.mp4', 'wan2.2-animate-mix', 'wan-pro'],
['./examples/mix/2/2.jpeg', './examples/mix/2/2.mp4', 'wan2.2-animate-mix', 'wan-pro']
]
if example_data:
gr.Examples(
examples=example_data,
inputs=[ref_img, video, model_id, model],
outputs=[output_video, output_status],
fn=app.predict,
cache_examples="lazy",
)
demo.queue(default_concurrency_limit=100)
demo.launch(
server_name="0.0.0.0",
server_port=7860
)
if __name__ == "__main__":
start_app()