Spaces:

Wan-AI
/

Wan2.2-Animate

Running

App Files Files Community

Wan2.2-Animate / app.py

kelseye

Update app.py

7b7aba3 verified 3 days ago

raw

history blame contribute delete

13.3 kB

	# app.py
	import os
	import oss2
	import sys
	import uuid
	import shutil
	import time
	import gradio as gr
	import requests

	import dashscope
	from dashscope.utils.oss_utils import check_and_upload_local

	DASHSCOPE_API_KEY = os.getenv("DASHSCOPE_API_KEY")
	dashscope.api_key = DASHSCOPE_API_KEY


	class WanAnimateApp:
	def __init__(self, url, get_url):
	self.url = url
	self.get_url = get_url

	def predict(
	self,
	ref_img,
	video,
	model_id,
	model,
	):
	# Upload files to OSS if needed and get URLs
	_, image_url = check_and_upload_local(model_id, ref_img, DASHSCOPE_API_KEY)
	_, video_url = check_and_upload_local(model_id, video, DASHSCOPE_API_KEY)

	# Prepare the request payload
	payload = {
	"model": model_id,
	"input": {
	"image_url": image_url,
	"video_url": video_url
	},
	"parameters": {
	"check_image": True,
	"mode": model,
	}
	}

	# Set up headers
	headers = {
	"X-DashScope-Async": "enable",
	"X-DashScope-OssResourceResolve": "enable",
	"Authorization": f"Bearer {DASHSCOPE_API_KEY}",
	"Content-Type": "application/json"
	}

	# Make the initial API request
	url = self.url
	response = requests.post(url, json=payload, headers=headers)

	# Check if request was successful
	if response.status_code != 200:
	raise Exception(f"Initial request failed with status code {response.status_code}: {response.text}")

	# Get the task ID from response
	result = response.json()
	task_id = result.get("output", {}).get("task_id")
	if not task_id:
	raise Exception("Failed to get task ID from response")

	# Poll for results
	get_url = f"{self.get_url}/{task_id}"
	headers = {
	"Authorization": f"Bearer {DASHSCOPE_API_KEY}",
	"Content-Type": "application/json"
	}

	while True:
	response = requests.get(get_url, headers=headers)
	if response.status_code != 200:
	raise Exception(f"Failed to get task status: {response.status_code}: {response.text}")

	result = response.json()
	print(result)
	task_status = result.get("output", {}).get("task_status")

	if task_status == "SUCCEEDED":
	# Task completed successfully, return video URL
	video_url = result["output"]["results"]["video_url"]
	return video_url, "SUCCEEDED"
	elif task_status == "FAILED":
	# Task failed, raise an exception with error message
	error_msg = result.get("output", {}).get("message", "Unknown error")
	code_msg = result.get("output", {}).get("code", "Unknown code")
	print(f"\n\nTask failed: {error_msg} Code: {code_msg} TaskId: {task_id}\n\n")
	return None, f"Task failed: {error_msg} Code: {code_msg} TaskId: {task_id}"
	# raise Exception(f"Task failed: {error_msg} TaskId: {task_id}")
	else:
	# Task is still running, wait and retry
	time.sleep(5) # Wait 5 seconds before polling again

	def start_app():
	import argparse
	parser = argparse.ArgumentParser(description="Wan2.2-Animate 视频生成工具")
	args = parser.parse_args()

	url = "https://dashscope.aliyuncs.com/api/v1/services/aigc/image2video/video-synthesis/"
	# url = "https://poc-dashscope.aliyuncs.com/api/v1/services/aigc/image2video/video-synthesis"

	get_url = f"https://dashscope.aliyuncs.com/api/v1/tasks/"
	# get_url = f"https://poc-dashscope.aliyuncs.com/api/v1/tasks"
	app = WanAnimateApp(url=url, get_url=get_url)

	with gr.Blocks(title="Wan2.2-Animate 视频生成") as demo:
	gr.HTML("""


	<div style="padding: 2rem; text-align: center; max-width: 1200px; margin: 0 auto; font-family: Arial, sans-serif;">

	<h1 style="font-size: 2.5rem; font-weight: bold; margin-bottom: 0.5rem; color: #333;">
	Wan2.2-Animate: Unified Character Animation and Replacement with Holistic Replication
	</h1>

	<h3 style="font-size: 2.5rem; font-weight: bold; margin-bottom: 0.5rem; color: #333;">
	Wan2.2-Animate: 统一的角色动画和视频人物替换模型
	</h3>

	<div style="font-size: 1.25rem; margin-bottom: 1.5rem; color: #555;">
	Tongyi Lab, Alibaba
	</div>

	<div style="display: flex; flex-wrap: wrap; justify-content: center; gap: 1rem; margin-bottom: 1rem;">
	<!-- 第一行按钮 -->
	<a href="https://arxiv.org/abs/2509.14055" target="_blank"
	style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; /* 浅灰色背景 / color: #333; / 深色文字 */ text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
	<span style="margin-right: 0.5rem;">📄</span> <!-- 使用文档图标 -->
	<span>Paper</span>
	</a>

	<a href="https://github.com/Wan-Video/Wan2.2" target="_blank"
	style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
	<span style="margin-right: 0.5rem;">💻</span> <!-- 使用电脑图标 -->
	<span>GitHub</span>
	</a>

	<a href="https://huggingface.co/Wan-AI/Wan2.2-Animate-14B" target="_blank"
	style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
	<span style="margin-right: 0.5rem;">🤗</span>
	<span>HF Model</span>
	</a>

	<a href="https://www.modelscope.cn/models/Wan-AI/Wan2.2-Animate-14B" target="_blank"
	style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
	<span style="margin-right: 0.5rem;">🤖</span>
	<span>MS Model</span>
	</a>
	</div>

	<div style="display: flex; flex-wrap: wrap; justify-content: center; gap: 1rem;">
	<!-- 第二行按钮 -->
	<a href="https://huggingface.co/spaces/Wan-AI/Wan2.2-Animate" target="_blank"
	style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
	<span style="margin-right: 0.5rem;">🤗</span>
	<span>HF Space</span>
	</a>

	<a href="https://www.modelscope.cn/studios/Wan-AI/Wan2.2-Animate" target="_blank"
	style="display: inline-flex; align-items: center; padding: 0.5rem 1rem; background-color: #f0f0f0; color: #333; text-decoration: none; border-radius: 9999px; font-weight: 500; transition: background-color 0.3s;">
	<span style="margin-right: 0.5rem;">🤖</span>
	<span>MS Studio</span>
	</a>
	</div>

	</div>

	""")

	gr.HTML("""
	<details>
	<summary>‼️Usage (使用说明)</summary>

	Wan-Animate supports two mode:
	<ul>
	<li>Move Mode: animate the character in input image with movements from the input video</li>
	<li>Mix Mode: replace the character in input video with the character in input image</li>
	</ul>

	Wan-Animate 支持两种模式:
	<ul>
	<li>Move模式: 用输入视频中提取的动作，驱动输入图片中的角色</li>
	<li>Mix模式: 用输入图片中的角色，替换输入视频中的角色</li>
	</ul>

	Currently, the following restrictions apply to inputs:

	<ul> <li>Video file size: Less than 200MB</li>
	<li>Video resolution: The shorter side must be greater than 200, and the longer side must be less than 2048</li>
	<li>Video duration: 2s to 30s</li>
	<li>Video aspect ratio: 1:3 to 3:1</li>
	<li>Video formats: mp4, avi, mov</li>
	<li>Image file size: Less than 5MB</li>
	<li>Image resolution: The shorter side must be greater than 200, and the longer side must be less than 4096</li>
	<li>Image formats: jpg, png, jpeg, webp, bmp</li> </ul>


	当前，对于输入有以下的限制

	<ul>
	<li>视频文件大小: 小于 200MB</li>
	<li>视频分辨率：最小边大于 200, 最大边小于2048</li>
	<li>视频时长: 2s ~ 30s </li>
	<li>视频比例：1:3 ~ 3:1 </li>
	<li>视频格式: mp4, avi, mov </li>
	<li>图片文件大小: 小于5MB </li>
	<li>图片分辨率：最小边大于200，最大边小于4096 </li>
	<li>图片格式: jpg, png, jpeg, webp, bmp </li>
	</ul>

	<p> Currently, the inference quality has two variants. You can use our open-source code for more flexible configuration. </p>

	<p>当前，推理质量有两个变种。您可以使用我们的开源代码，来进行更灵活的设置。</p>

	<ul>
	<li> wan-pro: 25fps, 720p </li>
	<li> wan-std: 15fps, 720p </li>
	</ul>


	</details>
	""")

	with gr.Row():
	with gr.Column():
	ref_img = gr.Image(
	label="Reference Image(参考图像)",
	type="filepath",
	sources=["upload"],
	)

	video = gr.Video(
	label="Template Video(模版视频)",
	sources=["upload"],
	)

	with gr.Row():
	model_id = gr.Dropdown(
	label="Mode(模式)",
	choices=["wan2.2-animate-move", "wan2.2-animate-mix"],
	value="wan2.2-animate-move",
	info=""
	)

	model = gr.Dropdown(
	label="推理质量(Inference Quality)",
	choices=["wan-pro", "wan-std"],
	value="wan-pro",
	)

	run_button = gr.Button("Generate Video(生成视频)")

	with gr.Column():
	output_video = gr.Video(label="Output Video(输出视频)")
	output_status = gr.Textbox(label="Status(状态)")

	run_button.click(
	fn=app.predict,
	inputs=[
	ref_img,
	video,
	model_id,
	model,
	],
	outputs=[output_video, output_status],
	)

	example_data = [
	['./examples/mov/1/1.jpeg', './examples/mov/1/1.mp4', 'wan2.2-animate-move', 'wan-pro'],
	['./examples/mov/2/2.jpeg', './examples/mov/2/2.mp4', 'wan2.2-animate-move', 'wan-pro'],
	['./examples/mix/1/1.jpeg', './examples/mix/1/1.mp4', 'wan2.2-animate-mix', 'wan-pro'],
	['./examples/mix/2/2.jpeg', './examples/mix/2/2.mp4', 'wan2.2-animate-mix', 'wan-pro']
	]

	if example_data:
	gr.Examples(
	examples=example_data,
	inputs=[ref_img, video, model_id, model],
	outputs=[output_video, output_status],
	fn=app.predict,
	cache_examples="lazy",
	)

	demo.queue(default_concurrency_limit=100)

	demo.launch(
	server_name="0.0.0.0",
	server_port=7860
	)


	if __name__ == "__main__":
	start_app()