Spaces:

sourxbhh
/

ACMDM_Motion_Generation

Sleeping

App Files Files Community

ACMDM_Motion_Generation / app.py

sourxbhh

UI fixes

9b0e308 23 days ago

raw

history blame contribute delete

32.4 kB

	"""
	Gradio Web Interface for ACMDM Motion Generation
	Milestone 3: User-friendly web interface for text-to-motion generation
	"""

	import os
	import sys
	from os.path import join as pjoin, dirname, abspath

	# Add current directory to Python path for HuggingFace Spaces
	# This ensures models/ and utils/ can be imported
	current_dir = dirname(abspath(__file__))
	if current_dir not in sys.path:
	sys.path.insert(0, current_dir)

	import torch
	import numpy as np
	import gradio as gr
	from typing import Optional, Tuple, List
	import tempfile
	import random

	# Import from models and utils
	from models.AE_2D_Causal import AE_models
	from models.ACMDM import ACMDM_models
	from models.LengthEstimator import LengthEstimator
	from utils.back_process import back_process
	from utils.motion_process import plot_3d_motion, t2m_kinematic_chain

	# Global variables for model caching
	_models_cache = {
	'ae': None,
	'acmdm': None,
	'length_estimator': None,
	'stats': None,
	'device': None,
	'loaded': False
	}


	def set_seed(seed):
	"""Set random seed for reproducibility"""
	random.seed(seed)
	np.random.seed(seed)
	torch.manual_seed(seed)
	torch.backends.cudnn.benchmark = False


	def load_models_cached(
	gpu_id: int = 0,
	model_name: str = 'ACMDM_Flow_S_PatchSize22',
	ae_name: str = 'AE_2D_Causal',
	ae_model: str = 'AE_Model',
	model_type: str = 'ACMDM-Flow-S-PatchSize22',
	dataset_name: str = 't2m',
	checkpoints_dir: str = './checkpoints',
	use_length_estimator: bool = False
	) -> Tuple[dict, str]:
	"""
	Load models with caching to avoid reloading on every request.
	Returns (models_dict, status_message)
	"""
	global _models_cache

	# Check if models are already loaded
	if _models_cache['loaded']:
	return _models_cache, "Models already loaded (using cache)"

	try:
	# Determine device
	if gpu_id >= 0 and torch.cuda.is_available():
	device = torch.device(f"cuda:{gpu_id}")
	else:
	device = torch.device("cpu")

	_models_cache['device'] = device
	status_messages = [f"Using device: {device}"]

	# Load AE
	status_messages.append("Loading AE model...")
	ae = AE_models[ae_model](input_width=3)
	ae_ckpt_path = pjoin(checkpoints_dir, dataset_name, ae_name, 'model', 'latest.tar')

	if not os.path.exists(ae_ckpt_path):
	return None, f"Error: AE checkpoint not found at {ae_ckpt_path}"

	ae_ckpt = torch.load(ae_ckpt_path, map_location='cpu')
	ae.load_state_dict(ae_ckpt['ae'])
	ae.eval()
	ae.to(device)
	_models_cache['ae'] = ae
	status_messages.append(f"✓ Loaded AE from {ae_ckpt_path}")

	# Load ACMDM
	status_messages.append("Loading ACMDM model...")
	acmdm = ACMDM_models[model_type](input_dim=ae.output_emb_width, cond_mode='text')
	acmdm_ckpt_path = pjoin(checkpoints_dir, dataset_name, model_name, 'model', 'latest.tar')

	if not os.path.exists(acmdm_ckpt_path):
	return None, f"Error: ACMDM checkpoint not found at {acmdm_ckpt_path}"

	acmdm_ckpt = torch.load(acmdm_ckpt_path, map_location='cpu')
	missing_keys, unexpected_keys = acmdm.load_state_dict(acmdm_ckpt['ema_acmdm'], strict=False)
	assert len(unexpected_keys) == 0
	assert all([k.startswith('clip_model.') for k in missing_keys])
	acmdm.eval()
	acmdm.to(device)
	_models_cache['acmdm'] = acmdm
	status_messages.append(f"✓ Loaded ACMDM from {acmdm_ckpt_path}")

	# Load LengthEstimator if needed
	length_estimator = None
	if use_length_estimator:
	status_messages.append("Loading LengthEstimator...")
	length_estimator = LengthEstimator(input_size=512, output_size=1)
	length_estimator_path = pjoin(checkpoints_dir, dataset_name, 'length_estimator', 'model', 'latest.tar')
	if os.path.exists(length_estimator_path):
	length_ckpt = torch.load(length_estimator_path, map_location='cpu')
	length_estimator.load_state_dict(length_ckpt['model'])
	length_estimator.eval()
	length_estimator.to(device)
	_models_cache['length_estimator'] = length_estimator
	status_messages.append(f"✓ Loaded LengthEstimator")
	else:
	status_messages.append(f"⚠ LengthEstimator not found, will use default length")

	# Load normalization stats
	status_messages.append("Loading normalization statistics...")
	after_mean = np.load(pjoin(checkpoints_dir, dataset_name, ae_name, 'AE_2D_Causal_Post_Mean.npy'))
	after_std = np.load(pjoin(checkpoints_dir, dataset_name, ae_name, 'AE_2D_Causal_Post_Std.npy'))
	joint_mean = np.load(f'utils/22x3_mean_std/{dataset_name}/22x3_mean.npy')
	joint_std = np.load(f'utils/22x3_mean_std/{dataset_name}/22x3_std.npy')
	eval_mean = np.load(f'utils/eval_mean_std/{dataset_name}/eval_mean.npy')
	eval_std = np.load(f'utils/eval_mean_std/{dataset_name}/eval_std.npy')

	_models_cache['stats'] = {
	'after_mean': after_mean,
	'after_std': after_std,
	'joint_mean': joint_mean,
	'joint_std': joint_std,
	'eval_mean': eval_mean,
	'eval_std': eval_std
	}

	_models_cache['loaded'] = True
	status_message = "\n".join(status_messages)
	return _models_cache, status_message

	except Exception as e:
	error_msg = f"Error loading models: {str(e)}"
	import traceback
	error_msg += f"\n\nTraceback:\n{traceback.format_exc()}"
	return None, error_msg


	def estimate_motion_length(text: str, models_cache: dict) -> int:
	"""Estimate motion length from text using LengthEstimator"""
	if models_cache['length_estimator'] is None:
	return None

	device = models_cache['device']
	acmdm = models_cache['acmdm']
	length_estimator = models_cache['length_estimator']

	with torch.no_grad():
	text_emb = acmdm.encode_text([text])
	pred_length = length_estimator(text_emb)
	pred_length = int(pred_length.item() * 4)
	pred_length = ((pred_length + 2) // 4) * 4
	pred_length = max(40, min(196, pred_length))
	return pred_length


	def generate_motion_single(
	text: str,
	motion_length: Optional[int],
	cfg_scale: float,
	use_auto_length: bool,
	gpu_id: int,
	seed: int
	) -> Tuple[Optional[str], str]:
	"""
	Generate a single motion from text.
	Returns (video_path, status_message)
	"""
	global _models_cache

	try:
	set_seed(seed)

	# Load models if not cached
	if not _models_cache['loaded']:
	models_cache, load_msg = load_models_cached(
	gpu_id=gpu_id,
	use_length_estimator=use_auto_length
	)
	if models_cache is None:
	return None, f"Failed to load models:\n{load_msg}"
	else:
	models_cache = _models_cache

	device = models_cache['device']
	ae = models_cache['ae']
	acmdm = models_cache['acmdm']
	stats = models_cache['stats']

	# Estimate length if needed
	if motion_length is None or (motion_length == 0 and use_auto_length):
	if use_auto_length and models_cache['length_estimator'] is not None:
	motion_length = estimate_motion_length(text, models_cache)
	status_msg = f"Estimated motion length: {motion_length} frames\n"
	else:
	motion_length = 120 # Default
	status_msg = f"Using default motion length: {motion_length} frames\n"
	else:
	# Round to multiple of 4
	motion_length = ((motion_length + 2) // 4) * 4
	status_msg = f"Using specified motion length: {motion_length} frames\n"

	status_msg += f"Generating motion for: '{text}'...\n"

	# Generate motion
	with torch.no_grad():
	latent_length = motion_length // 4
	m_lens = torch.tensor([latent_length], device=device)
	pred_latents = acmdm.generate([text], m_lens, cfg_scale)

	# Denormalize latents
	pred_latents_np = pred_latents.permute(0, 2, 3, 1).detach().cpu().numpy()
	pred_latents_np = pred_latents_np * stats['after_std'] + stats['after_mean']
	pred_latents_tensor = torch.from_numpy(pred_latents_np).to(device)

	# Decode through AE
	pred_motions = ae.decode(pred_latents_tensor.permute(0, 3, 1, 2))

	# Denormalize motions
	pred_motions_np = pred_motions.permute(0, 2, 3, 1).detach().cpu().numpy()
	if stats['joint_mean'].ndim == 1:
	pred_motions_np = pred_motions_np * stats['joint_std'][np.newaxis, np.newaxis, :, np.newaxis] + stats['joint_mean'][np.newaxis, np.newaxis, :, np.newaxis]
	else:
	pred_motions_np = pred_motions_np * stats['joint_std'][np.newaxis, ..., np.newaxis] + stats['joint_mean'][np.newaxis, ..., np.newaxis]

	# Back process to get RIC format, then recover joint positions
	from utils.motion_process import recover_from_ric

	motion = pred_motions_np[0] # (22, 3, seq_len)
	motion = motion[:, :, :motion_length].transpose(2, 0, 1) # (seq_len, 22, 3)
	ric_data = back_process(motion, is_mesh=False)
	ric_tensor = torch.from_numpy(ric_data).float()
	joints = recover_from_ric(ric_tensor, joints_num=22).numpy() # (seq_len, 22, 3)

	# Create temporary file for video
	temp_dir = tempfile.mkdtemp()
	os.makedirs(temp_dir, exist_ok=True)
	video_path = pjoin(temp_dir, 'motion.mp4')

	# Generate video - plot_3d_motion returns the actual path (may be .mp4 or .gif)
	try:
	actual_video_path = plot_3d_motion(
	video_path,
	t2m_kinematic_chain,
	joints,
	title=text,
	fps=20,
	radius=4
	)
	except Exception as e:
	status_msg += f"\n⚠ Error in plot_3d_motion: {str(e)}"
	raise

	# Verify file exists - check both the returned path and original path
	if not os.path.exists(actual_video_path):
	# Check if file exists with original path
	if os.path.exists(video_path):
	actual_video_path = video_path
	# Check if it was saved as GIF instead
	elif os.path.exists(video_path.replace('.mp4', '.gif')):
	actual_video_path = video_path.replace('.mp4', '.gif')
	else:
	# List files in temp directory for debugging
	files_in_dir = os.listdir(temp_dir) if os.path.exists(temp_dir) else []
	error_msg = f"Video file not found. Expected: {actual_video_path}\n"
	error_msg += f"Files in temp directory: {files_in_dir}"
	status_msg += f"\n❌ {error_msg}"
	raise FileNotFoundError(error_msg)

	status_msg += f"\n✓ Motion generated successfully! Video saved."
	return actual_video_path, status_msg

	except Exception as e:
	error_msg = f"Error generating motion: {str(e)}"
	import traceback
	error_msg += f"\n\nTraceback:\n{traceback.format_exc()}"
	return None, error_msg


	# Batch generation feature commented out
	# def generate_motion_batch(
	# text_file_content: str,
	# cfg_scale: float,
	# use_auto_length: bool,
	# gpu_id: int,
	# seed: int
	# ) -> Tuple[List[Optional[str]], str]:
	# """
	# Generate motions from a batch of text prompts.
	# Returns (list_of_video_paths, status_message)
	# """
	# # Parse text file
	# text_prompts = []
	# for line in text_file_content.strip().split('\n'):
	# line = line.strip()
	# if not line:
	# continue
	# if '#' in line:
	# parts = line.split('#')
	# text = parts[0].strip()
	# length_str = parts[1].strip() if len(parts) > 1 else 'NA'
	# else:
	# text = line
	# length_str = 'NA'
	#
	# if length_str.upper() == 'NA':
	# motion_length = None if use_auto_length else 120
	# else:
	# try:
	# motion_length = int(length_str)
	# motion_length = ((motion_length + 2) // 4) * 4
	# except:
	# motion_length = None if use_auto_length else 120
	#
	# text_prompts.append((text, motion_length))
	#
	# if not text_prompts:
	# return [], "No valid prompts found in file"
	#
	# status_msg = f"Processing {len(text_prompts)} prompts...\n"
	# video_paths = []
	#
	# # Create a persistent directory for batch videos (not temp, so Gradio can access them)
	# # Use a directory that Gradio can serve from
	# batch_output_dir = pjoin('generation', 'batch_temp')
	# os.makedirs(batch_output_dir, exist_ok=True)
	#
	# # Also ensure the parent directory exists
	# os.makedirs('generation', exist_ok=True)
	#
	# for idx, (text, motion_length) in enumerate(text_prompts):
	# try:
	# video_path, gen_msg = generate_motion_single(
	# text, motion_length, cfg_scale, use_auto_length, gpu_id, seed + idx
	# )
	#
	# # If video was created, copy it to persistent location for batch gallery
	# if video_path and os.path.exists(video_path):
	# # Create a unique filename for this batch item
	# # Get file extension from original path
	# file_ext = os.path.splitext(video_path)[1] or '.mp4'
	# batch_video_path = pjoin(batch_output_dir, f'motion_{idx:04d}{file_ext}')
	#
	# # Copy file to persistent location
	# import shutil
	# try:
	# shutil.copy2(video_path, batch_video_path)
	#
	# # Verify the copied file exists
	# if os.path.exists(batch_video_path):
	# # Use relative path for Gradio (works better in HuggingFace Spaces)
	# # Gradio can serve files from relative paths within the app directory
	# video_paths.append(batch_video_path)
	# file_size = os.path.getsize(batch_video_path)
	# status_msg += f"\n[{idx+1}/{len(text_prompts)}] ✓ {text[:50]}... - Video saved ({file_size/1024:.1f} KB)"
	# else:
	# status_msg += f"\n[{idx+1}/{len(text_prompts)}] ⚠ {text[:50]}... - Video copy failed (file not found after copy)"
	# video_paths.append(None)
	# except Exception as copy_error:
	# status_msg += f"\n[{idx+1}/{len(text_prompts)}] ⚠ {text[:50]}... - Copy error: {str(copy_error)}"
	# video_paths.append(None)
	# else:
	# status_msg += f"\n[{idx+1}/{len(text_prompts)}] ❌ {text[:50]}... - Generation failed (no video path returned)"
	# video_paths.append(None)
	#
	# except Exception as e:
	# status_msg += f"\n[{idx+1}/{len(text_prompts)}] ❌ Error: {str(e)}"
	# import traceback
	# status_msg += f"\n Traceback: {traceback.format_exc()[:200]}"
	# video_paths.append(None)
	#
	# # Filter out None values and verify files exist - Gradio Gallery needs valid paths
	# valid_video_paths = []
	# for path in video_paths:
	# if path is not None:
	# # Use relative path (Gradio handles these better in cloud environments)
	# # Verify file exists
	# if os.path.exists(path):
	# # Verify it's a video file
	# if path.lower().endswith(('.mp4', '.gif', '.mov', '.avi')):
	# # Get file size for debugging
	# file_size = os.path.getsize(path)
	# if file_size > 0: # Ensure file is not empty
	# valid_video_paths.append(path) # Keep relative path
	# status_msg += f"\n ✓ Verified: {os.path.basename(path)} ({file_size/1024:.1f} KB)"
	# else:
	# status_msg += f"\n ⚠ Empty file: {path}"
	# else:
	# status_msg += f"\n ⚠ Skipping non-video file: {path}"
	# else:
	# # Try absolute path as fallback
	# abs_path = os.path.abspath(path)
	# if os.path.exists(abs_path):
	# valid_video_paths.append(abs_path)
	# status_msg += f"\n ✓ Found via absolute path: {abs_path}"
	# else:
	# status_msg += f"\n ⚠ File not found (relative: {path}, absolute: {abs_path})"
	#
	# if len(valid_video_paths) == 0:
	# status_msg += "\n\n❌ No videos were successfully generated for the gallery."
	# status_msg += "\n💡 Check the error messages above for each prompt."
	# # Return empty list explicitly
	# return [], status_msg
	# else:
	# status_msg += f"\n\n✅ Successfully generated {len(valid_video_paths)}/{len(text_prompts)} motions."
	# status_msg += f"\n📁 Videos saved in: {batch_output_dir}"
	# status_msg += f"\n📋 Gallery will display {len(valid_video_paths)} video(s)."
	#
	# # Debug: Show first few paths
	# status_msg += f"\n\n🎬 First few video paths:\n"
	# for i, p in enumerate(valid_video_paths[:3]):
	# abs_p = os.path.abspath(p) if not os.path.isabs(p) else p
	# exists = "✓" if os.path.exists(p) else "✗"
	# status_msg += f" {exists} [{i+1}] {p} (exists: {os.path.exists(p)})\n"
	# if len(valid_video_paths) > 3:
	# status_msg += f" ... and {len(valid_video_paths) - 3} more\n"
	#
	# # Return list of file paths (Gradio Gallery expects list of strings)
	# # Ensure all paths are valid and accessible
	# final_paths = []
	# for p in valid_video_paths:
	# if os.path.exists(p):
	# # Normalize path (use forward slashes for cross-platform compatibility)
	# normalized_path = p.replace('\\', '/')
	# final_paths.append(normalized_path)
	# else:
	# status_msg += f"\n⚠ Warning: Path not found when returning: {p}"
	#
	# if len(final_paths) != len(valid_video_paths):
	# status_msg += f"\n⚠ Some paths were filtered out. Returning {len(final_paths)}/{len(valid_video_paths)} videos."
	#
	# return final_paths, status_msg


	# Gradio Interface
	def create_interface():
	"""Create and configure the Gradio interface"""

	with gr.Blocks(title="ACMDM Motion Generation", theme=gr.themes.Soft()) as app:
	gr.Markdown("""
	# 🎭 ACMDM Motion Generation

	Generate human motion from text descriptions using the ACMDM (Absolute Coordinates Make Motion Generation Easy) model.

	How to use:
	1. Enter a text description of the motion you want to generate
	2. Adjust motion length (or use auto-estimate)
	3. Click "Generate Motion" to create the animation
	4. View and download the generated video

	Example prompts:
	- "A person is running on a treadmill."
	- "Someone is doing jumping jacks."
	- "A person walks forward and then turns around."
	""")

	with gr.Tabs():
	# Single Generation Tab
	with gr.Tab("Single Motion Generation"):
	with gr.Row():
	with gr.Column(scale=1):
	text_input = gr.Textbox(
	label="Motion Description",
	placeholder="A person is running on a treadmill.",
	lines=3,
	value="A person is running on a treadmill."
	)

	with gr.Row():
	motion_length = gr.Slider(
	label="Motion Length (frames)",
	minimum=40,
	maximum=196,
	value=120,
	step=4,
	info="Will be rounded to nearest multiple of 4"
	)
	use_auto_length = gr.Checkbox(
	label="Auto-estimate length",
	value=False,
	info="Use length estimator (ignores manual length if checked)"
	)

	cfg_scale = gr.Slider(
	label="CFG Scale",
	minimum=1.0,
	maximum=10.0,
	value=3.0,
	step=0.5,
	info="Classifier-free guidance scale (higher = more aligned with text)"
	)

	with gr.Row():
	gpu_id = gr.Number(
	label="GPU ID",
	value=0,
	precision=0,
	info="Use -1 for CPU"
	)
	seed = gr.Number(
	label="Random Seed",
	value=3407,
	precision=0
	)

	generate_btn = gr.Button("Generate Motion", variant="primary", size="lg")

	with gr.Column(scale=1):
	video_output = gr.Video(
	label="Generated Motion",
	format="mp4"
	)
	status_output = gr.Textbox(
	label="Status",
	lines=10,
	interactive=False
	)

	# Update model status after generation
	def generate_and_update_status(text, motion_length, cfg_scale, use_auto_length, gpu_id, seed):
	video_path, status_msg = generate_motion_single(
	text, motion_length, cfg_scale, use_auto_length, gpu_id, seed
	)
	# Return video and status, plus trigger status update
	return video_path, status_msg

	generate_btn.click(
	fn=generate_and_update_status,
	inputs=[text_input, motion_length, cfg_scale, use_auto_length, gpu_id, seed],
	outputs=[video_output, status_output]
	)

	# Batch Generation Tab - COMMENTED OUT
	# with gr.Tab("Batch Generation"):
	# with gr.Row():
	# with gr.Column(scale=1):
	# batch_text_input = gr.Textbox(
	# label="Text Prompts (one per line, format: text#length or text#NA)",
	# placeholder="A person is running on a treadmill.#120\nSomeone is doing jumping jacks.#NA",
	# lines=10,
	# info="Each line: 'text#length' or 'text#NA' for auto-estimate"
	# )
	#
	# batch_cfg_scale = gr.Slider(
	# label="CFG Scale",
	# minimum=1.0,
	# maximum=10.0,
	# value=3.0,
	# step=0.5
	# )
	#
	# batch_use_auto_length = gr.Checkbox(
	# label="Auto-estimate length for NA",
	# value=True
	# )
	#
	# batch_gpu_id = gr.Number(
	# label="GPU ID",
	# value=0,
	# precision=0
	# )
	#
	# batch_seed = gr.Number(
	# label="Random Seed",
	# value=3407,
	# precision=0
	# )
	#
	# batch_generate_btn = gr.Button("Generate Batch", variant="primary", size="lg")
	#
	# with gr.Column(scale=1):
	# batch_status_output = gr.Textbox(
	# label="Batch Status",
	# lines=15,
	# interactive=False
	# )
	# batch_video_gallery = gr.Gallery(
	# label="Generated Motions",
	# show_label=True,
	# elem_id="gallery",
	# columns=2,
	# rows=2,
	# height="auto",
	# type="filepath" # Explicitly specify filepath type
	# )
	#
	# batch_generate_btn.click(
	# fn=generate_motion_batch,
	# inputs=[batch_text_input, batch_cfg_scale, batch_use_auto_length, batch_gpu_id, batch_seed],
	# outputs=[batch_video_gallery, batch_status_output]
	# )

	# Model Management Tab
	with gr.Tab("Model Management"):
	with gr.Row():
	with gr.Column():
	model_status = gr.Textbox(
	label="Model Status",
	lines=15,
	interactive=False,
	value="⏳ Models not loaded yet. They will be loaded automatically on first generation."
	)
	with gr.Row():
	refresh_status_btn = gr.Button("🔄 Refresh Status", variant="primary")
	reload_models_btn = gr.Button("🗑️ Clear Cache", variant="secondary")

	gr.Markdown("""
	Model Configuration:
	- Model Name: `ACMDM_Flow_S_PatchSize22`
	- AE Name: `AE_2D_Causal`
	- Dataset: `t2m`
	- Checkpoints Directory: `./checkpoints`
	""")

	def check_model_status():
	"""Check and display current model status"""
	global _models_cache
	if _models_cache['loaded']:
	device = _models_cache['device']
	status_lines = [
	"✓ MODELS LOADED AND READY",
	"=" * 50,
	f"📱 Device: {device}",
	f"💾 CUDA Available: {torch.cuda.is_available()}",
	]

	if device.type == 'cuda':
	status_lines.append(f"🎮 GPU: {torch.cuda.get_device_name(device.index if device.index is not None else 0)}")
	status_lines.append(f"💾 GPU Memory: {torch.cuda.get_device_properties(device.index if device.index is not None else 0).total_memory / 1e9:.2f} GB")

	status_lines.extend([
	"",
	"📦 Loaded Models:",
	" ✓ Autoencoder (AE_2D_Causal)",
	" ✓ ACMDM Diffusion Model",
	])

	if _models_cache['length_estimator'] is not None:
	status_lines.append(" ✓ Length Estimator")
	else:
	status_lines.append(" ⚠ Length Estimator (not loaded)")

	status_lines.extend([
	"",
	"📊 Statistics Loaded:",
	" ✓ Post-AE Mean/Std",
	" ✓ Joint Mean/Std",
	" ✓ Eval Mean/Std",
	"",
	"✨ Models are cached and ready for generation!",
	"💡 Tip: Use 'Clear Cache' to force reload on next generation."
	])

	return "\n".join(status_lines)
	else:
	return (
	"⏳ Models not loaded yet. They will be loaded automatically on first generation.\n"
	"📝 To load models now, go to 'Single Motion Generation' tab and click 'Generate Motion'.\n"
	"⏱️ First generation will take 30-60 seconds (model loading time).\n"
	"⚡ Subsequent generations will be much faster (5-15 seconds)."
	)

	def reload_models():
	"""Clear model cache"""
	global _models_cache
	_models_cache['loaded'] = False
	_models_cache['ae'] = None
	_models_cache['acmdm'] = None
	_models_cache['length_estimator'] = None
	_models_cache['stats'] = None
	_models_cache['device'] = None
	return (
	"🗑️ Model cache cleared. Models will be automatically reloaded on your next generation request.\n"
	"💡 Click 'Refresh Status' after generating to see updated status."
	)

	# Button callbacks
	refresh_status_btn.click(
	fn=check_model_status,
	outputs=model_status
	)

	reload_models_btn.click(
	fn=reload_models,
	outputs=model_status
	)

	# Update status on tab load
	app.load(
	fn=check_model_status,
	outputs=model_status
	)

	gr.Markdown("""
	---
	Note: First generation may take longer as models need to be loaded. Subsequent generations will be faster.

	Tips:
	- Use descriptive text prompts for better results
	- Adjust CFG scale: higher values (3-5) for more text alignment, lower values (1-2) for more diversity
	- Motion length should be a multiple of 4 (automatically rounded)
	- For batch processing, use the format: `text description#length` or `text description#NA`
	""")

	return app


	if __name__ == "__main__":
	# Create and launch the interface
	app = create_interface()

	# Launch with sharing option
	app.launch(
	server_name="0.0.0.0", # Allow external connections
	server_port=7860, # Default Gradio port
	share=False, # Set to True for public link (requires ngrok)
	show_error=True
	)