Spaces:

Raxephion
/

CipherCore-SD1.5-Image-Generator

Runtime error

App Files Files Community

CipherCore-SD1.5-Image-Generator / app.py

Raxephion

Update app.py

590767f verified 7 months ago

raw

history blame contribute delete

34.8 kB

	# -- coding: utf-8 --
	"""
	Hugging Face Spaces Script for Basic Stable Diffusion 1.5 Gradio App
	Adapted from user's local script and HF Spaces template.
	Supports Hub models and CPU/GPU selection based on available hardware.
	Includes Attention Slicing optimization toggle.
	Corrected progress callback format.
	"""

	import gradio as gr
	import numpy as np
	import random
	import torch
	from diffusers import StableDiffusionPipeline
	# Import commonly used schedulers
	from diffusers import DDPMScheduler, EulerDiscreteScheduler, DPMSolverMultistepScheduler, LMSDiscreteScheduler
	import os # Keep os for potential checks, though local paths are less standard on Spaces
	# import spaces #[uncomment to use ZeroGPU if needed, typically not for standard GPU usage]
	from PIL import Image
	import time # Optional: for timing generation
	# huggingface_hub is implicitly used by from_pretrained

	# --- Configuration ---
	# MODELS_DIR is less relevant for Spaces unless specifically placing models in repo
	# For Spaces, models are primarily loaded via their Hugging Face Hub IDs
	SUPPORTED_SD15_SIZES = ["512x512", "768x512", "512x768", "768x768", "1024x768", "768x1024", "1024x1024", "hire.fix"]

	# Mapping of friendly scheduler names to their diffusers classes
	SCHEDULER_MAP = {
	"Euler": EulerDiscreteScheduler,
	"DPM++ 2M": DPMSolverMultistepScheduler,
	"DDPM": DDPMScheduler,
	"LMS": LMSDiscreteScheduler,
	# Add more as needed from diffusers.schedulers (make sure they are imported)
	}
	DEFAULT_SCHEDULER = "Euler" # Default scheduler on startup

	# List of popular Stable Diffusion 1.5 models on the Hugging Face Hub
	# For Spaces, this is the primary source of models.
	DEFAULT_HUB_MODELS = [
	"Raxephion/Typhoon-SD1.5-V1",
	"Yntec/RevAnimatedV2Rebirth",
	"stablediffusionapi/realcartoon-anime-v11"
	# "CompVis/stable-diffusion-v1-4", # Example SD 1.4 model (might behave slightly differently)
	# Add other diffusers-compatible SD1.5 models here
	]

	# --- Constants for Gradio UI / Generation ---
	MAX_SEED = np.iinfo(np.int32).max # Defines the maximum seed value
	# MAX_IMAGE_SIZE_SLIDER = 1024 # Used only for slider max, kept for consistency if needed elsewhere

	# --- Determine available devices and set up options ---
	# This logic is from the user's script and works well for Spaces
	AVAILABLE_DEVICES = ["CPU"]
	if torch.cuda.is_available():
	AVAILABLE_DEVICES.append("GPU")
	print(f"CUDA available. Found {torch.cuda.device_count()} GPU(s).")
	if torch.cuda.device_count() > 0:
	print(f"Using GPU 0: {torch.cuda.get_device_name(0)}")
	else:
	print("CUDA not available. Running on CPU.")

	# Default device preference: GPU if available, else CPU
	DEFAULT_DEVICE = "GPU" if "GPU" in AVAILABLE_DEVICES else "CPU"

	# Set initial PyTorch device string based on detection
	initial_device_to_use = "cuda" if DEFAULT_DEVICE == "GPU" else "cpu"
	print(f"Initial pipeline will load on device: {initial_device_to_use}")

	# Determine initial dtype
	# Note: fp16 is generally faster and uses less VRAM on compatible GPUs
	initial_dtype_to_use = torch.float32 # Default
	if initial_device_to_use == "cuda":
	# Check if the GPU supports fp16 (most modern ones do)
	if torch.cuda.is_available() and torch.cuda.get_device_capability(0)[0] >= 7: # Check compute capability (7.0+ for good fp16)
	initial_dtype_to_use = torch.float16
	print("Detected GPU supports FP16, will attempt using torch.float16.")
	else:
	initial_dtype_to_use = torch.float32 # Fallback
	print("Detected GPU might not fully support FP16 or capability check failed, using torch.float32.")
	else:
	initial_dtype_to_use = torch.float32 # CPU requires float32

	print(f"Initial dtype: {initial_dtype_to_use}")


	# --- Global state for the loaded pipeline ---
	# We'll load the initial pipeline once on startup and keep it in memory.
	# Subsequent model changes will reload the pipeline within the infer function.
	current_pipeline = None
	current_model_id = None # Keep track of the currently loaded model identifier
	current_device_loaded = None # Keep track of the device the pipeline is currently on

	# Initial model to load on startup
	INITIAL_MODEL_ID = DEFAULT_HUB_MODELS[0] if DEFAULT_HUB_MODELS else None
	if INITIAL_MODEL_ID:
	print(f"\nLoading initial model '{INITIAL_MODEL_ID}' on startup...")
	try:
	# Load the pipeline onto the initial device and dtype
	pipeline = StableDiffusionPipeline.from_pretrained(
	INITIAL_MODEL_ID,
	torch_dtype=initial_dtype_to_use,
	safety_checker=None, # <<< SAFETY CHECKER DISABLED <<<
	)

	# --- Apply Optimizations during initial load ---
	# Apply attention slicing by default if GPU is available for memory efficiency on Spaces
	if initial_device_to_use == "cuda":
	try:
	pipeline.enable_attention_slicing()
	print("Attention Slicing enabled during initial load.")
	except Exception as e:
	print(f"Warning: Failed to enable Attention Slicing during initial load: {e}")
	# Don't raise Gradio error here, just print warning


	pipeline = pipeline.to(initial_device_to_use) # Move to the initial device

	current_pipeline = pipeline
	current_model_id = INITIAL_MODEL_ID
	current_device_loaded = torch.device(initial_device_to_use)
	print(f"Initial model loaded successfully on {current_device_loaded}.")

	# Basic check for SD1.x architecture
	unet_config = getattr(current_pipeline, 'unet', None)
	if unet_config and hasattr(unet_config, 'config') and hasattr(unet_config.config, 'cross_attention_dim'):
	cross_attn_dim = unet_config.config.cross_attention_dim
	if cross_attn_dim != 768:
	warning_msg = (f"Warning: Loaded model '{INITIAL_MODEL_ID}' might not be a standard SD 1.x model "
	f"(expected UNet cross_attention_dim 768, found {cross_attn_dim}). "
	"Results may be unexpected.")
	print(warning_msg)
	# gr.Warning(warning_msg) # Cannot raise Gradio error/warning during startup load
	else:
	print("UNet cross_attention_dim is 768, consistent with SD 1.x.")
	else:
	print("Could not check UNet cross_attention_dim for initial model.")


	except Exception as e:
	current_pipeline = None
	current_model_id = None
	current_device_loaded = None
	print(f"Error loading initial model '{INITIAL_MODEL_ID}': {e}")
	print("Application will start, but image generation may fail if the initial model cannot be loaded.")
	# Cannot raise gr.Error here as Gradio not fully initialized
	else:
	print("\nNo default Hub models defined. Application will start without a loaded model.")
	print("Please select a model from the dropdown to enable generation.")


	# --- Image Generation Function (Adapted for Hugging Face Spaces 'infer' signature) ---
	# @spaces.GPU #[uncomment if using ZeroGPU, otherwise standard torch device handles it]
	def infer(
	model_identifier, # From model_dropdown
	selected_device_str, # From device_dropdown
	prompt, # From prompt_input
	negative_prompt, # From negative_prompt_input
	steps, # From steps_slider
	cfg_scale, # From cfg_slider
	scheduler_name, # From scheduler_dropdown
	size, # From size_dropdown
	seed, # From seed_input (now a Slider)
	randomize_seed, # From randomize_seed_checkbox
	enable_attention_slicing, # New input for the optimization toggle
	progress=gr.Progress(), # Corrected Progress initialization (removed track_tqdm=True)
	):
	"""Generates an image using the selected model and parameters on the chosen device."""
	global current_pipeline, current_model_id, current_device_loaded, SCHEDULER_MAP, MAX_SEED

	# This check is done before parameter parsing so we can determine device/dtype for loading
	# Need to redo some parameter parsing here to get device_to_use early
	temp_device_to_use = "cuda" if selected_device_str == "GPU" and "GPU" in AVAILABLE_DEVICES else "cpu"
	temp_dtype_to_use = torch.float32
	if temp_device_to_use == "cuda":
	if torch.cuda.is_available() and torch.cuda.get_device_capability(0)[0] >= 7:
	temp_dtype_to_use = torch.float16
	else:
	temp_dtype_to_use = torch.float32
	else:
	temp_dtype_to_use = torch.float32

	# 1. Load/Switch Model if necessary
	# Check if the requested model identifier OR the requested device has changed
	if current_pipeline is None or current_model_id != model_identifier or (current_device_loaded is not None and str(current_device_loaded) != temp_device_to_use):

	print(f"Loading model: {model_identifier} onto {temp_device_to_use} with dtype {temp_dtype_to_use}...")
	# Clear previous pipeline to potentially free memory before loading the new one
	if current_pipeline is not None:
	print(f"Unloading previous model '{current_model_id}' from {current_device_loaded}...")
	if str(current_device_loaded) == "cuda":
	try:
	current_pipeline.to("cpu")
	print("Moved previous pipeline to CPU.")
	except Exception as move_e:
	print(f"Warning: Failed to move previous pipeline to CPU: {move_e}")
	del current_pipeline
	current_pipeline = None # Set to None immediately
	# Attempt to clear CUDA cache if using GPU (from the previous device)
	if str(current_device_loaded) == "cuda":
	try:
	torch.cuda.empty_cache()
	print("Cleared CUDA cache.")
	except Exception as cache_e:
	print(f"Warning: Error clearing CUDA cache: {cache_e}")

	# Ensure the device is actually available if not CPU (redundant with earlier check but safe)
	if temp_device_to_use == "cuda":
	if not torch.cuda.is_available():
	raise gr.Error("GPU selected but CUDA is not available to PyTorch on this Space. Please select CPU or ensure the Space is configured with a GPU and the CUDA version of PyTorch is installed.")

	try:
	pipeline = StableDiffusionPipeline.from_pretrained(
	model_identifier,
	torch_dtype=temp_dtype_to_use, # Use the determined dtype for loading
	safety_checker=None, # DISABLED
	)

	# Apply optimizations based on UI input during load
	if enable_attention_slicing and temp_device_to_use == "cuda": # Only apply on GPU
	try:
	pipeline.enable_attention_slicing()
	print("Attention Slicing enabled during model load.")
	except Exception as e:
	print(f"Warning: Failed to enable Attention Slicing: {e}")
	gr.Warning(f"Failed to enable Attention Slicing. Error: {e}")
	else:
	try:
	pipeline.disable_attention_slicing() # Ensure it's off if toggle is off or on CPU
	# print("Attention Slicing disabled during model load.") # Avoid noise
	except Exception as e:
	# May fail if it wasn't enabled, ignore
	pass


	pipeline = pipeline.to(temp_device_to_use) # Move to the determined device

	current_pipeline = pipeline
	current_model_id = model_identifier
	current_device_loaded = torch.device(temp_device_to_use) # Store the actual device object

	# Basic check for SD1.x architecture
	unet_config = getattr(pipeline, 'unet', None)
	if unet_config and hasattr(unet_config, 'config') and hasattr(unet_config.config, 'cross_attention_dim'):
	cross_attn_dim = unet_config.config.cross_attention_dim
	if cross_attn_dim != 768:
	warning_msg = (f"Warning: Loaded model '{model_identifier}' might not be a standard SD 1.x model "
	f"(expected UNet cross_attention_dim 768, found {cross_attn_dim}). "
	"Results may be unexpected or generation might fail.")
	print(warning_msg)
	gr.Warning(warning_msg)
	else:
	print("UNet cross_attention_dim is 768, consistent with SD 1.x.")
	else:
	print("Could not check UNet cross_attention_dim.")

	print(f"Model '{model_identifier}' loaded successfully on {current_device_loaded} with dtype {temp_dtype_to_use}.")

	except Exception as e:
	current_pipeline = None
	current_model_id = None
	current_device_loaded = None
	print(f"Error loading model '{model_identifier}': {e}")
	error_message_lower = str(e).lower()
	if "cannot find requested files" in error_message_lower or "404 client error" in error_message_lower or "no such file or directory" in error_message_lower:
	raise gr.Error(f"Model '{model_identifier}' not found on Hugging Face Hub or in repo files. Check ID/path or internet connection. Error: {e}")
	elif "checkpointsnotfounderror" in error_message_lower or "valueerror: could not find a valid model structure" in error_message_lower:
	raise gr.Error(f"No valid diffusers model at '{model_identifier}'. Ensure it's a diffusers format ID/path. Error: {e}")
	elif "out of memory" in error_message_lower:
	raise gr.Error(f"Out of Memory (OOM) loading model. This Space might not have enough RAM/VRAM for this model. Try a lighter model or select CPU (if available). Error: {e}")
	elif "cusolver64" in error_message_lower or "cuda driver version" in error_message_lower or "cuda error" in error_message_lower:
	raise gr.Error(f"CUDA/GPU Driver/Installation Error on Space: {e}. Check Space hardware or select CPU.")
	elif "safetensors_rust.safetensorserror" in error_message_lower or "oserror: cannot load" in error_message_lower or "filenotfounderror" in error_message_lower:
	raise gr.Error(f"Model file error for '{model_identifier}': {e}. Files might be corrupt or incomplete on the Hub/in repo.")
	elif "could not import" in error_message_lower or "module not found" in error_message_lower:
	raise gr.Error(f"Dependency error: {e}. Ensure required libraries are in requirements.txt.")
	else:
	raise gr.Error(f"Failed to load model '{model_identifier}': {e}")

	# Re-determine device_to_use and dtype_to_use after ensuring pipeline is loaded
	# They should match current_device_loaded and the pipeline's dtype
	# This is crucial because current_pipeline.device and dtype are the definitive source
	# after a potentially successful load or switch.
	device_to_use = str(current_pipeline.device) if current_pipeline else ("cuda" if selected_device_str == "GPU" and "GPU" in AVAILABLE_DEVICES else "cpu")
	dtype_to_use = current_pipeline.dtype if current_pipeline else torch.float32 # Fallback if somehow pipeline is still None


	# Check if pipeline is successfully loaded before proceeding with generation
	if current_pipeline is None:
	raise gr.Error("Model failed to load during setup or switching. Cannot generate image.")


	# --- Apply Optimizations before generation if model was already loaded ---
	# If the model didn't need reloading, we need to apply/remove slicing here
	# Check the pipeline's actual device
	if str(current_pipeline.device) == "cuda": # Only attempt on GPU
	if enable_attention_slicing:
	try:
	current_pipeline.enable_attention_slicing()
	# print("Attention Slicing enabled for generation.") # Too verbose
	except Exception as e:
	print(f"Warning: Failed to enable Attention Slicing before generation: {e}")
	gr.Warning(f"Failed to enable Attention Slicing. Error: {e}")
	else:
	try:
	current_pipeline.disable_attention_slicing()
	# print("Attention Slicing disabled for generation.") # Too verbose
	except Exception as e:
	# May fail if it wasn't enabled, ignore
	pass
	else: # Ensure slicing is off on CPU
	try:
	current_pipeline.disable_attention_slicing()
	except Exception as e:
	pass # Ignore


	# 2. Configure Scheduler
	selected_scheduler_class = SCHEDULER_MAP.get(scheduler_name)
	if selected_scheduler_class is None:
	print(f"Warning: Unknown scheduler '{scheduler_name}'. Using default: {DEFAULT_SCHEDULER}.")
	selected_scheduler_class = SCHEDULER_MAP[DEFAULT_SCHEDULER]
	gr.Warning(f"Unknown scheduler '{scheduler_name}'. Using default: {DEFAULT_SCHEDULER}.")

	# Recreate scheduler from config to ensure compatibility with the loaded pipeline
	try:
	scheduler_config = current_pipeline.scheduler.config
	current_pipeline.scheduler = selected_scheduler_class.from_config(scheduler_config)
	print(f"Scheduler set to: {scheduler_name}")
	except Exception as e:
	print(f"Error setting scheduler '{scheduler_name}': {e}")
	# Attempt to fallback to a default if setting fails
	try:
	print(f"Attempting to fallback to default scheduler: {DEFAULT_SCHEDULER}")
	current_pipeline.scheduler = SCHEDULER_MAP[DEFAULT_SCHEDULER].from_config(scheduler_config)
	gr.Warning(f"Failed to set scheduler to '{scheduler_name}', fell back to {DEFAULT_SCHEDULER}. Error: {e}")
	except Exception as fallback_e:
	print(f"Fallback scheduler failed too: {fallback_e}")
	raise gr.Error(f"Failed to configure scheduler '{scheduler_name}' and fallback failed. Error: {e}")


	# 3. Parse Image Size
	width, height = 512, 512 # Default size
	if size.lower() == "hire.fix":
	width, height = 1024, 1024
	print(f"Interpreting 'hire.fix' size as {width}x{height}")
	else:
	try:
	w_str, h_str = size.split('x')
	width = int(w_str)
	height = int(h_str)
	except ValueError:
	raise gr.Error(f"Invalid size format: '{size}'. Use 'WidthxHeight' (e.g., 512x512) or 'hire.fix'.")
	except Exception as e:
	raise gr.Error(f"Error parsing size '{size}': {e}")

	# Size multiple check (SD 1.5 works best with multiples of 64 or 8)
	multiple_check = 64 # Use 64 as a standard check
	if width % multiple_check != 0 or height % multiple_check != 0:
	warning_msg_size = (f"Warning: Image size {width}x{height} is not a multiple of {multiple_check}. "
	f"Stable Diffusion 1.5 models are typically trained on sizes like 512x512. "
	"Using non-standard sizes may cause tiling, distortions, or other artifacts.")
	print(warning_msg_size)
	gr.Warning(warning_msg_size)
	# Optional: Round size to nearest multiple of 64? Not implemented here to preserve user choice.


	# 4. Set Seed Generator
	# The generator device needs to match the pipeline device
	generator_device = current_pipeline.device # Must match the pipeline device

	seed_int = 0 # Default if issue occurs
	if randomize_seed: # Use the randomize_seed checkbox
	seed_int = random.randint(0, MAX_SEED) # Re-randomize seed using MAX_SEED
	print(f"Randomizing seed to: {seed_int}")
	else:
	# Use provided seed from the slider input
	try:
	seed_int = int(seed)
	print(f"Using provided seed: {seed_int}")
	except ValueError:
	print(f"Warning: Invalid seed input '{seed}'. Using random seed instead.")
	gr.Warning(f"Invalid seed input '{seed}'. Using random seed instead.")
	seed_int = random.randint(0, MAX_SEED) # Fallback to random if input is not int
	# No need to set randomize_seed = True here, just use the new random seed_int


	generator = None # Initialize generator as None
	try:
	# Explicitly move generator to the desired device
	generator = torch.Generator(device=generator_device).manual_seed(seed_int)
	print(f"Generator set with seed {seed_int} on device: {generator_device}")
	except Exception as e:
	print(f"Warning: Error setting seed generator with seed {seed_int} on device {generator_device}: {e}. Falling back to default generator (potentially on CPU) or system random.")
	gr.Warning(f"Failed to set seed generator with seed {seed_int}. Using system random seed. Error: {e}")
	generator = None # Let pipeline handle random seed if generator creation fails or device mismatch
	# If generator creation failed, the actual seed used by the pipeline will be different and system-dependent random.
	# We should probably report -1 in this case, or just report the seed we tried to use.
	# Reporting the seed we tried to use is simpler and often sufficient.
	pass # Keep the last calculated seed_int

	# 5. Generate Image
	# Ensure required parameters are integers/floats
	num_inference_steps_int = int(steps)
	guidance_scale_float = float(cfg_scale)

	# Basic validation on parameters
	if num_inference_steps_int <= 0 or guidance_scale_float <= 0:
	raise ValueError("Steps and CFG Scale must be positive values.")
	if width <= 0 or height <= 0:
	raise ValueError("Image width and height must be positive.")

	print(f"Generating: Prompt='{prompt[:80]}{'...' if len(prompt) > 80 else ''}', NegPrompt='{negative_prompt[:80]}{'...' if len(negative_prompt) > 80 else ''}', Steps={num_inference_steps_int}, CFG={guidance_scale_float}, Size={width}x{height}, Scheduler={scheduler_name}, Seed={seed_int if generator else 'System Random'}, Device={device_to_use}, Dtype={dtype_to_use}, Slicing Enabled={enable_attention_slicing and device_to_use == 'cuda'}")
	start_time = time.time()

	try:
	# Use the progress parameter from the template
	output = current_pipeline(
	prompt=prompt,
	negative_prompt=negative_prompt if negative_prompt else None,
	num_inference_steps=num_inference_steps_int,
	guidance_scale=guidance_scale_float,
	width=width,
	height=height,
	generator=generator, # Pass the generator (which might be None)
	# Pass progress object for tqdm tracking in Gradio
	callback_steps=max(1, num_inference_steps_int // 20), # Update progress bar periodically
	# --- CORRECTED CALLBACK FORMAT ---
	callback=lambda step, timestep, latents: progress((step, num_inference_steps_int), desc=f"Step {step}/{num_inference_steps_int}"),

	# Add VAE usage here if needed for specific models that require it
	# vae=...
	# enable_xformers_memory_efficient_attention() # Needs xformers installed & compatible GPU
	)
	end_time = time.time()
	print(f"Generation finished in {end_time - start_time:.2f} seconds.")
	generated_image = output.images[0]

	# Determine the seed to return: the one we attempted to use, or -1 if generator creation failed
	actual_seed_used = seed_int if generator else -1

	# Return both the image and the seed (potentially randomized)
	return generated_image, actual_seed_used

	except gr.Error as e:
	# Re-raise Gradio errors directly
	raise e
	except ValueError as ve:
	# Handle specific value errors like invalid parameters
	print(f"Parameter Error: {ve}")
	# This is the line that was re-raising the error, it remains here.
	raise gr.Error(f"Invalid Parameter: {ve}")
	except Exception as e:
	# Catch any other unexpected errors during generation
	print(f"An error occurred during image generation: {e}")
	error_message_lower = str(e).lower()
	if "size must be a multiple of" in error_message_lower or "invalid dimensions" in error_message_lower or "shape mismatch" in error_message_lower:
	raise gr.Error(f"Image generation failed - Invalid size '{width}x{height}' for model: {e}. Try a multiple of 64 or 8.")
	elif "out of memory" in error_message_lower or "cuda out of memory" in error_message_lower:
	print("Hint: Try smaller image size, fewer steps, or a model that uses less VRAM.")
	raise gr.Error(f"Out of Memory (OOM) during generation. This Space might not have enough VRAM. Try smaller size/steps or select CPU (if available). Error: {e}")
	elif "runtimeerror" in error_message_lower:
	raise gr.Error(f"Runtime Error during generation: {e}. This could be a model/scheduler incompatibility or other issue.")
	elif "device-side assert" in error_message_lower or "cuda error" in error_message_lower:
	raise gr.Error(f"CUDA/GPU Error during generation: {e}. Ensure the Space is configured with a GPU and compatible PyTorch.")
	elif "expected all tensors to be on the same device" in error_message_lower:
	raise gr.Error(f"Device mismatch error during generation: {e}. This is an internal error, please report it.")
	else:
	# Generic catch-all for unknown errors
	raise gr.Error(f"Image generation failed: An unexpected error occurred. {e}")


	# --- Gradio Interface ---
	# For Spaces, we primarily list Hub models in the dropdown
	model_choices = DEFAULT_HUB_MODELS
	if not model_choices:
	initial_model_choices = ["No models found"]
	initial_default_model = "No models found"
	model_dropdown_interactive = False
	print(f"\n!!! WARNING: No default Hub models listed in script. Model dropdown will be empty. !!!")
	else:
	initial_model_choices = model_choices
	# Set a reasonable default if available
	initial_default_model = INITIAL_MODEL_ID if INITIAL_MODEL_ID and INITIAL_MODEL_ID in initial_model_choices else (initial_model_choices[0] if initial_model_choices and initial_model_choices[0] != "No models found" else "No models found")

	model_dropdown_interactive = True if initial_default_model != "No models found" else False # Make it interactive if there's any model choice

	scheduler_choices = list(SCHEDULER_MAP.keys())

	# Use the template's CSS
	css = """
	#col-container {
	margin: 0 auto;
	max-width: 640px;
	}
	"""

	with gr.Blocks(css=css, theme=gr.themes.Soft()) as demo: # Added Soft theme from user's script
	gr.Markdown(
	"""
	# CipherCore Stable Diffusion 1.5 Gradio WebUI
	Create images with Stable Diffusion 1.5 using models from Hugging Face Hub.
	Choose a model, set your prompts and parameters, and generate!
	_Note: 'hire.fix' size option currently generates at 1024x1024._
	""" # Removed reference to local checkpoints and "coming soon"
	)

	# Add a note about model loading time
	if initial_default_model != "No models found":
	gr.Markdown(f"(Note: Model '{initial_default_model}' will load on first generation or model switch... This might take some time.)")
	else:
	gr.Markdown(f"(Note: No models available. Add Hub IDs to DEFAULT_HUB_MODELS in the script.)")


	with gr.Row():
	with gr.Column(scale=2): # Give more space to controls
	model_dropdown = gr.Dropdown(
	choices=initial_model_choices,
	value=initial_default_model,
	label="Select Model (Hugging Face Hub ID)", # Updated label
	interactive=model_dropdown_interactive,
	)
	device_dropdown = gr.Dropdown(
	choices=AVAILABLE_DEVICES,
	value=DEFAULT_DEVICE,
	label="Processing Device",
	interactive=len(AVAILABLE_DEVICES) > 1, # Only make interactive if both CPU and GPU are options
	)
	prompt_input = gr.Textbox(label="Positive Prompt", placeholder="e.g., a majestic lion in a vibrant jungle, photorealistic", lines=3, autofocus=True) # Autofocus on prompt
	negative_prompt_input = gr.Textbox(label="Negative Prompt (Optional)", placeholder="e.g., blurry, low quality, deformed, watermark", lines=2)

	with gr.Accordion("Advanced Settings", open=False): # Keep advanced settings initially closed
	with gr.Row():
	steps_slider = gr.Slider(minimum=5, maximum=150, value=30, label="Inference Steps", step=1)
	cfg_slider = gr.Slider(minimum=1.0, maximum=30.0, value=7.5, label="CFG Scale", step=0.1)
	with gr.Row():
	scheduler_dropdown = gr.Dropdown(
	choices=scheduler_choices,
	value=DEFAULT_SCHEDULER,
	label="Scheduler"
	)
	size_dropdown = gr.Dropdown(
	choices=SUPPORTED_SD15_SIZES,
	value="512x512", # SD1.5 default
	label="Image Size"
	)
	# Combine seed input and randomize checkbox
	with gr.Row():
	# Removed precision=0 from Slider - FIX FOR TYPEERROR
	seed_input = gr.Slider(label="Seed", minimum=0, maximum=MAX_SEED, step=1, value=0, interactive=True) # Use 0 as default, interactive initially
	randomize_seed_checkbox = gr.Checkbox(label="Randomize seed", value=True) # Simplified label

	# --- Memory Optimization Toggle ---
	with gr.Row():
	# Default to enabled if GPU is available, otherwise off
	default_slicing = True if "GPU" in AVAILABLE_DEVICES else False
	enable_attention_slicing_checkbox = gr.Checkbox(
	label="Enable Attention Slicing (Memory Optimization - GPU only)",
	value=default_slicing,
	interactive="GPU" in AVAILABLE_DEVICES # Only interactive if GPU is an option
	)
	gr.Markdown("(Helps reduce VRAM usage, may slightly affect speed/quality)")


	generate_button = gr.Button("✨ Generate Image ✨", variant="primary", scale=1) # Added emojis

	with gr.Column(scale=3): # Give more space to image
	output_image = gr.Image(
	label="Generated Image",
	type="pil",
	height=768, # Slightly larger preview if possible
	width=768, # Match height for square
	show_share_button=True,
	show_download_button=True,
	interactive=False # Output image is not interactive
	)
	# The template returned the seed, let's add a display for the actual seed used
	actual_seed_output = gr.Number(label="Actual Seed Used", precision=0, interactive=False)


	# Link button click to generation function
	# Use gr.on as in the template
	gr.on(
	triggers=[generate_button.click, prompt_input.submit], # Also trigger on prompt submit
	fn=infer,
	inputs=[
	model_dropdown,
	device_dropdown,
	prompt_input,
	negative_prompt_input,
	steps_slider,
	cfg_slider,
	scheduler_dropdown,
	size_dropdown,
	seed_input,
	randomize_seed_checkbox,
	enable_attention_slicing_checkbox, # Pass the new checkbox value
	],
	outputs=[output_image, actual_seed_output], # Return image and the actual seed used
	api_name="generate" # Optional: For API access
	)

	# Add examples from template
	# Ensure examples map to the correct input component indices
	template_examples = [
	"Astronaut in a jungle, cold color palette, muted colors, detailed, 8k",
	"An astronaut riding a green horse",
	"A delicious ceviche cheesecake slice",
	]
	# Examples will only populate the first input they match.
	# In this case, passing just a list of strings populates the first Textbox: prompt_input.
	gr.Examples(examples=template_examples, inputs=[prompt_input])


	# Add some notes/footer from user's script, adapted for Spaces
	gr.Markdown(
	"""
	---
	Usage Notes:
	1. Select a model from the dropdown (Hugging Face Hub ID). Models are downloaded and cached on the Space.
	2. Choose your processing device (GPU recommended if available).
	3. Enter your positive and optional negative prompts.
	4. Adjust advanced settings (Steps, CFG Scale, Scheduler, Size, Seed) if needed. The "Randomize seed" checkbox will override the seed value in the input box.
	5. Click "Generate Image".
	The first generation with a new model/device might take some time to load.
	""" # Removed notes about local models and batch files
	)


	# --- Launch the App ---
	if __name__ == "__main__":
	print("\n--- Starting CipherCore Stable Diffusion 1.5 Generator (Hugging Face Spaces) ---")
	cuda_status = "CUDA available" if torch.cuda.is_available() else "CUDA not available"
	gpu_count_str = f"Found {torch.cuda.device_count()} GPU(s)." if torch.cuda.is_available() else ""

	print(f"{cuda_status} {gpu_count_str}")
	print(f"Available devices detected by PyTorch: {', '.join(AVAILABLE_DEVICES)}")
	print(f"Default device selected by app: {DEFAULT_DEVICE}")
	if current_pipeline:
	print(f"Initial model '{current_model_id}' loaded successfully on {current_device_loaded}.")
	else:
	print("No initial model loaded or initial load failed. Check model list and network connectivity.")


	print("Launching Gradio interface...")
	# For Spaces, usually launched directly without launch() parameters in app.py
	# Spaces handles the server_name, server_port, share, etc.
	# If running locally for testing, uncomment demo.launch()
	# demo.launch(show_error=True, inbrowser=True) # Uncomment for local testing
	demo.launch() # Standard launch for Hugging Face Spaces

	print("Gradio interface closing.")