Spaces:

Lasya18
/

Interior-Images-From-Inspiration

Running

App Files Files Community

Interior-Images-From-Inspiration / utils.py

Lasya18

Update utils.py

3b3c48f verified 4 months ago

raw

history blame

15.1 kB

	"""
	Utility functions for the Interior Style Transfer Pipeline
	"""
	import cv2
	import numpy as np
	from PIL import Image
	import os
	from typing import Tuple, List, Optional, Union
	import json
	from pathlib import Path

	def load_image_safe(image_path: str, target_size: Tuple[int, int] = None) -> np.ndarray:
	"""
	Safely load an image with error handling

	Args:
	image_path: Path to the image file
	target_size: Optional target size (width, height)

	Returns:
	Loaded image as numpy array

	Raises:
	ValueError: If image cannot be loaded
	"""
	if not os.path.exists(image_path):
	raise ValueError(f"Image file not found: {image_path}")

	# Try to load with OpenCV first
	image = cv2.imread(image_path)
	if image is None:
	# Fallback to PIL
	try:
	pil_image = Image.open(image_path)
	image = np.array(pil_image)
	if len(image.shape) == 3 and image.shape[2] == 3:
	image = cv2.cvtColor(image, cv2.COLOR_RGB2BGR)
	elif len(image.shape) == 3 and image.shape[2] == 4:
	image = cv2.cvtColor(image, cv2.COLOR_RGBA2BGR)
	except Exception as e:
	raise ValueError(f"Could not load image {image_path}: {e}")

	if target_size:
	image = cv2.resize(image, target_size)

	return image

	def save_image_safe(image: np.ndarray, output_path: str,
	quality: int = 95) -> bool:
	"""
	Safely save an image with error handling

	Args:
	image: Image to save as numpy array
	output_path: Output file path
	quality: JPEG quality (1-100)

	Returns:
	True if successful, False otherwise
	"""
	try:
	# Ensure output directory exists
	os.makedirs(os.path.dirname(output_path), exist_ok=True)

	# Save with OpenCV
	success = cv2.imwrite(output_path, image)

	if not success:
	# Fallback to PIL
	if len(image.shape) == 3 and image.shape[2] == 3:
	pil_image = Image.fromarray(cv2.cvtColor(image, cv2.COLOR_BGR2RGB))
	else:
	pil_image = Image.fromarray(image)

	pil_image.save(output_path, quality=quality)
	success = True

	return success
	except Exception as e:
	print(f"Error saving image to {output_path}: {e}")
	return False

	def validate_image_pair(user_room: np.ndarray, inspiration_room: np.ndarray) -> Tuple[bool, str]:
	"""
	Validate that two images are suitable for style transfer

	Args:
	user_room: User room image
	inspiration_room: Inspiration room image

	Returns:
	Tuple of (is_valid, error_message)
	"""
	# Check image dimensions
	if user_room.shape != inspiration_room.shape:
	return False, f"Image dimensions don't match: {user_room.shape} vs {inspiration_room.shape}"

	# Check minimum size
	min_size = 256
	if user_room.shape[0] < min_size or user_room.shape[1] < min_size:
	return False, f"Images too small. Minimum size: {min_size}x{min_size}"

	# Check aspect ratio (should be roughly square for best results)
	aspect_ratio = user_room.shape[1] / user_room.shape[0]
	if aspect_ratio < 0.5 or aspect_ratio > 2.0:
	return False, f"Extreme aspect ratio: {aspect_ratio:.2f}. Square images work best."

	# Check if images are too dark or too bright
	user_brightness = np.mean(cv2.cvtColor(user_room, cv2.COLOR_BGR2GRAY))
	inspiration_brightness = np.mean(cv2.cvtColor(inspiration_room, cv2.COLOR_BGR2GRAY))

	if user_brightness < 30 or user_brightness > 225:
	return False, f"User room too {'dark' if user_brightness < 30 else 'bright'}: {user_brightness:.1f}"

	if inspiration_brightness < 30 or inspiration_brightness > 225:
	return False, f"Inspiration room too {'dark' if inspiration_brightness < 30 else 'bright'}: {inspiration_brightness:.1f}"

	return True, "Images are valid for style transfer"

	def create_comparison_image(original: np.ndarray, result: np.ndarray,
	title: str = "Style Transfer Comparison") -> np.ndarray:
	"""
	Create a side-by-side comparison image

	Args:
	original: Original user room image
	result: Style transfer result
	title: Title for the comparison

	Returns:
	Comparison image
	"""
	# Ensure both images have the same dimensions
	if original.shape != result.shape:
	result = cv2.resize(result, (original.shape[1], original.shape[0]))

	# Create comparison image
	comparison = np.hstack([original, result])

	# Add title
	font = cv2.FONT_HERSHEY_SIMPLEX
	font_scale = 1.0
	thickness = 2

	# Calculate text position
	text_size = cv2.getTextSize(title, font, font_scale, thickness)[0]
	text_x = (comparison.shape[1] - text_size[0]) // 2
	text_y = 50

	# Add background for text
	cv2.rectangle(comparison, (text_x - 10, text_y - 30),
	(text_x + text_size[0] + 10, text_y + 10), (255, 255, 255), -1)

	# Add text
	cv2.putText(comparison, title, (text_x, text_y), font, font_scale, (0, 0, 0), thickness)

	# Add labels
	cv2.putText(comparison, "Original", (50, comparison.shape[0] - 30),
	font, 0.7, (255, 255, 255), 2)
	cv2.putText(comparison, "Result", (original.shape[1] + 50, comparison.shape[0] - 30),
	font, 0.7, (255, 255, 255), 2)

	return comparison

	def create_multi_comparison_image(images: List[np.ndarray],
	titles: List[str] = None,
	title: str = "Multi-Image Comparison") -> np.ndarray:
	"""
	Create a comparison image with multiple images side by side

	Args:
	images: List of images to compare
	titles: List of titles for each image (optional)
	title: Main title for the comparison

	Returns:
	Comparison image
	"""
	if not images:
	raise ValueError("At least one image is required")

	# Ensure all images have the same dimensions
	target_shape = images[0].shape
	resized_images = []
	for img in images:
	if img.shape != target_shape:
	resized_img = cv2.resize(img, (target_shape[1], target_shape[0]))
	resized_images.append(resized_img)
	else:
	resized_images.append(img)

	# Create horizontal stack of images
	comparison = np.hstack(resized_images)

	# Add main title
	font = cv2.FONT_HERSHEY_SIMPLEX
	font_scale = 1.0
	thickness = 2

	# Calculate text position for main title
	text_size = cv2.getTextSize(title, font, font_scale, thickness)[0]
	text_x = (comparison.shape[1] - text_size[0]) // 2
	text_y = 50

	# Add background for main title
	cv2.rectangle(comparison, (text_x - 10, text_y - 30),
	(text_x + text_size[0] + 10, text_y + 10), (255, 255, 255), -1)

	# Add main title
	cv2.putText(comparison, title, (text_x, text_y), font, font_scale, (0, 0, 0), thickness)

	# Add individual image titles if provided
	if titles and len(titles) == len(images):
	font_scale_small = 0.7
	thickness_small = 1

	for i, (img, img_title) in enumerate(zip(resized_images, titles)):
	# Calculate position for each image title
	img_width = img.shape[1]
	start_x = sum(img.shape[1] for img in resized_images[:i])

	# Add background for image title
	title_size = cv2.getTextSize(img_title, font, font_scale_small, thickness_small)[0]
	title_x = start_x + (img_width - title_size[0]) // 2
	title_y = comparison.shape[0] - 30

	# Add background rectangle
	cv2.rectangle(comparison, (title_x - 5, title_y - 20),
	(title_x + title_size[0] + 5, title_y + 5), (255, 255, 255), -1)

	# Add image title
	cv2.putText(comparison, img_title, (title_x, title_y),
	font, font_scale_small, (0, 0, 0), thickness_small)

	return comparison

	def enhance_image_quality(image: np.ndarray,
	sharpness: float = 0.3,
	contrast: float = 1.1,
	saturation: float = 1.1) -> np.ndarray:
	"""
	Enhance image quality with various filters

	Args:
	image: Input image
	sharpness: Sharpening strength (0.0 to 1.0)
	contrast: Contrast multiplier
	saturation: Saturation multiplier

	Returns:
	Enhanced image
	"""
	enhanced = image.copy()

	# Sharpening
	if sharpness > 0:
	kernel = np.array([[-1, -1, -1],
	[-1, 9, -1],
	[-1, -1, -1]]) * sharpness
	enhanced = cv2.filter2D(enhanced, -1, kernel)

	# Contrast adjustment
	if contrast != 1.0:
	enhanced = np.clip(enhanced * contrast, 0, 255).astype(np.uint8)

	# Saturation adjustment
	if saturation != 1.0:
	hsv = cv2.cvtColor(enhanced, cv2.COLOR_BGR2HSV).astype(np.float32)
	hsv[:, :, 1] = np.clip(hsv[:, :, 1] * saturation, 0, 255)
	enhanced = cv2.cvtColor(hsv.astype(np.uint8), cv2.COLOR_HSV2BGR)

	return enhanced

	def create_progress_bar(total: int, description: str = "Processing") -> callable:
	"""
	Create a simple progress bar function

	Args:
	total: Total number of steps
	description: Description of the process

	Returns:
	Function to update progress
	"""
	def update_progress(current: int):
	percentage = (current / total) * 100
	bar_length = 30
	filled_length = int(bar_length * current // total)
	bar = '█' * filled_length + '-' * (bar_length - filled_length)
	print(f'\r{description}: \|{bar}\| {percentage:.1f}% ({current}/{total})', end='')
	if current == total:
	print()

	return update_progress

	def save_metadata(metadata: dict, output_path: str) -> bool:
	"""
	Save metadata to JSON file

	Args:
	metadata: Dictionary of metadata
	output_path: Output file path

	Returns:
	True if successful, False otherwise
	"""
	try:
	os.makedirs(os.path.dirname(output_path), exist_ok=True)

	with open(output_path, 'w') as f:
	json.dump(metadata, f, indent=2, default=str)

	return True
	except Exception as e:
	print(f"Error saving metadata to {output_path}: {e}")
	return False

	def load_metadata(metadata_path: str) -> Optional[dict]:
	"""
	Load metadata from JSON file

	Args:
	metadata_path: Path to metadata file

	Returns:
	Loaded metadata dictionary or None if failed
	"""
	try:
	with open(metadata_path, 'r') as f:
	return json.load(f)
	except Exception as e:
	print(f"Error loading metadata from {metadata_path}: {e}")
	return None

	def calculate_image_similarity(img1: np.ndarray, img2: np.ndarray) -> float:
	"""
	Calculate similarity between two images using structural similarity

	Args:
	img1: First image
	img2: Second image

	Returns:
	Similarity score (0.0 to 1.0, higher is more similar)
	"""
	try:
	from skimage.metrics import structural_similarity as ssim

	# Ensure same dimensions
	if img1.shape != img2.shape:
	img2 = cv2.resize(img2, (img1.shape[1], img1.shape[0]))

	# Convert to grayscale for SSIM
	gray1 = cv2.cvtColor(img1, cv2.COLOR_BGR2GRAY)
	gray2 = cv2.cvtColor(img2, cv2.COLOR_BGR2GRAY)

	# Calculate SSIM
	similarity = ssim(gray1, gray2)
	return max(0.0, similarity) # Ensure non-negative

	except ImportError:
	# Fallback to simple MSE-based similarity
	if img1.shape != img2.shape:
	img2 = cv2.resize(img2, (img1.shape[1], img1.shape[0]))

	mse = np.mean((img1.astype(np.float32) - img2.astype(np.float32)) ** 2)
	max_mse = 255 ** 2
	similarity = 1.0 - (mse / max_mse)
	return max(0.0, similarity)

	def create_thumbnail(image: np.ndarray, max_size: int = 200) -> np.ndarray:
	"""
	Create a thumbnail version of an image

	Args:
	image: Input image
	max_size: Maximum dimension size

	Returns:
	Thumbnail image
	"""
	height, width = image.shape[:2]

	if height <= max_size and width <= max_size:
	return image.copy()

	# Calculate new dimensions maintaining aspect ratio
	if height > width:
	new_height = max_size
	new_width = int(width * max_size / height)
	else:
	new_width = max_size
	new_height = int(height * max_size / width)

	thumbnail = cv2.resize(image, (new_width, new_height))
	return thumbnail

	def batch_resize_images(images: List[np.ndarray],
	target_size: Tuple[int, int]) -> List[np.ndarray]:
	"""
	Resize a list of images to the same target size

	Args:
	images: List of input images
	target_size: Target size (width, height)

	Returns:
	List of resized images
	"""
	resized_images = []

	for image in images:
	resized = cv2.resize(image, target_size)
	resized_images.append(resized)

	return resized_images

	def create_image_grid(images: List[np.ndarray],
	grid_size: Tuple[int, int] = None) -> np.ndarray:
	"""
	Create a grid layout of images

	Args:
	images: List of images to arrange in grid
	grid_size: Grid dimensions (rows, cols). If None, auto-calculate

	Returns:
	Grid image
	"""
	if not images:
	return np.array([])

	if grid_size is None:
	# Auto-calculate grid size
	n_images = len(images)
	cols = int(np.ceil(np.sqrt(n_images)))
	rows = int(np.ceil(n_images / cols))
	grid_size = (rows, cols)

	rows, cols = grid_size

	# Ensure all images have the same size
	target_size = (images[0].shape[1], images[0].shape[0])
	resized_images = batch_resize_images(images, target_size)

	# Create grid
	grid_rows = []
	for i in range(rows):
	row_images = []
	for j in range(cols):
	idx = i * cols + j
	if idx < len(resized_images):
	row_images.append(resized_images[idx])
	else:
	# Fill empty space with black
	empty_image = np.zeros((target_size[1], target_size[0], 3), dtype=np.uint8)
	row_images.append(empty_image)

	row = np.hstack(row_images)
	grid_rows.append(row)

	grid = np.vstack(grid_rows)
	return grid