farjadmalik's picture
Fix spaces
f9630b2
raw
history blame contribute delete
901 Bytes
"""
Configuration variables to centralize parameters and paths.
"""
OUTPUT_DIR = "outputs/" # Directory to save generated image and captions
# Image generation settings
IMAGE_SIZE = (512, 512) # Size of the generated images
# Model names for easy change and reuse
EMBEDDING_MODEL_NAME = "all-MiniLM-L6-v2"
TEXT_MODEL_NAME = "microsoft/phi-2"
AUDIO_MODEL_NAME = "" # Placeholder for audio model, can be set later
# Stable Diffusion model and device to run on
IMG_MODEL_NAME = "runwayml/stable-diffusion-v1-5"
VIDEO_MODEL_NAME = "cerspense/zeroscope_v2_XL" # Placeholder for video model
# Other models to try # Qwen/Qwen-Image # CompVis/stable-diffusion-v1-4
# "segmind/SSD-1B" # Or "kandinsky-community/kandinsky-3", "warp-ai/wuerstchen"
# Video generation models # cerspense/zeroscope_v2_576w # Wan‑Video/Wan2.1
# Font path for overlay text
# FONT_PATH = "./fonts/arial.ttf"
# FONT_SIZE = 40