Spaces:

ianshank
/

phi35-moe-demo

Sleeping

App Files Files Community

phi35-moe-demo / prestart.sh

ianshank

🚀 Deploy robust modular solution with comprehensive testing and CPU/GPU support

6510698 verified 3 months ago

raw

history blame contribute delete

3.89 kB

	#!/usr/bin/env bash
	set -euo pipefail

	echo "🚀 Starting Phi-3.5-MoE prestart setup..."

	# Function to log with timestamp
	log() {
	echo "[$(date '+%Y-%m-%d %H:%M:%S')] $1"
	}

	# Function to check if command exists
	command_exists() {
	command -v "$1" >/dev/null 2>&1
	}

	# Ensure Python is available
	if ! command_exists python; then
	log "❌ Python not found"
	exit 1
	fi

	log "✅ Python found: $(python --version)"

	# Load environment variables if .env exists
	if [ -f .env ]; then
	log "📄 Loading environment variables from .env"
	export $(cat .env \| grep -v '^#' \| xargs)
	fi

	# Run dependency installation and environment setup
	python - <<'PY'
	import os
	import sys
	import subprocess
	import logging
	import torch

	# Setup logging
	logging.basicConfig(level=logging.INFO, format='[%(asctime)s] %(levelname)s: %(message)s')
	logger = logging.getLogger(__name__)

	def run_pip_install(packages, description="packages"):
	"""Run pip install with error handling."""
	try:
	cmd = [sys.executable, "-m", "pip", "install"] + packages
	logger.info(f"Installing {description}: {' '.join(packages)}")
	subprocess.check_call(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE)
	logger.info(f"✅ Successfully installed {description}")
	return True
	except subprocess.CalledProcessError as e:
	logger.error(f"❌ Failed to install {description}: {e}")
	return False

	def main():
	logger.info("🔍 Checking environment and installing dependencies...")

	# Always ensure core dependencies are present
	core_deps = ["einops>=0.7.0", "transformers==4.46.0", "accelerate>=0.31.0"]
	if not run_pip_install(core_deps, "core dependencies"):
	logger.error("❌ Failed to install core dependencies")
	sys.exit(1)

	# Check CUDA availability
	cuda_available = torch.cuda.is_available()
	logger.info(f"🖥️ CUDA available: {cuda_available}")

	if cuda_available:
	logger.info("🚀 GPU runtime detected - installing flash-attn for optimal performance")

	# Install flash-attn for GPU
	flash_attn_packages = ["flash-attn>=2.6.0", "--no-build-isolation"]
	if run_pip_install(flash_attn_packages, "flash-attn (GPU optimization)"):
	logger.info("✅ GPU environment fully configured")
	else:
	logger.warning("⚠️ Flash-attn installation failed, continuing without it")
	else:
	logger.info("💻 CPU runtime detected - configuring for CPU-only operation")
	logger.info("ℹ️ Skipping flash-attn installation (not needed for CPU)")

	# For CPU, we need to select a safe model revision
	logger.info("🔍 Checking for CPU-safe model revision...")

	try:
	# Run the revision selector
	result = subprocess.run([
	sys.executable, "scripts/select_revision.py"
	], capture_output=True, text=True, timeout=300)

	if result.returncode == 0:
	logger.info("✅ CPU-safe revision configured")
	else:
	logger.warning(f"⚠️ Revision selector returned {result.returncode}")
	logger.warning(f"stdout: {result.stdout}")
	logger.warning(f"stderr: {result.stderr}")

	except subprocess.TimeoutExpired:
	logger.warning("⚠️ Revision selection timed out, continuing with default")
	except Exception as e:
	logger.warning(f"⚠️ Error running revision selector: {e}")

	logger.info("🎉 Prestart setup completed successfully!")

	if __name__ == "__main__":
	main()
	PY

	# Check exit code from Python script
	if [ $? -ne 0 ]; then
	log "❌ Prestart setup failed"
	exit 1
	fi

	log "✅ Prestart setup completed successfully!"
	log "🚀 Ready to start the application!"