Spaces:

jameszokah
/

jamiya

Sleeping

App Files Files Community

jameszokah commited on Apr 5

Commit

23beeea

1 Parent(s): 6f1d384

UNDO the update for the path to the that was casing permission issues in entire app

Browse files

Files changed (7) hide show

Dockerfile +20 -20
app/api/routes.py +3 -8
app/main.py +6 -7
app/utils/voice_manager.py +5 -10
app/voice_cloning.py +1 -2
app/voice_enhancement.py +5 -5
app/voice_memory.py +2 -3

Dockerfile CHANGED Viewed

@@ -38,32 +38,31 @@ RUN apt-get update && apt-get install -y --no-install-recommends \
     ffmpeg \
     git \
     build-essential \
     && apt-get clean \
     && rm -rf /var/lib/apt/lists/*
-# Create user and set up environment
-RUN useradd -m -u 1000 user
-USER user
-ENV HOME=/home/user \
-    PATH=/home/user/.local/bin:$PATH
 # Set working directory
-WORKDIR $HOME/app
 # Copy requirements first for better caching
 COPY --chown=user:user requirements.txt .
-# Create and set up persistent directories with proper permissions
-RUN mkdir -p $HOME/app/static $HOME/app/models $HOME/app/voice_memories $HOME/app/voice_references \
-    $HOME/app/voice_profiles $HOME/app/cloned_voices $HOME/app/audio_cache $HOME/app/tokenizers $HOME/app/logs && \
-    chmod -R 755 $HOME/app && \
-    chmod -R 777 $HOME/app/voice_references $HOME/app/voice_profiles $HOME/app/voice_memories \
-    $HOME/app/cloned_voices $HOME/app/audio_cache $HOME/app/static $HOME/app/logs $HOME/app/tokenizers $HOME/app/models
-# Copy static files
-COPY --chown=user:user ./static $HOME/app/static
 # Install Python dependencies
 RUN pip3 install --no-cache-dir --upgrade pip && \
@@ -85,11 +84,12 @@ RUN pip3 install -r requirements.txt
 # Install additional dependencies for streaming and voice cloning
 RUN pip3 install yt-dlp openai-whisper
-# Copy application code
-COPY --chown=user:user ./app $HOME/app/app
 # Copy downloaded model from the model-downloader stage
-COPY --chown=user:user --from=model-downloader /model-downloader/models $HOME/app/models
 # Show available models in torchtune
 RUN python3 -c "import torchtune.models; print('Available models in torchtune:', dir(torchtune.models))"

     ffmpeg \
     git \
     build-essential \
+    sudo \
     && apt-get clean \
     && rm -rf /var/lib/apt/lists/*
+# Create user and give sudo access
+RUN useradd -m -s /bin/bash user && \
+    usermod -aG sudo user && \
+    echo "user ALL=(ALL) NOPASSWD:ALL" >> /etc/sudoers
 # Set working directory
+WORKDIR /app
+# Create and set up persistent directories with proper permissions
+RUN mkdir -p /app/static /app/models /app/voice_memories /app/voice_references \
+    /app/voice_profiles /app/cloned_voices /app/audio_cache /app/tokenizers /app/logs && \
+    chown -R user:user /app && \
+    chmod -R 755 /app && \
+    chmod -R 777 /app/voice_references /app/voice_profiles /app/voice_memories \
+    /app/cloned_voices /app/audio_cache /app/static /app/logs /app/tokenizers /app/models
 # Copy requirements first for better caching
 COPY --chown=user:user requirements.txt .
+# Switch to user
+USER user
 # Install Python dependencies
 RUN pip3 install --no-cache-dir --upgrade pip && \
 # Install additional dependencies for streaming and voice cloning
 RUN pip3 install yt-dlp openai-whisper
+# Copy static files and application code
+COPY --chown=user:user ./static /app/static
+COPY --chown=user:user ./app /app/app
 # Copy downloaded model from the model-downloader stage
+COPY --chown=user:user --from=model-downloader /model-downloader/models /app/models
 # Show available models in torchtune
 RUN python3 -c "import torchtune.models; print('Available models in torchtune:', dir(torchtune.models))"

app/api/routes.py CHANGED Viewed

@@ -16,7 +16,7 @@ import numpy as np
 from fastapi import APIRouter, Request, HTTPException, BackgroundTasks, Body, Response, Query
 from fastapi.responses import StreamingResponse
 from app.api.schemas import SpeechRequest, ResponseFormat, Voice
-from app.models import Segment, TTSRequest, TTSResponse, StreamRequest
 from app.api.streaming import AudioChunker
 from app.prompt_engineering import split_into_segments
@@ -24,11 +24,6 @@ from app.prompt_engineering import split_into_segments
 logger = logging.getLogger(__name__)
 router = APIRouter()
-# Constants
-APP_DIR = os.path.join(os.environ['HOME'], 'app')
-AUDIO_CACHE_DIR = os.path.join(APP_DIR, "audio_cache")
-os.makedirs(AUDIO_CACHE_DIR, exist_ok=True)
 # Mapping of response_format to MIME types
 MIME_TYPES = {
     "mp3": "audio/mpeg",
@@ -438,7 +433,7 @@ async def format_audio(audio, response_format, sample_rate, app_state):
         # Generate a hash of the audio tensor for caching
         audio_hash = hashlib.md5(audio.cpu().numpy().tobytes()).hexdigest()
         cache_key = f"{audio_hash}_{response_format}"
-        cache_dir = getattr(app_state, "audio_cache_dir", AUDIO_CACHE_DIR)
         os.makedirs(cache_dir, exist_ok=True)
         cache_path = os.path.join(cache_dir, f"{cache_key}")
@@ -539,7 +534,7 @@ async def format_audio(audio, response_format, sample_rate, app_state):
             # Store in cache if enabled
             if cache_enabled and cache_key:
                 try:
-                    cache_path = os.path.join(getattr(app_state, "audio_cache_dir", AUDIO_CACHE_DIR), f"{cache_key}")
                     with open(cache_path, "wb") as f:
                         f.write(response_data)
                     logger.debug(f"Cached {response_format} audio with key: {cache_key}")

 from fastapi import APIRouter, Request, HTTPException, BackgroundTasks, Body, Response, Query
 from fastapi.responses import StreamingResponse
 from app.api.schemas import SpeechRequest, ResponseFormat, Voice
+from app.models import Segment
 from app.api.streaming import AudioChunker
 from app.prompt_engineering import split_into_segments
 logger = logging.getLogger(__name__)
 router = APIRouter()
 # Mapping of response_format to MIME types
 MIME_TYPES = {
     "mp3": "audio/mpeg",
         # Generate a hash of the audio tensor for caching
         audio_hash = hashlib.md5(audio.cpu().numpy().tobytes()).hexdigest()
         cache_key = f"{audio_hash}_{response_format}"
+        cache_dir = getattr(app_state, "audio_cache_dir", "/app/audio_cache")
         os.makedirs(cache_dir, exist_ok=True)
         cache_path = os.path.join(cache_dir, f"{cache_key}")
             # Store in cache if enabled
             if cache_enabled and cache_key:
                 try:
+                    cache_path = os.path.join(getattr(app_state, "audio_cache_dir", "/app/audio_cache"), f"{cache_key}")
                     with open(cache_path, "wb") as f:
                         f.write(response_data)
                     logger.debug(f"Cached {response_format} audio with key: {cache_key}")

app/main.py CHANGED Viewed

@@ -54,7 +54,7 @@ async def lifespan(app: FastAPI):
     app.state.logger = logger  # Make logger available to routes
     # Create necessary directories - use persistent locations
-    APP_DIR = os.path.join(os.environ['HOME'], 'app')
     os.makedirs(os.path.join(APP_DIR, "models"), exist_ok=True)
     os.makedirs(os.path.join(APP_DIR, "tokenizers"), exist_ok=True)
     os.makedirs(os.path.join(APP_DIR, "voice_memories"), exist_ok=True)
@@ -498,12 +498,11 @@ app.add_middleware(
 )
 # Create static and other required directories
-APP_DIR = os.path.join(os.environ['HOME'], 'app')
-os.makedirs(os.path.join(APP_DIR, "static"), exist_ok=True)
-os.makedirs(os.path.join(APP_DIR, "cloned_voices"), exist_ok=True)
 # Mount the static files directory
-app.mount("/static", StaticFiles(directory=os.path.join(APP_DIR, "static")), name="static")
 # Include routers
 app.include_router(api_router, prefix="/api/v1")
@@ -590,13 +589,13 @@ async def version():
 @app.get("/voice-cloning", include_in_schema=False)
 async def voice_cloning_ui():
     """Voice cloning UI endpoint."""
-    return FileResponse(os.path.join(APP_DIR, "static/voice-cloning.html"))
 # Streaming demo endpoint
 @app.get("/streaming-demo", include_in_schema=False)
 async def streaming_demo():
     """Streaming TTS demo endpoint."""
-    return FileResponse(os.path.join(APP_DIR, "static/streaming-demo.html"))
 @app.get("/", include_in_schema=False)
 async def root():

     app.state.logger = logger  # Make logger available to routes
     # Create necessary directories - use persistent locations
+    APP_DIR = "/app"
     os.makedirs(os.path.join(APP_DIR, "models"), exist_ok=True)
     os.makedirs(os.path.join(APP_DIR, "tokenizers"), exist_ok=True)
     os.makedirs(os.path.join(APP_DIR, "voice_memories"), exist_ok=True)
 )
 # Create static and other required directories
+os.makedirs("/app/static", exist_ok=True)
+os.makedirs("/app/cloned_voices", exist_ok=True)
 # Mount the static files directory
+app.mount("/static", StaticFiles(directory="/app/static"), name="static")
 # Include routers
 app.include_router(api_router, prefix="/api/v1")
 @app.get("/voice-cloning", include_in_schema=False)
 async def voice_cloning_ui():
     """Voice cloning UI endpoint."""
+    return FileResponse("/app/static/voice-cloning.html")
 # Streaming demo endpoint
 @app.get("/streaming-demo", include_in_schema=False)
 async def streaming_demo():
     """Streaming TTS demo endpoint."""
+    return FileResponse("/app/static/streaming-demo.html")
 @app.get("/", include_in_schema=False)
 async def root():

app/utils/voice_manager.py CHANGED Viewed

@@ -8,23 +8,18 @@ from typing import Dict, List, Optional, Any
 logger = logging.getLogger(__name__)
-# Constants
-APP_DIR = os.path.join(os.environ['HOME'], 'app')
-VOICE_REFERENCES_DIR = os.path.join(APP_DIR, "voice_references")
-VOICE_PROFILES_DIR = os.path.join(APP_DIR, "voice_profiles")
-VOICE_MEMORIES_DIR = os.path.join(APP_DIR, "voice_memories")
-VOICE_BACKUPS_DIR = os.path.join(APP_DIR, "voice_backups")
 # Ensure directories exist
 os.makedirs(VOICE_REFERENCES_DIR, exist_ok=True)
 os.makedirs(VOICE_PROFILES_DIR, exist_ok=True)
 os.makedirs(VOICE_MEMORIES_DIR, exist_ok=True)
-os.makedirs(VOICE_BACKUPS_DIR, exist_ok=True)
-def backup_voice_data(backup_dir: str = None):
     """Create a backup of all voice data."""
-    if backup_dir is None:
-        backup_dir = VOICE_BACKUPS_DIR
     os.makedirs(backup_dir, exist_ok=True)
     timestamp = torch.datetime.now().strftime("%Y%m%d_%H%M%S")
     backup_path = os.path.join(backup_dir, f"voice_backup_{timestamp}")

 logger = logging.getLogger(__name__)
+# Define persistent paths
+VOICE_REFERENCES_DIR = "/app/voice_references"
+VOICE_PROFILES_DIR = "/app/voice_profiles"
+VOICE_MEMORIES_DIR = "/app/voice_memories"
 # Ensure directories exist
 os.makedirs(VOICE_REFERENCES_DIR, exist_ok=True)
 os.makedirs(VOICE_PROFILES_DIR, exist_ok=True)
 os.makedirs(VOICE_MEMORIES_DIR, exist_ok=True)
+def backup_voice_data(backup_dir: str = "/app/voice_backups"):
     """Create a backup of all voice data."""
     os.makedirs(backup_dir, exist_ok=True)
     timestamp = torch.datetime.now().strftime("%Y%m%d_%H%M%S")
     backup_path = os.path.join(backup_dir, f"voice_backup_{timestamp}")

app/voice_cloning.py CHANGED Viewed

@@ -27,8 +27,7 @@ from app.models import Segment
 logger = logging.getLogger(__name__)
 # Directory for storing cloned voice data
-APP_DIR = os.path.join(os.environ['HOME'], 'app')
-CLONED_VOICES_DIR = os.path.join(APP_DIR, "cloned_voices")
 os.makedirs(CLONED_VOICES_DIR, exist_ok=True)
 class ClonedVoice(BaseModel):

 logger = logging.getLogger(__name__)
 # Directory for storing cloned voice data
+CLONED_VOICES_DIR = "/app/cloned_voices"
 os.makedirs(CLONED_VOICES_DIR, exist_ok=True)
 class ClonedVoice(BaseModel):

app/voice_enhancement.py CHANGED Viewed

@@ -8,15 +8,13 @@ from typing import Dict, List, Optional, Tuple
 import logging
 from dataclasses import dataclass
 from scipy import signal
-from app.models import Segment
 # Setup logging
 logger = logging.getLogger(__name__)
-# Constants
-APP_DIR = os.path.join(os.environ['HOME'], 'app')
-VOICE_REFERENCES_DIR = os.path.join(APP_DIR, "voice_references")
-VOICE_PROFILES_DIR = os.path.join(APP_DIR, "voice_profiles")
 # Ensure directories exist
 os.makedirs(VOICE_REFERENCES_DIR, exist_ok=True)
@@ -478,6 +476,8 @@ def get_voice_segments(voice_name: str, device: torch.device) -> List:
     Returns:
         List of context segments
     """
     if voice_name not in VOICE_PROFILES:
         logger.warning(f"Voice {voice_name} not found, defaulting to alloy")
         voice_name = "alloy"

 import logging
 from dataclasses import dataclass
 from scipy import signal
 # Setup logging
 logger = logging.getLogger(__name__)
+# Define persistent paths
+VOICE_REFERENCES_DIR = "/app/voice_references"
+VOICE_PROFILES_DIR = "/app/voice_profiles"
 # Ensure directories exist
 os.makedirs(VOICE_REFERENCES_DIR, exist_ok=True)
     Returns:
         List of context segments
     """
+    from app.models import Segment
     if voice_name not in VOICE_PROFILES:
         logger.warning(f"Voice {voice_name} not found, defaulting to alloy")
         voice_name = "alloy"

app/voice_memory.py CHANGED Viewed

@@ -12,9 +12,8 @@ from app.models import Segment
 # Setup logging
 logger = logging.getLogger(__name__)
-# Constants
-APP_DIR = os.path.join(os.environ['HOME'], 'app')
-VOICE_MEMORIES_DIR = os.path.join(APP_DIR, "voice_memories")
 os.makedirs(VOICE_MEMORIES_DIR, exist_ok=True)
 @dataclass

 # Setup logging
 logger = logging.getLogger(__name__)
+# Path to store voice memories - use persistent location
+VOICE_MEMORIES_DIR = "/app/voice_memories"
 os.makedirs(VOICE_MEMORIES_DIR, exist_ok=True)
 @dataclass