added containerization to backend services, both cpu and gpu support. Rearranged requirement modules

WinstonLam · WinstonLam · commit 7919143506a2 · 2025-03-08T12:24:47.000+01:00
diff --git a/backend/docker/Dockerfile b/backend/docker/Dockerfile
@@ -0,0 +1,121 @@
+# Start with a universal base image for common setup
+FROM ubuntu:22.04 AS universal-base
+
+# Set environment variables
+ENV PYTHONDONTWRITEBYTECODE=1 \
+  PYTHONUNBUFFERED=1 \
+  DEBIAN_FRONTEND=noninteractive \
+  TZ=UTC
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+  python3.10 \
+  python3-pip \
+  python3-dev \
+  git \
+  curl \
+  wget \
+  ffmpeg \
+  libsndfile1 \
+  build-essential \
+  && apt-get clean \
+  && rm -rf /var/lib/apt/lists/*
+
+# Set working directory
+WORKDIR /app
+
+# Create directories for data and models
+RUN mkdir -p /app/models /app/datasets /app/logs /app/local_data/tts
+
+# CPU version - Built directly from universal base
+FROM universal-base AS cpu
+
+# Copy backend requirements
+COPY backend/requirements.txt /app/
+
+# First, install torch and faiss-cpu
+RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu \
+  && pip3 install faiss-cpu
+
+# Next, install the remaining dependencies (filtering out torch and faiss-gpu)
+RUN grep -v "torch==.*\|torch-.*\|faiss-gpu" requirements.txt > cpu_requirements.txt \
+  && pip3 install --no-cache-dir -r cpu_requirements.txt
+
+# GPU version - Use NVIDIA CUDA image
+FROM nvidia/cuda:12.4.0-runtime-ubuntu22.04 AS gpu-base
+
+# Set environment variables
+ENV PYTHONDONTWRITEBYTECODE=1 \
+  PYTHONUNBUFFERED=1 \
+  DEBIAN_FRONTEND=noninteractive \
+  TZ=UTC
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+  python3.10 \
+  python3-pip \
+  python3-dev \
+  git \
+  curl \
+  wget \
+  ffmpeg \
+  libsndfile1 \
+  build-essential \
+  && apt-get clean \
+  && rm -rf /var/lib/apt/lists/*
+
+# Set working directory
+WORKDIR /app
+
+# Create directories for data and models
+RUN mkdir -p /app/models /app/datasets /app/logs /app/local_data/tts
+
+# Complete GPU setup
+FROM gpu-base AS gpu
+
+# Copy backend requirements
+COPY backend/requirements.txt backend/gpu-requirements.txt /app/
+
+# Install GPU-specific dependencies
+RUN pip3 install --no-cache-dir -r requirements.txt \
+  && pip3 install --no-cache-dir -r gpu-requirements.txt
+
+# Common steps for both CPU and GPU - using a separate stage for code copying
+FROM ${BUILD_TYPE:-cpu} AS final
+
+# Copy the application code from the backend directory
+COPY backend/ /app/
+
+# Create an entrypoint script
+RUN echo '#!/bin/bash\n\
+  if [ ! -f "/app/config.yaml" ]; then\n\
+  echo "ERROR: Config file not found at /app/config.yaml"\n\
+  echo "Make sure to mount the config file from the host system:"\n\
+  echo "  -v /path/to/FluentAI/config.yaml:/app/config.yaml:ro"\n\
+  exit 1\n\
+  fi\n\
+  \n\
+  # Set config path explicitly\n\
+  export FLUENTAI_CONFIG_PATH=/app/config.yaml\n\
+  echo "Using config from: $FLUENTAI_CONFIG_PATH"\n\
+  \n\
+  # Check if languages.json exists\n\
+  if [ ! -f "/app/data/languages.json" ]; then\n\
+  echo "ERROR: languages.json not found at /app/data/languages.json"\n\
+  echo "Make sure the data directory is properly mounted:"\n\
+  echo "  -v /path/to/FluentAI/data:/app/data:ro"\n\
+  exit 1\n\
+  fi\n\
+  \n\
+  # Start the application using uvicorn\n\
+  uvicorn fluentai.api.app:app --host 0.0.0.0 --port 8000 "$@"\n\
+  ' > /app/entrypoint.sh && chmod +x /app/entrypoint.sh
+
+# Expose port
+EXPOSE 8000
+
+# Set entrypoint
+ENTRYPOINT ["/app/entrypoint.sh"]
+
+# Default command
+CMD ["--host", "0.0.0.0", "--port", "8000"]
diff --git a/backend/docker/ReadME.md b/backend/docker/ReadME.md
@@ -0,0 +1,78 @@
+# 🐳 Docker Setup for FluentAI Backend
+
+This directory contains Docker configuration files for running the FluentAI backend service.
+
+## 📂 Directory Structure
+```
+FluentAI/
+├── config.yaml             # Root-level configuration file
+├── backend/
+│   ├── docker/             # This directory
+│   │   ├── Dockerfile      # Main Dockerfile for Linux NVIDIA
+│   │   ├── Dockerfile.mac  # Special Dockerfile for Apple Silicon
+│   │   ├── docker-compose.yml 
+│   │   └── README.md         
+```
+## ⚙️ Configuration
+The Docker setup uses the project's root-level configuration file at /FluentAI/config.yaml. Make sure this file exists and contains the necessary configuration.
+
+## 🚀 Usage
+Run all commands from the docker directory:
+```
+/FluentAI/backend/docker
+```
+### Choose the appropriate version for your hardware:
+#### 🖥️ For Linux/Windows with NVIDIA GPU:
+```
+docker-compose up -d fluentai-gpu
+```
+#### 💻 For Linux/Windows CPU only:
+```
+docker-compose up -d fluentai-cpu
+```
+#### 🍎 For Apple Silicon Macs (⚠️ work in progress 🚧):
+```
+docker-compose up -d fluentai-apple
+```
+
+### 🌐 View logs:
+```
+docker-compose logs -f
+```
+
+### 📊 Accessing the API
+- CPU version: http://localhost:8000
+- GPU version: http://localhost:8001
+- Apple Silicon version: http://localhost:8002
+
+The FastAPI documentation is available at /docs (e.g., http://localhost:8000/docs)
+or visit: https://fastapi.tiangolo.com/#example-upgrade 
+
+### 🛑 Stopping the Containers
+```
+docker-compose down
+```
+
+### 🔄 Rebuilding after Code Changes
+```
+docker-compose up -d --build fluentai-[cpu|gpu|apple]
+```
+### 💾 Data Persistence
+The following Docker volumes are used for data persistence:
+- models_data: Caches downloaded ML models
+- datasets_data: Stores datasets
+- local_data: Stores generated files (images, audio, etc.)
+- logs_data: Stores application logs
+
+## ⚠️ Troubleshooting
+### Missing or incorrect config file
+Make sure the config file exists at /FluentAI/config.yaml. The Docker container mounts this file directly into the container.
+### Out of memory errors
+Increase the memory limit for your Docker container in Docker Desktop settings.
+### GPU not detected
+For NVIDIA GPU users, ensure NVIDIA Container Toolkit is properly installed:
+```
+docker run --rm --gpus all nvidia/cuda:12.4.0-base-ubuntu22.04 nvidia-smi
+```
+### Network issues downloading models
+If you experience issues downloading models, check network connectivity and ensure Hugging Face credentials are correctly set up if needed.
diff --git a/backend/docker/docker-compose.yml b/backend/docker/docker-compose.yml
@@ -0,0 +1,98 @@
+services:
+  # CPU Version
+  fluentai-cpu:
+    container_name: fluentai-backend-cpu
+    build:
+      context: ../..
+      dockerfile: backend/docker/Dockerfile
+      target: final
+      args:
+        - BUILD_TYPE=cpu
+    ports:
+      - "8000:8000"
+    volumes:
+      - ../../config.yaml:/app/config.yaml:ro
+      - models_data:/app/models
+      - datasets_data:/app/datasets
+      - local_data:/app/local_data
+      - logs_data:/app/logs
+      - ../../data:/app/data:ro
+    environment:
+      - FLUENTAI_CONFIG_PATH=/app/config.yaml
+    restart: unless-stopped
+    healthcheck:
+      test: [ "CMD", "curl", "-f", "http://localhost:8000/docs" ]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
+
+  # GPU Version
+  fluentai-gpu:
+    container_name: fluentai-backend-gpu
+    build:
+      context: ../..
+      dockerfile: backend/docker/Dockerfile
+      target: final
+      args:
+        - BUILD_TYPE=gpu
+    ports:
+      - "8001:8000"
+    volumes:
+      - ../../config.yaml:/app/config.yaml:ro
+      - models_data:/app/models
+      - datasets_data:/app/datasets
+      - local_data:/app/local_data
+      - logs_data:/app/logs
+      - ../../data:/app/data:ro
+    environment:
+      - FLUENTAI_CONFIG_PATH=/app/config.yaml
+    restart: unless-stopped
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [ gpu ]
+    healthcheck:
+      test: [ "CMD", "curl", "-f", "http://localhost:8000/docs" ]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
+  # # Apple Silicon Version
+  # fluentai-apple:
+  #   container_name: fluentai-backend-mac
+  #   build:
+  #     context: ../..
+  #     dockerfile: backend/docker/Dockerfile.mac
+  #   platform: linux/arm64
+  #   ports:
+  #     - "8002:8000"
+  #   volumes:
+  #     - ../../config.yaml:/app/config.yaml:ro
+  #     - models_data:/app/models
+  #     - datasets_data:/app/datasets
+  #     - local_data:/app/local_data
+  #     - logs_data:/app/logs
+  #     - ../../data:/app/data:ro
+  #   environment:
+  #     - FLUENTAI_CONFIG_PATH=/app/config.yaml
+  #   restart: unless-stopped
+  #   healthcheck:
+  #     test: [ "CMD", "curl", "-f", "http://localhost:8000/docs" ]
+  #     interval: 30s
+  #     timeout: 10s
+  #     retries: 3
+  #     start_period: 40s
+
+volumes:
+  models_data:
+    driver: local
+  datasets_data:
+    driver: local
+  local_data:
+    driver: local
+  logs_data:
+    driver: local
diff --git a/backend/gpu-requirements.txt b/backend/gpu-requirements.txt
@@ -4,4 +4,5 @@ torchaudio==2.5.1+cu124
 torchvision==0.20.1+cu124
 faiss-gpu ; sys_platform == 'linux'
 --extra-index-url https://download.pytorch.org/whl/cu124
-xformers==0.0.29
+xformers==0.0.29
+bitsandbytes==0.45.2
diff --git a/backend/requirements.txt b/backend/requirements.txt
@@ -18,7 +18,7 @@ Levenshtein==0.26.1
 pyclts==3.2.0
 panphon==0.21.2
 soundvectors==1.0
-datasets==3.2.0
+datasets==3.3.2
 GitPython==3.1.44
 googletrans==4.0.2
 pycountry==24.6.1
@@ -28,5 +28,6 @@ uvicorn[standard]==0.34.0  # ASGI server for FastAPI
 gtts==2.5.4
 ftfy==6.3.1
 einops==0.8.0
-bitsandbytes==0.45.2
-peft==0.14.0
+bitsandbytes==0.42.0
+peft==0.14.0
+xformers==0.0.29