FROM nvidia/cuda:11.8-devel-ubuntu20.04

# Set environment variables
ENV PYTHONDONTWRITEBYTECODE=1
ENV PYTHONUNBUFFERED=1
ENV DEBIAN_FRONTEND=noninteractive

# Install system dependencies
RUN apt-get update && apt-get install -y \
    python3 \
    python3-pip \
    python3-dev \
    git \
    wget \
    curl \
    vim \
    htop \
    && rm -rf /var/lib/apt/lists/*

# Set working directory
WORKDIR /workspace/kskt

# Copy requirements first for better Docker caching
COPY requirements.txt .

# Install Python dependencies
RUN pip3 install --no-cache-dir -r requirements.txt

# Install additional dependencies for development
RUN pip3 install --no-cache-dir \
    jupyter \
    tensorboard \
    gradio \
    streamlit

# Copy project files
COPY . .

# Create necessary directories
RUN mkdir -p data/processed checkpoints logs results

# Set Python path
ENV PYTHONPATH=/workspace/kskt:$PYTHONPATH

# Expose ports for Jupyter, TensorBoard, and Gradio
EXPOSE 8888 6006 7860

# Create startup script
RUN echo '#!/bin/bash\n\
echo "KSKT Development Environment"\n\
echo "Available commands:"\n\
echo "  python train_kskt.py --help        # Training"\n\
echo "  python evaluate_kskt.py --help     # Evaluation"\n\
echo "  python inference.py --help         # Inference"\n\
echo "  python -m tests.test_kskt_model    # Run tests"\n\
echo "  jupyter lab --ip=0.0.0.0 --allow-root  # Start Jupyter"\n\
echo ""\n\
/bin/bash' > /start.sh && chmod +x /start.sh

# Set default command
CMD ["/start.sh"]


# ===== docker/docker-compose.yml =====
version: '3.8'

services:
  kskt-dev:
    build:
      context: ..
      dockerfile: docker/Dockerfile
    container_name: kskt-development
    volumes:
      - ../:/workspace/kskt
      - kskt-data:/workspace/kskt/data
      - kskt-checkpoints:/workspace/kskt/checkpoints
      - kskt-results:/workspace/kskt/results
    ports:
      - "8888:8888"  # Jupyter Lab
      - "6006:6006"  # TensorBoard
      - "7860:7860"  # Gradio
      - "8501:8501"  # Streamlit
    environment:
      - CUDA_VISIBLE_DEVICES=0
      - WANDB_API_KEY=${WANDB_API_KEY}
    runtime: nvidia
    shm_size: '2gb'
    stdin_open: true
    tty: true
    command: /bin/bash

  kskt-training:
    build:
      context: ..
      dockerfile: docker/Dockerfile
    container_name: kskt-training
    volumes:
      - ../:/workspace/kskt
      - kskt-data:/workspace/kskt/data
      - kskt-checkpoints:/workspace/kskt/checkpoints
    environment:
      - CUDA_VISIBLE_DEVICES=0,1,2,3
      - WANDB_API_KEY=${WANDB_API_KEY}
    runtime: nvidia
    shm_size: '4gb'
    command: >
      python train_kskt.py
      --train_data data/processed/character_profiles.json
      --val_data data/processed/character_bench_dev.json
      --output_dir checkpoints
      --batch_size 8
      --learning_rate 2e-5
      --wandb_project kskt-training
    profiles:
      - training

volumes:
  kskt-data:
  kskt-checkpoints:
  kskt-results:
