# Use an official Python runtime as a base image
FROM python:3.10-slim

# Set environment variables
ENV TRANSFORMERS_CACHE=/app/cache \
    HF_HOME=/app/cache \
    DEBIAN_FRONTEND=noninteractive

# Set working directory
WORKDIR /app

# Install minimal system dependencies for running the app
RUN apt-get update && apt-get install -y --no-install-recommends \
      libgomp1 \
    && rm -rf /var/lib/apt/lists/*

# Prepare cache directory
RUN mkdir -p /app/cache && chmod -R 777 /app/cache

# Copy requirements and install Python packages
COPY requirements.txt .

# Install most packages from requirements.txt, then llama-cpp-python with binary-only
RUN grep -v "llama-cpp-python" requirements.txt | pip install --no-cache-dir -r /dev/stdin \
    && pip install --no-cache-dir --only-binary=all llama-cpp-python==0.3.14

# Copy application code and data
COPY app.py cv_embeddings.json cv_text.txt ./

# Expose the port your FastAPI app runs on
EXPOSE 7860

# Launch
CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]