finservAPI/Dockerfile at main · akashgupta2004/finservAPI · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
# Use NVIDIA's official CUDA base image which includes the necessary GPU drivers.
FROM nvidia/cuda:12.1.1-base-ubuntu22.04

# Install Python, pip, venv, and other essential build tools into the base image.
RUN apt-get update && apt-get install -y \
    python3.10 \
    python3-pip \
    python3.10-venv \
    build-essential \
    git \
 && rm -rf /var/lib/apt/lists/*

# Set python3.10 as the default python3 interpreter.
RUN update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.10 1

# Set the working directory inside the container.
WORKDIR /code

# Set environment variables for Python and the model cache location.
ENV PYTHONDONTWRITEBYTECODE 1
ENV PYTHONUNBUFFERED 1
ENV SENTENCE_TRANSFORMERS_HOME=/tmp/sentence_transformers_cache
ENV NLTK_DATA=/tmp/nltk_data

# Copy the requirements file into the container first to leverage Docker's caching.
COPY requirements.txt .

# Install the Python dependencies from your requirements.txt file.
RUN pip3 install --no-cache-dir -r requirements.txt

# Pre-download all models and data during the build phase.
RUN python3 -c "from sentence_transformers import SentenceTransformer, CrossEncoder; import nltk; \
    SentenceTransformer('BAAI/bge-small-en-v1.5'); \
    CrossEncoder('cross-encoder/ms-marco-MiniLM-L-6-v2'); \
    nltk.download('punkt_tab', download_dir='/tmp/nltk_data')"


# Copy the rest of your application's source code into the container.
COPY . .

# Expose a fixed port. 8080 is a standard default for Cloud Run.
EXPOSE 8000

# Use the $PORT environment variable provided by Cloud Run at runtime.
# The ${PORT:-8080} syntax provides a default value for local testing.
CMD ["uvicorn", "main:app", "--host", "0.0.0.0", "--port", "8000"]