FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04 WORKDIR /app # Install system dependencies RUN apt-get update && apt-get install -y \ python3.11 \ python3-pip \ curl \ git \ && rm -rf /var/lib/apt/lists/* # Install Python dependencies RUN pip3 install --no-cache-dir \ torch \ torchvision \ transformers \ accelerate \ pillow \ fastapi \ uvicorn \ python-multipart \ pydantic \ httpx \ tiktoken \ sentencepiece \ einops \ verovio # Copy inference service COPY . /app # Expose port EXPOSE 8000 # Run inference service CMD ["python3", "main.py"]