# ๐Ÿงฑ Base image with Python and CUDA support (for GPU) FROM pytorch/pytorch:2.3.0-cuda11.8-cudnn8-runtime # ๐Ÿ‘ค Metadata LABEL maintainer="Shakeel Ahmed " LABEL description="DeepSeek-R1-Distill-Llama-8B FastAPI Server" # ๐Ÿ—๏ธ Create working directory WORKDIR /app # ๐Ÿงพ Copy files COPY requirements.txt . RUN pip install --no-cache-dir -r requirements.txt # ๐Ÿง  Copy app code COPY app.py . COPY README.md . # โšก Optional: Environment variables for performance ENV TRANSFORMERS_CACHE=/app/cache \ PYTHONUNBUFFERED=1 \ HF_HOME=/app/hf_home # ๐Ÿงฐ Expose port EXPOSE 7860 # ๐Ÿš€ Run FastAPI app with Uvicorn CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]