32 lines
756 B
Docker
32 lines
756 B
Docker
# Local LLM Agent - Inference Engine Dockerfile
|
|
FROM python:3.11-slim
|
|
|
|
WORKDIR /app
|
|
|
|
# Install system dependencies
|
|
RUN apt-get update && apt-get install -y --no-install-recommends \
|
|
curl \
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
# Copy requirements and install Python dependencies
|
|
COPY requirements.txt .
|
|
RUN pip install --no-cache-dir -r requirements.txt
|
|
|
|
# Copy source code
|
|
COPY . .
|
|
|
|
# Set environment variables
|
|
ENV PYTHONUNBUFFERED=1
|
|
ENV PYTHONDONTWRITEBYTECODE=1
|
|
ENV INFERENCE_PORT=3161
|
|
|
|
# Expose port
|
|
EXPOSE 3161
|
|
|
|
# Health check
|
|
HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
|
|
CMD curl -f http://localhost:3161/health || exit 1
|
|
|
|
# Start the application
|
|
CMD ["uvicorn", "src.main:app", "--host", "0.0.0.0", "--port", "3161"]
|