mirror of
https://github.com/karpathy/nanochat.git
synced 2026-05-08 08:49:53 +00:00
- FastAPI service that manages conversations and messages in PostgreSQL
(SQLAlchemy 2.0 async + asyncpg) and streams assistant responses back
to the client via sse-starlette, forwarding the inference service SSE
contract unchanged.
- Auth guard validates every request against the auth service
/auth/validate endpoint (X-Internal-API-Key) and caches results in an
in-process TTL cache (5 min, 1024 entries) to absorb request bursts.
- Every query filters by authenticated user_id; cross-user access
returns 404. Message send flow auto-titles the first message,
persists the streamed assistant response after the client disconnects,
and records token_count + inference_time_ms.
- /api/models{,/swap} proxies the inference admin surface; swap
requires is_admin on the validated user.
- Structured JSON logging via structlog with trace_id + user_id
ContextVars attached to every log line.
- Test suite (pytest + aiosqlite + respx) covers CRUD, user scoping,
streaming SSE persistence, regenerate, model proxy admin gate,
and the stream proxy error path. 16/16 passing.
Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
35 lines
794 B
Docker
35 lines
794 B
Docker
FROM python:3.12-slim
|
|
|
|
ENV PYTHONDONTWRITEBYTECODE=1 \
|
|
PYTHONUNBUFFERED=1 \
|
|
UV_SYSTEM_PYTHON=1 \
|
|
UV_LINK_MODE=copy
|
|
|
|
RUN apt-get update \
|
|
&& apt-get install -y --no-install-recommends build-essential curl \
|
|
&& rm -rf /var/lib/apt/lists/*
|
|
|
|
RUN pip install --no-cache-dir uv==0.4.30
|
|
|
|
WORKDIR /app
|
|
|
|
COPY pyproject.toml README.md /app/
|
|
|
|
RUN uv pip install --system --no-cache \
|
|
"fastapi>=0.117.1" \
|
|
"uvicorn[standard]>=0.36.0" \
|
|
"pydantic>=2.8.0" \
|
|
"pydantic-settings>=2.4.0" \
|
|
"sqlalchemy[asyncio]>=2.0.36" \
|
|
"asyncpg>=0.29.0" \
|
|
"httpx>=0.27.0" \
|
|
"sse-starlette>=2.1.3" \
|
|
"structlog>=24.4.0" \
|
|
"cachetools>=5.5.0"
|
|
|
|
COPY src /app/src
|
|
|
|
EXPOSE 8002
|
|
|
|
CMD ["uvicorn", "src.main:app", "--host", "0.0.0.0", "--port", "8002"]
|