Soju06 · dwnmf · Feb 22, 2026 · Feb 22, 2026 · Feb 22, 2026 · Feb 22, 2026
diff --git a/.claude b/.claude
diff --git a/.env.example b/.env.example
@@ -11,6 +11,9 @@ CODEX_LB_UPSTREAM_BASE_URL=https://chatgpt.com/backend-api
 CODEX_LB_UPSTREAM_CONNECT_TIMEOUT_SECONDS=30
 CODEX_LB_STREAM_IDLE_TIMEOUT_SECONDS=300
 
+# Anthropic-compatible default reasoning effort (optional)
+# CODEX_LB_ANTHROPIC_DEFAULT_REASONING_EFFORT=xhigh
+
 # OAuth / token refresh
 CODEX_LB_AUTH_BASE_URL=https://auth.openai.com
 CODEX_LB_OAUTH_CLIENT_ID=app_EMoamEEZ73f0CkXaXp7hrann

diff --git a/app/core/auth/dependencies.py b/app/core/auth/dependencies.py
@@ -2,7 +2,7 @@
 
 import logging
 
-from fastapi import Request, Security
+from fastapi import HTTPException, Request, Security
 from fastapi.security import HTTPAuthorizationCredentials, HTTPBearer
 
 from app.core.clients.usage import UsageFetchError, fetch_usage
@@ -26,6 +26,10 @@ def set_openai_error_format(request: Request) -> None:
     request.state.error_format = "openai"
 
 
+def set_anthropic_error_format(request: Request) -> None:
+    request.state.error_format = "anthropic"
+
+
 def set_dashboard_error_format(request: Request) -> None:
     request.state.error_format = "dashboard"
 
@@ -52,6 +56,26 @@ async def validate_proxy_api_key(
             raise ProxyAuthError(str(exc)) from exc
 
 
+async def validate_anthropic_api_key(
+    request: Request,
+    credentials: HTTPAuthorizationCredentials | None = Security(_bearer),
+) -> ApiKeyData | None:
+    settings = await get_settings_cache().get()
+    if not settings.api_key_auth_enabled:
+        return None
+
+    token = _extract_anthropic_api_key(request, credentials)
+    if token is None:
+        raise HTTPException(status_code=401, detail="Missing API key")
+
+    async with get_background_session() as session:
+        service = ApiKeysService(ApiKeysRepository(session))
+        try:
+            return await service.validate_key(token)
+        except ApiKeyInvalidError as exc:
+            raise HTTPException(status_code=401, detail=str(exc)) from exc
+
+
 # --- Dashboard session auth ---
 
 
@@ -119,3 +143,20 @@ def _extract_bearer_token(authorization: str | None) -> str | None:
     if not token:
         return None
     return token
+
+
+def _extract_anthropic_api_key(
+    request: Request,
+    credentials: HTTPAuthorizationCredentials | None,
+) -> str | None:
+    x_api_key = request.headers.get("x-api-key")
+    if x_api_key is not None:
+        token = x_api_key.strip()
+        if token:
+            return token
+    if credentials is None:
+        return None
+    token = credentials.credentials.strip()
+    if not token:
+        return None
+    return token
diff --git a/app/core/clients/proxy.py b/app/core/clients/proxy.py
@@ -27,6 +27,7 @@
     "content-length",
     "host",
     "forwarded",
+    "x-api-key",
     "x-real-ip",
     "true-client-ip",
 }

diff --git a/app/core/config/settings.py b/app/core/config/settings.py
@@ -71,6 +71,7 @@ class Settings(BaseSettings):
     log_proxy_request_shape: bool = False
     log_proxy_request_shape_raw_cache_key: bool = False
     log_proxy_request_payload: bool = False
+    anthropic_default_reasoning_effort: str | None = None
     max_decompressed_body_bytes: int = Field(default=32 * 1024 * 1024, gt=0)
     image_inline_fetch_enabled: bool = True
     image_inline_allowed_hosts: Annotated[list[str], NoDecode] = Field(default_factory=list)
@@ -115,6 +116,16 @@ def _normalize_image_inline_allowed_hosts(cls, value: object) -> list[str]:
             return normalized
         raise TypeError("image_inline_allowed_hosts must be a list or comma-separated string")
 
+    @field_validator("anthropic_default_reasoning_effort")
+    @classmethod
+    def _normalize_anthropic_default_reasoning_effort(cls, value: str | None) -> str | None:
+        if value is None:
+            return None
+        normalized = value.strip()
+        if not normalized:
+            raise ValueError("anthropic_default_reasoning_effort must be a non-empty string")
+        return normalized
+
 
 @lru_cache(maxsize=1)
 def get_settings() -> Settings:

diff --git a/app/core/errors.py b/app/core/errors.py
@@ -18,6 +18,16 @@ class OpenAIErrorEnvelope(TypedDict):
     error: OpenAIErrorDetail
 
 
+class AnthropicErrorDetail(TypedDict):
+    type: str
+    message: str
+
+
+class AnthropicErrorEnvelope(TypedDict):
+    type: Literal["error"]
+    error: AnthropicErrorDetail
+
+
 class DashboardErrorDetail(TypedDict):
     code: str
     message: str
@@ -45,6 +55,10 @@ def openai_error(code: str, message: str, error_type: str = "server_error") -> O
     return {"error": {"message": message, "type": error_type, "code": code}}
 
 
+def anthropic_error(error_type: str, message: str) -> AnthropicErrorEnvelope:
+    return {"type": "error", "error": {"type": error_type, "message": message}}
+
+
 def dashboard_error(code: str, message: str) -> DashboardErrorEnvelope:
     return {"error": {"code": code, "message": message}}
 

diff --git a/app/core/handlers/exceptions.py b/app/core/handlers/exceptions.py
@@ -11,7 +11,7 @@
 from fastapi.responses import JSONResponse, Response
 from starlette.exceptions import HTTPException as StarletteHTTPException
 
-from app.core.errors import dashboard_error, openai_error
+from app.core.errors import anthropic_error, dashboard_error, openai_error
 from app.core.exceptions import (
     AppError,
     DashboardAuthError,
@@ -44,6 +44,18 @@
     DashboardRateLimitError,
 )
 
+_ANTHROPIC_V1_PATH_PREFIXES: tuple[str, ...] = (
+    "/v1/messages",
+    "/v1/messages/count_tokens",
+)
+
+
+def _is_anthropic_v1_path(path: str) -> bool:
+    for prefix in _ANTHROPIC_V1_PATH_PREFIXES:
+        if path == prefix or path.startswith(f"{prefix}/"):
+            return True
+    return False
+
 
 def _error_format(request: Request) -> str | None:
     fmt = getattr(request.state, "error_format", None)
@@ -53,6 +65,10 @@ def _error_format(request: Request) -> str | None:
     path = request.url.path
     if path.startswith("/api/"):
         return "dashboard"
+    if path.startswith("/anthropic/"):
+        return "anthropic"
+    if _is_anthropic_v1_path(path):
+        return "anthropic"
     if path.startswith("/v1/") or path.startswith("/backend-api/"):
         return "openai"
     return None
@@ -99,6 +115,11 @@ async def validation_error_handler(
                 status_code=422,
                 content=dashboard_error("validation_error", "Invalid request payload"),
             )
+        if fmt == "anthropic":
+            return JSONResponse(
+                status_code=400,
+                content=anthropic_error("invalid_request_error", "Invalid request payload"),
+            )
         if fmt == "openai":
             error = openai_error("invalid_request_error", "Invalid request payload", error_type="invalid_request_error")
             if exc.errors():
@@ -123,6 +144,17 @@ async def http_error_handler(
                 status_code=exc.status_code,
                 content=dashboard_error(f"http_{exc.status_code}", detail),
             )
+        if fmt == "anthropic":
+            error_type = "invalid_request_error"
+            if exc.status_code == 401:
+                error_type = "authentication_error"
+            elif exc.status_code == 403:
+                error_type = "permission_error"
+            elif exc.status_code == 429:
+                error_type = "rate_limit_error"
+            elif exc.status_code >= 500:
+                error_type = "api_error"
+            return JSONResponse(status_code=exc.status_code, content=anthropic_error(error_type, detail))
         if fmt == "openai":
             error_type = "invalid_request_error"
             code = "invalid_request_error"
@@ -155,6 +187,11 @@ async def unhandled_error_handler(request: Request, exc: Exception) -> JSONRespo
                 status_code=500,
                 content=dashboard_error("internal_error", "Unexpected error"),
             )
+        if fmt == "anthropic":
+            return JSONResponse(
+                status_code=500,
+                content=anthropic_error("api_error", "Internal server error"),
+            )
         if fmt == "openai":
             return JSONResponse(
                 status_code=500,

diff --git a/app/core/openai/message_coercion.py b/app/core/openai/message_coercion.py
@@ -258,7 +258,12 @@ def _normalize_content_part(part: dict[str, JsonValue], role: str = "user") -> J
     if part_type in ("text", "input_text", "output_text"):
         text = part.get("text")
         if isinstance(text, str):
-            return {"type": text_type, "text": text}
+            # Preserve cache-related and metadata fields while normalizing
+            # text part type for the target role.
+            normalized = dict(part)
+            normalized["type"] = text_type
+            normalized["text"] = text
+            return normalized
         return part
     if role == "assistant":
         return part

diff --git a/app/core/openai/requests.py b/app/core/openai/requests.py
@@ -298,6 +298,7 @@ class ResponsesRequest(BaseModel):
     previous_response_id: str | None = None
     truncation: str | None = None
     prompt_cache_key: str | None = None
+    prompt_cache_retention: str | None = None
     text: ResponsesTextControls | None = None
 
     @field_validator("input")

diff --git a/app/core/openai/v1_requests.py b/app/core/openai/v1_requests.py
@@ -32,6 +32,7 @@ class V1ResponsesRequest(BaseModel):
     previous_response_id: str | None = None
     truncation: str | None = None
     prompt_cache_key: str | None = None
+    prompt_cache_retention: str | None = None
     text: ResponsesTextControls | None = None
 
     @field_validator("input")

diff --git a/app/db/alembic/versions/013_add_request_logs_codex_session_hashes.py b/app/db/alembic/versions/013_add_request_logs_codex_session_hashes.py
@@ -0,0 +1,51 @@
+"""add codex session/conversation hashes to request_logs
+
+Revision ID: 013_add_request_logs_codex_session_hashes
+Revises: 012_add_import_without_overwrite_and_drop_accounts_email_unique
+Create Date: 2026-02-22
+"""
+
+from __future__ import annotations
+
+import sqlalchemy as sa
+from alembic import op
+from sqlalchemy.engine import Connection
+
+# revision identifiers, used by Alembic.
+revision = "013_add_request_logs_codex_session_hashes"
+down_revision = "012_add_import_without_overwrite_and_drop_accounts_email_unique"
+branch_labels = None
+depends_on = None
+
+
+def _columns(connection: Connection, table_name: str) -> set[str]:
+    inspector = sa.inspect(connection)
+    if not inspector.has_table(table_name):
+        return set()
+    return {str(column["name"]) for column in inspector.get_columns(table_name) if column.get("name") is not None}
+
+
+def upgrade() -> None:
+    bind = op.get_bind()
+    columns = _columns(bind, "request_logs")
+    if not columns:
+        return
+
+    with op.batch_alter_table("request_logs") as batch_op:
+        if "codex_session_hash" not in columns:
+            batch_op.add_column(sa.Column("codex_session_hash", sa.String(), nullable=True))
+        if "codex_conversation_hash" not in columns:
+            batch_op.add_column(sa.Column("codex_conversation_hash", sa.String(), nullable=True))
+
+
+def downgrade() -> None:
+    bind = op.get_bind()
+    columns = _columns(bind, "request_logs")
+    if not columns:
+        return
+
+    with op.batch_alter_table("request_logs") as batch_op:
+        if "codex_conversation_hash" in columns:
+            batch_op.drop_column("codex_conversation_hash")
+        if "codex_session_hash" in columns:
+            batch_op.drop_column("codex_session_hash")
diff --git a/app/db/models.py b/app/db/models.py
@@ -83,6 +83,8 @@ class RequestLog(Base):
     account_id: Mapped[str] = mapped_column(String, ForeignKey("accounts.id", ondelete="CASCADE"), nullable=False)
     api_key_id: Mapped[str | None] = mapped_column(String, nullable=True)
     request_id: Mapped[str] = mapped_column(String, nullable=False)
+    codex_session_hash: Mapped[str | None] = mapped_column(String, nullable=True)
+    codex_conversation_hash: Mapped[str | None] = mapped_column(String, nullable=True)
     requested_at: Mapped[datetime] = mapped_column(DateTime, server_default=func.now(), nullable=False)
     model: Mapped[str] = mapped_column(String, nullable=False)
     input_tokens: Mapped[int | None] = mapped_column(Integer, nullable=True)

diff --git a/app/dependencies.py b/app/dependencies.py
@@ -10,6 +10,7 @@
 from app.db.session import get_background_session, get_session
 from app.modules.accounts.repository import AccountsRepository
 from app.modules.accounts.service import AccountsService
+from app.modules.anthropic_compat.service import AnthropicCompatService
 from app.modules.api_keys.repository import ApiKeysRepository
 from app.modules.api_keys.service import ApiKeysService
 from app.modules.dashboard.repository import DashboardRepository
@@ -66,6 +67,11 @@ class ApiKeysContext:
     service: ApiKeysService
 
 
+@dataclass(slots=True)
+class AnthropicCompatContext:
+    service: AnthropicCompatService
+
+
 @dataclass(slots=True)
 class RequestLogsContext:
     session: AsyncSession
@@ -164,6 +170,12 @@ def get_api_keys_context(
     return ApiKeysContext(session=session, repository=repository, service=service)
 
 
+def get_anthropic_compat_context() -> AnthropicCompatContext:
+    proxy_service = ProxyService(repo_factory=_proxy_repo_context)
+    service = AnthropicCompatService(proxy_service)
+    return AnthropicCompatContext(service=service)
+
+
 def get_request_logs_context(
     session: AsyncSession = Depends(get_session),
 ) -> RequestLogsContext:

diff --git a/app/main.py b/app/main.py
@@ -17,6 +17,7 @@
 from app.core.usage.refresh_scheduler import build_usage_refresh_scheduler
 from app.db.session import close_db, init_db
 from app.modules.accounts import api as accounts_api
+from app.modules.anthropic_compat import api as anthropic_compat_api
 from app.modules.api_keys import api as api_keys_api
 from app.modules.dashboard import api as dashboard_api
 from app.modules.dashboard_auth import api as dashboard_auth_api
@@ -66,6 +67,8 @@ def create_app() -> FastAPI:
     app.include_router(proxy_api.router)
     app.include_router(proxy_api.v1_router)
     app.include_router(proxy_api.usage_router)
+    app.include_router(anthropic_compat_api.router)
+    app.include_router(anthropic_compat_api.anthropic_router)
     app.include_router(accounts_api.router)
     app.include_router(dashboard_api.router)
     app.include_router(usage_api.router)
@@ -80,7 +83,7 @@ def create_app() -> FastAPI:
     index_html = static_dir / "index.html"
     static_root = static_dir.resolve()
     frontend_build_hint = "Frontend assets are missing. Run `cd frontend && bun run build`."
-    excluded_prefixes = ("api/", "v1/", "backend-api/", "health")
+    excluded_prefixes = ("api/", "v1/", "backend-api/", "anthropic/", "health")
 
     def _is_static_asset_path(path: str) -> bool:
         if path.startswith("assets/"):

diff --git a/app/modules/anthropic_compat/__init__.py b/app/modules/anthropic_compat/__init__.py
@@ -0,0 +1 @@
+