claude-code-xai/main.py at main · vantasnerdan/claude-code-xai · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
"""Claude Code xAI Bridge -- Anthropic Messages API to xAI Grok proxy.

Receives Claude Code traffic on /v1/messages, translates to xAI Responses
API format, forwards to xAI, translates response back. Enrichment hooks
inject Agentic API Standard context.

As of issue #51, ALL models default to /v1/responses (Responses API).
As of issue #52, the Chat Completions handler delegates to the Responses
handler — both code paths now use the same translation and transport.
Set XAI_USE_CHAT_COMPLETIONS=true to force the legacy entry point (which
still delegates to Responses API internally).
"""

from fastapi import FastAPI, Request
from fastapi.responses import JSONResponse
import httpx
import os
import json
import time
from dotenv import load_dotenv

from bridge.logging_config import configure_logging, get_logger
from translation.forward import strip_thinking
from translation.config import TranslationConfig
from translation.model_routing import detect_endpoint, XAIEndpoint, use_legacy_chat_completions
from translation.tools import set_tool_enrichment_hook, reset_enrichment_overhead
from enrichment.factory import create_enricher
from handlers.chat_completions import handle_chat_completions
from handlers.responses import handle_responses

load_dotenv()
configure_logging()
logger = get_logger("main")

app = FastAPI(title="xai-agentic-claude-bridge")
XAI_API_KEY = os.getenv("XAI_API_KEY", "")
if not XAI_API_KEY:
    logger.warning("XAI_API_KEY not set. Requests to xAI will fail.")

client = httpx.AsyncClient(base_url="https://api.x.ai/v1", timeout=120.0)

enricher = create_enricher()
set_tool_enrichment_hook(enricher.enrich)
logger.info("Enrichment mode: %s", enricher.config.mode)

_config = TranslationConfig()

# Log the default API path at startup.
if use_legacy_chat_completions():
    logger.info("API path: Chat Completions (legacy, XAI_USE_CHAT_COMPLETIONS=true)")
else:
    logger.info("API path: Responses API (default, issue #51 migration)")


@app.head("/")
@app.get("/")
async def root() -> dict:
    """Health check for Claude Code connectivity probes (HEAD /)."""
    return {"status": "ok"}


@app.get("/manifest")
async def get_manifest() -> dict:
    with open("manifest.json") as f:
        return json.load(f)


@app.get("/health")
async def health() -> dict:
    return {
        "status": "healthy",
        "model": os.getenv("GROK_MODEL", "grok-4.20-reasoning-latest"),
        "enrichment_mode": enricher.config.mode,
    }


@app.post("/v1/messages", response_model=None)
async def messages(request: Request):
    body = await request.json()
    start = time.time()
    reset_enrichment_overhead()

    msg_count = len(body.get("messages", []))
    tool_count = len(body.get("tools", []) or [])
    has_thinking = "thinking" in body
    is_stream = bool(body.get("stream"))
    logger.info(
        "POST /v1/messages model=%s messages=%d tools=%d thinking=%s stream=%s",
        body.get("model", "?"), msg_count, tool_count, has_thinking, is_stream,
    )

    try:
        bridge_warnings = strip_thinking(body)
        if bridge_warnings:
            for w in bridge_warnings:
                logger.debug("Degraded feature: %s", w)

        resolved_model = _config.resolve_model(body.get("model", ""))
        endpoint = detect_endpoint(resolved_model)
        logger.debug("Routing model=%s to %s", resolved_model, endpoint.value)

        if endpoint == XAIEndpoint.CHAT_COMPLETIONS:
            return await handle_chat_completions(body, bridge_warnings, start, client, XAI_API_KEY)

        return await handle_responses(body, bridge_warnings, start, client, XAI_API_KEY)

    except NotImplementedError as e:
        logger.warning("Unsupported feature: %s", e)
        return JSONResponse(status_code=400, content={
            "type": "error", "error": {"type": "invalid_request_error", "message": str(e),
                                        "suggestion": "Use native Anthropic API for this feature."}})
    except Exception as e:
        logger.exception("Bridge error: %s", e)
        return JSONResponse(status_code=500, content={
            "type": "error", "error": {"type": "api_error", "message": str(e),
                                        "suggestion": "Retry the request. Check XAI_API_KEY."},
            "_links": {"retry": {"href": "/v1/messages", "method": "POST"}, "manifest": {"href": "/manifest"}}})


if __name__ == "__main__":
    import uvicorn
    uvicorn.run(app, host=os.getenv("HOST", "0.0.0.0"), port=int(os.getenv("PORT", "4000")))