duckdb-data-api/cache_middleware.py at main · senthilsweb/duckdb-data-api · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
"""
cache_middleware.py

Implements caching for FastAPI requests to enhance performance and response times.
The middleware utilizes Upstash Redis due to limitations encountered with vercel-kv
in the Python environment. Vercel-kv offers native support for JavaScript but not for Python.

Caching is particularly important for this application as it uses MotherDuck, a serverless
version of DuckDB. While DuckDB is performant, deploying it at the edge with Vercel's hobby
plan introduces constraints such as memory and RAM limitations, and a function timeout of 10 seconds.
To mitigate these limitations and improve response times, a Redis cache was implemented.
Upstash Redis was chosen for its ease of integration with Vercel, offering 500 MB of free cache
storage under the hobby plan.

Cache keys are consistently lowercased and prefixed with 'duckdb-data-api:' to ensure
uniformity and to avoid case-sensitive cache misses. Only GET requests and a specific POST
request for executing SQL are cached.

For the POST method specific to the "/execute/sql" route, the caching strategy involves generating
a unique cache key based on the content of the request body. This is achieved by computing an MD5 checksum
of the POST body, ensuring that different contents produce different cache keys, thereby accurately
caching responses based on the actual query being executed. This method addresses the challenge of caching
dynamic content that could vary significantly with each request.
"""


from fastapi import Request
from starlette.middleware.base import BaseHTTPMiddleware
from starlette.responses import Response
from upstash_redis.asyncio import Redis
import hashlib

# Load environment variables
from dotenv import load_dotenv
load_dotenv()

# Initialize Upstash Redis using environment variables
redis = Redis.from_env()

class CacheMiddleware(BaseHTTPMiddleware):
    """
    Middleware to cache GET and specific POST request responses using Upstash Redis.
    Generates unique cache keys based on the request method, path, query parameters, and
    for POST requests, the content of the request body.
    """

    async def dispatch(self, request: Request, call_next):
        """
        Process an incoming request by checking if it's cached. If not, call the next
        request handler and cache the response if applicable.
        """
        # Construct the base cache key from the method and path
        base_key = f"{request.method}-{request.url.path}"

        # Special handling for POST to "/execute/sql"
        if request.method == "POST" and request.url.path == "/execute/sql":
            # Read and then reset the request body for hashing and processing
            body = await request.body()
            request._body = body  # Reset body after reading

            # Create a checksum of the body to use in the cache key
            checksum = hashlib.md5(body).hexdigest()
            cache_key = f"duckdb-data-api:{base_key}?{checksum}".lower()
        elif request.method == "GET":
            # Use query parameters to distinguish GET requests
            cache_key = f"duckdb-data-api:{base_key}?{request.query_params}".lower()
        else:
            cache_key = None

        # Try to retrieve the cached response
        if cache_key:
            cached_response = await redis.get(cache_key)
            if cached_response:
                print(f"Cache hit for key: {cache_key}")
                return Response(content=cached_response, status_code=200, media_type='application/json')
            print(f"Cache miss for key: {cache_key}")

        # Proceed with the actual request handling if no cache is found
        response = await call_next(request)

        # Cache the response if the status code is 200 and we have a cache key
        if response.status_code == 200 and cache_key:
            body = b''.join([chunk async for chunk in response.body_iterator])
            cache_content = body.decode()
            headers = {"Content-Length": str(len(cache_content))}
            await redis.set(cache_key, cache_content)
            print(f"Cached response for key: {cache_key}")
            return Response(content=cache_content, status_code=200, media_type='application/json', headers=headers)

        return response