duckdb-data-api/main.py at main · senthilsweb/duckdb-data-api · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
"""
File Name: main.py
Author(s): Sernthilnathan Karuppaiah and ChatGPT4 :-)
Date: 14-Mar-2024
Description: This FastAPI application serves as a data proxy to DuckDB, offering endpoints for basic database
             operations such as listing tables, reading table data with optional filtering, sorting, and pagination,
             and a debug endpoint to check database connectivity. It is designed for dynamic usage, following
             the ActiveRecord design pattern akin to a Rails-type microORM, and utilizes SQLAlchemy for
             database interaction.
"""

from fastapi import FastAPI, Depends, HTTPException, Request, Query, Path, Body
from fastapi.encoders import jsonable_encoder
from fastapi.middleware.cors import CORSMiddleware
from fastapi.responses import JSONResponse
import sqlglot
from sqlglot import parse_one, exp
from sqlglot.optimizer import optimize
from sqlalchemy import create_engine, text
from sqlalchemy.orm import sessionmaker, Session
from typing import List, Dict, Any
from pydantic import BaseModel
from datetime import datetime
from cache_middleware import CacheMiddleware
import os
from dotenv import load_dotenv
import math
from decimal import Decimal
from sqlalchemy.sql import text


# Initialize environment variables and set HOME for duckDB compatibility in serverless environments.
# Only load .env file if running locally and not in Vercel
if os.environ.get('VERCEL', None) != '1':
    # Clear all environment variables
    os.environ.clear()
    load_dotenv()

os.environ['HOME'] = '/tmp'
# Initialize environment variables and set HOME for duckDB compatibility in serverless environments.
# Only load .env file if running locally and not in Vercel
if os.environ.get('VERCEL', None) != '1':
    load_dotenv()

# Configuration variables
DATABASE_URL = os.getenv("DUCKDB_DATABASE_URL", default="duckdb:///tickit.duckdb")
print(f"DATABASE_URL = [{DATABASE_URL}]")
SCHEMA_NAME = os.getenv("DUCKDB_SCHEMA_NAME", default="main")
print(f"SCHEMA_NAME = [{SCHEMA_NAME}]")
BLACKLIST_KEYWORDS = [keyword for keyword in os.getenv("QUERY_BLACKLIST", "").split(",") if keyword]


# Database engine setup
engine = create_engine(DATABASE_URL)
SessionLocal = sessionmaker(autocommit=False, autoflush=False, bind=engine)

app = FastAPI()
#app.add_middleware(CacheMiddleware)

# Dependency to get the database session
def get_db():
    db = SessionLocal()
    try:
        yield db
    finally:
        db.close()

app.add_middleware(
    CORSMiddleware,
    allow_origins=["*"],  # Allow all origins
    allow_credentials=True,
    allow_methods=["*"],  # Allow all methods
    allow_headers=["*"],  # Allow all headers
)

@app.get("/")
async def root():
    """Root endpoint returning welcome message."""
    return {"message": "Welcome to DuckDB Data Proxy!"}

@app.get("/health")
async def health_check():
    """Health check endpoint."""
    return {"message": "I am doing great!"}

@app.get("/debug/connection")
def debug_connection(db: Session = Depends(get_db)):
    """
    Debug endpoint to test database connection.

    Attempts a simple query to verify database connectivity.
    """
    try:
        result = db.execute(text("SELECT 1"))
        return {"status": "success", "message": "Database connection established successfully."}
    except Exception as e:
        return {"status": "error", "message": str(e)}


def prepare_where_clauses(request: Request):
    """
    Prepares WHERE clauses for SQL queries based on request query parameters.

    Supports various operators like .eq, .gt, .gte, .lt, .lte, .neq, and .like.
    """
    where_clauses = []
    params = {}
    for key, value in request.query_params.items():
        if key not in ["select", "limit", "offset", "order"]:
            operator = "="  # Default operator
            if key.endswith(".eq"):
                operator = "="
                key = key[:-3]
            elif key.endswith(".gt"):
                operator = ">"
                key = key[:-3]
            elif key.endswith(".gte"):
                operator = ">="
                key = key[:-4]
            elif key.endswith(".lt"):
                operator = "<"
                key = key[:-3]
            elif key.endswith(".lte"):
                operator = "<="
                key = key[:-4]
            elif key.endswith(".neq"):
                operator = "<>"
                key = key[:-4]
            elif key.endswith(".like"):
                operator = "ILIKE"
                key = key[:-5]
            where_clauses.append(f"{key} {operator} :{key}")
            params[key] = value
    return " AND ".join(where_clauses), params

@app.get("/entity/{table_name}", response_model=List[Dict[str, Any]])
def get_entities(table_name: str, request: Request, select: str = Query("*"),
                    order: str = Query(None), skip: int = Query(0, alias="offset"),
                    limit: int = Query(100), db: Session = Depends(get_db)):
    """
    Endpoint to read data from a specified table with optional filtering, sorting, and pagination.

    Validates table name against existing tables to prevent SQL injection.
    """
    # Validate table name
    if table_name not in list_tables(db):
        raise HTTPException(status_code=404, detail="Table not found")

    # Construct query with optional WHERE, ORDER BY, and pagination
    base_query = f"SELECT {select} FROM  {SCHEMA_NAME}.{table_name}"
    where_clauses, params = prepare_where_clauses(request)
    if where_clauses:
        base_query += f" WHERE {where_clauses}"
        count_query = f"SELECT COUNT(*) FROM {SCHEMA_NAME}.{table_name} WHERE {where_clauses}"

    else:
        count_query = f"SELECT COUNT(*) FROM {SCHEMA_NAME}.{table_name}"

    if order:
        base_query += f" ORDER BY {order}"
    base_query += " LIMIT :limit OFFSET :offset"
    print(f"base_query = {base_query}")
    params.update({"limit": limit, "offset": skip})
    print(f"params = {params}")
    # Execute query and handle results
    try:
        result_proxy = db.execute(text(base_query), params)
        results = result_proxy.fetchall()
        # Use params for count query as well to respect WHERE conditions
        total_count = db.execute(text(count_query), params).scalar()
        page_number = math.ceil(skip / limit) + 1
        total_pages = math.ceil(total_count / limit)
        response_data = {
            "total_rows": total_count,
            "total_pages": total_pages,
            "limit": limit,
            "offset": skip,
            "current_page": page_number,
            "data": [{key: (value.isoformat() if isinstance(value, datetime) else value)
                      for key, value in dict(zip(result_proxy.keys(), row)).items()} for row in results]
        }
        return JSONResponse(content=response_data)
    except Exception as e:
        raise HTTPException(status_code=500, detail=str(e))

@app.get("/entity/{table_name}/{id}", response_model=Dict[str, Any])
def get_entity(table_name: str, id: int = Path(..., description="The ID of the entity to retrieve"),
               db: Session = Depends(get_db)):
    """
    Dynamically fetches a single entity by its ID from a specified table.

    Parameters:
    - table_name: str - The name of the table from which to retrieve the entity.
    - id: int - The unique identifier of the entity to retrieve.

    Returns a single entity matching the given ID from the specified table, with datetime fields properly serialized.
    """
    # Validate table name
    if table_name not in list_tables(db):
        raise HTTPException(status_code=404, detail="Table not found")

    query = text(f"SELECT * FROM {SCHEMA_NAME}.{table_name} WHERE id = :id")
    result = db.execute(query, {"id": id}).fetchone()

    if result is None:
        raise HTTPException(status_code=404, detail=f"Record [{id}] not found in [{SCHEMA_NAME}.{table_name}]")

    # Convert the RowProxy object to a dictionary
    result_dict = {key: value for key, value in result._mapping.items()}

    # Serialize using jsonable_encoder to handle datetime and other complex types
    return jsonable_encoder(result_dict)

@app.delete("/entity/{table_name}/{id}", response_model=Dict[str, Any])
def delete_entity(table_name: str, id: int = Path(..., description="The ID of the entity to delete"),
                  db: Session = Depends(get_db)):
    """
    Deletes a single entity by its ID from a specified table.
    """
   # Validate table name
    if table_name not in list_tables(db):
        raise HTTPException(status_code=404, detail="Table not found")

    # Check if the entity exists
    exists_query = text(f"SELECT EXISTS(SELECT 1 FROM {SCHEMA_NAME}.{table_name} WHERE id = :id)")
    exists = db.execute(exists_query, {"id": id}).scalar()

    if not exists:
        raise HTTPException(status_code=404, detail=f"Record [{id}] not found in [{SCHEMA_NAME}.{table_name}]")

    # Delete the entity
    delete_query = text(f"DELETE FROM {SCHEMA_NAME}.{table_name} WHERE id = :id")
    db.execute(delete_query, {"id": id})
    db.commit()

    return {"message": f"Record [{id}] deleted successfully from [{SCHEMA_NAME}.{table_name}]"}

@app.post("/entity/{table_name}", response_model=Dict[str, Any])
def create_entity(table_name: str, entity_data: Dict[str, Any] = Body(...),
                  db: Session = Depends(get_db)):
    """
    Creates a new entity in the specified table with the provided data.
    """
    # Validate table name
    if table_name not in list_tables(db):
        raise HTTPException(status_code=404, detail="Table not found")

    # Constructing SQL INSERT statement dynamically based on entity_data
    columns = ', '.join(entity_data.keys())
    values = ', '.join([f":{key}" for key in entity_data.keys()])
    insert_query = text(f"INSERT INTO {SCHEMA_NAME}.{table_name} ({columns}) VALUES ({values}) RETURNING *")

    # Execute the query and fetch the newly created entity
    result = db.execute(insert_query, entity_data).fetchone()
    db.commit()

    if result is None:
        raise HTTPException(status_code=500, detail="Failed to create record")

    # Convert the RowProxy object to a dictionary
    result_dict = {key: value for key, value in result._mapping.items()}

    # Serialize using jsonable_encoder to handle datetime and other complex types
    return jsonable_encoder(result_dict)

@app.patch("/entity/{table_name}/{id}", response_model=Dict[str, Any])
def update_entity(table_name: str, id: int, update_data: Dict[str, Any] = Body(...),
                  db: Session = Depends(get_db)):
    """
    Updates an existing entity in the specified table with the provided data.
    """
    # Validate table name
    if table_name not in list_tables(db):
        raise HTTPException(status_code=404, detail="Table not found")

    # First, check if the entity exists
    exists_query = text(f"SELECT EXISTS(SELECT 1 FROM {SCHEMA_NAME}.{table_name} WHERE id = :id)")
    exists = db.execute(exists_query, {"id": id}).scalar()
    if not exists:
        raise HTTPException(status_code=404, detail="Entity not found")

    # Constructing SQL UPDATE statement dynamically based on update_data
    set_clauses = ', '.join([f"{key} = :{key}" for key in update_data.keys()])
    update_query = text(f"UPDATE {SCHEMA_NAME}.{table_name} SET {set_clauses} WHERE id = :id RETURNING *")

    # Execute the query and fetch the updated entity
    result = db.execute(update_query, {**update_data, "id": id}).fetchone()
    db.commit()

    if result is None:
        raise HTTPException(status_code=500, detail="Failed to update record [{id}] in [{table_name}]")

    # Convert the result row to a dict to ensure compatibility with FastAPI's response_model
    updated_entity = {column: value for column, value in result._mapping.items()}
    return updated_entity

@app.put("/entity/{table_name}/{id}", response_model=Dict[str, Any])
def replace_entity(table_name: str, id: int, new_data: Dict[str, Any] = Body(...),
                   db: Session = Depends(get_db)):

    if table_name not in list_tables(db):
        raise HTTPException(status_code=404, detail="Table not found")

    # First, check if the entity exists
    exists_query = text(f"SELECT EXISTS(SELECT 1 FROM {SCHEMA_NAME}.{table_name} WHERE id = :id)")
    exists = db.execute(exists_query, {"id": id}).scalar()
    if not exists:
        raise HTTPException(status_code=404, detail="Table not found")

    # Assuming all fields must be provided for a PUT operation, construct a dynamic UPDATE statement
    set_clauses = ', '.join([f"{key} = :{key}" for key in new_data.keys()])
    update_query = text(f"UPDATE {SCHEMA_NAME}.{table_name} SET {set_clauses} WHERE id = :id RETURNING *")

    # Execute the query and fetch the updated entity
    result = db.execute(update_query, {**new_data, "id": id}).fetchone()
    db.commit()

    if result is None:
        raise HTTPException(status_code=500, detail="Failed to replace record [{id}] in [{table_name}]")

    # Convert the result row to a dict to ensure compatibility with FastAPI's response_model
    replaced_entity = {column: value for column, value in result._mapping.items()}
    return replaced_entity

def is_query_blacklisted(query: str) -> bool:
    # Check if BLACKLIST_KEYWORDS is actually empty or contains only an empty string
    if not BLACKLIST_KEYWORDS or BLACKLIST_KEYWORDS == ['']:
        return False

    query_lower = query.lower()
    for keyword in BLACKLIST_KEYWORDS:
        # Skip empty strings which might be a result of splitting an empty environment variable
        if keyword and keyword in query_lower:
            return True
    return False

@app.post("/execute/sql")
def execute_custom_query(query: str = Body(..., embed=True), db: Session = Depends(get_db)):
    """
    Executes a custom SQL query, which can be a SELECT statement or a DDL statement.
    Checks against a blacklist for prohibited keywords.

    Parameters:
    - query: str - The SQL query to execute.

    If the query is a SELECT statement, returns the fetched data.
    For DDL statements, returns a confirmation message.
    """
    #query = query.strip().lower()
    query = query.strip()
    if is_query_blacklisted(query):
        raise HTTPException(status_code=403, detail="The query contains prohibited keywords.")

    if query.startswith("select") or query.startswith("SELECT"):
        # It's a select query
        return execute_select_query(query, db)
    else:
        # It's a DDL query
        return execute_ddl_query(query, db)


@app.get("/metadata/databases", response_model=List[Dict[str, Any]])
def get_md_duckdb_databases(db: Session = Depends(get_db)):
    return execute_metadata_query("SELECT * FROM duckdb_databases", db)

@app.get("/metadata/schemas", response_model=List[Dict[str, Any]])
def get_md_duckdb_databases(db: Session = Depends(get_db)):
    return execute_metadata_query("SELECT * FROM duckdb_schemas", db)

@app.get("/metadata/tables", response_model=List[Dict[str, Any]])
def get_md_duckdb_databases(db: Session = Depends(get_db)):
    return execute_metadata_query("SELECT * FROM duckdb_columns", db)

@app.get("/metadata/columns", response_model=List[Dict[str, Any]])
def get_md_duckdb_databases(db: Session = Depends(get_db)):
    return execute_metadata_query("SELECT * FROM duckdb_columns", db)

@app.get("/metadata/views", response_model=List[Dict[str, Any]])
def get_md_duckdb_databases(db: Session = Depends(get_db)):
    return execute_metadata_query("SELECT * FROM duckdb_views", db)

@app.get("/metadata/constraints", response_model=List[Dict[str, Any]])
def get_md_duckdb_databases(db: Session = Depends(get_db)):
    return execute_metadata_query("SELECT * FROM duckdb_constraints", db)

@app.get("/metadata/{path:path}", response_model=List[Dict[str, Any]])
def handle_metadata_routes(path: str, db: Session = Depends(get_db)):
    """
    Handles metadata routes dynamically for DuckDB catalogs, schemas, tables, and columns.
    Retrieves all available fields from the information schema.
    """
    parts = path.split("/")  # Split the path into components

    if len(parts) == 1:  # Matches /metadata/{catalog}
        catalog = parts[0]
        query = f"""
            SELECT *
            FROM information_schema.schemata
            WHERE catalog_name = '{catalog}';
        """

    elif len(parts) == 2:  # Matches /metadata/{catalog}/{schema}
        catalog, schema = parts
        query = f"""
            SELECT *
            FROM information_schema.tables
            WHERE table_catalog = '{catalog}' AND table_schema = '{schema}';
        """

    elif len(parts) == 3:  # Matches /metadata/{catalog}/{schema}/{table}
        catalog, schema, table = parts
        query = f"""
            SELECT *
            FROM information_schema.columns
            WHERE table_catalog = '{catalog}' AND table_schema = '{schema}' AND table_name = '{table}';
        """

    elif len(parts) == 4:  # Matches /metadata/{catalog}/{schema}/{table}/{column}
        catalog, schema, table, column = parts
        query = f"""
            SELECT *
            FROM information_schema.columns
            WHERE table_catalog = '{catalog}' AND table_schema = '{schema}' AND table_name = '{table}' AND column_name = '{column}';
        """

    else:
        # Return a 400 error if the path format is invalid
        raise HTTPException(status_code=400, detail="Invalid route format. Check the number of parts.")

    # Execute the query and return results
    return execute_metadata_query(query, db)

@app.get("/describe", response_model=List[Dict[str, Any]])
def describe_object(object: str = Query(..., description="The object to describe, in the format 'db.schema.table'"),
                    db: Session = Depends(get_db)):
    """
    Fetches metadata for the specified object (table).
    Query parameter format: 'db.schema.table'.
    """
    # Split the object into components
    try:
        catalog, schema, table = object.split(".")
    except ValueError:
        raise HTTPException(status_code=400, detail="Invalid object format. Use 'db.schema.table'.")

    # Construct the query
    query = f"DESCRIBE TABLE {catalog}.{schema}.{table}"

    # Execute and return the result
    return execute_metadata_query(query, db)


@app.get("/profile", response_model=List[Dict[str, Any]])
def profile_object(object: str = Query(..., description="The object to profile, in the format 'db.schema.table' or 'db.schema.table.column'"),
                   db: Session = Depends(get_db)):
    """
    Fetches profile metadata for the specified object.
    Query parameter format: 'db.schema.table' (for table) or 'db.schema.table.column' (for specific column).
    """
    parts = object.split(".")
    if len(parts) == 3:
        # Table-level profile
        catalog, schema, table = parts
        query = f"SUMMARIZE TABLE {catalog}.{schema}.{table}"
        return execute_profile_query(query, db)
    elif len(parts) == 4:
        # Column-level profile
        catalog, schema, table, column = parts
        query = f"SUMMARIZE TABLE {catalog}.{schema}.{table}"
        all_columns = execute_profile_query(query, db)

        # Filter for the specific column
        column_summary = [col for col in all_columns if col["column_name"] == column]
        if not column_summary:
            raise HTTPException(status_code=404, detail=f"Column '{column}' not found in table '{table}'.")
        return column_summary
    else:
        raise HTTPException(status_code=400, detail="Invalid object format. Use 'db.schema.table' or 'db.schema.table.column'.")


def execute_profile_query(query: str, db: Session) -> List[Dict[str, Any]]:
    """
    Executes a profile-specific query (e.g., SUMMARIZE TABLE) and handles Decimal objects for JSON serialization.
    """
    try:
        # Use SQLAlchemy's text() to wrap raw SQL queries
        result_proxy = db.execute(text(query))
        results = result_proxy.fetchall()

        # Convert results to JSON-serializable format
        serialized_results = []
        for row in results:
            serialized_row = {}
            for key, value in zip(result_proxy.keys(), row):
                # Handle Decimal conversion for SUMMARIZE TABLE results
                if isinstance(value, Decimal):
                    serialized_row[key] = float(value)
                else:
                    serialized_row[key] = value
            serialized_results.append(serialized_row)

        return serialized_results
    except Exception as e:
        # Log and raise an HTTP exception for errors
        raise HTTPException(status_code=500, detail=f"Error executing profile query: {str(e)}")

def execute_metadata_query(query: str, db: Session) -> List[Dict[str, Any]]:
    """
    Executes a metadata query and formats the results.

    Parameters:
    - query: str - The SQL query to execute.
    - db: Session - The database session to use for query execution.

    Returns:
    - A list of dictionaries where each dictionary represents a row of query results.
    """
    print(query)  # Log the query for debugging purposes
    try:
        # Execute the query using the database session
        result_proxy = db.execute(text(query))
        results = result_proxy.fetchall()

        # Convert query results into a structured format
        response_data = {
            "data": [
                {key: (value.isoformat() if isinstance(value, datetime) else value)
                 for key, value in dict(zip(result_proxy.keys(), row)).items()}
                for row in results
            ]
        }
        # Return the formatted response data as JSON
        return JSONResponse(content=response_data)
    except Exception as e:
        # Handle any exceptions that occur during query execution
        raise HTTPException(status_code=500, detail=str(e))


def execute_select_query(query: str, db: Session):

    print(query)

    try:
        result_proxy = db.execute(text(query))
        results = result_proxy.mappings().all()  # Convert to list of dictionaries
        # Serialize the results using jsonable_encoder to handle special data types like datetime
        json_compatible_data = jsonable_encoder(results)
        return JSONResponse(content={"data": json_compatible_data, "total_rows": len(results)})
    except Exception as e:
        raise HTTPException(status_code=400, detail=str(e))

def execute_ddl_query(query: str, db: Session):
    try:
        db.execute(text(query))
        db.commit()  # Make sure to commit the transaction for DDL operations
        return JSONResponse(content={"message": "Query executed successfully"})
    except Exception as e:
        db.rollback()  # Rollback the transaction in case of failure
        raise HTTPException(status_code=400, detail=str(e))

@app.post("/sqlglot/transpile")
async def sqlglot_transpile_sql(request: Request):
    try:
        # Parse JSON dynamically without a Pydantic model
        body = await request.json()
        sql = body.get("sql")
        transpile_to = body.get("transpile_to")

        if not sql:
            raise ValueError("No SQL provided for transpilation.")
        if not transpile_to:
            raise ValueError("No target language provided for transpilation.")

        # Transpile the provided SQL to the specified target language
        transpiled_sql = sqlglot.transpile(sql, write=transpile_to, identify=True, pretty=True)[0]
        return {"result_sql": transpiled_sql}
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except Exception as e:
        raise HTTPException(status_code=500, detail=f"An error occurred while transpiling: {e}")

@app.post("/sqlglot/prettify")
async def sqlglot_prettify_sql(request: Request):
    try:
        # Parse JSON dynamically without a Pydantic model
        body = await request.json()
        sql = body.get("sql")

        if not sql:
            raise ValueError("No SQL provided for prettify.")

        # Transpile the provided SQL to the specified target language
        prettified_sql = sqlglot.optimizer.optimize(sql).sql(pretty=True)
        return {"result_sql": prettified_sql}
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except Exception as e:
        raise HTTPException(status_code=500, detail=f"An error occurred while prettify: {e}")

@app.post("/sqlglot/extract/column")
async def sqlglot_extract_columns(request: Request):
    try:
        body = await request.json()
        sql = body.get("sql")

        if not sql:
            raise ValueError("No SQL provided.")

        parsed_sql = parse_one(sql)

        # Extract columns
        columns = [column.alias_or_name for column in parsed_sql.find_all(exp.Column)]

        return {"data": columns}
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except Exception as e:
        raise HTTPException(status_code=500, detail=f"An error occurred while extracting columns: {e}")

@app.post("/sqlglot/extract/table")
async def sqlglot_extract_tables(request: Request):
    try:
        body = await request.json()
        sql = body.get("sql")

        if not sql:
            raise ValueError("No SQL provided.")

        parsed_sql = parse_one(sql)

        # Extract tables
        tables = [table.name for table in parsed_sql.find_all(exp.Table)]

        return {"data": tables}
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except Exception as e:
        raise HTTPException(status_code=500, detail=f"An error occurred while extracting tables: {e}")

@app.post("/sqlglot/extract/projection")
async def sqlglot_extract_projections(request: Request):
    try:
        body = await request.json()
        sql = body.get("sql")

        if not sql:
            raise ValueError("No SQL provided.")

        parsed_sql = parse_one(sql)

        # Extract projections
        projections = []
        for select in parsed_sql.find_all(exp.Select):
            projections.extend([projection.alias_or_name for projection in select.expressions])

        return {"data": projections}
    except ValueError as e:
        raise HTTPException(status_code=400, detail=str(e))
    except Exception as e:
        raise HTTPException(status_code=500, detail=f"An error occurred while extracting projections: {e}")