From 45ad56ab7863bd95c9ccd6b5e66397e06c39ea04 Mon Sep 17 00:00:00 2001 From: Lee Penkman Date: Fri, 11 Jul 2025 15:20:22 +1200 Subject: [PATCH] Add speech to text demo route and nav links --- README.md | 12 ++++++++++++ main.py | 10 ++++++++++ static/templates/shared/header.jinja2 | 2 ++ static/templates/shared/header_new.jinja2 | 2 ++ static/templates/shared/header_old.jinja2 | 2 ++ 5 files changed, 28 insertions(+) diff --git a/README.md b/README.md index cb10908..8793d96 100644 --- a/README.md +++ b/README.md @@ -218,6 +218,18 @@ PYTHONPATH=$(pwd):$(pwd)/OFA GOOGLE_APPLICATION_CREDENTIALS=secrets/google-crede PYTHONPATH=$HOME/code/20-questions:$HOME/code/20-questions/OFA:$HOME/code/20-questions/OFA/fairseq GOOGLE_APPLICATION_CREDENTIALS=secrets/google-credentials.json gunicorn -k uvicorn.workers.UvicornWorker -b :9080 questions.inference_server.inference_server:app --timeout 180000 --workers 1 ``` Then go to localhost:9080/docs to use the API + +### Speech To Text Endpoint + +The API supports transcription of audio via the `/api/v1/audio-extraction` and `/api/v1/audio-file-extraction` routes. +Example usage with `curl`: + +```bash +curl -X POST "http://localhost:9080/api/v1/audio-extraction" \ + -H "Content-Type: application/json" \ + -d '{"audio_url": "AUDIO_URL", "translate_to_english": false}' +``` + #### run audio server only Just the Parakeet speech to text part. diff --git a/main.py b/main.py index 0c0dabd..09b18b7 100644 --- a/main.py +++ b/main.py @@ -878,6 +878,16 @@ async def text_to_speech(request: Request): "templates/text-to-speech.jinja2", base_vars, ) + +@app.get("/speech-to-text") +async def speech_to_text(request: Request): + base_vars = get_base_template_vars(request) + base_vars.update({ + }) + return templates.TemplateResponse( + "templates/speech-to-text.jinja2", base_vars, + ) + @app.get("/use-cases/{usecase}") async def use_case_route(request: Request, usecase: str): use_case_data = deepcopy(fixtures.use_cases.get(usecase)) diff --git a/static/templates/shared/header.jinja2 b/static/templates/shared/header.jinja2 index f35da56..035bf3e 100644 --- a/static/templates/shared/header.jinja2 +++ b/static/templates/shared/header.jinja2 @@ -14,6 +14,7 @@ Tools Text To Speech + Speech To Text Bulk Generator Playground @@ -38,6 +39,7 @@ play_arrow Playground edit AI Text Editor volume_up Text To Speech + graphic_eq Speech To Text android Docs login Login payments Subscribe diff --git a/static/templates/shared/header_new.jinja2 b/static/templates/shared/header_new.jinja2 index 0f4f36f..6d6502c 100644 --- a/static/templates/shared/header_new.jinja2 +++ b/static/templates/shared/header_new.jinja2 @@ -14,6 +14,7 @@ Tools Text To Speech + Speech To Text Bulk Generator Playground @@ -38,6 +39,7 @@ play_arrow Playground edit AI Text Editor volume_up Text To Speech + graphic_eq Speech To Text android Docs login Login payments Subscribe diff --git a/static/templates/shared/header_old.jinja2 b/static/templates/shared/header_old.jinja2 index 05e644f..458b4d3 100755 --- a/static/templates/shared/header_old.jinja2 +++ b/static/templates/shared/header_old.jinja2 @@ -14,6 +14,7 @@ Tools Text To Speech + Speech To Text Bulk Generator Playground @@ -38,6 +39,7 @@ play_arrow Playground edit AI Text Editor volume_up Text To Speech + graphic_eq Speech To Text android Docs login Login payments Subscribe