From 2d469752e03580bf4d459ebe1cd2a8ebf441dc2b Mon Sep 17 00:00:00 2001 From: Virginia Partridge Date: Wed, 7 Jan 2026 19:37:33 +0100 Subject: [PATCH 1/3] Updated website links and added TIMIT model fine-tuned to web app --- CHANGELOG.md | 6 ++++++ README.md | 4 ++-- src/autoipaalign/web/app.py | 7 ++++--- 3 files changed, 12 insertions(+), 5 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index fae5399..3418f0a 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -6,6 +6,12 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 ## [Unreleased] +### Changed +- Updated project links in web app and README + +### Added +- Added best TIMIT model fine-tuned on Buckeye to model list in web app + ## [v1.0.0] - 2025-12-16 ### Added diff --git a/README.md b/README.md index 3838eaa..19ca463 100644 --- a/README.md +++ b/README.md @@ -2,11 +2,11 @@ Automatically transcribe audio into the International Phonetic Alphabet (IPA) and perform forced alignment. This toolkit includes a command line interface, comparison tools, and interactive web tool. -The AutoIPA project is a collaboration between Virginia Partridge of the UMass Center for Data Science and Artificial +The Wav2IPA project is a collaboration between Virginia Partridge of the UMass Center for Data Science and Artificial Intelligence and Joe Pater of UMass Linguistics. Its goal is to make automated IPA transcription more useful to linguists (and others!). Please reach out to us if you have any questions or comments about our work or have related work to share! -More details are on our [project website](https://websites.umass.edu/comphon/autoipa-automated-ipa-transcription/). +More details are on our [project website](https://websites.umass.edu/comphon/wav2ipa-automated-ipa-transcription/). If you use our software, please cite our AMP paper: diff --git a/src/autoipaalign/web/app.py b/src/autoipaalign/web/app.py index 0f66b50..8c79a33 100644 --- a/src/autoipaalign/web/app.py +++ b/src/autoipaalign/web/app.py @@ -13,7 +13,7 @@ TEXTGRID_DOWNLOAD_TEXT = "Download TextGrid file" TEXTGRID_NAME_INPUT_LABEL = "TextGrid file name" -TITLE = "AutoIPA: Automated IPA transcription" +TITLE = "Wav2IPA: Automated IPA transcription" INTRO_BLOCK = f"""# {TITLE} Experiment with producing @@ -26,7 +26,7 @@ Our first step was to fine-tune a Wav2Vec 2.0 model on the Buckeye corpus, which you can try out here. Our next steps will be to extend our work to other varieties of English and other languages. Please reach out to us if you have any questions or comments about our work or have related work to share! -More details are on our [project website](https://websites.umass.edu/comphon/autoipa-automated-ipa-transcription/). +More details are on our [project website](https://websites.umass.edu/comphon/wav2ipa-automated-ipa-transcription/). If you use our software, please cite our AMP paper: Partridge, Virginia, Joe Pater, Parth Bhangla, Ali Nirheche and Brandon Prickett. 2025/to appear. [AI-assisted analysis of phonological variation in English](https://docs.google.com/presentation/d/1IJrfokvX5T_fKkiFXmcYEgRI2ZRwgFU4zU1tNC-iYl0/edit?usp=sharing). Special session on Deep Phonology, AMP 2025, UC Berkeley. To appear in the Proceedings of AMP 2025. @@ -52,6 +52,7 @@ "ctaguchi/wav2vec2-large-xlsr-japlmthufielta-ipa1000-ns", "excalibur12/wav2vec2-large-lv60_phoneme-timit_english_timit-4k", "excalibur12/wav2vec2-large-lv60_phoneme-timit_english_timit-4k_simplified", + "ginic/wav2vec2-large-lv60_phoneme-timit_english_timit-4k_buckeye-4k_bs32_3", "ginic/full_dataset_train_1_wav2vec2-large-xlsr-53-buckeye-ipa", "ginic/full_dataset_train_2_wav2vec2-large-xlsr-53-buckeye-ipa", "ginic/full_dataset_train_3_wav2vec2-large-xlsr-53-buckeye-ipa", @@ -240,7 +241,7 @@ def launch_demo(): VALID_MODELS, value=DEFAULT_MODEL, label="IPA transcription ASR model", - info="Select the model to use for prediction.", + info="Select the model to use for prediction. For details about each one, visit its model page on the HuggingFace Hub", ) # Dropdown for transcription type selection From 7b8895c32fed01f2f957a1d846d85202ca8f21cb Mon Sep 17 00:00:00 2001 From: Virginia Partridge Date: Wed, 7 Jan 2026 19:38:22 +0100 Subject: [PATCH 2/3] Bump version number --- CHANGELOG.md | 2 ++ pyproject.toml | 2 +- 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 3418f0a..2cec4d5 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -6,6 +6,8 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 ## [Unreleased] +## [v1.0.1] - 2026-01-07 + ### Changed - Updated project links in web app and README diff --git a/pyproject.toml b/pyproject.toml index 718bf3a..99e1347 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -1,6 +1,6 @@ [project] name = "autoipaalign" -version = "1.0.0" +version = "1.0.1" description = "Automatic IPA alignment workspace with CLI, comparison tools, and web interface" requires-python = ">=3.10,<3.14" readme = "README.md" From 78aaef9f39375b2d35136c7762e87f473e91810e Mon Sep 17 00:00:00 2001 From: Virginia Partridge Date: Wed, 7 Jan 2026 19:46:17 +0100 Subject: [PATCH 3/3] Sync uv lock --- uv.lock | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/uv.lock b/uv.lock index 66b75b4..e2402db 100644 --- a/uv.lock +++ b/uv.lock @@ -124,7 +124,7 @@ wheels = [ [[package]] name = "autoipaalign" -version = "1.0.0" +version = "1.0.1" source = { editable = "." } dependencies = [ { name = "librosa" },