BasedHardware · beastoin · Jan 22, 2026 · Jan 22, 2026 · Jan 22, 2026 · Jan 22, 2026
diff --git a/backend/test.sh b/backend/test.sh
@@ -8,6 +8,7 @@ export ENCRYPTION_SECRET="omi_ZwB2ZNqB2HHpMK6wStk7sTpavJiPTFg7gXUHnc4tFABPU6pZ2c
 
 pytest tests/unit/test_transcript_segment.py -v
 pytest tests/unit/test_text_similarity.py -v
+pytest tests/unit/test_text_containment.py -v
 pytest tests/unit/test_speaker_sample.py -v
 pytest tests/unit/test_speaker_sample_migration.py -v
 pytest tests/unit/test_users_add_sample_transaction.py -v
diff --git a/backend/tests/unit/test_speaker_sample.py b/backend/tests/unit/test_speaker_sample.py
@@ -31,9 +31,7 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript is None
     assert is_valid is False
@@ -52,9 +50,7 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript is None
     assert is_valid is False
@@ -72,9 +68,7 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript is None
     assert is_valid is False
@@ -119,9 +113,7 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript is None
     assert is_valid is False
@@ -137,11 +129,11 @@ def test_verify_and_transcribe_sample_text_mismatch(monkeypatch):
     def fake_deepgram(*_args, **_kwargs):
         return words
 
-    def fake_similarity(_text1, _text2):
+    def fake_containment(_text1, _text2):
         return 0.5
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
-    monkeypatch.setattr(speaker_sample, "compute_text_similarity", fake_similarity)
+    monkeypatch.setattr(speaker_sample, "compute_text_containment", fake_containment)
 
     transcript, is_valid, reason = asyncio.run(
         speaker_sample.verify_and_transcribe_sample(
@@ -151,7 +143,7 @@ def fake_similarity(_text1, _text2):
 
     assert transcript == "good morning thanks for coming"
     assert is_valid is False
-    assert reason == "text_mismatch: similarity=0.50"
+    assert reason == "text_mismatch: containment=0.50"
 
 
 def test_verify_and_transcribe_sample_text_mismatch_just_below(monkeypatch):
@@ -163,21 +155,19 @@ def test_verify_and_transcribe_sample_text_mismatch_just_below(monkeypatch):
     def fake_deepgram(*_args, **_kwargs):
         return words
 
-    def fake_similarity(_text1, _text2):
-        return 0.59
+    def fake_containment(_text1, _text2):
+        return 0.89
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
-    monkeypatch.setattr(speaker_sample, "compute_text_similarity", fake_similarity)
+    monkeypatch.setattr(speaker_sample, "compute_text_containment", fake_containment)
 
     transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(
-            b"audio", 16000, expected_text="galaxy salsa party"
-        )
+        speaker_sample.verify_and_transcribe_sample(b"audio", 16000, expected_text="galaxy salsa party")
     )
 
     assert transcript == "galaxy salsa makes the party loud"
     assert is_valid is False
-    assert reason == "text_mismatch: similarity=0.59"
+    assert reason == "text_mismatch: containment=0.89"
 
 
 def test_verify_and_transcribe_sample_success(monkeypatch):
@@ -186,19 +176,39 @@ def test_verify_and_transcribe_sample_success(monkeypatch):
     def fake_deepgram(*_args, **_kwargs):
         return words
 
-    def fake_similarity(_text1, _text2):
-        return 0.9
+    def fake_containment(_text1, _text2):
+        return 0.95
+
+    monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
+    monkeypatch.setattr(speaker_sample, "compute_text_containment", fake_containment)
+
+    transcript, is_valid, reason = asyncio.run(
+        speaker_sample.verify_and_transcribe_sample(b"audio", 16000, expected_text="thanks for joining the meeting")
+    )
+
+    assert transcript == "thanks for joining the meeting"
+    assert is_valid is True
+    assert reason == "ok"
+
+
+def test_verify_and_transcribe_sample_containment_real_function(monkeypatch):
+    words = _make_words(
+        ["orbiting", "satellites", "drift", "above", "quietly"],
+        speakers=["SPEAKER_00"] * 5,
+    )
+
+    def fake_deepgram(*_args, **_kwargs):
+        return words
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
-    monkeypatch.setattr(speaker_sample, "compute_text_similarity", fake_similarity)
 
     transcript, is_valid, reason = asyncio.run(
         speaker_sample.verify_and_transcribe_sample(
-            b"audio", 16000, expected_text="thanks for joining the meeting"
+            b"audio", 16000, expected_text="today orbiting satellites drift above quietly"
         )
     )
 
-    assert transcript == "thanks for joining the meeting"
+    assert transcript == "orbiting satellites drift above quietly"
     assert is_valid is True
     assert reason == "ok"
 
@@ -214,9 +224,7 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript == "party on planet pizza night"
     assert is_valid is True
@@ -244,16 +252,14 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript == " ".join(texts)
     assert is_valid is True
     assert reason == "ok"
 
 
-def test_verify_and_transcribe_sample_similarity_boundary(monkeypatch):
+def test_verify_and_transcribe_sample_containment_boundary(monkeypatch):
     words = _make_words(
         ["space", "pirates", "sail", "the", "neon", "seas"],
         speakers=["SPEAKER_00"] * 6,
@@ -262,16 +268,14 @@ def test_verify_and_transcribe_sample_similarity_boundary(monkeypatch):
     def fake_deepgram(*_args, **_kwargs):
         return words
 
-    def fake_similarity(_text1, _text2):
-        return 0.6
+    def fake_containment(_text1, _text2):
+        return 0.9
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
-    monkeypatch.setattr(speaker_sample, "compute_text_similarity", fake_similarity)
+    monkeypatch.setattr(speaker_sample, "compute_text_containment", fake_containment)
 
     transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(
-            b"audio", 16000, expected_text="space pirates sail neon seas"
-        )
+        speaker_sample.verify_and_transcribe_sample(b"audio", 16000, expected_text="space pirates sail neon seas")
     )
 
     assert transcript == "space pirates sail the neon seas"
@@ -287,9 +291,7 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript == "just a solo astronaut report"
     assert is_valid is True
@@ -307,9 +309,7 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript == "blank speaker tag shows up"
     assert is_valid is True
@@ -326,10 +326,10 @@ def fake_deepgram(*_args, **_kwargs):
         return words
 
     def fail_similarity(*_args, **_kwargs):
-        raise AssertionError("compute_text_similarity should not be called")
+        raise AssertionError("compute_text_containment should not be called")
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
-    monkeypatch.setattr(speaker_sample, "compute_text_similarity", fail_similarity)
+    monkeypatch.setattr(speaker_sample, "compute_text_containment", fail_similarity)
 
     transcript, is_valid, reason = asyncio.run(
         speaker_sample.verify_and_transcribe_sample(b"audio", 16000, expected_text="")
@@ -350,10 +350,10 @@ def fake_deepgram(*_args, **_kwargs):
         return words
 
     def fail_similarity(*_args, **_kwargs):
-        raise AssertionError("compute_text_similarity should not be called")
+        raise AssertionError("compute_text_containment should not be called")
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
-    monkeypatch.setattr(speaker_sample, "compute_text_similarity", fail_similarity)
+    monkeypatch.setattr(speaker_sample, "compute_text_containment", fail_similarity)
 
     transcript, is_valid, reason = asyncio.run(
         speaker_sample.verify_and_transcribe_sample(b"audio", 16000, expected_text=None)
@@ -370,9 +370,7 @@ def fake_deepgram(*_args, **_kwargs):
 
     monkeypatch.setattr(speaker_sample, "deepgram_prerecorded_from_bytes", fake_deepgram)
 
-    transcript, is_valid, reason = asyncio.run(
-        speaker_sample.verify_and_transcribe_sample(b"audio", 16000)
-    )
+    transcript, is_valid, reason = asyncio.run(speaker_sample.verify_and_transcribe_sample(b"audio", 16000))
 
     assert transcript is None
     assert is_valid is False

diff --git a/backend/tests/unit/test_text_containment.py b/backend/tests/unit/test_text_containment.py
@@ -0,0 +1,54 @@
+"""
+Unit tests for compute_text_containment function.
+Tests character trigram containment across multiple languages.
+"""
+
+from utils.text_utils import compute_text_containment
+
+
+class TestComputeTextContainment:
+    """Tests for the compute_text_containment function."""
+
+    def test_transcript_fully_contained(self):
+        transcript = "hello world nice day"
+        expected = "greetings hello world nice day everyone"
+        assert compute_text_containment(transcript, expected) == 1.0
+
+    def test_transcript_not_contained(self):
+        transcript = "hello world nice day"
+        expected = "greetings hello world pleasant evening"
+        containment = compute_text_containment(transcript, expected)
+        assert containment < 0.9
+
+    def test_empty_transcript(self):
+        assert compute_text_containment("", "hello") == 0.0
+
+    def test_short_transcript_contained(self):
+        assert compute_text_containment("hi", "oh hi there") == 1.0
+
+    def test_short_transcript_not_contained(self):
+        assert compute_text_containment("hi", "hello there") == 0.0
+
+    def test_case_and_whitespace_normalization(self):
+        transcript = "Hello   World"
+        expected = "greetings hello world everyone"
+        assert compute_text_containment(transcript, expected) == 1.0
+
+    def test_chinese_contained(self):
+        transcript = "你好世界"
+        expected = "今天你好世界朋友"
+        assert compute_text_containment(transcript, expected) == 1.0
+
+    def test_thai_contained(self):
+        transcript = "สวัสดีครับ"
+        expected = "วันนี้สวัสดีครับเพื่อนๆ"
+        assert compute_text_containment(transcript, expected) == 1.0
+
+    def test_expected_empty_returns_zero(self):
+        assert compute_text_containment("hello", "") == 0.0
+
+    def test_trigram_length_boundary_contained(self):
+        assert compute_text_containment("hey", "oh hey there") == 1.0
+
+    def test_trigram_length_boundary_not_contained(self):
+        assert compute_text_containment("hey", "oh he there") == 0.0
diff --git a/backend/utils/speaker_sample.py b/backend/utils/speaker_sample.py
@@ -12,10 +12,10 @@
 
 from utils.other.storage import delete_speech_profile_blob, download_speech_profile_bytes
 from utils.stt.pre_recorded import deepgram_prerecorded_from_bytes
-from utils.text_utils import compute_text_similarity
+from utils.text_utils import compute_text_containment
 
 MIN_WORDS = 5
-MIN_SIMILARITY = 0.6
+MIN_CONTAINMENT = 0.9
 MIN_DOMINANT_SPEAKER_RATIO = 0.7
 
 
@@ -30,7 +30,7 @@ async def verify_and_transcribe_sample(
     Checks:
     1. Transcription has at least MIN_WORDS words
     2. Dominant speaker accounts for >= MIN_DOMINANT_SPEAKER_RATIO of words (via diarization)
-    3. Transcribed text has >= MIN_SIMILARITY with expected text (if provided)
+    3. Transcribed text has >= MIN_CONTAINMENT containment in expected text (if provided)
 
     Args:
         audio_bytes: WAV format audio bytes
@@ -66,9 +66,9 @@ async def verify_and_transcribe_sample(
     transcript = ' '.join(w.get('text', '') for w in words)
 
     if expected_text:
-        similarity = compute_text_similarity(transcript, expected_text)
-        if similarity < MIN_SIMILARITY:
-            return transcript, False, f"text_mismatch: similarity={similarity:.2f}"
+        containment = compute_text_containment(transcript, expected_text)
+        if containment < MIN_CONTAINMENT:
+            return transcript, False, f"text_mismatch: containment={containment:.2f}"
 
     return transcript, True, "ok"