From a56a3bed93d4cce0330441cb4d2436639b971f3f Mon Sep 17 00:00:00 2001
From: Chris0Jeky <jeky.tck@gmail.com>
Date: Tue, 31 Mar 2026 04:10:00 +0100
Subject: [PATCH 1/6] Increase default MaxTokens from 1024 to 2048

The previous 1024 limit was too low, causing LLM responses to be
truncated mid-JSON when structured output was requested. Fixes #616.
---
 backend/src/Taskdeck.Application/Services/ILlmProvider.cs | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/backend/src/Taskdeck.Application/Services/ILlmProvider.cs b/backend/src/Taskdeck.Application/Services/ILlmProvider.cs
index 946a91309..3c8e14ca0 100644
--- a/backend/src/Taskdeck.Application/Services/ILlmProvider.cs
+++ b/backend/src/Taskdeck.Application/Services/ILlmProvider.cs
@@ -10,7 +10,7 @@ public interface ILlmProvider
 
 public record ChatCompletionRequest(
     List<ChatCompletionMessage> Messages,
-    int MaxTokens = 1024,
+    int MaxTokens = 2048,
     double Temperature = 0.7,
     LlmRequestAttribution? Attribution = null,
     string? SystemPrompt = null,

From ca2fabcbd3899a0cfd0ef24513f0d527aeb06d50 Mon Sep 17 00:00:00 2001
From: Chris0Jeky <jeky.tck@gmail.com>
Date: Tue, 31 Mar 2026 04:11:12 +0100
Subject: [PATCH 2/6] Add finish_reason and JSON truncation detection to OpenAI
 provider

Extract finish_reason from the OpenAI response. When it is "length",
mark the result as degraded with reason "Response was truncated".
Also detect invalid JSON when JSON mode was requested, which indicates
the response was cut off before the model could produce valid output.
---
 .../Services/OpenAiLlmProvider.cs             | 58 ++++++++++++++++++-
 1 file changed, 56 insertions(+), 2 deletions(-)

diff --git a/backend/src/Taskdeck.Application/Services/OpenAiLlmProvider.cs b/backend/src/Taskdeck.Application/Services/OpenAiLlmProvider.cs
index e77f590a4..035239379 100644
--- a/backend/src/Taskdeck.Application/Services/OpenAiLlmProvider.cs
+++ b/backend/src/Taskdeck.Application/Services/OpenAiLlmProvider.cs
@@ -52,12 +52,43 @@ public async Task<LlmCompletionResult> CompleteAsync(ChatCompletionRequest reque
                 return BuildFallbackResult(lastUserMessage, "Live provider request failed.", GetConfiguredModelOrDefault());
             }
 
-            if (!TryParseResponse(body, out var content, out var tokensUsed))
+            if (!TryParseResponse(body, out var content, out var tokensUsed, out var finishReason))
             {
                 _logger.LogWarning("OpenAI completion response could not be parsed.");
                 return BuildFallbackResult(lastUserMessage, "Live provider response parsing failed.", GetConfiguredModelOrDefault());
             }
 
+            // Detect truncation: OpenAI returns finish_reason "length" when the
+            // response was cut off by the max_tokens limit.
+            if (string.Equals(finishReason, "length", StringComparison.OrdinalIgnoreCase))
+            {
+                _logger.LogWarning("OpenAI response was truncated (finish_reason=length).");
+                return new LlmCompletionResult(
+                    content,
+                    tokensUsed,
+                    IsActionable: false,
+                    Provider: "OpenAI",
+                    Model: GetConfiguredModelOrDefault(),
+                    IsDegraded: true,
+                    DegradedReason: "Response was truncated");
+            }
+
+            // When JSON mode was requested but the response is not valid JSON,
+            // the output was likely truncated before the model could finish.
+            var useInstructionExtraction = request.SystemPrompt is null;
+            if (useInstructionExtraction && !IsValidJson(content))
+            {
+                _logger.LogWarning("OpenAI JSON-mode response is not valid JSON; treating as truncated.");
+                return new LlmCompletionResult(
+                    content,
+                    tokensUsed,
+                    IsActionable: false,
+                    Provider: "OpenAI",
+                    Model: GetConfiguredModelOrDefault(),
+                    IsDegraded: true,
+                    DegradedReason: "Response was truncated");
+            }
+
             // Try to parse structured instruction extraction from the LLM response
             if (LlmInstructionExtractionPrompt.TryParseStructuredResponse(
                     content,
@@ -227,10 +258,11 @@ private object BuildRequestPayload(ChatCompletionRequest request)
         return payload;
     }
 
-    private static bool TryParseResponse(string responseBody, out string content, out int tokensUsed)
+    private static bool TryParseResponse(string responseBody, out string content, out int tokensUsed, out string? finishReason)
     {
         content = string.Empty;
         tokensUsed = 0;
+        finishReason = null;
 
         if (string.IsNullOrWhiteSpace(responseBody))
         {
@@ -259,6 +291,12 @@ private static bool TryParseResponse(string responseBody, out string content, ou
                 return false;
             }
 
+            if (first.TryGetProperty("finish_reason", out var finishReasonElement) &&
+                finishReasonElement.ValueKind == JsonValueKind.String)
+            {
+                finishReason = finishReasonElement.GetString();
+            }
+
             if (root.TryGetProperty("usage", out var usage) &&
                 usage.TryGetProperty("total_tokens", out var totalTokens) &&
                 totalTokens.TryGetInt32(out var parsedTokens))
@@ -308,6 +346,22 @@ private static LlmCompletionResult BuildFallbackResult(string userMessage, strin
             Instructions: instructions);
     }
 
+    private static bool IsValidJson(string text)
+    {
+        if (string.IsNullOrWhiteSpace(text))
+            return false;
+
+        try
+        {
+            using var doc = JsonDocument.Parse(text);
+            return true;
+        }
+        catch (JsonException)
+        {
+            return false;
+        }
+    }
+
     private static int EstimateTokens(string text)
     {
         if (string.IsNullOrWhiteSpace(text))

From 1eb85488eefc09773a2b20b1c61634c50dcce105 Mon Sep 17 00:00:00 2001
From: Chris0Jeky <jeky.tck@gmail.com>
Date: Tue, 31 Mar 2026 04:12:13 +0100
Subject: [PATCH 3/6] Add finish_reason and JSON truncation detection to Gemini
 provider

Extract finishReason from the Gemini response candidates. When it is
"MAX_TOKENS", mark the result as degraded with reason "Response was
truncated". Also detect invalid JSON when JSON mode was requested.
---
 .../Services/GeminiLlmProvider.cs             | 58 ++++++++++++++++++-
 1 file changed, 56 insertions(+), 2 deletions(-)

diff --git a/backend/src/Taskdeck.Application/Services/GeminiLlmProvider.cs b/backend/src/Taskdeck.Application/Services/GeminiLlmProvider.cs
index 534aeb381..911ba355d 100644
--- a/backend/src/Taskdeck.Application/Services/GeminiLlmProvider.cs
+++ b/backend/src/Taskdeck.Application/Services/GeminiLlmProvider.cs
@@ -81,12 +81,42 @@ public async Task<LlmCompletionResult> CompleteAsync(ChatCompletionRequest reque
                 return BuildFallbackResult(lastUserMessage, "Live provider request failed.", GetConfiguredModelOrDefault());
             }
 
-            if (!TryParseResponse(body, out var content, out var tokensUsed))
+            if (!TryParseResponse(body, out var content, out var tokensUsed, out var finishReason))
             {
                 _logger.LogWarning("Gemini completion response could not be parsed.");
                 return BuildFallbackResult(lastUserMessage, "Live provider response parsing failed.", GetConfiguredModelOrDefault());
             }
 
+            // Detect truncation: Gemini returns finishReason "MAX_TOKENS" when the
+            // response was cut off by the maxOutputTokens limit.
+            if (string.Equals(finishReason, "MAX_TOKENS", StringComparison.OrdinalIgnoreCase))
+            {
+                _logger.LogWarning("Gemini response was truncated (finishReason=MAX_TOKENS).");
+                return new LlmCompletionResult(
+                    content,
+                    tokensUsed,
+                    IsActionable: false,
+                    Provider: "Gemini",
+                    Model: GetConfiguredModelOrDefault(),
+                    IsDegraded: true,
+                    DegradedReason: "Response was truncated");
+            }
+
+            // When JSON mode was requested but the response is not valid JSON,
+            // the output was likely truncated before the model could finish.
+            if (useInstructionExtraction && !IsValidJson(content))
+            {
+                _logger.LogWarning("Gemini JSON-mode response is not valid JSON; treating as truncated.");
+                return new LlmCompletionResult(
+                    content,
+                    tokensUsed,
+                    IsActionable: false,
+                    Provider: "Gemini",
+                    Model: GetConfiguredModelOrDefault(),
+                    IsDegraded: true,
+                    DegradedReason: "Response was truncated");
+            }
+
             // Try to parse structured instruction extraction from the LLM response
             if (LlmInstructionExtractionPrompt.TryParseStructuredResponse(
                     content,
@@ -225,10 +255,11 @@ private static object MapMessage(ChatCompletionMessage message)
         };
     }
 
-    private static bool TryParseResponse(string responseBody, out string content, out int tokensUsed)
+    private static bool TryParseResponse(string responseBody, out string content, out int tokensUsed, out string? finishReason)
     {
         content = string.Empty;
         tokensUsed = 0;
+        finishReason = null;
 
         if (string.IsNullOrWhiteSpace(responseBody))
         {
@@ -248,6 +279,13 @@ private static bool TryParseResponse(string responseBody, out string content, ou
             }
 
             var firstCandidate = candidates[0];
+
+            if (firstCandidate.TryGetProperty("finishReason", out var finishReasonElement) &&
+                finishReasonElement.ValueKind == JsonValueKind.String)
+            {
+                finishReason = finishReasonElement.GetString();
+            }
+
             if (!firstCandidate.TryGetProperty("content", out var candidateContent) ||
                 !candidateContent.TryGetProperty("parts", out var parts) ||
                 parts.ValueKind != JsonValueKind.Array ||
@@ -324,6 +362,22 @@ private static LlmCompletionResult BuildFallbackResult(string userMessage, strin
             Instructions: instructions);
     }
 
+    private static bool IsValidJson(string text)
+    {
+        if (string.IsNullOrWhiteSpace(text))
+            return false;
+
+        try
+        {
+            using var doc = JsonDocument.Parse(text);
+            return true;
+        }
+        catch (JsonException)
+        {
+            return false;
+        }
+    }
+
     private static int EstimateTokens(string text)
     {
         if (string.IsNullOrWhiteSpace(text))

From d6bc4110ae73057532664968809d2f9d8cd8d193 Mon Sep 17 00:00:00 2001
From: Chris0Jeky <jeky.tck@gmail.com>
Date: Tue, 31 Mar 2026 04:13:59 +0100
Subject: [PATCH 4/6] Detect truncated JSON in chat and show friendly notice

When an assistant message starts with '{' but is not valid JSON, the
frontend now shows "This response was cut short. Try a simpler question
or rephrase." instead of rendering the raw broken JSON.
---
 .../src/views/AutomationChatView.vue          | 27 ++++++++++++++++++-
 1 file changed, 26 insertions(+), 1 deletion(-)

diff --git a/frontend/taskdeck-web/src/views/AutomationChatView.vue b/frontend/taskdeck-web/src/views/AutomationChatView.vue
index 33cc09f54..fd1a14176 100644
--- a/frontend/taskdeck-web/src/views/AutomationChatView.vue
+++ b/frontend/taskdeck-web/src/views/AutomationChatView.vue
@@ -28,6 +28,20 @@ function renderMarkdown(content: string): string {
   return DOMPurify.sanitize(marked.parse(content, { async: false }))
 }
 
+function isTruncatedJson(content: string): boolean {
+  if (!content) return false
+  const trimmed = content.trim()
+  if (!trimmed.startsWith('{')) return false
+  try {
+    JSON.parse(trimmed)
+    return false
+  } catch {
+    return true
+  }
+}
+
+const truncationNotice = 'This response was cut short. Try a simpler question or rephrase.'
+
 const router = useRouter()
 const route = useRoute()
 const toast = useToastStore()
@@ -661,7 +675,13 @@ watch(
               </template>
               <template v-else>
                 <div
-                  v-if="isAssistantOrSystemMessage(message)"
+                  v-if="isAssistantOrSystemMessage(message) && isTruncatedJson(message.content)"
+                  class="td-message-content td-message-content--truncated"
+                >
+                  {{ truncationNotice }}
+                </div>
+                <div
+                  v-else-if="isAssistantOrSystemMessage(message)"
                   class="td-message-content td-message-content--markdown"
                   v-html="renderMarkdown(message.content)"
                 ></div>
@@ -930,6 +950,11 @@ watch(
   font-size: var(--td-font-sm);
 }
 
+.td-message-content--truncated {
+  color: var(--td-text-secondary);
+  font-style: italic;
+}
+
 .td-message-content--markdown {
   white-space: normal;
 }

From a463641b0907a638a48c50297bdfb2009bb57735 Mon Sep 17 00:00:00 2001
From: Chris0Jeky <jeky.tck@gmail.com>
Date: Tue, 31 Mar 2026 04:17:21 +0100
Subject: [PATCH 5/6] Refine JSON truncation check to only flag partial JSON
 objects

Plain-text LLM responses should still fall through to the static
classifier. Only flag content that starts with '{' but fails JSON
parsing, which indicates truncated structured output.
---
 .../Services/GeminiLlmProvider.cs             | 22 +++++++++++++------
 .../Services/OpenAiLlmProvider.cs             | 22 +++++++++++++------
 2 files changed, 30 insertions(+), 14 deletions(-)

diff --git a/backend/src/Taskdeck.Application/Services/GeminiLlmProvider.cs b/backend/src/Taskdeck.Application/Services/GeminiLlmProvider.cs
index 911ba355d..1ce8762f3 100644
--- a/backend/src/Taskdeck.Application/Services/GeminiLlmProvider.cs
+++ b/backend/src/Taskdeck.Application/Services/GeminiLlmProvider.cs
@@ -102,9 +102,9 @@ public async Task<LlmCompletionResult> CompleteAsync(ChatCompletionRequest reque
                     DegradedReason: "Response was truncated");
             }
 
-            // When JSON mode was requested but the response is not valid JSON,
-            // the output was likely truncated before the model could finish.
-            if (useInstructionExtraction && !IsValidJson(content))
+            // When JSON mode was requested and the response starts with '{' but
+            // does not parse as valid JSON, the output was likely truncated.
+            if (useInstructionExtraction && LooksLikeTruncatedJson(content))
             {
                 _logger.LogWarning("Gemini JSON-mode response is not valid JSON; treating as truncated.");
                 return new LlmCompletionResult(
@@ -362,19 +362,27 @@ private static LlmCompletionResult BuildFallbackResult(string userMessage, strin
             Instructions: instructions);
     }
 
-    private static bool IsValidJson(string text)
+    /// <summary>
+    /// Returns true when <paramref name="text"/> starts with '{' but does not
+    /// parse as valid JSON — a strong signal the response was cut off mid-output.
+    /// </summary>
+    internal static bool LooksLikeTruncatedJson(string text)
     {
         if (string.IsNullOrWhiteSpace(text))
             return false;
 
+        var trimmed = text.TrimStart();
+        if (!trimmed.StartsWith('{'))
+            return false;
+
         try
         {
-            using var doc = JsonDocument.Parse(text);
-            return true;
+            using var doc = JsonDocument.Parse(trimmed);
+            return false;
         }
         catch (JsonException)
         {
-            return false;
+            return true;
         }
     }
 
diff --git a/backend/src/Taskdeck.Application/Services/OpenAiLlmProvider.cs b/backend/src/Taskdeck.Application/Services/OpenAiLlmProvider.cs
index 035239379..c8a161bb3 100644
--- a/backend/src/Taskdeck.Application/Services/OpenAiLlmProvider.cs
+++ b/backend/src/Taskdeck.Application/Services/OpenAiLlmProvider.cs
@@ -73,10 +73,10 @@ public async Task<LlmCompletionResult> CompleteAsync(ChatCompletionRequest reque
                     DegradedReason: "Response was truncated");
             }
 
-            // When JSON mode was requested but the response is not valid JSON,
-            // the output was likely truncated before the model could finish.
+            // When JSON mode was requested and the response starts with '{' but
+            // does not parse as valid JSON, the output was likely truncated.
             var useInstructionExtraction = request.SystemPrompt is null;
-            if (useInstructionExtraction && !IsValidJson(content))
+            if (useInstructionExtraction && LooksLikeTruncatedJson(content))
             {
                 _logger.LogWarning("OpenAI JSON-mode response is not valid JSON; treating as truncated.");
                 return new LlmCompletionResult(
@@ -346,19 +346,27 @@ private static LlmCompletionResult BuildFallbackResult(string userMessage, strin
             Instructions: instructions);
     }
 
-    private static bool IsValidJson(string text)
+    /// <summary>
+    /// Returns true when <paramref name="text"/> starts with '{' but does not
+    /// parse as valid JSON — a strong signal the response was cut off mid-output.
+    /// </summary>
+    internal static bool LooksLikeTruncatedJson(string text)
     {
         if (string.IsNullOrWhiteSpace(text))
             return false;
 
+        var trimmed = text.TrimStart();
+        if (!trimmed.StartsWith('{'))
+            return false;
+
         try
         {
-            using var doc = JsonDocument.Parse(text);
-            return true;
+            using var doc = JsonDocument.Parse(trimmed);
+            return false;
         }
         catch (JsonException)
         {
-            return false;
+            return true;
         }
     }
 

From 5d51b68b42a752d00b66f0441be586f22f198b58 Mon Sep 17 00:00:00 2001
From: Chris0Jeky <jeky.tck@gmail.com>
Date: Tue, 31 Mar 2026 04:23:50 +0100
Subject: [PATCH 6/6] Add tests for finish_reason and truncated JSON detection

Cover OpenAI finish_reason=length, Gemini finishReason=MAX_TOKENS,
OpenAI JSON-mode truncation, and LooksLikeTruncatedJson unit tests
for both providers.
---
 .../Services/GeminiLlmProviderTests.cs        | 49 ++++++++++++
 .../Services/OpenAiLlmProviderTests.cs        | 79 +++++++++++++++++++
 2 files changed, 128 insertions(+)

diff --git a/backend/tests/Taskdeck.Application.Tests/Services/GeminiLlmProviderTests.cs b/backend/tests/Taskdeck.Application.Tests/Services/GeminiLlmProviderTests.cs
index 3971b5272..9d5d7021e 100644
--- a/backend/tests/Taskdeck.Application.Tests/Services/GeminiLlmProviderTests.cs
+++ b/backend/tests/Taskdeck.Application.Tests/Services/GeminiLlmProviderTests.cs
@@ -432,6 +432,55 @@ await provider.CompleteAsync(new ChatCompletionRequest(
         hasSystemInstruction.Should().BeFalse("empty system prompt should not produce system_instruction field");
     }
 
+    [Fact]
+    public async Task CompleteAsync_ShouldReturnDegraded_WhenFinishReasonIsMaxTokens()
+    {
+        var settings = BuildSettings();
+        var handler = new StubHttpMessageHandler(_ =>
+        {
+            return new HttpResponseMessage(HttpStatusCode.OK)
+            {
+                Content = new StringContent(
+                    """
+                    {
+                      "candidates": [
+                        {
+                          "content": {
+                            "parts": [{ "text": "partial response" }]
+                          },
+                          "finishReason": "MAX_TOKENS"
+                        }
+                      ],
+                      "usageMetadata": { "totalTokenCount": 50 }
+                    }
+                    """,
+                    Encoding.UTF8,
+                    "application/json")
+            };
+        });
+
+        var provider = new GeminiLlmProvider(new HttpClient(handler), settings, NullLogger<GeminiLlmProvider>.Instance);
+        var result = await provider.CompleteAsync(new ChatCompletionRequest(
+            [new ChatCompletionMessage("User", "tell me something")],
+            SystemPrompt: string.Empty));
+
+        result.IsDegraded.Should().BeTrue();
+        result.DegradedReason.Should().Be("Response was truncated");
+        result.Content.Should().Be("partial response");
+        result.IsActionable.Should().BeFalse();
+    }
+
+    [Theory]
+    [InlineData("{\"reply\":\"incomplete", true)]
+    [InlineData("{}", false)]
+    [InlineData("plain text response", false)]
+    [InlineData("", false)]
+    [InlineData("  { broken json", true)]
+    public void LooksLikeTruncatedJson_ShouldDetectPartialJson(string input, bool expected)
+    {
+        GeminiLlmProvider.LooksLikeTruncatedJson(input).Should().Be(expected);
+    }
+
     private static LlmProviderSettings BuildSettings()
     {
         return new LlmProviderSettings
diff --git a/backend/tests/Taskdeck.Application.Tests/Services/OpenAiLlmProviderTests.cs b/backend/tests/Taskdeck.Application.Tests/Services/OpenAiLlmProviderTests.cs
index c29c75273..df3dca0c5 100644
--- a/backend/tests/Taskdeck.Application.Tests/Services/OpenAiLlmProviderTests.cs
+++ b/backend/tests/Taskdeck.Application.Tests/Services/OpenAiLlmProviderTests.cs
@@ -269,6 +269,85 @@ public async Task CompleteAsync_ShouldRedactSensitiveDetails_WhenUnexpectedExcep
         message.Should().Contain($"Authorization: Bearer {SensitiveDataRedactor.RedactedValue}");
     }
 
+    [Fact]
+    public async Task CompleteAsync_ShouldReturnDegraded_WhenFinishReasonIsLength()
+    {
+        var settings = BuildSettings();
+        var handler = new StubHttpMessageHandler(_ =>
+        {
+            return new HttpResponseMessage(HttpStatusCode.OK)
+            {
+                Content = new StringContent(
+                    """
+                    {
+                      "choices": [
+                        {
+                          "message": { "content": "partial response" },
+                          "finish_reason": "length"
+                        }
+                      ],
+                      "usage": { "total_tokens": 50 }
+                    }
+                    """,
+                    Encoding.UTF8,
+                    "application/json")
+            };
+        });
+
+        var provider = new OpenAiLlmProvider(new HttpClient(handler), settings, NullLogger<OpenAiLlmProvider>.Instance);
+        var result = await provider.CompleteAsync(new ChatCompletionRequest(
+            [new ChatCompletionMessage("User", "tell me something")],
+            SystemPrompt: string.Empty));
+
+        result.IsDegraded.Should().BeTrue();
+        result.DegradedReason.Should().Be("Response was truncated");
+        result.Content.Should().Be("partial response");
+        result.IsActionable.Should().BeFalse();
+    }
+
+    [Fact]
+    public async Task CompleteAsync_ShouldReturnDegraded_WhenJsonModeResponseIsInvalidJson()
+    {
+        var settings = BuildSettings();
+        // Build a valid OpenAI response whose content value is truncated JSON.
+        // The inner content must be JSON-escaped so the outer envelope parses.
+        var truncatedContent = "{\\\"reply\\\":\\\"this is cut off";
+        var responseBody = $@"{{
+  ""choices"": [{{
+    ""message"": {{ ""content"": ""{truncatedContent}"" }},
+    ""finish_reason"": ""stop""
+  }}],
+  ""usage"": {{ ""total_tokens"": 50 }}
+}}";
+        var handler = new StubHttpMessageHandler(_ =>
+        {
+            return new HttpResponseMessage(HttpStatusCode.OK)
+            {
+                Content = new StringContent(responseBody, Encoding.UTF8, "application/json")
+            };
+        });
+
+        var provider = new OpenAiLlmProvider(new HttpClient(handler), settings, NullLogger<OpenAiLlmProvider>.Instance);
+
+        // SystemPrompt defaults to null -> JSON mode is requested
+        var result = await provider.CompleteAsync(new ChatCompletionRequest(
+            [new ChatCompletionMessage("User", "tell me something")]));
+
+        result.IsDegraded.Should().BeTrue();
+        result.DegradedReason.Should().Be("Response was truncated");
+    }
+
+    [Theory]
+    [InlineData("{\"reply\":\"incomplete", true)]
+    [InlineData("{}", false)]
+    [InlineData("plain text response", false)]
+    [InlineData("", false)]
+    [InlineData("  { broken json", true)]
+    public void LooksLikeTruncatedJson_ShouldDetectPartialJson(string input, bool expected)
+    {
+        OpenAiLlmProvider.LooksLikeTruncatedJson(input).Should().Be(expected);
+    }
+
     private static LlmProviderSettings BuildSettings()
     {
         return new LlmProviderSettings