fix: strip R1 think blocks before JSON extraction

DeepSeek-R1 models emit <think>...</think> before their actual response. The brace-counting extractor would grab the first { inside the thinking block (which contains partial JSON fragments) rather than the final strategy JSON. strip_think_blocks() removes all <think>...</think> sections including unterminated blocks (truncated responses), leaving only the final output for extract_json to process. Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>
2026-03-09 18:17:06 +02:00
parent b947f48b01
commit 185cb4586e
1 changed files with 28 additions and 2 deletions
--- a/src/claude.rs
+++ b/src/claude.rs
@@ -98,9 +98,13 @@ impl ClaudeClient {
    }
 }

-/// Extract a JSON object from Claude's response text.
-/// Looks for the first `{` ... `}` block, handling markdown code fences.
+/// Extract a JSON object from a model response text.
+/// Handles markdown code fences and R1-style `<think>...</think>` blocks.
 pub fn extract_json(text: &str) -> Result<Value> {
+    // Strip R1-style thinking blocks before looking for JSON
+    let text = strip_think_blocks(text);
+    let text = text.as_ref();
+
    // Strip markdown fences if present
    let cleaned = text
        .replace("```json", "")
@@ -137,3 +141,25 @@ pub fn extract_json(text: &str) -> Result<Value> {

    serde_json::from_str(&cleaned[s..e]).context("parse extracted JSON")
 }
+
+/// Remove `<think>...</think>` blocks emitted by R1-family reasoning models.
+/// Handles nested tags and unterminated blocks (truncated responses).
+fn strip_think_blocks(text: &str) -> std::borrow::Cow<'_, str> {
+    if !text.contains("<think>") {
+        return std::borrow::Cow::Borrowed(text);
+    }
+    let mut out = String::with_capacity(text.len());
+    let mut rest = text;
+    while let Some(start) = rest.find("<think>") {
+        out.push_str(&rest[..start]);
+        rest = &rest[start + "<think>".len()..];
+        if let Some(end) = rest.find("</think>") {
+            rest = &rest[end + "</think>".len()..];
+        } else {
+            // Unterminated — discard the rest (truncated thinking block)
+            rest = "";
+        }
+    }
+    out.push_str(rest);
+    std::borrow::Cow::Owned(out)
+}