From aca4a027baf58c2f810456f5ee7cd516c4b9db53 Mon Sep 17 00:00:00 2001
From: Hyungi Ahn <hyungiahn@Hyungiui-MacBookPro.local>
Date: Thu, 26 Mar 2026 13:39:05 +0900
Subject: [PATCH] =?UTF-8?q?fix:=20LLM=20thinking=20=ED=97=88=EC=9A=A9=20+?=
 =?UTF-8?q?=20=EB=A7=88=EC=A7=80=EB=A7=89=20=EC=9C=A0=ED=9A=A8=20JSON=20?=
 =?UTF-8?q?=EC=B6=94=EC=B6=9C=20=EB=B0=A9=EC=8B=9D=EC=9C=BC=EB=A1=9C=20?=
 =?UTF-8?q?=EB=B3=80=EA=B2=BD?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
---
 scripts/pkm_utils.py | 38 +++++++++++++++++++-------------------
 1 file changed, 19 insertions(+), 19 deletions(-)
diff --git a/scripts/pkm_utils.py b/scripts/pkm_utils.py
index eb66b45..cf525d9 100644
--- a/scripts/pkm_utils.py
+++ b/scripts/pkm_utils.py
@@ -109,32 +109,32 @@ def llm_generate(prompt: str, model: str = "mlx-community/Qwen3.5-35B-A3B-4bit",
                  host: str = "http://localhost:8800", json_mode: bool = False) -> str:
     """MLX 서버 API 호출 (OpenAI 호환)"""
     import requests
-    messages = []
-    if json_mode:
-        messages.append({"role": "system", "content": "IMPORTANT: Output ONLY valid JSON. No thinking process, no explanation, no markdown fences. Start your response with { and end with }."})
-    messages.append({"role": "user", "content": prompt})
+    messages = [{"role": "user", "content": prompt}]
     resp = requests.post(f"{host}/v1/chat/completions", json={
         "model": model,
         "messages": messages,
-        "temperature": 0.1 if json_mode else 0.3,
-        "max_tokens": 2048,
-    }, timeout=180)
+        "temperature": 0.3,
+        "max_tokens": 4096,
+    }, timeout=300)
     resp.raise_for_status()
     content = resp.json()["choices"][0]["message"]["content"]
-    # thinking 블록 제거 (Qwen3.5 thinking 모델 대응)
-    if "<think>" in content and "</think>" in content:
-        content = content.split("</think>")[-1].strip()
-    # JSON 블록 추출
-    if "```json" in content:
-        content = content.split("```json")[1].split("```")[0].strip()
-    elif "```" in content:
-        content = content.split("```")[1].split("```")[0].strip()
-    # { 로 시작하는 JSON 추출
+    if not json_mode:
+        return content
+    # JSON 모드: thinking 허용 → 마지막 유효 JSON 객체 추출
     import re
+    import json as _json
+    # 배열이 포함된 JSON 객체 매칭
+    all_jsons = re.findall(r'\{[^{}]*(?:\[[^\]]*\])?[^{}]*\}', content)
+    for j in reversed(all_jsons):
+        try:
+            parsed = _json.loads(j)
+            if any(k in parsed for k in ("domain_db", "tags", "domain", "classification")):
+                return j
+        except _json.JSONDecodeError:
+            continue
+    # 폴백: 전체에서 가장 큰 JSON 추출
     json_match = re.search(r'\{[\s\S]*\}', content)
-    if json_match:
-        content = json_match.group(0)
-    return content
+    return json_match.group(0) if json_match else content
 
 
 # 하위호환 별칭