fix: MLX 서버(localhost:8800) 대응 — Ollama API → OpenAI 호환 변경

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-03-26 13:31:52 +09:00
parent 084d3a8c63
commit a77477140b
4 changed files with 29 additions and 23 deletions
@@ -2,7 +2,7 @@

 ## 시스템 개요

-Mac mini M4 Pro(64GB RAM, 4TB SSD)를 중심으로, DEVONthink를 **중앙 지식 허브**로 두고, Omni 제품군으로 **실행/계획**, Synology NAS로 **저장/백업**, AI(Claude API + Ollama)로 **지능화**하는 통합 PKM 시스템.
+Mac mini M4 Pro(64GB RAM, 4TB SSD)를 중심으로, DEVONthink를 **중앙 지식 허브**로 두고, Omni 제품군으로 **실행/계획**, Synology NAS로 **저장/백업**, AI(Claude API + MLX/Ollama)로 **지능화**하는 통합 PKM 시스템.

 ```
 ┌─────────────────────────────────────────────────────────────┐
@@ -279,10 +279,10 @@ on performSmartRule(theRecords)
            set docText to text 1 thru 4000 of docText
        end if

-        -- Step 1: Mac mini 35B → 태그 + 분류 대상 DB/그룹 생성
-        set shellCmd to "curl -s http://localhost:11434/api/generate -d '{" & ¬
-            "\"model\": \"qwen3.5:35b-a3b-q4_K_M\"," & ¬
-            "\"prompt\": \"다음 문서를 분석하고 JSON으로 응답해줘.\\n" & ¬
+        -- Step 1: Mac mini MLX 35B → 태그 + 분류 대상 DB/그룹 생성
+        set shellCmd to "curl -s http://localhost:8800/v1/chat/completions -H 'Content-Type: application/json' -d '{" & ¬
+            "\"model\": \"mlx-community/Qwen3.5-35B-A3B-4bit\"," & ¬
+            "\"messages\": [{\"role\":\"user\",\"content\":\"다음 문서를 분석하고 JSON으로 응답해줘.\\n" & ¬
            "{\\\"tags\\\": [최대5개_한글태그],\\n" & ¬
            " \\\"domain_db\\\": \\\"DB이름\\\",\\n" & ¬
            " \\\"sub_group\\\": \\\"하위그룹경로\\\"}\\n\\n" & ¬
@@ -910,11 +910,10 @@ tell application id "DNtp"
 end tell

 -- AI로 액션 아이템 추출
-set extractCmd to "curl -s http://localhost:11434/api/generate -d '{" & ¬
-    "\"model\":\"qwen3.5:35b-a3b-q4_K_M\"," & ¬
-    "\"prompt\":\"다음 텍스트에서 할 일(TODO)만 추출해서 " & ¬
-    "한 줄에 하나씩 출력해줘:\\n" & docText & "\"," & ¬
-    "\"stream\":false}'"
+set extractCmd to "curl -s http://localhost:8800/v1/chat/completions -H 'Content-Type: application/json' -d '{" & ¬
+    "\"model\":\"mlx-community/Qwen3.5-35B-A3B-4bit\"," & ¬
+    "\"messages\":[{\"role\":\"user\",\"content\":\"다음 텍스트에서 할 일(TODO)만 추출해서 " & ¬
+    "한 줄에 하나씩 출력해줘:\\n" & docText & "\"}]}'"
 set aiResult to do shell script extractCmd

 -- OmniFocus에 작업 생성
@@ -1325,7 +1324,7 @@ OmniFocus                      0.5GB      낮음
 OmniPlan                       0.5GB      낮음
 OmniOutliner                   0.3GB      낮음
 OmniGraffle                    0.5GB      낮음
-Ollama (Qwen3.5-35B-A3B 4Q)   ~20GB      중간         MoE: 3B만 활성
+MLX (Qwen3.5-35B-A3B 4bit)    ~20GB      중간         MoE: 3B만 활성
 ChromaDB                       1-2GB      낮음
 Roon Core                      2-4GB      낮음
 Komga                          0.5GB      낮음