diff --git a/nanoclaude/services/worker.py b/nanoclaude/services/worker.py index 2e50cc1..d694e5c 100644 --- a/nanoclaude/services/worker.py +++ b/nanoclaude/services/worker.py @@ -366,7 +366,8 @@ async def run(job: Job) -> None: elif action == "route" and settings.pipeline_enabled and backend_registry.is_healthy("reasoner"): # === ROUTE: Gemma reasoning === reasoning_model = backend_registry.reasoner.model - rewritten_message = (route_prompt or job.message)[:MAX_PROMPT_LENGTH] + # 원본 사용자 메시지를 그대로 전달 (route_prompt는 신뢰 안 함 — EXAONE이 답변까지 미리 작성하는 문제) + rewritten_message = job.message[:MAX_PROMPT_LENGTH] job.rewritten_message = rewritten_message # Gemma busy 안내 (Hybrid 부하 판단 — inference 강제 측정 안 함)