diff --git a/config.yaml b/config.yaml index 9be6e5e..a6f8b3f 100644 --- a/config.yaml +++ b/config.yaml @@ -1,8 +1,6 @@ # hyungi_Document_Server 설정 ai: - gateway: - endpoint: "http://ai-gateway:8080" models: # ─── 단일 generation 호스트 routing (2026-05-14 GPU LLM 제거) ─── diff --git a/docker-compose.yml b/docker-compose.yml index 8bcf06d..4b986d5 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -168,19 +168,6 @@ services: start_period: 120s restart: unless-stopped - ai-gateway: - build: ./gpu-server/services/ai-gateway - ports: - - "127.0.0.1:8081:8080" - environment: - - PRIMARY_ENDPOINT=http://100.76.254.116:8801/v1/chat/completions - - FALLBACK_ENDPOINT=http://ollama:11434/v1/chat/completions - - CLAUDE_API_KEY=${CLAUDE_API_KEY:-} - - DAILY_BUDGET_USD=${DAILY_BUDGET_USD:-5.00} - # depends_on: ollama 제거 (2026-06-08) — ollama 서비스가 standalone 으로 이관됨. - # FALLBACK_ENDPOINT 의 ollama:11434 는 standalone(동일 hostname, DS 망 부착)으로 해소. - restart: unless-stopped - fastapi: build: ./app ports: