동작하는 최소 코드 수준의 v2 스캐폴딩: - docker-compose.yml: postgres, fastapi, kordoc, frontend, caddy - app/: FastAPI 백엔드 (main, core, models, ai, prompts) - services/kordoc/: Node.js 문서 파싱 마이크로서비스 - gpu-server/: AI Gateway + GPU docker-compose - frontend/: SvelteKit 기본 구조 - migrations/: PostgreSQL 초기 스키마 (documents, tasks, processing_queue) - tests/: pytest conftest 기본 설정 - config.yaml, Caddyfile, credentials.env.example 갱신 Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
49 lines
1.1 KiB
YAML
49 lines
1.1 KiB
YAML
# hyungi_Document_Server 설정
|
|
|
|
ai:
|
|
gateway:
|
|
endpoint: "http://gpu-server:8080"
|
|
|
|
models:
|
|
primary:
|
|
endpoint: "http://host.docker.internal:8800/v1/chat/completions"
|
|
model: "mlx-community/Qwen3.5-35B-A3B-4bit"
|
|
max_tokens: 4096
|
|
timeout: 60
|
|
|
|
fallback:
|
|
endpoint: "http://gpu-server:11434/v1/chat/completions"
|
|
model: "qwen3.5:35b-a3b"
|
|
max_tokens: 4096
|
|
timeout: 120
|
|
|
|
premium:
|
|
endpoint: "https://api.anthropic.com/v1/messages"
|
|
model: "claude-sonnet-4-20250514"
|
|
max_tokens: 8192
|
|
daily_budget_usd: 5.00
|
|
require_explicit_trigger: true
|
|
|
|
embedding:
|
|
endpoint: "http://gpu-server:11434/api/embeddings"
|
|
model: "nomic-embed-text"
|
|
|
|
vision:
|
|
endpoint: "http://gpu-server:11434/api/generate"
|
|
model: "Qwen2.5-VL-7B"
|
|
|
|
rerank:
|
|
endpoint: "http://gpu-server:11434/api/rerank"
|
|
model: "bge-reranker-v2-m3"
|
|
|
|
nas:
|
|
mount_path: "/documents"
|
|
pkm_root: "/documents/PKM"
|
|
|
|
schedule:
|
|
law_monitor: "07:00"
|
|
mailplus_archive: ["07:00", "18:00"]
|
|
daily_digest: "20:00"
|
|
file_watcher_interval_minutes: 5
|
|
queue_consumer_interval_minutes: 10
|