From 53a30449e27a4d56f09e13550045bc544df3655d Mon Sep 17 00:00:00 2001 From: hyungi Date: Wed, 10 Jun 2026 13:47:18 +0900 Subject: [PATCH] =?UTF-8?q?fix(news):=20crawl=5Fpoliteness=20logger=20?= =?UTF-8?q?=EB=A5=BC=20setup=5Flogger=20=EB=A1=9C=20=EC=A0=95=ED=95=A9?= =?UTF-8?q?=ED=99=94=20=E2=80=94=20INFO=20=EB=8C=80=EA=B8=B0=20=EB=A1=9C?= =?UTF-8?q?=EA=B7=B8=20=EA=B0=80=EC=8B=9C=ED=99=94?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Co-Authored-By: Claude Fable 5 --- app/core/crawl_politeness.py | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/app/core/crawl_politeness.py b/app/core/crawl_politeness.py index d54687d..d61e030 100644 --- a/app/core/crawl_politeness.py +++ b/app/core/crawl_politeness.py @@ -12,7 +12,6 @@ SSRF 차단은 core.url_validator.validate_feed_url 재사용 (redirect target """ import asyncio -import logging import random import time import urllib.robotparser @@ -21,8 +20,10 @@ from urllib.parse import urljoin, urlparse import httpx from core.url_validator import validate_feed_url +from core.utils import setup_logger -logger = logging.getLogger("crawl_politeness") +# bare getLogger 는 root(WARNING) 상속이라 INFO 대기/차단 로그가 드랍됨 — 타 워커와 동일 설정 +logger = setup_logger("crawl_politeness") # 정직 식별 UA + 연락처 — 차단 전 연락 통로 (A-4) CRAWL_UA = "HyungiPKM-Archiver/1.0 (personal archive; +mailto:hyun49196@gmail.com)"