fix(agent-office/lotto): deep CuratorError fallthrough + urgent 발송 재시도

결함1: deep signal-check에서 curate_weekly가 CuratorError면 전체 check가 abort돼 sim/drift 시그널이 미평가되던 문제 → try/except로 confidence만 포기하고 sim/drift는 계속(curate_result=None fallthrough). 결함2: send_urgent_signal 실패가 outer except로 빠져 task 실패+미마킹이던 문제 → _send_urgent_with_retry(3회/60s) 추출, 최종 실패해도 raise 안 함(시그널 평가·태스크 보존), 성공 시에만 mark_signal_notified. TDD 3 신규 테스트. Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
2026-06-11 08:48:08 +09:00
parent 2c2828c8f0
commit 3c11b75a5f
2 changed files with 115 additions and 9 deletions
--- a/agent-office/app/agents/lotto.py
+++ b/agent-office/app/agents/lotto.py
@@ -2,6 +2,10 @@ from .base import BaseAgent
 from ..db import create_task, update_task_status, add_log
 from ..curator.pipeline import curate_weekly, CuratorError

+# urgent 텔레그램 발송 재시도 (전송 실패가 시그널 평가/태스크를 중단시키지 않도록)
+URGENT_SEND_MAX_ATTEMPTS = 3
+URGENT_SEND_RETRY_SEC = 60
+

 class LottoAgent(BaseAgent):
    agent_id = "lotto"
@@ -54,10 +58,16 @@ class LottoAgent(BaseAgent):

            if source == "deep":
                from ..curator.pipeline import curate_weekly
-                cw = await curate_weekly(source="signal_deep")
-                curate_result = {"confidence": cw.get("confidence")}
-                if cw.get("draw_no"):
-                    current_draw_no = cw.get("draw_no")
+                try:
+                    cw = await curate_weekly(source="signal_deep")
+                    curate_result = {"confidence": cw.get("confidence")}
+                    if cw.get("draw_no"):
+                        current_draw_no = cw.get("draw_no")
+                except CuratorError as e:
+                    # 큐레이션 실패는 confidence 시그널만 포기 — sim/drift 평가는 계속(fallthrough)
+                    add_log("lotto", f"deep curate_weekly 실패 → sim/drift만 평가: {e}",
+                            level="warning", task_id=task_id)
+                    curate_result = None

            outcome = await run_signal_check(
                source=source,
@@ -88,11 +98,7 @@ class LottoAgent(BaseAgent):
                            "triggered_at": datetime.now(timezone.utc).isoformat(),
                            "results": outcome["results"],
                        }
-                        await send_urgent_signal(event)
-                        for r in outcome["results"]:
-                            if r["fire_level"] in ("normal", "urgent"):
-                                mark_signal_notified(r["signal_id"])
-                        add_log("lotto", f"urgent 텔레그램 발송 ({len(outcome['results'])}개 시그널)", task_id=task_id)
+                        await self._send_urgent_with_retry(event, outcome["results"], task_id)

            fired_metrics = [
                r["metric"] for r in outcome["results"]
@@ -111,6 +117,31 @@ class LottoAgent(BaseAgent):
            add_log("lotto", f"signal_check 예외: {e}", level="error", task_id=task_id)
            return {"ok": False, "message": f"{type(e).__name__}: {e}"}

+    async def _send_urgent_with_retry(self, event: dict, results: list, task_id: str) -> bool:
+        """urgent 텔레그램 발송 + 실패 시 재시도. 최종 실패해도 raise하지 않음(시그널 평가·태스크 보존).
+        성공 시 fired 시그널을 notified로 마킹. 반환: 발송 성공 여부."""
+        import asyncio
+        from ..db import add_log, mark_signal_notified
+        from ..notifiers.telegram_lotto import send_urgent_signal
+        for attempt in range(1, URGENT_SEND_MAX_ATTEMPTS + 1):
+            try:
+                await send_urgent_signal(event)
+                for r in results:
+                    if r["fire_level"] in ("normal", "urgent"):
+                        mark_signal_notified(r["signal_id"])
+                add_log("lotto", f"urgent 텔레그램 발송 ({len(results)}개 시그널, attempt {attempt})", task_id=task_id)
+                return True
+            except Exception as e:
+                if attempt < URGENT_SEND_MAX_ATTEMPTS:
+                    add_log("lotto", f"urgent 발송 실패(attempt {attempt}) → {URGENT_SEND_RETRY_SEC}s 후 재시도: {e}",
+                            level="warning", task_id=task_id)
+                    await asyncio.sleep(URGENT_SEND_RETRY_SEC)
+                else:
+                    add_log("lotto", f"urgent 발송 {URGENT_SEND_MAX_ATTEMPTS}회 실패 — 미발송: {e}",
+                            level="error", task_id=task_id)
+                    return False
+        return False
+
    async def run_daily_digest(self) -> dict:
        """일일 요약 — 지난 24h normal/urgent 발화 텔레그램 1통. task_id wrap."""
        from ..db import (