fix(insta-lab): 프롬프트 템플릿 GET이 미저장 시 코드 기본값 반환

slate_writer/category_seeds가 DB에 없으면 404 대신 생성 파이프라인이 실제 폴백하는 코드 기본값(card_writer.DEFAULT_PROMPT, DEFAULT_CATEGORY_SEEDS)을 is_default=true로 반환. 편집 UI가 마스터 프롬프트를 표시·수정 가능. 미지정 이름은 여전히 404. 테스트 4건. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
feat(agent-office): 인스타 큐레이터 후보를 중복 제거 + 신뢰도 0.7+ 필터
2026-05-23 02:50:33 +09:00 · 2026-05-23 02:50:33 +09:00 · 2026-05-23 02:50:18 +09:00
7 changed files with 257 additions and 14 deletions
--- a/agent-office/app/agents/insta.py
+++ b/agent-office/app/agents/insta.py
@@ -18,6 +18,26 @@ from ..telegram import messaging
 logger = logging.getLogger(__name__)
 # 텔레그램 후보 푸시 시 "확실한 것만" 보내기 위한 최소 신뢰도 (키워드 score 0~1)
 KEYWORD_MIN_SCORE = 0.7
 def _dedup_and_filter_keywords(
    keywords: List[Dict[str, Any]], min_score: float = KEYWORD_MIN_SCORE,
 ) -> List[Dict[str, Any]]:
    """score >= min_score 인 키워드만 남기고, 동일 keyword 중복 제거(최고 score 유지).
    결과는 score 내림차순. 텔레그램 후보 푸시 전 정리용."""
    best: Dict[str, Dict[str, Any]] = {}
    for k in keywords:
        if float(k.get("score", 0)) < min_score:
            continue
        name = str(k.get("keyword", "")).strip()
        if not name:
            continue
        if name not in best or k["score"] > best[name]["score"]:
            best[name] = k
    return sorted(best.values(), key=lambda k: -k["score"])
 async def _send_media_group(media: List[Dict[str, Any]], caption: str = "") -> Dict[str, Any]:
    """텔레그램 sendMediaGroup. media는 InputMediaPhoto dicts.
@@ -89,14 +109,18 @@ class InstaAgent(BaseAgent):
        raise TimeoutError(f"{step} timeout {timeout_sec}s")
    async def _push_keyword_candidates(self, keywords: List[Dict[str, Any]]) -> None:
-        by_cat: Dict[str, List[Dict[str, Any]]] = {}
+        # 중복 제거 + 신뢰도(score) 임계값 이상만 — "확실한 것만" 정리해서 전송
-        for k in keywords:
+        filtered = _dedup_and_filter_keywords(keywords)
-            by_cat.setdefault(k["category"], []).append(k)
+        if not filtered:
-        if not by_cat:
+            await messaging.send_raw(
-            await messaging.send_raw("📰 [인스타 큐레이터] 오늘은 추천할 키워드가 없습니다.")
+                f"📰 [인스타 큐레이터] 오늘은 확실한 추천 키워드가 없습니다 (신뢰도 {KEYWORD_MIN_SCORE:.1f}+ 기준)."
            )
            return
        by_cat: Dict[str, List[Dict[str, Any]]] = {}
        for k in filtered:
            by_cat.setdefault(k["category"], []).append(k)
        rows: List[List[Dict[str, Any]]] = []
-        text_lines = ["📰 <b>[인스타 큐레이터]</b> 오늘의 키워드 후보"]
+        text_lines = [f"📰 <b>[인스타 큐레이터]</b> 오늘의 키워드 후보 (신뢰도 {KEYWORD_MIN_SCORE:.1f}+)"]
        for cat, items in by_cat.items():
            text_lines.append(f"\n<b>{cat}</b>")
            for k in items[:5]:
--- a/agent-office/tests/test_insta_keyword_filter.py
+++ b/agent-office/tests/test_insta_keyword_filter.py
@@ -0,0 +1,55 @@
 import os
 import sys
 import tempfile
 _fd, _TMP = tempfile.mkstemp(suffix=".db")
 os.close(_fd)
 os.unlink(_TMP)
 os.environ["AGENT_OFFICE_DB_PATH"] = _TMP
 sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.abspath(__file__))))
 from app.agents.insta import _dedup_and_filter_keywords, KEYWORD_MIN_SCORE
 def test_filters_below_threshold():
    """score < 임계값(0.7) 키워드는 제외."""
    kws = [
        {"id": 1, "keyword": "금리인하", "category": "경제", "score": 0.9},
        {"id": 2, "keyword": "환율", "category": "경제", "score": 0.6},  # 컷
        {"id": 3, "keyword": "반도체", "category": "경제", "score": 0.71},
    ]
    out = _dedup_and_filter_keywords(kws, min_score=0.7)
    kept = {k["keyword"] for k in out}
    assert kept == {"금리인하", "반도체"}
 def test_dedup_keeps_highest_score():
    """동일 keyword 중복 시 최고 score 1개만 유지."""
    kws = [
        {"id": 1, "keyword": "AI", "category": "경제", "score": 0.75},
        {"id": 2, "keyword": "AI", "category": "기술", "score": 0.92},  # 같은 키워드, 더 높음
    ]
    out = _dedup_and_filter_keywords(kws, min_score=0.7)
    assert len(out) == 1
    assert out[0]["id"] == 2
    assert out[0]["score"] == 0.92
 def test_sorted_by_score_desc():
    kws = [
        {"id": 1, "keyword": "a", "category": "c", "score": 0.72},
        {"id": 2, "keyword": "b", "category": "c", "score": 0.95},
        {"id": 3, "keyword": "c", "category": "c", "score": 0.80},
    ]
    out = _dedup_and_filter_keywords(kws, min_score=0.7)
    assert [k["keyword"] for k in out] == ["b", "c", "a"]
 def test_empty_when_all_below_threshold():
    kws = [{"id": 1, "keyword": "x", "category": "c", "score": 0.4}]
    assert _dedup_and_filter_keywords(kws, min_score=0.7) == []
 def test_default_threshold_is_0_7():
    assert KEYWORD_MIN_SCORE == 0.7
--- a/insta-lab/app/main.py
+++ b/insta-lab/app/main.py
@@ -271,12 +271,40 @@ class TemplateBody(BaseModel):
    description: str = ""
 def _default_prompt_templates() -> dict:
    """DB에 저장된 override가 없을 때 노출할 코드 기본값.
    생성 파이프라인이 실제로 폴백하는 값과 동일한 단일 소스를 사용."""
    return {
        "slate_writer": {
            "template": card_writer.DEFAULT_PROMPT,
            "description": "카드 10페이지 카피 생성 마스터 프롬프트 (Claude Sonnet). "
                           "{category}/{keyword}/{articles} 치환자 필수.",
        },
        "category_seeds": {
            "template": json.dumps(DEFAULT_CATEGORY_SEEDS, ensure_ascii=False, indent=2),
            "description": "트렌드 수집·분류용 카테고리별 시드 키워드 (JSON). "
                           "최상위 키가 분류 라벨로도 쓰임.",
        },
    }
@app.get("/api/insta/templates/prompts/{name}")
 def get_prompt(name: str):
    pt = db.get_prompt_template(name)
-    if not pt:
+    if pt:
        raise HTTPException(404)
        return pt
    # DB override 없음 → 코드 기본값 노출 (편집 UI가 마스터 프롬프트를 보고 수정 가능)
    defaults = _default_prompt_templates()
    if name in defaults:
        d = defaults[name]
        return {
            "name": name,
            "template": d["template"],
            "description": d["description"],
            "updated_at": None,
            "is_default": True,
        }
    raise HTTPException(404)
@app.put("/api/insta/templates/prompts/{name}")
--- a/insta-lab/tests/test_main_prompt_defaults.py
+++ b/insta-lab/tests/test_main_prompt_defaults.py
@@ -0,0 +1,63 @@
 import os
 import gc
 import json
 import tempfile
 import pytest
 from fastapi.testclient import TestClient
 from app import db as db_module
@pytest.fixture
 def client(monkeypatch):
    fd, path = tempfile.mkstemp(suffix=".db")
    os.close(fd)
    monkeypatch.setattr(db_module, "DB_PATH", path)
    db_module.init_db()
    from app import main
    monkeypatch.setattr(main, "DB_PATH", path)
    with TestClient(main.app) as c:
        yield c
    gc.collect()
    for ext in ("", "-wal", "-shm"):
        try:
            os.remove(path + ext)
        except OSError:
            pass
 def test_get_slate_writer_returns_default_when_unset(client):
    """DB에 없으면 코드 기본 마스터 프롬프트를 200으로 반환 (404 아님)."""
    resp = client.get("/api/insta/templates/prompts/slate_writer")
    assert resp.status_code == 200
    body = resp.json()
    assert body["is_default"] is True
    assert "{keyword}" in body["template"]
    assert "{category}" in body["template"]
 def test_get_category_seeds_returns_default_when_unset(client):
    """category_seeds 기본값은 유효한 JSON (카테고리→시드 배열)."""
    resp = client.get("/api/insta/templates/prompts/category_seeds")
    assert resp.status_code == 200
    body = resp.json()
    assert body["is_default"] is True
    seeds = json.loads(body["template"])
    assert "economy" in seeds and isinstance(seeds["economy"], list)
 def test_get_unknown_prompt_still_404(client):
    resp = client.get("/api/insta/templates/prompts/does_not_exist")
    assert resp.status_code == 404
 def test_saved_template_overrides_default(client):
    """PUT로 저장하면 이후 GET은 저장본(is_default 없음)을 반환."""
    client.put("/api/insta/templates/prompts/slate_writer",
               json={"template": "내 커스텀 프롬프트", "description": "custom"})
    resp = client.get("/api/insta/templates/prompts/slate_writer")
    assert resp.status_code == 200
    body = resp.json()
    assert body["template"] == "내 커스텀 프롬프트"
    assert not body.get("is_default")
--- a/stock/app/screener/ai_news/analyzer.py
+++ b/stock/app/screener/ai_news/analyzer.py
@@ -15,9 +15,15 @@ PROMPT_TEMPLATE = """다음은 종목 {name}({ticker})에 대한 최근 뉴스 {
 {news_block}
-이 뉴스들이 종목에 호재인지 악재인지 평가하세요.
+이 뉴스들이 종목 주가에 호재인지 악재인지 종합 평가하세요.
-score: -10(매우 강한 악재) ~ +10(매우 강한 호재) 사이의 실수. 0은 중립.
+
-reason: 30자 이내 한 줄 근거.
+규칙:
 - score: -10(매우 강한 악재) ~ +10(매우 강한 호재) 사이의 실수. 명확한 방향성이 없으면 0(중립).
 - 뉴스가 호재·악재로 섞여 있으면 주가에 더 우세한 쪽을 기준으로 부호를 정하세요.
 - reason은 반드시 score 부호와 같은 방향의 근거만 쓰세요.
  · score가 양수(호재)면 호재 근거만, 음수(악재)면 악재 근거만 적습니다.
  · 호재 평가에 악재 내용을, 악재 평가에 호재 내용을 섞지 마세요.
 - reason: 30자 이내 한 줄.
 JSON으로만 응답하세요. 다른 텍스트 금지:
 {{"score": <float>, "reason": "<string>"}}"""
--- a/stock/app/screener/ai_news/pipeline.py
+++ b/stock/app/screener/ai_news/pipeline.py
@@ -124,8 +124,10 @@ async def refresh_daily(
    if successes:
        _upsert_news_sentiment(conn, asof, successes, source="articles")
-    top_pos = sorted(successes, key=lambda r: -r["score_raw"])[:5]
+    # 부호 게이트: 호재(score>0)·악재(score<0)만 분류. score 미만 종목이 5개 미만이어도
-    top_neg = sorted(successes, key=lambda r: r["score_raw"])[:5]
+    # 반대 부호 종목으로 채우지 않음 (양수 종목이 악재란에 섞이는 문제 방지). 중립(0)은 제외.
    top_pos = sorted([r for r in successes if r["score_raw"] > 0], key=lambda r: -r["score_raw"])[:5]
    top_neg = sorted([r for r in successes if r["score_raw"] < 0], key=lambda r: r["score_raw"])[:5]
    return {
        "asof": asof.isoformat(),
--- a/stock/tests/test_ai_news_pipeline.py
+++ b/stock/tests/test_ai_news_pipeline.py
@@ -140,6 +140,71 @@ async def test_refresh_daily_no_match_ticker_skipped(conn):
    assert {r["ticker"] for r in rows} == {"005930"}
@pytest.mark.asyncio
 async def test_refresh_daily_sign_gate_no_positive_in_neg(conn):
    """전 종목 양수 점수면 top_neg는 비어야 함 (호재 종목이 악재란에 채워지면 안 됨)."""
    asof = dt.date(2026, 5, 13)
    fake_articles_by_ticker = {
        "005930": [{"title": "h", "summary": "", "press": "", "pub_date": ""}],
        "000660": [{"title": "h", "summary": "", "press": "", "pub_date": ""}],
        "373220": [{"title": "h", "summary": "", "press": "", "pub_date": ""}],
    }
    fake_stats = {"total_articles": 3, "matched_pairs": 3, "hit_tickers": 3}
    scores = {"005930": 6.0, "000660": 2.0, "373220": 0.5}  # 모두 양수
    async def fake_score(llm, ticker, news, *, name=None, model="m"):
        return {
            "ticker": ticker, "score_raw": scores[ticker], "reason": "r",
            "news_count": 1, "tokens_input": 1, "tokens_output": 1, "model": model,
        }
    with patch.object(pipeline, "articles_source") as mas, \
         patch.object(pipeline, "_analyzer") as ma, \
         patch.object(pipeline, "_make_llm") as ml:
        mas.gather_articles_for_tickers = MagicMock(return_value=(fake_articles_by_ticker, fake_stats))
        ma.score_sentiment = fake_score
        ml.return_value.__aenter__.return_value = AsyncMock()
        ml.return_value.__aexit__.return_value = None
        result = await pipeline.refresh_daily(conn, asof, concurrency=3)
    assert len(result["top_pos"]) == 3
    assert result["top_neg"] == []  # 양수 종목이 악재란에 들어가면 안 됨
@pytest.mark.asyncio
 async def test_refresh_daily_sign_gate_excludes_neutral(conn):
    """score=0(중립)은 호재·악재 어디에도 포함되지 않음."""
    asof = dt.date(2026, 5, 13)
    fake_articles_by_ticker = {
        "005930": [{"title": "h", "summary": "", "press": "", "pub_date": ""}],
        "000660": [{"title": "h", "summary": "", "press": "", "pub_date": ""}],
        "373220": [{"title": "h", "summary": "", "press": "", "pub_date": ""}],
    }
    fake_stats = {"total_articles": 3, "matched_pairs": 3, "hit_tickers": 3}
    scores = {"005930": 3.0, "000660": 0.0, "373220": -3.0}
    async def fake_score(llm, ticker, news, *, name=None, model="m"):
        return {
            "ticker": ticker, "score_raw": scores[ticker], "reason": "r",
            "news_count": 1, "tokens_input": 1, "tokens_output": 1, "model": model,
        }
    with patch.object(pipeline, "articles_source") as mas, \
         patch.object(pipeline, "_analyzer") as ma, \
         patch.object(pipeline, "_make_llm") as ml:
        mas.gather_articles_for_tickers = MagicMock(return_value=(fake_articles_by_ticker, fake_stats))
        ma.score_sentiment = fake_score
        ml.return_value.__aenter__.return_value = AsyncMock()
        ml.return_value.__aexit__.return_value = None
        result = await pipeline.refresh_daily(conn, asof, concurrency=3)
    pos_tickers = {r["ticker"] for r in result["top_pos"]}
    neg_tickers = {r["ticker"] for r in result["top_neg"]}
    assert pos_tickers == {"005930"}
    assert neg_tickers == {"373220"}
    assert "000660" not in pos_tickers and "000660" not in neg_tickers
 def test_top_market_cap_tickers(conn):
    out = pipeline._top_market_cap_tickers(conn, n=2)
    assert out == ["005930", "000660"]