feat(reco): gate cold_start engines by nsessions (FFM-1161) (#248)

ohld · web-flow · commit bb14d0adf363 · 2026-05-11T08:47:29.000+08:00
Diagnostic in FFM-1107 showed cold_start_adapt was serving users averaging
198 days old with 2 lifetime sessions — dormant returners, not fresh users.
Continuation was only 5% despite a healthy 50% LR at position 1, because
the engine optimizes for users with zero history while the population had
stale preferences.

Add an nsessions gate behind COLD_START_NSESSIONS_GATE_ENABLED:
- pulls nsessions from user_stats into the cached user_info payload
- restricts cold_start_explore / cold_start_adapt to nsessions &lt;= 1
- dormant returners (nmemes_sent &lt; 30, nsessions &gt;= 2) fall through to
  the growing-user blender, which has stale-but-real signal to work with

Feature flag defaults off so this lands behind a config toggle and stays
disjoint from the recently_liked_blender_v2 read (FFM-1094, May 17-18).
diff --git a/experiments/log.jsonl b/experiments/log.jsonl
@@ -50,3 +50,4 @@
 {"timestamp":"2026-04-20T03:40:00Z","agent":"ceo","action":"experiment_created","status":"success","summary":"Created early-channel-popup experiment: move popup.telegram_channel from meme #50 to #5 with conversion tracking","details":{"experiment":"2026-04-20-early-channel-popup","reason":"75% of new users leave before meme #5, channel popup at #50 reaches almost nobody. Channel = retention anchor via TG feed. Approved by founder.","impact":"Expected: 10%+ subscribe rate (vs ~0% at #50), improved D7 retention for subscribers","cto_task":"FFM-590","analyst_task":"FFM-591"},"error":null}
 {"timestamp":"2026-04-20T09:30:00Z","agent":"ceo","action":"daily_review","status":"success","summary":"Weekly CEO review. Retro: 22 commits, 1.0k LOC, 8 PRs, 59% fix ratio, 5-day streak. WAU 589 (-13% WoW) is #1 concern. Goat experiment Day 7/14 all green (LR 41.9% vs 39.4% baseline). Early-channel-popup waiting on deploy. describe_memes structurally rate-limited (0.7% coverage). 31 stale QA issues need cleanup.","details":{"north_star":30,"wau":589,"wau_change":"-13%","active_experiments":["goat-recency-filter (Day 7/14, all green, conclude Apr 27)","early-channel-popup (code ready, FFM-590 in_review, not deployed)"],"retro":{"commits":22,"fix_ratio":"59%","test_ratio":"3%","streak_days":5,"ship_of_week":"goat recency filter PR #169 + describe_memes hardening (6 commits)"},"actions":["experiment_continue: goat-recency-filter — all metrics passing, Day 7/14","task_created: FFM-598 CTO — deploy early-channel-popup branch (HIGH)","task_created: FFM-599 CTO — structural fix for describe_memes rate limiting (HIGH)","task_created: FFM-600 CTO — batch close 31 stale QA issues (LOW)","todos_updated: marked goat recency filter as DONE in TODOS.md"],"priorities_next_week":["1. Deploy early-channel-popup (retention lever for WAU decline)","2. Fix describe_memes structurally (content quality)","3. Monitor goat experiment through Apr 27","4. Clean up stale issues"]},"error":null}
 {"timestamp":"2026-05-01T07:15:11Z","agent":"comms-manager","action":"daily_channel_post","status":"success","summary":"Published meme-of-April kulich highlight to @fastfoodmemes: 44% like rate, 60 likes from 133 sends.","details":{"task":"FFM-866","channel":"@fastfoodmemes","url":"https://t.me/fastfoodmemes/12590","telegram_message_id":12590,"editorial_post_id":1,"category":"E","entity_id":"meme:top_lr_10119534","note":"Fun meme findings may target the main RU meme channel; build-in-public/product/process posts target @ffmemes."},"error":null}
+{"timestamp":"2026-05-11T00:00:00Z","agent":"cto","action":"experiment_started","status":"success","summary":"FFM-1161: cold-start nsessions gate + feature flag shipped to PR. Adds nsessions to user_info, gates cold_start_explore/adapt to nsessions<=1 behind COLD_START_NSESSIONS_GATE_ENABLED. Dormant returners (nmemes_sent<30 but nsessions>=2) fall through to growing-user blender.","details":{"issue":"FFM-1161","experiment":"2026-05-11-cold-start-routing-fix","feature_flag":"COLD_START_NSESSIONS_GATE_ENABLED","files":["src/config.py","src/tgbot/service.py","src/recommendations/meme_queue.py","tests/recommendations/test_meme_queue.py"],"tests":"19/19 mocked tests green; DB integration tests require Docker","coordination":"Do not deploy until recently_liked_blender_v2 (FFM-1094) May 17-18 read is in flight — coordinate with Release Engineer."},"error":null}
diff --git a/src/config.py b/src/config.py
@@ -49,6 +49,11 @@ class Config(BaseSettings):
     DEEPSEEK_BASE_URL: str = "https://api.deepseek.com"
     CHAT_AGENT_ENABLED: bool = False
 
+    # FFM-1161: gate cold_start engines so they only serve genuinely-new users
+    # (nsessions <= 1). Dormant returners with nmemes_sent < 30 but multiple
+    # sessions fall through to the growing-user blender instead.
+    COLD_START_NSESSIONS_GATE_ENABLED: bool = False
+
     PREFECT_API_URL: str | None = None
     PREFECT_AUTH_STRING: str | None = None
 
diff --git a/src/recommendations/meme_queue.py b/src/recommendations/meme_queue.py
@@ -6,6 +6,7 @@
 from sqlalchemy import text
 
 from src import redis
+from src.config import settings
 from src.database import fetch_all
 from src.recommendations.blender import blend
 from src.recommendations.blender_experiments import (
@@ -95,6 +96,11 @@ async def generate_recommendations(
     if nmemes_sent is None:
         nmemes_sent = user_info["nmemes_sent"]
 
+    # FFM-1161: nsessions gate. cold_start engines were designed for first-session
+    # users; the cached user_info may predate the gate (1h TTL) — treat missing as 0
+    # so we don't accidentally route dormant returners into cold_start.
+    nsessions = user_info.get("nsessions") or 0
+
     queue_key = redis.get_meme_queue_key(user_id)
 
     meme_ids_in_queue = []
@@ -149,10 +155,19 @@ async def get_candidates(user_id, limit, use_recently_liked_blender_v2: bool = T
           Phase 3 (16-30): Transition — blend adapt + growing engines
 
         Fallback chain: phase engine -> lr_smoothed -> best_uploaded_memes
+
+        FFM-1161: when COLD_START_NSESSIONS_GATE_ENABLED, cold_start is only
+        used for first-session users (nsessions <= 1). Dormant returners
+        (nsessions >= 2, nmemes_sent < 30) fall through to the growing-user
+        blender below — they have stale signal, not zero signal.
         """
 
+        in_cold_start_window = nmemes_sent < 30
+        if settings.COLD_START_NSESSIONS_GATE_ENABLED:
+            in_cold_start_window = in_cold_start_window and nsessions <= 1
+
         # Cold start: 3-phase adaptive
-        if nmemes_sent < 30:
+        if in_cold_start_window:
             if nmemes_sent < 6:
                 # Phase 1: diverse exploration from top sources
                 engine = "cold_start_explore"
diff --git a/src/tgbot/service.py b/src/tgbot/service.py
@@ -358,6 +358,7 @@ async def get_user_info(
         SELECT
             type,
             COALESCE(nmemes_sent, 0) nmemes_sent,
+            COALESCE(nsessions, 0) nsessions,
             COALESCE(memes_watched_today, 0) memes_watched_today,
             UIL.interface_lang
         FROM "user" AS U
diff --git a/tests/recommendations/test_meme_queue.py b/tests/recommendations/test_meme_queue.py
@@ -13,6 +13,15 @@
 TEST_USER_ID = 99999
 
 
+def _patch_user_info(nsessions: int = 0, nmemes_sent: int = 0, **extra):
+    user_info = defaultdict(int, {"nmemes_sent": nmemes_sent, "nsessions": nsessions, **extra})
+    return patch(
+        "src.recommendations.meme_queue.get_user_info",
+        new_callable=AsyncMock,
+        return_value=user_info,
+    )
+
+
 @pytest.fixture(autouse=True)
 def mock_redis():
     """Mock Redis and user_info calls — these tests validate blending logic, not Redis."""
@@ -488,3 +497,151 @@ class TestRetriever(CandidatesRetriever):
     for nmemes in [0, 3, 8, 12, 20, 25]:
         candidates = await generate_recommendations(TEST_USER_ID, 10, nmemes, TestRetriever())
         assert len(candidates) == 0, f"Expected empty at nmemes_sent={nmemes}"
+
+
+# ── FFM-1161: nsessions gate ──
+
+
+def _growing_retriever_class():
+    """Retriever covering both cold_start engines and the growing-user blender."""
+
+    async def cold_start_explore(self, user_id, limit=10, exclude_meme_ids=[], **kw):
+        return [{"id": 101, "recommended_by": "cold_start_explore"}]
+
+    async def cold_start_adapt(self, user_id, limit=10, exclude_meme_ids=[], **kw):
+        return [{"id": 201, "recommended_by": "cold_start_adapt"}]
+
+    async def lr_smoothed(self, user_id, limit=10, exclude_meme_ids=[], **kw):
+        return [{"id": 301, "recommended_by": "lr_smoothed"}]
+
+    async def best_uploaded_memes(self, user_id, limit=10, exclude_meme_ids=[], **kw):
+        return [{"id": 401, "recommended_by": "best_uploaded_memes"}]
+
+    async def like_spread_and_recent_memes(self, user_id, limit=10, exclude_meme_ids=[], **kw):
+        return [{"id": 501, "recommended_by": "like_spread_and_recent_memes"}]
+
+    async def recently_liked(self, user_id, limit=10, exclude_meme_ids=[], **kw):
+        return [{"id": 601, "recommended_by": "recently_liked"}]
+
+    async def goat(self, user_id, limit=10, exclude_meme_ids=[], **kw):
+        return [{"id": 701, "recommended_by": "goat"}]
+
+    async def es_ranked(self, user_id, limit=10, exclude_meme_ids=[], **kw):
+        return [{"id": 801, "recommended_by": "es_ranked"}]
+
+    class TestRetriever(CandidatesRetriever):
+        engine_map = {
+            "cold_start_explore": cold_start_explore,
+            "cold_start_adapt": cold_start_adapt,
+            "lr_smoothed": lr_smoothed,
+            "best_uploaded_memes": best_uploaded_memes,
+            "like_spread_and_recent_memes": like_spread_and_recent_memes,
+            "recently_liked": recently_liked,
+            "goat": goat,
+            "es_ranked": es_ranked,
+        }
+
+    return TestRetriever
+
+
+@pytest.mark.asyncio
+async def test_gate_off_dormant_returner_still_uses_cold_start():
+    """Default (gate disabled): nsessions is ignored — cold_start still routes by nmemes_sent."""
+    retriever = _growing_retriever_class()()
+    with (
+        _patch_user_info(nsessions=5, nmemes_sent=8),
+        patch("src.config.settings.COLD_START_NSESSIONS_GATE_ENABLED", False),
+    ):
+        candidates = await generate_recommendations(
+            TEST_USER_ID, 10, nmemes_sent=8, retriever=retriever
+        )
+    assert any(c["recommended_by"] == "cold_start_adapt" for c in candidates)
+
+
+@pytest.mark.asyncio
+async def test_gate_on_first_session_routes_to_cold_start_explore():
+    """Gate on + nsessions<=1 + nmemes_sent<6 → cold_start_explore (Phase 1)."""
+    retriever = _growing_retriever_class()()
+    with (
+        _patch_user_info(nsessions=0, nmemes_sent=0),
+        patch("src.config.settings.COLD_START_NSESSIONS_GATE_ENABLED", True),
+    ):
+        candidates = await generate_recommendations(
+            TEST_USER_ID, 10, nmemes_sent=0, retriever=retriever
+        )
+    assert len(candidates) == 1
+    assert candidates[0]["recommended_by"] == "cold_start_explore"
+
+
+@pytest.mark.asyncio
+async def test_gate_on_first_session_phase2_routes_to_cold_start_adapt():
+    """Gate on + nsessions<=1 + 6<=nmemes_sent<16 → cold_start_adapt (Phase 2)."""
+    retriever = _growing_retriever_class()()
+    with (
+        _patch_user_info(nsessions=1, nmemes_sent=8),
+        patch("src.config.settings.COLD_START_NSESSIONS_GATE_ENABLED", True),
+    ):
+        candidates = await generate_recommendations(
+            TEST_USER_ID, 10, nmemes_sent=8, retriever=retriever
+        )
+    assert any(c["recommended_by"] == "cold_start_adapt" for c in candidates)
+
+
+@pytest.mark.asyncio
+async def test_gate_on_dormant_returner_falls_through_to_growing_blender():
+    """Gate on + nsessions>=2 + nmemes_sent<30 → growing-user blender, NO cold_start engines."""
+    retriever = _growing_retriever_class()()
+    with (
+        _patch_user_info(nsessions=3, nmemes_sent=12),
+        patch("src.config.settings.COLD_START_NSESSIONS_GATE_ENABLED", True),
+    ):
+        candidates = await generate_recommendations(
+            TEST_USER_ID, 10, nmemes_sent=12, retriever=retriever, random_seed=42
+        )
+    sources = {c["recommended_by"] for c in candidates}
+    assert "cold_start_explore" not in sources
+    assert "cold_start_adapt" not in sources
+    # Growing blender is pinned at lr_smoothed in position 0
+    assert candidates[0]["recommended_by"] == "lr_smoothed"
+
+
+@pytest.mark.asyncio
+async def test_gate_on_mature_user_unchanged():
+    """Gate on + mature user (nmemes_sent>=100) → blender_v2 path, untouched by gate."""
+    retriever = _growing_retriever_class()()
+    with (
+        _patch_user_info(nsessions=5, nmemes_sent=120),
+        patch("src.config.settings.COLD_START_NSESSIONS_GATE_ENABLED", True),
+        patch(
+            "src.recommendations.meme_queue.get_recently_liked_blender_v2_weights",
+            new_callable=AsyncMock,
+            return_value=MATURE_BLENDER_TREATMENT_WEIGHTS,
+        ) as get_weights,
+    ):
+        candidates = await generate_recommendations(
+            TEST_USER_ID, 10, nmemes_sent=120, retriever=retriever, random_seed=42
+        )
+    sources = {c["recommended_by"] for c in candidates}
+    assert "cold_start_explore" not in sources
+    assert "cold_start_adapt" not in sources
+    get_weights.assert_awaited_once_with(TEST_USER_ID)
+
+
+@pytest.mark.asyncio
+async def test_gate_on_missing_nsessions_treated_as_zero():
+    """Stale cache without nsessions key → treated as 0, cold_start still applies."""
+    retriever = _growing_retriever_class()()
+    # user_info lacks 'nsessions' (defaultdict(int) returns 0)
+    stale_info = defaultdict(int, {"nmemes_sent": 4})
+    with (
+        patch(
+            "src.recommendations.meme_queue.get_user_info",
+            new_callable=AsyncMock,
+            return_value=stale_info,
+        ),
+        patch("src.config.settings.COLD_START_NSESSIONS_GATE_ENABLED", True),
+    ):
+        candidates = await generate_recommendations(
+            TEST_USER_ID, 10, nmemes_sent=4, retriever=retriever
+        )
+    assert candidates[0]["recommended_by"] == "cold_start_explore"