market-aware AI cadence + incremental log updates

Two changes that together cut OpenRouter spend ~50% and give the daily log temporal awareness. 1. CadencePolicy (app/services/cadence.py): expensive AI jobs only fire hourly during the EU/US active window (Mon-Fri 07-21 UTC). Off-hours weekdays throttle to every 4h; weekends to every 12h. ai_log_job and indicator_summary_job both consult the policy before doing real work; market/news/portfolio ingest jobs stay hourly (cheap, no API cost). Skipped runs land in job_runs with status 'skipped' and the throttle reason in error. 2. Update mode for ai_log_job: when an earlier log exists for the current UTC day, it's passed to the model as 'Earlier log from today (generated HH:MM UTC)'. The system prompt grows an Update mode section instructing the model to revise — not restart — and anchor on what has CHANGED since the earlier draft. The TL;DR leads with intra-day change when meaningful, the watch list evolves rather than restarts. PROMPT_VERSION bumped to 5. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
2026-05-16 10:17:39 +01:00 · 2026-05-16 10:17:39 +01:00 · 40cfb50e37
commit 40cfb50e37
parent 2f223b75a3
4 changed files with 157 additions and 6 deletions
--- a/app/jobs/ai_log_job.py
+++ b/app/jobs/ai_log_job.py
@ -13,7 +13,8 @@ from sqlalchemy import desc, func, select
 from app.config import get_settings
 from app.db import utcnow
 from app.jobs._helpers import job_lifecycle, log
-from app.models import AICall, Headline, Quote, StrategicLog
+from app.models import AICall, Headline, JobRun, Quote, StrategicLog
+from app.services.cadence import DEFAULT_POLICY
 from app.services.openrouter import (
    PROMPT_VERSION,
    build_system_prompt,
@ -102,6 +103,20 @@ async def run() -> None:
            jr.status = "skipped"
            return

+        # Cadence: hourly during EU/US active hours; throttled off-hours.
+        last_success = (await session.execute(
+            select(func.max(JobRun.finished_at)).where(
+                JobRun.name == "ai_log_job",
+                JobRun.status == "success",
+            )
+        )).scalar()
+        should_run, reason = DEFAULT_POLICY.should_run(last_success)
+        if not should_run:
+            log.info("ai_log.cadence_skip", reason=reason)
+            jr.status = "skipped"
+            jr.error = reason
+            return
+
        spent = await _month_spend(session)
        if spent >= s.OPENROUTER_MONTHLY_CAP_USD:
            log.warning("ai_log.cap_reached", spent=spent,
@ -117,6 +132,17 @@ async def run() -> None:
            jr.status = "skipped"
            return

+        # Look up the most recent log generated today (UTC) so the model can
+        # update it rather than start from scratch. This gives the model
+        # temporal awareness — "since this morning's read, X has changed".
+        today_start = utcnow().replace(hour=0, minute=0, second=0, microsecond=0)
+        previous_log = (await session.execute(
+            select(StrategicLog)
+            .where(StrategicLog.generated_at >= today_start)
+            .order_by(desc(StrategicLog.generated_at))
+            .limit(1)
+        )).scalar_one_or_none()
+
        anchor = s.CASSANDRA_ANCHOR_DATE or None
        user_prompt = build_user_prompt(
            today=utcnow(),
@ -124,6 +150,7 @@ async def run() -> None:
            quotes_by_group=quotes,
            headlines_by_bucket=news,
            reference_line=REFERENCE_LINE,
+            previous_log=previous_log,
        )

        system_prompt = build_system_prompt(s.CASSANDRA_TONE, s.CASSANDRA_ANALYSIS)
--- a/app/jobs/indicator_summary_job.py
+++ b/app/jobs/indicator_summary_job.py
@ -13,7 +13,8 @@ from sqlalchemy import desc, func, select
 from app.config import get_settings, load_groups
 from app.db import utcnow
 from app.jobs._helpers import job_lifecycle, log
-from app.models import AICall, IndicatorSummary, Quote
+from app.models import AICall, IndicatorSummary, JobRun, Quote
+from app.services.cadence import DEFAULT_POLICY
 from app.services.openrouter import (
    PROMPT_VERSION,
    build_aggregate_summary_system_prompt,
@ -234,6 +235,21 @@ async def run() -> None:
            jr.status = "skipped"
            return

+        # Cadence — same policy as ai_log_job: hourly during EU/US active,
+        # throttled off-hours and weekends.
+        last_success = (await session.execute(
+            select(func.max(JobRun.finished_at)).where(
+                JobRun.name == "indicator_summary_job",
+                JobRun.status == "success",
+            )
+        )).scalar()
+        should_run, reason = DEFAULT_POLICY.should_run(last_success)
+        if not should_run:
+            log.info("ind_summary.cadence_skip", reason=reason)
+            jr.status = "skipped"
+            jr.error = reason
+            return
+
        spent = await _month_spend(session)
        if spent >= s.OPENROUTER_MONTHLY_CAP_USD:
            jr.status = "skipped"
--- a/app/services/cadence.py
+++ b/app/services/cadence.py
@ -0,0 +1,66 @@
+"""When should expensive AI jobs fire?
+
+Markets matter. The scheduler wakes every hour, but there's no point spending
+OpenRouter tokens at 03:00 UTC on a Sunday when nothing has moved. This module
+encodes a single policy: weekday active hours (LSE open through NYSE close,
+roughly 07:00-21:00 UTC) get the full hourly cadence; off-hours and weekends
+get throttled.
+
+Used by ai_log_job and indicator_summary_job to decide whether to run NOW or
+skip until enough time has passed since the last successful run. Market /
+news / portfolio ingestion jobs keep running hourly — they're cheap.
+"""
+from __future__ import annotations
+
+from dataclasses import dataclass
+from datetime import datetime, timezone
+
+
+@dataclass(frozen=True)
+class CadencePolicy:
+    # Active window in UTC. LSE opens 07:00 BST → 07:00 UTC summer, 08:00 UTC
+    # winter. NYSE closes 16:00 ET → 21:00 UTC summer, 21:00 UTC winter. The
+    # combined EU/US trading window is well covered by 07:00-21:00 UTC.
+    active_start_hour: int = 7
+    active_end_hour: int = 21
+    # Minimum gap between successful runs outside the active window.
+    off_hours_gap_h: float = 4.0
+    weekend_gap_h: float = 12.0
+
+    def is_active_window(self, now: datetime | None = None) -> bool:
+        now = now or datetime.now(timezone.utc)
+        if now.weekday() >= 5:  # Saturday / Sunday
+            return False
+        return self.active_start_hour <= now.hour < self.active_end_hour
+
+    def min_gap_hours(self, now: datetime | None = None) -> float:
+        now = now or datetime.now(timezone.utc)
+        if now.weekday() >= 5:
+            return self.weekend_gap_h
+        if self.is_active_window(now):
+            return 0.0  # always run during the active window
+        return self.off_hours_gap_h
+
+    def should_run(
+        self,
+        last_success_at: datetime | None,
+        now: datetime | None = None,
+    ) -> tuple[bool, str]:
+        """Returns (should_run, reason). The reason is human-readable for logs
+        and the job_runs.error column when a run is skipped."""
+        now = now or datetime.now(timezone.utc)
+        if self.is_active_window(now):
+            return True, "active window"
+        min_gap = self.min_gap_hours(now)
+        if last_success_at is None:
+            return True, "no prior successful run"
+        # Normalise tz; DB returns naive but we treat it as UTC.
+        if last_success_at.tzinfo is None:
+            last_success_at = last_success_at.replace(tzinfo=timezone.utc)
+        age_h = (now - last_success_at).total_seconds() / 3600.0
+        if age_h >= min_gap:
+            return True, f"off-hours but last run {age_h:.1f}h ago (≥ {min_gap}h)"
+        return False, f"off-hours throttled — last run {age_h:.1f}h ago (< {min_gap}h)"
+
+
+DEFAULT_POLICY = CadencePolicy()
--- a/app/services/openrouter.py
+++ b/app/services/openrouter.py
@ -20,7 +20,7 @@ OPENROUTER_URL = "https://openrouter.ai/api/v1/chat/completions"
 # Bump when the composed prompt changes meaningfully. Stored on every
 # StrategicLog row so historical logs can be linked to the prompt that produced
 # them.
-PROMPT_VERSION = 4
+PROMPT_VERSION = 5


 # --- Core: invariant across tone/analysis settings ----------------------------
@ -99,7 +99,23 @@ Close the log with a single sentence on a line of its own, formatted exactly:

 This is the line a reader who only sees the watch list scrolls down to. Make \
 it earn its place: cite real signals (HY OAS, breadth, VIX, valuation, real \
-yields), not vibes."""
+yields), not vibes.
+
+# Update mode (when an earlier log from today is provided)
+If the user message includes a section labelled "Earlier log from today \
+(generated HH:MM UTC)", treat that as YOUR OWN earlier draft. You are \
+UPDATING it for the current data, not starting from scratch.
+- Don't restate context that hasn't changed. Anchor on what's moved SINCE \
+that timestamp: confirmations, refutations, new emergent patterns.
+- The TL;DR should lead with the move since the earlier read when there \
+was a meaningful intra-day change ("Since this morning's read, …") — \
+otherwise stay regime-level.
+- The watch list should evolve: drop items that triggered or settled, add \
+items that emerged. Keep items still load-bearing.
+- Preserve any insights from the earlier draft that remain valid; sharpen \
+or revise the ones that don't. Avoid contradicting yourself silently — if \
+you change a stance, name it briefly ("Earlier I read X; with Y now, the \
+read shifts to Z")."""


 # --- Tone: audience-shaping block --------------------------------------------
@ -312,8 +328,11 @@ def build_user_prompt(
    quotes_by_group: dict[str, list[dict]],
    headlines_by_bucket: dict[str, list[dict]],
    reference_line: str | None = None,
+    previous_log: object | None = None,
 ) -> str:
-    """Assemble the user message from already-fetched-and-persisted data."""
+    """Assemble the user message from already-fetched-and-persisted data.
+    If `previous_log` is a StrategicLog from earlier today, it's included
+    as 'Update mode' context — the model will revise rather than restart."""
    parts = [f"# Strategic log request — {today.strftime('%Y-%m-%d')}"]
    if anchor:
        parts.append(f"Anchor reference date: {anchor}")
@ -322,6 +341,20 @@ def build_user_prompt(
            "\n## Reference snapshot (when the macro thesis was authored)"
            f"\n{reference_line}\nCompare live readings against it."
        )
+
+    if previous_log is not None:
+        gen = getattr(previous_log, "generated_at", None)
+        ts = gen.strftime("%H:%M UTC") if gen else "earlier today"
+        parts.append(
+            f"\n## Earlier log from today (generated {ts})\n"
+            "Treat this as YOUR OWN earlier draft for today. Update it for\n"
+            "the current data — don't restate unchanged context. See the\n"
+            "'Update mode' section of the system prompt for how to handle it.\n"
+            "```markdown\n"
+            f"{previous_log.content}\n"
+            "```"
+        )
+
    parts.append("\n## Live market data (per group)")
    parts.append("```json\n" + json.dumps(quotes_by_group, indent=2, default=str) + "\n```")
    parts.append("\n## News flow (last 24h, filtered by bucket)")
@ -331,11 +364,20 @@ def build_user_prompt(
        parts.append(f"\n### {label.upper()}")
        for h in items[:30]:
            parts.append(f"- [{h['when'][:16].replace('T',' ')}] [{h['source']}] {h['title']}")
-    parts.append(
+
+    task_line = (
        "\n## Task\nWrite the daily strategic log in ~800 words, following "
        "the discipline in the system prompt. No preamble; begin directly "
        "with the date header."
    )
+    if previous_log is not None:
+        task_line = (
+            "\n## Task\nUpdate the earlier log above for the current data. "
+            "Keep the same structure (date header, TL;DR, sections, watch "
+            "list, system temperature) but anchor on what has CHANGED since "
+            "the earlier draft's timestamp. ~800 words. No preamble."
+        )
+    parts.append(task_line)
    return "\n".join(parts)