market-aware AI cadence + incremental log updates

Two changes that together cut OpenRouter spend ~50% and give the daily
log temporal awareness.

1. CadencePolicy (app/services/cadence.py): expensive AI jobs only
   fire hourly during the EU/US active window (Mon-Fri 07-21 UTC).
   Off-hours weekdays throttle to every 4h; weekends to every 12h.
   ai_log_job and indicator_summary_job both consult the policy before
   doing real work; market/news/portfolio ingest jobs stay hourly
   (cheap, no API cost). Skipped runs land in job_runs with status
   'skipped' and the throttle reason in error.

2. Update mode for ai_log_job: when an earlier log exists for the
   current UTC day, it's passed to the model as 'Earlier log from
   today (generated HH:MM UTC)'. The system prompt grows an Update
   mode section instructing the model to revise — not restart — and
   anchor on what has CHANGED since the earlier draft. The TL;DR
   leads with intra-day change when meaningful, the watch list evolves
   rather than restarts. PROMPT_VERSION bumped to 5.

Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
This commit is contained in:
Giorgio Gilestro 2026-05-16 10:17:39 +01:00
parent 2f223b75a3
commit 40cfb50e37
4 changed files with 157 additions and 6 deletions

View file

@ -13,7 +13,8 @@ from sqlalchemy import desc, func, select
from app.config import get_settings from app.config import get_settings
from app.db import utcnow from app.db import utcnow
from app.jobs._helpers import job_lifecycle, log from app.jobs._helpers import job_lifecycle, log
from app.models import AICall, Headline, Quote, StrategicLog from app.models import AICall, Headline, JobRun, Quote, StrategicLog
from app.services.cadence import DEFAULT_POLICY
from app.services.openrouter import ( from app.services.openrouter import (
PROMPT_VERSION, PROMPT_VERSION,
build_system_prompt, build_system_prompt,
@ -102,6 +103,20 @@ async def run() -> None:
jr.status = "skipped" jr.status = "skipped"
return return
# Cadence: hourly during EU/US active hours; throttled off-hours.
last_success = (await session.execute(
select(func.max(JobRun.finished_at)).where(
JobRun.name == "ai_log_job",
JobRun.status == "success",
)
)).scalar()
should_run, reason = DEFAULT_POLICY.should_run(last_success)
if not should_run:
log.info("ai_log.cadence_skip", reason=reason)
jr.status = "skipped"
jr.error = reason
return
spent = await _month_spend(session) spent = await _month_spend(session)
if spent >= s.OPENROUTER_MONTHLY_CAP_USD: if spent >= s.OPENROUTER_MONTHLY_CAP_USD:
log.warning("ai_log.cap_reached", spent=spent, log.warning("ai_log.cap_reached", spent=spent,
@ -117,6 +132,17 @@ async def run() -> None:
jr.status = "skipped" jr.status = "skipped"
return return
# Look up the most recent log generated today (UTC) so the model can
# update it rather than start from scratch. This gives the model
# temporal awareness — "since this morning's read, X has changed".
today_start = utcnow().replace(hour=0, minute=0, second=0, microsecond=0)
previous_log = (await session.execute(
select(StrategicLog)
.where(StrategicLog.generated_at >= today_start)
.order_by(desc(StrategicLog.generated_at))
.limit(1)
)).scalar_one_or_none()
anchor = s.CASSANDRA_ANCHOR_DATE or None anchor = s.CASSANDRA_ANCHOR_DATE or None
user_prompt = build_user_prompt( user_prompt = build_user_prompt(
today=utcnow(), today=utcnow(),
@ -124,6 +150,7 @@ async def run() -> None:
quotes_by_group=quotes, quotes_by_group=quotes,
headlines_by_bucket=news, headlines_by_bucket=news,
reference_line=REFERENCE_LINE, reference_line=REFERENCE_LINE,
previous_log=previous_log,
) )
system_prompt = build_system_prompt(s.CASSANDRA_TONE, s.CASSANDRA_ANALYSIS) system_prompt = build_system_prompt(s.CASSANDRA_TONE, s.CASSANDRA_ANALYSIS)

View file

@ -13,7 +13,8 @@ from sqlalchemy import desc, func, select
from app.config import get_settings, load_groups from app.config import get_settings, load_groups
from app.db import utcnow from app.db import utcnow
from app.jobs._helpers import job_lifecycle, log from app.jobs._helpers import job_lifecycle, log
from app.models import AICall, IndicatorSummary, Quote from app.models import AICall, IndicatorSummary, JobRun, Quote
from app.services.cadence import DEFAULT_POLICY
from app.services.openrouter import ( from app.services.openrouter import (
PROMPT_VERSION, PROMPT_VERSION,
build_aggregate_summary_system_prompt, build_aggregate_summary_system_prompt,
@ -234,6 +235,21 @@ async def run() -> None:
jr.status = "skipped" jr.status = "skipped"
return return
# Cadence — same policy as ai_log_job: hourly during EU/US active,
# throttled off-hours and weekends.
last_success = (await session.execute(
select(func.max(JobRun.finished_at)).where(
JobRun.name == "indicator_summary_job",
JobRun.status == "success",
)
)).scalar()
should_run, reason = DEFAULT_POLICY.should_run(last_success)
if not should_run:
log.info("ind_summary.cadence_skip", reason=reason)
jr.status = "skipped"
jr.error = reason
return
spent = await _month_spend(session) spent = await _month_spend(session)
if spent >= s.OPENROUTER_MONTHLY_CAP_USD: if spent >= s.OPENROUTER_MONTHLY_CAP_USD:
jr.status = "skipped" jr.status = "skipped"

66
app/services/cadence.py Normal file
View file

@ -0,0 +1,66 @@
"""When should expensive AI jobs fire?
Markets matter. The scheduler wakes every hour, but there's no point spending
OpenRouter tokens at 03:00 UTC on a Sunday when nothing has moved. This module
encodes a single policy: weekday active hours (LSE open through NYSE close,
roughly 07:00-21:00 UTC) get the full hourly cadence; off-hours and weekends
get throttled.
Used by ai_log_job and indicator_summary_job to decide whether to run NOW or
skip until enough time has passed since the last successful run. Market /
news / portfolio ingestion jobs keep running hourly they're cheap.
"""
from __future__ import annotations
from dataclasses import dataclass
from datetime import datetime, timezone
@dataclass(frozen=True)
class CadencePolicy:
# Active window in UTC. LSE opens 07:00 BST → 07:00 UTC summer, 08:00 UTC
# winter. NYSE closes 16:00 ET → 21:00 UTC summer, 21:00 UTC winter. The
# combined EU/US trading window is well covered by 07:00-21:00 UTC.
active_start_hour: int = 7
active_end_hour: int = 21
# Minimum gap between successful runs outside the active window.
off_hours_gap_h: float = 4.0
weekend_gap_h: float = 12.0
def is_active_window(self, now: datetime | None = None) -> bool:
now = now or datetime.now(timezone.utc)
if now.weekday() >= 5: # Saturday / Sunday
return False
return self.active_start_hour <= now.hour < self.active_end_hour
def min_gap_hours(self, now: datetime | None = None) -> float:
now = now or datetime.now(timezone.utc)
if now.weekday() >= 5:
return self.weekend_gap_h
if self.is_active_window(now):
return 0.0 # always run during the active window
return self.off_hours_gap_h
def should_run(
self,
last_success_at: datetime | None,
now: datetime | None = None,
) -> tuple[bool, str]:
"""Returns (should_run, reason). The reason is human-readable for logs
and the job_runs.error column when a run is skipped."""
now = now or datetime.now(timezone.utc)
if self.is_active_window(now):
return True, "active window"
min_gap = self.min_gap_hours(now)
if last_success_at is None:
return True, "no prior successful run"
# Normalise tz; DB returns naive but we treat it as UTC.
if last_success_at.tzinfo is None:
last_success_at = last_success_at.replace(tzinfo=timezone.utc)
age_h = (now - last_success_at).total_seconds() / 3600.0
if age_h >= min_gap:
return True, f"off-hours but last run {age_h:.1f}h ago (≥ {min_gap}h)"
return False, f"off-hours throttled — last run {age_h:.1f}h ago (< {min_gap}h)"
DEFAULT_POLICY = CadencePolicy()

View file

@ -20,7 +20,7 @@ OPENROUTER_URL = "https://openrouter.ai/api/v1/chat/completions"
# Bump when the composed prompt changes meaningfully. Stored on every # Bump when the composed prompt changes meaningfully. Stored on every
# StrategicLog row so historical logs can be linked to the prompt that produced # StrategicLog row so historical logs can be linked to the prompt that produced
# them. # them.
PROMPT_VERSION = 4 PROMPT_VERSION = 5
# --- Core: invariant across tone/analysis settings ---------------------------- # --- Core: invariant across tone/analysis settings ----------------------------
@ -99,7 +99,23 @@ Close the log with a single sentence on a line of its own, formatted exactly:
This is the line a reader who only sees the watch list scrolls down to. Make \ This is the line a reader who only sees the watch list scrolls down to. Make \
it earn its place: cite real signals (HY OAS, breadth, VIX, valuation, real \ it earn its place: cite real signals (HY OAS, breadth, VIX, valuation, real \
yields), not vibes.""" yields), not vibes.
# Update mode (when an earlier log from today is provided)
If the user message includes a section labelled "Earlier log from today \
(generated HH:MM UTC)", treat that as YOUR OWN earlier draft. You are \
UPDATING it for the current data, not starting from scratch.
- Don't restate context that hasn't changed. Anchor on what's moved SINCE \
that timestamp: confirmations, refutations, new emergent patterns.
- The TL;DR should lead with the move since the earlier read when there \
was a meaningful intra-day change ("Since this morning's read, …") \
otherwise stay regime-level.
- The watch list should evolve: drop items that triggered or settled, add \
items that emerged. Keep items still load-bearing.
- Preserve any insights from the earlier draft that remain valid; sharpen \
or revise the ones that don't. Avoid contradicting yourself silently — if \
you change a stance, name it briefly ("Earlier I read X; with Y now, the \
read shifts to Z")."""
# --- Tone: audience-shaping block -------------------------------------------- # --- Tone: audience-shaping block --------------------------------------------
@ -312,8 +328,11 @@ def build_user_prompt(
quotes_by_group: dict[str, list[dict]], quotes_by_group: dict[str, list[dict]],
headlines_by_bucket: dict[str, list[dict]], headlines_by_bucket: dict[str, list[dict]],
reference_line: str | None = None, reference_line: str | None = None,
previous_log: object | None = None,
) -> str: ) -> str:
"""Assemble the user message from already-fetched-and-persisted data.""" """Assemble the user message from already-fetched-and-persisted data.
If `previous_log` is a StrategicLog from earlier today, it's included
as 'Update mode' context the model will revise rather than restart."""
parts = [f"# Strategic log request — {today.strftime('%Y-%m-%d')}"] parts = [f"# Strategic log request — {today.strftime('%Y-%m-%d')}"]
if anchor: if anchor:
parts.append(f"Anchor reference date: {anchor}") parts.append(f"Anchor reference date: {anchor}")
@ -322,6 +341,20 @@ def build_user_prompt(
"\n## Reference snapshot (when the macro thesis was authored)" "\n## Reference snapshot (when the macro thesis was authored)"
f"\n{reference_line}\nCompare live readings against it." f"\n{reference_line}\nCompare live readings against it."
) )
if previous_log is not None:
gen = getattr(previous_log, "generated_at", None)
ts = gen.strftime("%H:%M UTC") if gen else "earlier today"
parts.append(
f"\n## Earlier log from today (generated {ts})\n"
"Treat this as YOUR OWN earlier draft for today. Update it for\n"
"the current data — don't restate unchanged context. See the\n"
"'Update mode' section of the system prompt for how to handle it.\n"
"```markdown\n"
f"{previous_log.content}\n"
"```"
)
parts.append("\n## Live market data (per group)") parts.append("\n## Live market data (per group)")
parts.append("```json\n" + json.dumps(quotes_by_group, indent=2, default=str) + "\n```") parts.append("```json\n" + json.dumps(quotes_by_group, indent=2, default=str) + "\n```")
parts.append("\n## News flow (last 24h, filtered by bucket)") parts.append("\n## News flow (last 24h, filtered by bucket)")
@ -331,11 +364,20 @@ def build_user_prompt(
parts.append(f"\n### {label.upper()}") parts.append(f"\n### {label.upper()}")
for h in items[:30]: for h in items[:30]:
parts.append(f"- [{h['when'][:16].replace('T',' ')}] [{h['source']}] {h['title']}") parts.append(f"- [{h['when'][:16].replace('T',' ')}] [{h['source']}] {h['title']}")
parts.append(
task_line = (
"\n## Task\nWrite the daily strategic log in ~800 words, following " "\n## Task\nWrite the daily strategic log in ~800 words, following "
"the discipline in the system prompt. No preamble; begin directly " "the discipline in the system prompt. No preamble; begin directly "
"with the date header." "with the date header."
) )
if previous_log is not None:
task_line = (
"\n## Task\nUpdate the earlier log above for the current data. "
"Keep the same structure (date header, TL;DR, sections, watch "
"list, system temperature) but anchor on what has CHANGED since "
"the earlier draft's timestamp. ~800 words. No preamble."
)
parts.append(task_line)
return "\n".join(parts) return "\n".join(parts)