Files
worldmonitor/api/seed-health.js
Elie Habib d3836ba49b feat(sentiment): add AAII investor sentiment survey (#2930)
* feat(sentiment): add AAII investor sentiment survey

Weekly bull/bear/neutral sentiment from AAII (1987-present). Shows
current reading, bull-bear spread, and 52-week historical chart.
Seeder fetches from AAII CSV, stores last 52 weeks in Redis.

* fix(aaii): wire panel loading + mark fallback data explicitly

* fix(aaii): keep panel live across refreshes + surface in health monitoring

- fetchData now falls back to /api/bootstrap?keys=aaiiSentiment on
  refresh (getHydratedData is one-shot and returns undefined after
  the first read, causing a permanent spinner on hourly refresh)
- Shows an error state with auto-retry when both hydrated and
  bootstrap-fetch miss, matching the WsbTickerScannerPanel pattern
- Registered aaiiSentiment in api/health.js BOOTSTRAP_KEYS and
  api/seed-health.js SEED_DOMAINS so rollout failures and
  fallback-only operation are observable in the monitoring dashboards

* fix(sentiment): handle BIFF8 SST trailing bytes and use UTC for AAII Thursday calc

Two P2 greptile fixes from PR #2930 review:

1. BIFF8 SST parser was reading the rich-text run count (cRun, flags & 0x08)
   and extended-string size (cbExtRst, flags & 0x04) to advance past those
   header fields, but never skipped the trailing bytes AFTER the char data:
   4 * cRun formatting-run bytes and cbExtRst ext-rst bytes. If any string
   before the column header was rich-text formatted, every subsequent SST
   entry parsed from the wrong offset, silently breaking XLS extraction and
   falling back to HTML scraping.

2. parseHtmlSentiment() computed last-Thursday via today.getDay() +
   setDate(today.getDate() - daysToThursday), both local-TZ-dependent. On
   Railway (non-UTC TZ) the inferred Thursday could drift by a day, causing
   the HTML-derived row to mismatch the XLS historical rows. Switched to
   getUTCDay() + Date.UTC() for TZ-stable arithmetic.
2026-04-11 17:05:39 +04:00

159 lines
10 KiB
JavaScript

import { getCorsHeaders, isDisallowedOrigin } from './_cors.js';
import { validateApiKey } from './_api-key.js';
import { jsonResponse } from './_json-response.js';
// @ts-expect-error — JS module, no declaration file
import { redisPipeline } from './_upstash-json.js';
export const config = { runtime: 'edge' };
const SEED_DOMAINS = {
// Phase 1 — Snapshot endpoints
'seismology:earthquakes': { key: 'seed-meta:seismology:earthquakes', intervalMin: 15 },
'wildfire:fires': { key: 'seed-meta:wildfire:fires', intervalMin: 60 },
'infra:outages': { key: 'seed-meta:infra:outages', intervalMin: 15 },
'climate:anomalies': { key: 'seed-meta:climate:anomalies', intervalMin: 120 },
'climate:disasters': { key: 'seed-meta:climate:disasters', intervalMin: 360 },
'climate:zone-normals': { key: 'seed-meta:climate:zone-normals', intervalMin: 44640 },
'climate:co2-monitoring': { key: 'seed-meta:climate:co2-monitoring', intervalMin: 1440 }, // daily cron; health.js maxStaleMin:4320 (3x) is intentionally higher — it's an alarm threshold, not the cron cadence
'climate:ocean-ice': { key: 'seed-meta:climate:ocean-ice', intervalMin: 1440 }, // daily cron; health.js maxStaleMin:2880 (2x) tolerates one missed run
'climate:news-intelligence': { key: 'seed-meta:climate:news-intelligence', intervalMin: 30 },
// Phase 2 — Parameterized endpoints
'unrest:events': { key: 'seed-meta:unrest:events', intervalMin: 15 },
'cyber:threats': { key: 'seed-meta:cyber:threats', intervalMin: 240 },
'market:crypto': { key: 'seed-meta:market:crypto', intervalMin: 15 },
'market:etf-flows': { key: 'seed-meta:market:etf-flows', intervalMin: 30 },
'market:gulf-quotes': { key: 'seed-meta:market:gulf-quotes', intervalMin: 15 },
'market:stablecoins': { key: 'seed-meta:market:stablecoins', intervalMin: 30 },
// Phase 3 — Hybrid endpoints
'natural:events': { key: 'seed-meta:natural:events', intervalMin: 60 },
'displacement:summary': { key: 'seed-meta:displacement:summary', intervalMin: 360 },
// Aligned with health.js SEED_META (intervalMin = maxStaleMin / 2)
'market:stocks': { key: 'seed-meta:market:stocks', intervalMin: 15 },
'market:commodities': { key: 'seed-meta:market:commodities', intervalMin: 15 },
'market:sectors': { key: 'seed-meta:market:sectors', intervalMin: 15 },
'aviation:faa': { key: 'seed-meta:aviation:faa', intervalMin: 45 },
'news:insights': { key: 'seed-meta:news:insights', intervalMin: 15 },
'positive-events:geo': { key: 'seed-meta:positive-events:geo', intervalMin: 30 },
'risk:scores:sebuf': { key: 'seed-meta:risk:scores:sebuf', intervalMin: 15 },
'conflict:iran-events': { key: 'seed-meta:conflict:iran-events', intervalMin: 5040 },
'conflict:ucdp-events': { key: 'seed-meta:conflict:ucdp-events', intervalMin: 210 },
'weather:alerts': { key: 'seed-meta:weather:alerts', intervalMin: 15 },
'economic:spending': { key: 'seed-meta:economic:spending', intervalMin: 60 },
'intelligence:gpsjam': { key: 'seed-meta:intelligence:gpsjam', intervalMin: 360 },
'intelligence:satellites': { key: 'seed-meta:intelligence:satellites', intervalMin: 90 },
'military:flights': { key: 'seed-meta:military:flights', intervalMin: 8 },
'military-forecast-inputs': { key: 'seed-meta:military-forecast-inputs', intervalMin: 8 },
'infra:service-statuses': { key: 'seed-meta:infra:service-statuses', intervalMin: 60 },
'supply_chain:shipping': { key: 'seed-meta:supply_chain:shipping', intervalMin: 120 },
'supply_chain:chokepoints': { key: 'seed-meta:supply_chain:chokepoints', intervalMin: 30 },
'cable-health': { key: 'seed-meta:cable-health', intervalMin: 30 },
'prediction:markets': { key: 'seed-meta:prediction:markets', intervalMin: 8 },
'aviation:intl': { key: 'seed-meta:aviation:intl', intervalMin: 15 },
'theater-posture': { key: 'seed-meta:theater-posture', intervalMin: 8 },
'economic:worldbank-techreadiness': { key: 'seed-meta:economic:worldbank-techreadiness:v1', intervalMin: 5040 },
'economic:worldbank-progress': { key: 'seed-meta:economic:worldbank-progress:v1', intervalMin: 5040 },
'economic:worldbank-renewable': { key: 'seed-meta:economic:worldbank-renewable:v1', intervalMin: 5040 },
'research:tech-events': { key: 'seed-meta:research:tech-events', intervalMin: 240 },
'intelligence:gdelt-intel': { key: 'seed-meta:intelligence:gdelt-intel', intervalMin: 210 }, // 420min maxStaleMin / 2 — aligned with health.js (6h cron + 1h grace)
'correlation:cards': { key: 'seed-meta:correlation:cards', intervalMin: 5 },
'intelligence:advisories': { key: 'seed-meta:intelligence:advisories', intervalMin: 60 },
'intelligence:wsb-tickers': { key: 'seed-meta:intelligence:wsb-tickers', intervalMin: 15 }, // 10min relay loop; intervalMin = maxStaleMin / 2 (30 / 2)
'trade:customs-revenue': { key: 'seed-meta:trade:customs-revenue', intervalMin: 720 },
'thermal:escalation': { key: 'seed-meta:thermal:escalation', intervalMin: 180 },
'radiation:observations': { key: 'seed-meta:radiation:observations', intervalMin: 15 },
'sanctions:pressure': { key: 'seed-meta:sanctions:pressure', intervalMin: 360 },
'health:air-quality': { key: 'seed-meta:health:air-quality', intervalMin: 60 }, // hourly cron (shared seeder writes health + climate keys)
'economic:grocery-basket': { key: 'seed-meta:economic:grocery-basket', intervalMin: 5040 }, // weekly seed; intervalMin = maxStaleMin / 2
'economic:bigmac': { key: 'seed-meta:economic:bigmac', intervalMin: 5040 }, // weekly seed; intervalMin = maxStaleMin / 2
'resilience:static': { key: 'seed-meta:resilience:static', intervalMin: 288000 }, // annual October snapshot; intervalMin = health.js maxStaleMin / 2 (400d alert threshold)
'resilience:intervals': { key: 'seed-meta:resilience:intervals', intervalMin: 10080 }, // weekly cron; intervalMin = health.js maxStaleMin / 2 (20160 / 2)
'regulatory:actions': { key: 'seed-meta:regulatory:actions', intervalMin: 120 }, // 2h cron; intervalMin = maxStaleMin / 3
'economic:owid-energy-mix': { key: 'seed-meta:economic:owid-energy-mix', intervalMin: 25200 }, // monthly cron on 1st; intervalMin = health.js maxStaleMin / 2 (50400 / 2)
'economic:fao-ffpi': { key: 'seed-meta:economic:fao-ffpi', intervalMin: 43200 }, // monthly seed; intervalMin = health.js maxStaleMin / 2 (86400 / 2)
'product-catalog': { key: 'seed-meta:product-catalog', intervalMin: 360 }, // relay loop every 6h; intervalMin = health.js maxStaleMin / 3 (1080 / 3)
'portwatch:chokepoints-ref': { key: 'seed-meta:portwatch:chokepoints-ref', intervalMin: 1440 }, // daily cron (0 0 * * *)
'supply_chain:portwatch-ports': { key: 'seed-meta:supply_chain:portwatch-ports', intervalMin: 720 }, // 12h cron (0 */12 * * *); intervalMin = maxStaleMin / 3 (2160 / 3)
'energy:chokepoint-flows': { key: 'seed-meta:energy:chokepoint-flows', intervalMin: 360 }, // 6h relay loop; intervalMin = maxStaleMin / 2 (720 / 2)
'energy:spine': { key: 'seed-meta:energy:spine', intervalMin: 1440 }, // daily cron (0 6 * * *); intervalMin = maxStaleMin / 2 (2880 / 2)
'energy:ember': { key: 'seed-meta:energy:ember', intervalMin: 1440 }, // daily cron (0 8 * * *); intervalMin = maxStaleMin / 2 (2880 / 2)
'energy:spr-policies': { key: 'seed-meta:energy:spr-policies', intervalMin: 288000 }, // annual static registry; intervalMin = health.js maxStaleMin / 2 (576000 / 2)
'market:aaii-sentiment': { key: 'seed-meta:market:aaii-sentiment', intervalMin: 10080 }, // weekly cron; intervalMin = maxStaleMin / 2 (20160 / 2)
};
async function getMetaBatch(keys) {
const pipeline = keys.map((k) => ['GET', k]);
const data = await redisPipeline(pipeline, 3000);
if (!data) throw new Error('Redis not configured');
const result = new Map();
for (let i = 0; i < keys.length; i++) {
const raw = data[i]?.result;
if (raw) {
try { result.set(keys[i], JSON.parse(raw)); } catch { /* skip */ }
}
}
return result;
}
export default async function handler(req) {
if (isDisallowedOrigin(req))
return new Response('Forbidden', { status: 403 });
const cors = getCorsHeaders(req);
if (req.method === 'OPTIONS')
return new Response(null, { status: 204, headers: cors });
const apiKeyResult = validateApiKey(req);
if (apiKeyResult.required && !apiKeyResult.valid)
return jsonResponse({ error: apiKeyResult.error }, 401, cors);
const now = Date.now();
const entries = Object.entries(SEED_DOMAINS);
const metaKeys = entries.map(([, v]) => v.key);
let metaMap;
try {
metaMap = await getMetaBatch(metaKeys);
} catch {
return jsonResponse({ error: 'Redis unavailable' }, 503, cors);
}
const seeds = {};
let staleCount = 0;
let missingCount = 0;
for (const [domain, cfg] of entries) {
const meta = metaMap.get(cfg.key);
const maxStalenessMs = cfg.intervalMin * 2 * 60 * 1000;
if (!meta) {
seeds[domain] = { status: 'missing', fetchedAt: null, recordCount: null, stale: true };
missingCount++;
continue;
}
const ageMs = now - (meta.fetchedAt || 0);
const isError = meta.status === 'error';
const stale = ageMs > maxStalenessMs || isError;
if (stale) staleCount++;
seeds[domain] = {
status: stale ? (isError ? 'error' : 'stale') : 'ok',
fetchedAt: meta.fetchedAt,
recordCount: meta.recordCount ?? null,
sourceVersion: meta.sourceVersion || null,
ageMinutes: Math.round(ageMs / 60000),
stale,
};
}
const overall = missingCount > 0 ? 'degraded' : staleCount > 0 ? 'warning' : 'healthy';
const httpStatus = overall === 'healthy' ? 200 : overall === 'warning' ? 200 : 503;
return jsonResponse({ overall, seeds, checkedAt: now }, httpStatus, {
...cors,
'Cache-Control': 'no-cache',
});
}