mirror of
https://github.com/koala73/worldmonitor.git
synced 2026-04-25 17:14:57 +02:00
* feat(seeds): shared FX rate cache + BigMac WoW guards - Extract SHARED_FX_FALLBACKS to _seed-utils.mjs as single source of truth, eliminating duplicated FX fallback tables across seed-bigmac, seed-grocery-basket, and seed-fx-rates - Add getSharedFxRates() / fetchYahooFxRates() to _seed-utils.mjs so all seeds share one Redis-cached rate set (shared:fx-rates:v1, 4h TTL) instead of each making ~46 independent Yahoo Finance calls per run - Add seed-fx-rates.mjs: dedicated daily Railway cron that pre-warms the shared FX cache, saving ~90 Yahoo calls per weekly bigmac+grocery-basket cycle - Add WoW minimum-age guard (6 days): prevents week-on-week display when previous snapshot is less than 6 days old (fixes -98.5% France WoW on first seed run) - Add per-country WoW anomaly filter (+-20%): nulls suspicious entries and logs admin alert with country name and delta for Railway log monitoring - Fix global WoW anomaly check to use unfiltered raw average so it can actually exceed +-20% (filtered average was mathematically bounded and never triggered) - Add USD price sanity range guard ($1.50-$12.00): drops prices from bad scrapes before they reach Redis (would have caught the $470 France value) - Move WOW_ANOMALY_THRESHOLD, MIN_WOW_AGE_MS, USD_MIN, USD_MAX to module scope * fix(seed-fx): address PR review — TTL mismatch and partial write-back risk - Extend shared:fx-rates:v1 TTL from 4h to 25h so cache stays warm between daily cron runs (with 1h drift buffer) - Make getSharedFxRates() read-only: remove write-back on partial cache hit and on cache miss; only seed-fx-rates.mjs owns writes to this key, preventing a subset consumer from silently overwriting a fuller cache
278 lines
12 KiB
JavaScript
278 lines
12 KiB
JavaScript
#!/usr/bin/env node
|
|
|
|
import { loadEnvFile, CHROME_UA, runSeed, sleep, readSeedSnapshot, getSharedFxRates, SHARED_FX_FALLBACKS } from './_seed-utils.mjs';
|
|
|
|
loadEnvFile(import.meta.url);
|
|
|
|
const CANONICAL_KEY = 'economic:bigmac:v1';
|
|
const CACHE_TTL = 864000; // 10 days — weekly seed with 3-day cron-drift buffer
|
|
const EXA_DELAY_MS = 150;
|
|
|
|
const FX_FALLBACKS = SHARED_FX_FALLBACKS;
|
|
|
|
// WoW validation thresholds
|
|
const MIN_WOW_AGE_MS = 6 * 24 * 60 * 60 * 1000; // 6 days minimum between snapshots
|
|
const WOW_ANOMALY_THRESHOLD = 20; // % change that signals a data bug
|
|
|
|
// USD price sanity range for a Big Mac globally
|
|
const USD_MIN = 1.50;
|
|
const USD_MAX = 12.00;
|
|
|
|
const COUNTRIES = [
|
|
// Americas
|
|
{ code: 'US', name: 'United States', currency: 'USD', flag: '🇺🇸' },
|
|
{ code: 'CA', name: 'Canada', currency: 'CAD', flag: '🇨🇦' },
|
|
{ code: 'MX', name: 'Mexico', currency: 'MXN', flag: '🇲🇽' },
|
|
{ code: 'BR', name: 'Brazil', currency: 'BRL', flag: '🇧🇷' },
|
|
{ code: 'AR', name: 'Argentina', currency: 'ARS', flag: '🇦🇷' },
|
|
{ code: 'CO', name: 'Colombia', currency: 'COP', flag: '🇨🇴' },
|
|
{ code: 'CL', name: 'Chile', currency: 'CLP', flag: '🇨🇱' },
|
|
// Europe
|
|
{ code: 'GB', name: 'UK', currency: 'GBP', flag: '🇬🇧' },
|
|
{ code: 'DE', name: 'Germany', currency: 'EUR', flag: '🇩🇪' },
|
|
{ code: 'FR', name: 'France', currency: 'EUR', flag: '🇫🇷' },
|
|
{ code: 'IT', name: 'Italy', currency: 'EUR', flag: '🇮🇹' },
|
|
{ code: 'ES', name: 'Spain', currency: 'EUR', flag: '🇪🇸' },
|
|
{ code: 'CH', name: 'Switzerland', currency: 'CHF', flag: '🇨🇭' },
|
|
{ code: 'NO', name: 'Norway', currency: 'NOK', flag: '🇳🇴' },
|
|
{ code: 'SE', name: 'Sweden', currency: 'SEK', flag: '🇸🇪' },
|
|
{ code: 'DK', name: 'Denmark', currency: 'DKK', flag: '🇩🇰' },
|
|
{ code: 'PL', name: 'Poland', currency: 'PLN', flag: '🇵🇱' },
|
|
{ code: 'CZ', name: 'Czechia', currency: 'CZK', flag: '🇨🇿' },
|
|
{ code: 'HU', name: 'Hungary', currency: 'HUF', flag: '🇭🇺' },
|
|
{ code: 'RO', name: 'Romania', currency: 'RON', flag: '🇷🇴' },
|
|
{ code: 'UA', name: 'Ukraine', currency: 'UAH', flag: '🇺🇦' },
|
|
// Asia-Pacific
|
|
{ code: 'CN', name: 'China', currency: 'CNY', flag: '🇨🇳' },
|
|
{ code: 'JP', name: 'Japan', currency: 'JPY', flag: '🇯🇵' },
|
|
{ code: 'KR', name: 'South Korea', currency: 'KRW', flag: '🇰🇷' },
|
|
{ code: 'AU', name: 'Australia', currency: 'AUD', flag: '🇦🇺' },
|
|
{ code: 'NZ', name: 'New Zealand', currency: 'NZD', flag: '🇳🇿' },
|
|
{ code: 'SG', name: 'Singapore', currency: 'SGD', flag: '🇸🇬' },
|
|
{ code: 'HK', name: 'Hong Kong', currency: 'HKD', flag: '🇭🇰' },
|
|
{ code: 'TW', name: 'Taiwan', currency: 'TWD', flag: '🇹🇼' },
|
|
{ code: 'TH', name: 'Thailand', currency: 'THB', flag: '🇹🇭' },
|
|
{ code: 'MY', name: 'Malaysia', currency: 'MYR', flag: '🇲🇾' },
|
|
{ code: 'ID', name: 'Indonesia', currency: 'IDR', flag: '🇮🇩' },
|
|
{ code: 'PH', name: 'Philippines', currency: 'PHP', flag: '🇵🇭' },
|
|
{ code: 'VN', name: 'Vietnam', currency: 'VND', flag: '🇻🇳' },
|
|
{ code: 'IN', name: 'India', currency: 'INR', flag: '🇮🇳' },
|
|
{ code: 'PK', name: 'Pakistan', currency: 'PKR', flag: '🇵🇰' },
|
|
// Middle East
|
|
{ code: 'AE', name: 'UAE', currency: 'AED', flag: '🇦🇪' },
|
|
{ code: 'SA', name: 'Saudi Arabia', currency: 'SAR', flag: '🇸🇦' },
|
|
{ code: 'QA', name: 'Qatar', currency: 'QAR', flag: '🇶🇦' },
|
|
{ code: 'KW', name: 'Kuwait', currency: 'KWD', flag: '🇰🇼' },
|
|
{ code: 'BH', name: 'Bahrain', currency: 'BHD', flag: '🇧🇭' },
|
|
{ code: 'OM', name: 'Oman', currency: 'OMR', flag: '🇴🇲' },
|
|
{ code: 'EG', name: 'Egypt', currency: 'EGP', flag: '🇪🇬' },
|
|
{ code: 'JO', name: 'Jordan', currency: 'JOD', flag: '🇯🇴' },
|
|
{ code: 'LB', name: 'Lebanon', currency: 'LBP', flag: '🇱🇧' },
|
|
{ code: 'IL', name: 'Israel', currency: 'ILS', flag: '🇮🇱' },
|
|
// Africa
|
|
{ code: 'ZA', name: 'South Africa', currency: 'ZAR', flag: '🇿🇦' },
|
|
{ code: 'NG', name: 'Nigeria', currency: 'NGN', flag: '🇳🇬' },
|
|
{ code: 'KE', name: 'Kenya', currency: 'KES', flag: '🇰🇪' },
|
|
];
|
|
|
|
const FX_SYMBOLS = Object.fromEntries(
|
|
[...new Set(COUNTRIES.map(c => c.currency))].map(ccy => [ccy, `${ccy}USD=X`])
|
|
);
|
|
|
|
// Handle both plain numbers and thousands-separated (480,000 LBP or 12,000 KRW)
|
|
const NUM = '\\d{1,3}(?:[,\\s]\\d{3})*(?:\\.\\d{1,3})?';
|
|
const CCY = 'USD|GBP|EUR|JPY|CHF|CNY|INR|AUD|CAD|NZD|BRL|MXN|ZAR|TRY|KRW|SGD|HKD|TWD|THB|IDR|NOK|SEK|DKK|PLN|CZK|HUF|RON|PHP|VND|MYR|PKR|ILS|ARS|COP|CLP|UAH|NGN|KES|AED|SAR|QAR|KWD|BHD|OMR|EGP|JOD|LBP';
|
|
const PRICE_PATTERNS = [
|
|
new RegExp(`(${NUM})\\s*(${CCY})`, 'i'),
|
|
new RegExp(`(${CCY})\\s*(${NUM})`, 'i'),
|
|
];
|
|
|
|
function parseNum(s) { return parseFloat(s.replace(/[,\s]/g, '')); }
|
|
|
|
function matchPrice(text, url) {
|
|
for (const re of PRICE_PATTERNS) {
|
|
const match = text.match(re);
|
|
if (match) {
|
|
const [price, currency] = /^\d/.test(match[1])
|
|
? [parseNum(match[1]), match[2].toUpperCase()]
|
|
: [parseNum(match[2]), match[1].toUpperCase()];
|
|
if (price > 0 && price < 10_000_000) return { price, currency, source: url || '' };
|
|
}
|
|
}
|
|
return null;
|
|
}
|
|
|
|
async function searchExa(query, includeDomains = null) {
|
|
const apiKey = (process.env.EXA_API_KEYS || process.env.EXA_API_KEY || '').split(/[\n,]+/)[0].trim();
|
|
if (!apiKey) throw new Error('EXA_API_KEYS or EXA_API_KEY not set');
|
|
|
|
const body = {
|
|
query,
|
|
numResults: 5,
|
|
type: 'auto',
|
|
contents: { summary: { query: 'What is the current Big Mac price in local currency and USD?' } },
|
|
};
|
|
if (includeDomains) body.includeDomains = includeDomains;
|
|
|
|
const resp = await fetch('https://api.exa.ai/search', {
|
|
method: 'POST',
|
|
headers: { 'x-api-key': apiKey, 'Content-Type': 'application/json', 'User-Agent': CHROME_UA },
|
|
body: JSON.stringify(body),
|
|
signal: AbortSignal.timeout(15_000),
|
|
});
|
|
|
|
if (!resp.ok) {
|
|
const text = await resp.text().catch(() => '');
|
|
console.warn(` EXA ${resp.status}: ${text.slice(0, 100)}`);
|
|
return null;
|
|
}
|
|
return resp.json();
|
|
}
|
|
|
|
async function fetchBigMacPrices(prevSnapshot) {
|
|
const fxRates = await getSharedFxRates(FX_SYMBOLS, FX_FALLBACKS);
|
|
const results = [];
|
|
|
|
for (const country of COUNTRIES) {
|
|
await sleep(EXA_DELAY_MS);
|
|
console.log(`\n Processing ${country.flag} ${country.name} (${country.currency})...`);
|
|
|
|
const fxRate = fxRates[country.currency] ?? FX_FALLBACKS[country.currency] ?? null;
|
|
let localPrice = null;
|
|
let usdPrice = null;
|
|
let sourceSite = '';
|
|
|
|
try {
|
|
// Include currency code in query — helps EXA find per-country specialist pages
|
|
const query = `Big Mac price ${country.name} ${country.currency}`;
|
|
const SPECIALIST_SITES = ['theburgerindex.com', 'eatmyindex.com'];
|
|
|
|
// Specialist Big Mac Index sites only — clean, verified per-country data
|
|
const exaResult = await searchExa(query, SPECIALIST_SITES);
|
|
await sleep(EXA_DELAY_MS);
|
|
|
|
if (exaResult?.results?.length) {
|
|
for (const result of exaResult.results) {
|
|
const summary = result?.summary;
|
|
if (!summary || typeof summary !== 'string') continue;
|
|
const hit = matchPrice(summary, result.url || '');
|
|
if (hit?.currency === country.currency) {
|
|
localPrice = hit.price;
|
|
sourceSite = hit.source;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
} catch (err) {
|
|
console.warn(` [${country.code}] EXA error: ${err.message}`);
|
|
}
|
|
|
|
if (usdPrice === null) {
|
|
usdPrice = localPrice !== null && fxRate ? +(localPrice * fxRate).toFixed(4) : null;
|
|
}
|
|
|
|
// Sanity check: Big Mac USD price must be in a plausible global range
|
|
if (usdPrice !== null && (usdPrice < USD_MIN || usdPrice > USD_MAX)) {
|
|
console.warn(` [PRICE] ANOMALY ${country.flag} ${country.name}: $${usdPrice} out of range [$${USD_MIN}-$${USD_MAX}] — dropping price`);
|
|
usdPrice = null;
|
|
localPrice = null;
|
|
}
|
|
|
|
const status = localPrice !== null ? `${localPrice} ${country.currency} = $${usdPrice}` : 'N/A';
|
|
console.log(` Big Mac: ${status}`);
|
|
|
|
results.push({
|
|
code: country.code,
|
|
name: country.name,
|
|
currency: country.currency,
|
|
flag: country.flag,
|
|
localPrice: localPrice !== null ? +localPrice.toFixed(4) : null,
|
|
usdPrice,
|
|
fxRate: fxRate || 0,
|
|
sourceSite,
|
|
available: usdPrice !== null,
|
|
});
|
|
}
|
|
|
|
const withData = results.filter(r => r.usdPrice != null);
|
|
const cheapest = withData.length ? withData.reduce((a, b) => a.usdPrice < b.usdPrice ? a : b).code : '';
|
|
const mostExpensive = withData.length ? withData.reduce((a, b) => a.usdPrice > b.usdPrice ? a : b).code : '';
|
|
|
|
// Compute WoW per country — requires at least 6 days between snapshots
|
|
const prevAge = prevSnapshot?.fetchedAt ? Date.now() - new Date(prevSnapshot.fetchedAt).getTime() : 0;
|
|
const hasPrevData = prevSnapshot?.countries?.length > 0;
|
|
const prevTooRecent = prevAge > 0 && prevAge < MIN_WOW_AGE_MS;
|
|
|
|
if (hasPrevData && prevTooRecent) {
|
|
console.warn(` [WoW] Skipping WoW — previous snapshot is only ${Math.round(prevAge / 3600000)}h old (need 144h+)`);
|
|
}
|
|
|
|
let wowAvailable = hasPrevData && !prevTooRecent;
|
|
let suspiciousCount = 0;
|
|
let suspiciousNames = '';
|
|
|
|
if (wowAvailable) {
|
|
const prevMap = Object.fromEntries(prevSnapshot.countries.map(c => [c.code, c.usdPrice]));
|
|
const rawWowValues = []; // unfiltered — used for global anomaly check
|
|
|
|
for (const r of results) {
|
|
if (r.usdPrice != null && prevMap[r.code] != null && prevMap[r.code] > 0) {
|
|
const raw = +((r.usdPrice - prevMap[r.code]) / prevMap[r.code] * 100).toFixed(2);
|
|
rawWowValues.push(raw);
|
|
if (Math.abs(raw) > WOW_ANOMALY_THRESHOLD) {
|
|
console.warn(` [WoW] ANOMALY ${r.flag} ${r.name}: ${raw}% (prev=$${prevMap[r.code]} now=$${r.usdPrice}) — hiding WoW for this country`);
|
|
suspiciousCount++;
|
|
suspiciousNames += (suspiciousNames ? ', ' : '') + `${r.name} ${raw}%`;
|
|
r.wowPct = null;
|
|
} else {
|
|
r.wowPct = raw;
|
|
}
|
|
} else {
|
|
r.wowPct = null;
|
|
}
|
|
}
|
|
|
|
if (suspiciousCount > 0) {
|
|
console.error(` [WoW] ADMIN ALERT: ${suspiciousCount} country/ies had anomalous WoW (>±${WOW_ANOMALY_THRESHOLD}%): ${suspiciousNames}`);
|
|
}
|
|
|
|
// Global check uses unfiltered average — individual filtering bounds each value to ≤20%
|
|
// so the filtered average can never exceed the threshold (dead check). Use raw values instead.
|
|
const rawAvg = rawWowValues.length > 0
|
|
? +(rawWowValues.reduce((s, v) => s + v, 0) / rawWowValues.length).toFixed(2)
|
|
: 0;
|
|
if (Math.abs(rawAvg) > WOW_ANOMALY_THRESHOLD) {
|
|
console.error(` [WoW] ADMIN ALERT: Global WoW raw avg ${rawAvg}% exceeds ±${WOW_ANOMALY_THRESHOLD}% — disabling WoW entirely, likely systematic data bug`);
|
|
wowAvailable = false;
|
|
}
|
|
}
|
|
|
|
const wowCountries = wowAvailable ? results.filter(r => r.wowPct != null) : [];
|
|
const wowAvgPct = wowCountries.length > 0
|
|
? +(wowCountries.reduce((s, r) => s + r.wowPct, 0) / wowCountries.length).toFixed(2)
|
|
: 0;
|
|
|
|
return {
|
|
countries: results,
|
|
fetchedAt: new Date().toISOString(),
|
|
cheapestCountry: cheapest,
|
|
mostExpensiveCountry: mostExpensive,
|
|
wowAvgPct,
|
|
wowAvailable,
|
|
prevFetchedAt: wowAvailable ? (prevSnapshot.fetchedAt ?? '') : '',
|
|
};
|
|
}
|
|
|
|
const prevSnapshot = await readSeedSnapshot(CANONICAL_KEY);
|
|
|
|
await runSeed('economic', 'bigmac', CANONICAL_KEY, () => fetchBigMacPrices(prevSnapshot), {
|
|
ttlSeconds: CACHE_TTL,
|
|
validateFn: (data) => data?.countries?.length > 0,
|
|
recordCount: (data) => data?.countries?.filter(c => c.available).length || 0,
|
|
extraKeys: prevSnapshot ? [{
|
|
key: `${CANONICAL_KEY}:prev`,
|
|
transform: () => prevSnapshot, // write PRE-overwrite snapshot; ignore new data
|
|
ttl: CACHE_TTL * 2,
|
|
}] : undefined,
|
|
});
|