mirror of
https://github.com/koala73/worldmonitor.git
synced 2026-04-25 17:14:57 +02:00
The weight rebalance (PR #3144) amplified a prompt gap: domestic mass shootings (e.g. "8 children killed in Louisiana") scored 88 because the LLM classified them as "critical" (mass-casualty 10+ killed) and the 55% severity weight pushed them into the critical gate. But WorldMonitor is a geopolitical monitor — domestic tragedies are terrible but not geopolitically destabilizing. Prompt change (both ais-relay.cjs + classify-event.ts): - "critical" now explicitly requires GEOPOLITICAL scope: "events that destabilize international order, threaten cross-border security, or disrupt global systems" - Domestic mass-casualty events (mass shootings, industrial accidents) moved to "high" — still important, but not critical-sensitivity alerts - Added counterexamples: "8 children killed in mass shooting in Louisiana → domestic mass-casualty → high" and "23 killed in fireworks factory explosion → industrial accident → high" - Retained: "700 killed in Sudan drone strikes → geopolitical mass- casualty in active civil war → critical" Classify cache: v2→v3 (bust stale entries that lack geopolitical scope). Shadow-log: v4→v5 (clean dataset for recalibration under the scoped prompt). 🤖 Generated with Claude Opus 4.6 via Claude Code Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
135 lines
5.9 KiB
TypeScript
135 lines
5.9 KiB
TypeScript
import type {
|
|
ServerContext,
|
|
ClassifyEventRequest,
|
|
ClassifyEventResponse,
|
|
SeverityLevel,
|
|
} from '../../../../src/generated/server/worldmonitor/intelligence/v1/service_server';
|
|
|
|
import { cachedFetchJson } from '../../../_shared/redis';
|
|
import { markNoCacheResponse } from '../../../_shared/response-headers';
|
|
import { UPSTREAM_TIMEOUT_MS, buildClassifyCacheKey } from './_shared';
|
|
import { callLlm } from '../../../_shared/llm';
|
|
|
|
// ========================================================================
|
|
// Constants
|
|
// ========================================================================
|
|
|
|
const CLASSIFY_CACHE_TTL = 86400;
|
|
const VALID_LEVELS = ['critical', 'high', 'medium', 'low', 'info'];
|
|
const VALID_CATEGORIES = [
|
|
'conflict', 'protest', 'disaster', 'diplomatic', 'economic',
|
|
'terrorism', 'cyber', 'health', 'environmental', 'military',
|
|
'crime', 'infrastructure', 'tech', 'general',
|
|
];
|
|
|
|
// ========================================================================
|
|
// Helpers
|
|
// ========================================================================
|
|
|
|
function mapLevelToSeverity(level: string): SeverityLevel {
|
|
if (level === 'critical' || level === 'high') return 'SEVERITY_LEVEL_HIGH';
|
|
if (level === 'medium') return 'SEVERITY_LEVEL_MEDIUM';
|
|
return 'SEVERITY_LEVEL_LOW';
|
|
}
|
|
|
|
// ========================================================================
|
|
// RPC handler
|
|
// ========================================================================
|
|
|
|
export async function classifyEvent(
|
|
ctx: ServerContext,
|
|
req: ClassifyEventRequest,
|
|
): Promise<ClassifyEventResponse> {
|
|
// Input sanitization (M-14 fix): limit title length
|
|
const MAX_TITLE_LEN = 500;
|
|
const title = typeof req.title === 'string' ? req.title.slice(0, MAX_TITLE_LEN) : '';
|
|
if (!title) { markNoCacheResponse(ctx.request); return { classification: undefined }; }
|
|
|
|
const cacheKey = await buildClassifyCacheKey(title);
|
|
|
|
const systemPrompt = `You classify news headlines into threat level and category. Return ONLY valid JSON, no other text.
|
|
|
|
Levels: critical, high, medium, low, info
|
|
Categories: conflict, protest, disaster, diplomatic, economic, terrorism, cyber, health, environmental, military, crime, infrastructure, tech, general
|
|
|
|
Guidelines for LEVEL assignment (geopolitical scope required for critical):
|
|
- critical: Active military strikes with international implications, geopolitical mass-casualty events (10+ killed in conflict/terrorism/state action), ceasefire agreements/collapses, nuclear incidents, pandemic declarations, coups, strait/waterway closures
|
|
- high: Armed conflict updates, major diplomatic actions, sanctions packages, significant natural disasters, blockades, terrorist attacks, domestic mass-casualty events (mass shootings, industrial disasters)
|
|
- medium: Ongoing conflict analysis, economic impact reports, protest movements, regional policy changes, military exercises
|
|
- low: Diplomatic meetings, trade discussions, humanitarian aid, election updates, peacekeeping deployments
|
|
- info: Opinion/editorial pieces, analysis/explainer articles, historical retrospectives, lifestyle, entertainment, routine local news, tutorials
|
|
|
|
Key distinction: "critical" requires GEOPOLITICAL scope — events that destabilize international order, threaten cross-border security, or disrupt global systems. Domestic tragedies are "high" unless they trigger international diplomatic responses.
|
|
- "8 children killed in mass shooting in Louisiana" → domestic mass-casualty → high
|
|
- "23 killed in fireworks factory explosion" → industrial accident → high
|
|
- "700 killed in Sudan drone strikes" → geopolitical mass-casualty → critical
|
|
- "Iran closes Strait of Hormuz" → global trade disruption → critical
|
|
- "Man killed his estranged wife" → domestic crime → info
|
|
- "How to Crack the SAM Database" → tutorial → info
|
|
|
|
Focus: geopolitical events, conflicts, disasters, diplomacy.
|
|
Classify by real-world event severity, not headline sentiment.
|
|
|
|
Return: {"level":"...","category":"..."}`;
|
|
|
|
let cached: { level: string; category: string; timestamp: number } | null = null;
|
|
try {
|
|
cached = await cachedFetchJson<{ level: string; category: string; timestamp: number }>(
|
|
cacheKey,
|
|
CLASSIFY_CACHE_TTL,
|
|
async () => {
|
|
let validatedResult: { level: string; category: string } | null = null;
|
|
|
|
const result = await callLlm({
|
|
messages: [
|
|
{ role: 'system', content: systemPrompt },
|
|
{ role: 'user', content: title },
|
|
],
|
|
temperature: 0,
|
|
maxTokens: 50,
|
|
timeoutMs: UPSTREAM_TIMEOUT_MS,
|
|
validate: (content) => {
|
|
try {
|
|
let parsed: { level?: string; category?: string };
|
|
try {
|
|
parsed = JSON.parse(content);
|
|
} catch {
|
|
const jsonMatch = content.match(/\{[\s\S]*\}/);
|
|
if (!jsonMatch) return false;
|
|
parsed = JSON.parse(jsonMatch[0]);
|
|
}
|
|
const level = VALID_LEVELS.includes(parsed.level ?? '') ? parsed.level! : null;
|
|
const category = VALID_CATEGORIES.includes(parsed.category ?? '') ? parsed.category! : null;
|
|
if (!level || !category) return false;
|
|
validatedResult = { level, category };
|
|
return true;
|
|
} catch {
|
|
return false;
|
|
}
|
|
},
|
|
});
|
|
|
|
if (!result || !validatedResult) return null;
|
|
const vr = validatedResult as { level: string; category: string };
|
|
return { level: vr.level, category: vr.category, timestamp: Date.now() };
|
|
},
|
|
);
|
|
} catch {
|
|
markNoCacheResponse(ctx.request);
|
|
return { classification: undefined };
|
|
}
|
|
|
|
if (!cached?.level || !cached?.category) { markNoCacheResponse(ctx.request); return { classification: undefined }; }
|
|
|
|
return {
|
|
classification: {
|
|
category: cached.category,
|
|
subcategory: cached.level,
|
|
severity: mapLevelToSeverity(cached.level),
|
|
confidence: 0.9,
|
|
analysis: '',
|
|
entities: [],
|
|
},
|
|
};
|
|
}
|