modelx / main.py
nivakaran's picture
Deploy from GitHub Actions
ff3017c verified
"""
main.py
Production-Ready Real-Time Intelligence Platform Backend
- Uses combinedAgentGraph for multi-agent orchestration
- Threading for concurrent graph execution and WebSocket server
- Database-driven feed updates with polling
- Duplicate prevention
- District-based feed categorization for map display
Updated: Resilient WebSocket handling for long scraping operations (60s+ cycles)
"""
from fastapi import FastAPI, WebSocket, WebSocketDisconnect
from fastapi.middleware.cors import CORSMiddleware
from pydantic import BaseModel
from typing import Dict, Any, List, Set, Optional
import asyncio
import json
from datetime import datetime, timedelta, timezone
import sys
import os
import logging
import threading
import time
import uuid # CRITICAL: Was missing, needed for event_id generation
def utc_now() -> datetime:
"""Return current UTC time (Python 3.12+ compatible)."""
return datetime.now(timezone.utc)
sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), '..', '..')))
from src.graphs.combinedAgentGraph import graph
from src.states.combinedAgentState import CombinedAgentState
from src.storage.storage_manager import StorageManager
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger("Roger_api")
# ============================================
# AUTO-TRAINING: Check and train models if missing
# ============================================
def check_and_train_models():
"""
Check if ML models are trained. If not, trigger training in background.
Called on startup to ensure models are available.
"""
from pathlib import Path
import subprocess
PROJECT_ROOT = Path(__file__).parent
# Define model checks: (name, model_path, train_command)
model_checks = [
{
"name": "Anomaly Detection",
"check_paths": [
PROJECT_ROOT / "models" / "anomaly-detection" / "artifacts" / "models",
],
"check_files": ["*.joblib", "*.pkl"],
"train_cmd": [
sys.executable,
str(PROJECT_ROOT / "models" / "anomaly-detection" / "main.py")
]
},
{
"name": "Weather Prediction",
"check_paths": [
PROJECT_ROOT / "models" / "weather-prediction" / "artifacts" / "models",
],
"check_files": ["*.h5", "*.keras"],
"train_cmd": [
sys.executable,
str(PROJECT_ROOT / "models" / "weather-prediction" / "main.py"),
"--mode", "full"
]
},
{
"name": "Currency Prediction",
"check_paths": [
PROJECT_ROOT / "models" / "currency-volatility-prediction"
/ "artifacts" / "models",
],
"check_files": ["*.h5", "*.keras"],
"train_cmd": [
sys.executable,
str(PROJECT_ROOT / "models" / "currency-volatility-prediction"
/ "main.py"),
"--mode", "full"
]
},
{
"name": "Stock Prediction",
"check_paths": [
PROJECT_ROOT / "models" / "stock-price-prediction"
/ "Artifacts",
],
"check_files": ["*.pkl", "*.h5", "*.keras"],
"train_cmd": [
sys.executable,
str(PROJECT_ROOT / "models" / "stock-price-prediction"
/ "main.py")
]
},
]
def has_trained_model(check_paths, check_files):
"""Check if any trained model files exist."""
for path in check_paths:
if path.exists():
for pattern in check_files:
if list(path.glob(pattern)):
return True
# Also check subdirectories
if list(path.glob(f"**/{pattern}")):
return True
return False
def train_in_background(name, cmd):
"""Run training in a background thread."""
def _train():
logger.info(f"[AUTO-TRAIN] Starting {name} training...")
try:
result = subprocess.run(
cmd,
cwd=str(PROJECT_ROOT),
capture_output=True,
text=True,
timeout=1800 # 30 min timeout
)
if result.returncode == 0:
logger.info(f"[AUTO-TRAIN] ✓ {name} training complete!")
else:
logger.warning(f"[AUTO-TRAIN] ⚠ {name} training failed: {result.stderr[:500]}")
except subprocess.TimeoutExpired:
logger.error(f"[AUTO-TRAIN] ✗ {name} training timed out (30 min)")
except Exception as e:
logger.error(f"[AUTO-TRAIN] ✗ {name} training error: {e}")
thread = threading.Thread(target=_train, daemon=True, name=f"train_{name}")
thread.start()
return thread
# Check each model
training_threads = []
for model in model_checks:
if has_trained_model(model["check_paths"], model["check_files"]):
logger.info(f"[MODEL CHECK] ✓ {model['name']} - Model found")
else:
logger.warning(f"[MODEL CHECK] ⚠ {model['name']} - No model found, starting training...")
thread = train_in_background(model["name"], model["train_cmd"])
training_threads.append((model["name"], thread))
if training_threads:
logger.info(f"[AUTO-TRAIN] Started {len(training_threads)} background training jobs")
else:
logger.info("[MODEL CHECK] All models found - no training needed")
return training_threads
# Run model check on module load (startup)
logger.info("=" * 60)
logger.info("[STARTUP] Checking ML models...")
logger.info("=" * 60)
_training_threads = check_and_train_models()
app = FastAPI(title="Roger Intelligence Platform API")
app.add_middleware(
CORSMiddleware,
allow_origins=["*"],
allow_credentials=True,
allow_methods=["*"],
allow_headers=["*"],
)
# Global state
current_state: Dict[str, Any] = {
"final_ranked_feed": [],
"risk_dashboard_snapshot": {
"logistics_friction": 0.0,
"compliance_volatility": 0.0,
"market_instability": 0.0,
"opportunity_index": 0.0,
"avg_confidence": 0.0,
"high_priority_count": 0,
"total_events": 0,
"last_updated": utc_now().isoformat()
},
"run_count": 0,
"status": "initializing",
"first_run_complete": False # Track first graph execution
}
# Thread-safe communication
feed_update_queue = asyncio.Queue()
seen_event_ids: Set[str] = set() # Duplicate prevention
# Global event loop reference for cross-thread broadcasting
main_event_loop = None
# Storage manager
storage_manager = StorageManager()
# WebSocket settings - ULTRA-RESILIENT for long scraping operations
# Heavy graph cycles can take 2-3 minutes, so we need high tolerance
HEARTBEAT_INTERVAL = 60.0 # Send ping every 60s (increased from 45s)
HEARTBEAT_TIMEOUT = 45.0 # Wait 45s for pong (increased from 30s)
HEARTBEAT_MISS_THRESHOLD = 5 # Allow 5 misses = ~5 minutes tolerance
SEND_TIMEOUT = 15.0 # Increased for slow networks/heavy load
class ConnectionManager:
"""Manages active WebSocket with heartbeat"""
def __init__(self):
self.active_connections: Dict[WebSocket, Dict[str, Any]] = {}
self._lock = asyncio.Lock()
async def connect(self, websocket: WebSocket):
await websocket.accept()
async with self._lock:
meta = {
"heartbeat_task": asyncio.create_task(self._heartbeat_loop(websocket)),
"last_pong": utc_now(),
"misses": 0
}
self.active_connections[websocket] = meta
logger.info(f"[WebSocket] Connected. Total: {len(self.active_connections)}")
async def disconnect(self, websocket: WebSocket):
async with self._lock:
meta = self.active_connections.pop(websocket, None)
if meta:
task = meta.get("heartbeat_task")
if task and not task.done():
task.cancel()
try:
await task
except asyncio.CancelledError:
pass
try:
await websocket.close()
except Exception:
pass
logger.info(f"[WebSocket] Disconnected. Total: {len(self.active_connections)}")
async def _send_with_timeout(self, websocket: WebSocket, message_json: str):
try:
await asyncio.wait_for(websocket.send_text(message_json), timeout=SEND_TIMEOUT)
return True
except Exception as e:
logger.debug(f"[WebSocket] Send failed: {e}")
return False
async def _heartbeat_loop(self, websocket: WebSocket):
"""Per-connection heartbeat task"""
try:
while True:
await asyncio.sleep(HEARTBEAT_INTERVAL)
if websocket not in self.active_connections:
break
ping_payload = json.dumps({"type": "ping"})
ok = await self._send_with_timeout(websocket, ping_payload)
if not ok:
async with self._lock:
meta = self.active_connections.get(websocket)
if meta is not None:
meta['misses'] += 1
else:
waited = 0.0
sleep_step = 0.5
pong_received = False
while waited < HEARTBEAT_TIMEOUT:
await asyncio.sleep(sleep_step)
waited += sleep_step
async with self._lock:
meta = self.active_connections.get(websocket)
if meta is None:
return
last_pong = meta.get("last_pong")
if last_pong and (utc_now() - last_pong).total_seconds() < (HEARTBEAT_INTERVAL + HEARTBEAT_TIMEOUT):
pong_received = True
meta['misses'] = 0
break
if not pong_received:
async with self._lock:
meta = self.active_connections.get(websocket)
if meta is not None:
meta['misses'] += 1
async with self._lock:
meta = self.active_connections.get(websocket)
if meta is None:
return
if meta.get('misses', 0) >= HEARTBEAT_MISS_THRESHOLD:
logger.warning("[WebSocket] Miss threshold exceeded, disconnecting")
try:
await websocket.close(code=1001)
except Exception:
pass
await self.disconnect(websocket)
return
except asyncio.CancelledError:
return
except Exception as e:
logger.exception(f"[WebSocket] Heartbeat error: {e}")
try:
await self.disconnect(websocket)
except Exception:
pass
async def broadcast(self, message: dict):
"""Broadcast to all connections"""
async with self._lock:
conns = list(self.active_connections.keys())
if not conns:
return
message_json = json.dumps(message, default=str)
dead: List[WebSocket] = []
for conn in conns:
ok = await self._send_with_timeout(conn, message_json)
if not ok:
dead.append(conn)
for conn in dead:
logger.info("[WebSocket] Removing dead connection")
await self.disconnect(conn)
manager = ConnectionManager()
def categorize_feed_by_district(feed: Dict[str, Any]) -> str:
"""
Categorize feed by Sri Lankan district based on summary text.
Returns district name or "National" if not district-specific.
NOTE: This returns the FIRST match. Use get_all_matching_districts() for multi-district feeds.
"""
districts = get_all_matching_districts(feed)
return districts[0] if districts else "National"
def get_all_matching_districts(feed: Dict[str, Any]) -> List[str]:
"""
Get ALL districts mentioned in a feed (direct or via province).
Supports:
- Direct district names (Colombo, Kandy, etc.)
- Province names that map to multiple districts
- Commonly referenced regions
Returns list of all matching district names.
"""
summary = feed.get("summary", "").lower()
# Sri Lankan districts
districts = [
"Colombo", "Gampaha", "Kalutara", "Kandy", "Matale", "Nuwara Eliya",
"Galle", "Matara", "Hambantota", "Jaffna", "Kilinochchi", "Mannar",
"Vavuniya", "Mullaitivu", "Batticaloa", "Ampara", "Trincomalee",
"Kurunegala", "Puttalam", "Anuradhapura", "Polonnaruwa", "Badulla",
"Moneragala", "Ratnapura", "Kegalle"
]
# Province to districts mapping
province_mapping = {
"western province": ["Colombo", "Gampaha", "Kalutara"],
"western": ["Colombo", "Gampaha", "Kalutara"],
"central province": ["Kandy", "Matale", "Nuwara Eliya"],
"central": ["Kandy", "Matale", "Nuwara Eliya"],
"southern province": ["Galle", "Matara", "Hambantota"],
"southern provinces": ["Galle", "Matara", "Hambantota"],
"southern": ["Galle", "Matara", "Hambantota"],
"south": ["Galle", "Matara", "Hambantota"],
"northern province": ["Jaffna", "Kilinochchi", "Mannar", "Vavuniya", "Mullaitivu"],
"northern": ["Jaffna", "Kilinochchi", "Mannar", "Vavuniya", "Mullaitivu"],
"north": ["Jaffna", "Kilinochchi", "Mannar", "Vavuniya", "Mullaitivu"],
"eastern province": ["Batticaloa", "Ampara", "Trincomalee"],
"eastern": ["Batticaloa", "Ampara", "Trincomalee"],
"east": ["Batticaloa", "Ampara", "Trincomalee"],
"north western province": ["Kurunegala", "Puttalam"],
"north western": ["Kurunegala", "Puttalam"],
"north central province": ["Anuradhapura", "Polonnaruwa"],
"north central": ["Anuradhapura", "Polonnaruwa"],
"uva province": ["Badulla", "Moneragala"],
"uva": ["Badulla", "Moneragala"],
"sabaragamuwa province": ["Ratnapura", "Kegalle"],
"sabaragamuwa": ["Ratnapura", "Kegalle"],
}
matched_districts = set()
# Check for province mentions first
for province, province_districts in province_mapping.items():
if province in summary:
matched_districts.update(province_districts)
# Check for direct district mentions
for district in districts:
if district.lower() in summary:
matched_districts.add(district)
return list(matched_districts)
def run_graph_loop():
"""
Graph execution in separate thread.
Runs the combinedAgentGraph every 60 seconds (non-blocking pattern).
UPDATED: Graph now runs single cycles and this loop handles the 60s interval
externally, making the pattern non-blocking and interruptible.
"""
REFRESH_INTERVAL_SECONDS = 60
shutdown_event = threading.Event()
logger.info("="*80)
logger.info("[GRAPH THREAD] Starting Roger combinedAgentGraph loop (60s interval)")
logger.info("="*80)
cycle_count = 0
while not shutdown_event.is_set():
cycle_count += 1
cycle_start = time.time()
logger.info(f"[GRAPH THREAD] Starting cycle #{cycle_count}")
initial_state = CombinedAgentState(
domain_insights=[],
final_ranked_feed=[],
run_count=cycle_count,
max_runs=1, # Single cycle mode
route=None
)
try:
# Run a single graph cycle (non-blocking since router now returns END)
config = {"recursion_limit": 100}
for event in graph.stream(initial_state, config=config):
logger.info(f"[GRAPH] Event nodes: {list(event.keys())}")
for node_name, node_output in event.items():
# Extract feed data
if hasattr(node_output, 'final_ranked_feed'):
feeds = node_output.final_ranked_feed
elif isinstance(node_output, dict):
feeds = node_output.get('final_ranked_feed', [])
else:
continue
if feeds:
logger.info(f"[GRAPH] {node_name} produced {len(feeds)} feeds")
# FIELD_NORMALIZATION: Transform graph format to frontend format
for feed_item in feeds:
if isinstance(feed_item, dict):
event_data = feed_item
else:
event_data = feed_item.__dict__ if hasattr(feed_item, '__dict__') else {}
# Normalize field names: graph uses content_summary/target_agent, frontend expects summary/domain
event_id = event_data.get("event_id", str(uuid.uuid4()))
summary = event_data.get("content_summary") or event_data.get("summary", "")
domain = event_data.get("target_agent") or event_data.get("domain", "unknown")
severity = event_data.get("severity", "medium")
impact_type = event_data.get("impact_type", "risk")
confidence = event_data.get("confidence_score", event_data.get("confidence", 0.5))
timestamp = event_data.get("timestamp", utc_now().isoformat())
# Check for duplicates
is_dup, _, _ = storage_manager.is_duplicate(summary)
if not is_dup:
try:
storage_manager.store_event(
event_id=event_id,
summary=summary,
domain=domain,
severity=severity,
impact_type=impact_type,
confidence_score=confidence
)
logger.info(f"[GRAPH] Stored new feed: {summary[:60]}...")
except Exception as storage_error:
logger.warning(f"[GRAPH] Storage error (continuing): {storage_error}")
# DIRECT_BROADCAST_FIX: Set first_run_complete and broadcast
if not current_state.get('first_run_complete'):
current_state['first_run_complete'] = True
current_state['status'] = 'operational'
logger.info("[GRAPH] FIRST RUN COMPLETE - Broadcasting to frontend!")
# Trigger broadcast from sync thread to async loop
if main_event_loop:
asyncio.run_coroutine_threadsafe(
manager.broadcast(current_state),
main_event_loop
)
except RuntimeError as e:
if "cannot schedule new futures after interpreter shutdown" in str(e):
logger.warning("[GRAPH THREAD] Interpreter shutting down, stopping graph loop gracefully")
break # Exit the loop cleanly
else:
logger.error(f"[GRAPH THREAD] RuntimeError in cycle #{cycle_count}: {e}", exc_info=True)
except Exception as e:
logger.error(f"[GRAPH THREAD] Error in cycle #{cycle_count}: {e}", exc_info=True)
# Calculate time spent in this cycle
cycle_duration = time.time() - cycle_start
logger.info(f"[GRAPH THREAD] Cycle #{cycle_count} completed in {cycle_duration:.1f}s")
# Wait for remaining time to complete 60s interval (interruptible)
wait_time = max(0, REFRESH_INTERVAL_SECONDS - cycle_duration)
if wait_time > 0:
logger.info(f"[GRAPH THREAD] Waiting {wait_time:.1f}s before next cycle...")
# Use Event.wait() for interruptible sleep instead of time.sleep()
shutdown_event.wait(timeout=wait_time)
logger.info("[GRAPH THREAD] Graph loop stopped")
async def database_polling_loop():
"""
Polls database for new feeds and broadcasts via WebSocket.
Runs concurrently with graph thread.
"""
global current_state
last_check = utc_now()
logger.info("[DB_POLLER] Starting database polling loop")
while True:
try:
await asyncio.sleep(2.0) # Poll every 2 seconds
# Get new feeds since last check
new_feeds = storage_manager.get_feeds_since(last_check)
last_check = utc_now()
if new_feeds:
logger.info(f"[DB_POLLER] Found {len(new_feeds)} new feeds")
# Filter duplicates (by event_id)
unique_feeds = []
for feed in new_feeds:
event_id = feed.get("event_id")
if event_id and event_id not in seen_event_ids:
seen_event_ids.add(event_id)
# Add district categorization for map
feed["district"] = categorize_feed_by_district(feed)
unique_feeds.append(feed)
if unique_feeds:
# Update current state
current_state['final_ranked_feed'] = unique_feeds + current_state.get('final_ranked_feed', [])
current_state['final_ranked_feed'] = current_state['final_ranked_feed'][:100] # Keep last 100
current_state['status'] = 'operational'
current_state['last_update'] = utc_now().isoformat()
# Mark first run as complete (frontend loading screen can now hide)
if not current_state.get('first_run_complete'):
current_state['first_run_complete'] = True
logger.info("[DB_POLLER] First graph run complete! Frontend loading screen can now hide.")
# Broadcast to WebSocket clients
await manager.broadcast(current_state)
logger.info(f"[DB_POLLER] Broadcasted {len(unique_feeds)} unique feeds")
except Exception as e:
logger.error(f"[DB_POLLER] Error: {e}")
@app.on_event("startup")
async def startup_event():
global main_event_loop
main_event_loop = asyncio.get_event_loop()
logger.info("[API] Starting Roger API...")
# Start graph execution in separate thread
graph_thread = threading.Thread(target=run_graph_loop, daemon=True)
graph_thread.start()
logger.info("[API] Graph thread started")
# Start database polling loop
asyncio.create_task(database_polling_loop())
logger.info("[API] Database polling started")
@app.get("/")
def read_root():
return {
"service": "Roger Intelligence Platform",
"status": current_state.get("status"),
"version": "2.0.0 (Database-Driven)"
}
@app.get("/api/status")
def get_status():
return {
"status": current_state.get("status"),
"run_count": current_state.get("run_count"),
"last_update": current_state.get("last_update"),
"active_connections": len(manager.active_connections),
"total_events": len(current_state.get("final_ranked_feed", []))
}
@app.get("/api/dashboard")
def get_dashboard():
return current_state.get("risk_dashboard_snapshot", {})
@app.get("/api/feed")
def get_feed():
"""Get current feed from memory"""
return {
"events": current_state.get("final_ranked_feed", []),
"total": len(current_state.get("final_ranked_feed", []))
}
@app.get("/api/feeds")
def get_feeds_from_db(limit: int = 100):
"""Get feeds directly from database (for initial load)"""
try:
feeds = storage_manager.get_recent_feeds(limit=limit)
# FIELD_NORMALIZATION + district categorization
normalized_feeds = []
for feed in feeds:
# Ensure frontend-compatible field names
normalized = {
"event_id": feed.get("event_id"),
"summary": feed.get("summary", ""),
"domain": feed.get("domain", "unknown"),
"severity": feed.get("severity", "medium"),
"impact_type": feed.get("impact_type", "risk"),
"confidence": feed.get("confidence", 0.5),
"timestamp": feed.get("timestamp"),
"district": categorize_feed_by_district(feed)
}
normalized_feeds.append(normalized)
return {
"events": normalized_feeds,
"total": len(normalized_feeds),
"source": "database"
}
except Exception as e:
logger.error(f"[API] Error fetching feeds: {e}")
return {"events": [], "total": 0, "error": str(e)}
@app.get("/api/feeds/by_district/{district}")
def get_feeds_by_district(district: str, limit: int = 50):
"""Get feeds for specific district"""
try:
all_feeds = storage_manager.get_recent_feeds(limit=200)
# Filter by district
district_feeds = []
for feed in all_feeds:
feed["district"] = categorize_feed_by_district(feed)
if feed["district"].lower() == district.lower():
district_feeds.append(feed)
if len(district_feeds) >= limit:
break
return {
"district": district,
"events": district_feeds,
"total": len(district_feeds)
}
except Exception as e:
logger.error(f"[API] Error fetching district feeds: {e}")
return {"events": [], "total": 0, "error": str(e)}
@app.get("/api/rivernet")
def get_rivernet_status():
"""Get real-time river monitoring data from RiverNet.lk"""
try:
from src.utils.utils import tool_rivernet_status
river_data = tool_rivernet_status()
return river_data
except Exception as e:
logger.error(f"[API] Error fetching rivernet data: {e}")
return {
"rivers": [],
"alerts": [],
"summary": {"total_monitored": 0, "overall_status": "error", "has_alerts": False},
"error": str(e)
}
@app.get("/api/weather/historical")
def get_historical_climate_data():
"""
Get 30-year historical flood pattern analysis.
Returns climate trend data including:
- Average annual rainfall
- Maximum daily rainfall records
- Heavy/extreme rain day counts
- Decadal comparison (1995-2025)
- Key climate change findings
"""
try:
from src.utils.utils import tool_floodwatch_historical
historical_data = tool_floodwatch_historical()
return {
"status": "success",
"data": historical_data
}
except Exception as e:
logger.error(f"[API] Error fetching historical data: {e}")
return {
"status": "error",
"error": str(e)
}
@app.get("/api/weather/threat")
def get_national_threat_score():
"""
Get national flood threat score (0-100).
Aggregates river status, DMC alerts, and seasonal factors
to compute an overall threat level for Sri Lanka.
Returns:
- national_threat_score (0-100)
- threat_level (CRITICAL/HIGH/MODERATE/LOW)
- breakdown by category
- risk district lists
"""
try:
from src.utils.utils import tool_rivernet_status, tool_calculate_national_threat, tool_dmc_alerts
# Get river data
river_data = None
try:
river_data = tool_rivernet_status()
except Exception as e:
logger.warning(f"[ThreatAPI] RiverNet unavailable: {e}")
# Get DMC alerts
dmc_data = None
try:
dmc_result = tool_dmc_alerts()
dmc_data = dmc_result.get("alerts", [])
except Exception as e:
logger.warning(f"[ThreatAPI] DMC unavailable: {e}")
# Calculate threat score
threat_data = tool_calculate_national_threat(
river_data=river_data,
dmc_alerts=dmc_data
)
return {
"status": "success",
**threat_data
}
except Exception as e:
logger.error(f"[API] Error calculating threat: {e}")
return {
"status": "error",
"national_threat_score": 0,
"threat_level": "UNKNOWN",
"error": str(e)
}
# ============================================
# INTEL CONFIG API - User Keywords & Profiles
# ============================================
# Global intel config (loaded from file)
INTEL_CONFIG_PATH = os.path.join(os.path.dirname(__file__), "data", "intel_config.json")
# Default config structure
DEFAULT_INTEL_CONFIG = {
"user_profiles": {
"twitter": [],
"facebook": [],
"linkedin": []
},
"user_keywords": [],
"user_products": []
}
def load_intel_config() -> dict:
"""Load intel config from JSON file."""
try:
if os.path.exists(INTEL_CONFIG_PATH):
with open(INTEL_CONFIG_PATH, "r", encoding="utf-8") as f:
return json.load(f)
except Exception as e:
logger.warning(f"[Intel Config] Error loading config: {e}")
return DEFAULT_INTEL_CONFIG.copy()
def save_intel_config(config: dict) -> bool:
"""Save intel config to JSON file."""
try:
os.makedirs(os.path.dirname(INTEL_CONFIG_PATH), exist_ok=True)
with open(INTEL_CONFIG_PATH, "w", encoding="utf-8") as f:
json.dump(config, f, indent=2, ensure_ascii=False)
return True
except Exception as e:
logger.error(f"[Intel Config] Error saving config: {e}")
return False
# Load config on startup
intel_config = load_intel_config()
@app.get("/api/intel/config")
def get_intel_config():
"""
Get current intelligence configuration.
Returns user-defined keywords, products, and social profiles to monitor.
"""
global intel_config
intel_config = load_intel_config() # Refresh from file
return {
"status": "success",
"config": intel_config
}
class IntelConfigUpdate(BaseModel):
user_profiles: dict = None
user_keywords: list = None
user_products: list = None
@app.post("/api/intel/config")
def update_intel_config(config_update: IntelConfigUpdate):
"""
Update intelligence configuration.
Accepts user-defined keywords, products, and social profiles.
Changes take effect on the next agent collection cycle.
"""
global intel_config
try:
# Update fields if provided
if config_update.user_profiles is not None:
intel_config["user_profiles"] = config_update.user_profiles
if config_update.user_keywords is not None:
intel_config["user_keywords"] = config_update.user_keywords
if config_update.user_products is not None:
intel_config["user_products"] = config_update.user_products
# Save to file
if save_intel_config(intel_config):
logger.info(f"[Intel Config] Updated: {len(intel_config.get('user_keywords', []))} keywords, "
f"{sum(len(v) for v in intel_config.get('user_profiles', {}).values())} profiles")
return {
"status": "updated",
"config": intel_config
}
else:
return {"status": "error", "error": "Failed to save configuration"}
except Exception as e:
logger.error(f"[Intel Config] Update error: {e}")
return {"status": "error", "error": str(e)}
def get_user_intel_config() -> dict:
"""
Get the current intel config for use by agents.
This function is called by social agents to get user-defined keywords and profiles.
"""
global intel_config
return intel_config
# ============================================
# SITUATIONAL AWARENESS API ENDPOINTS (NEW)
# ============================================
@app.get("/api/power")
def get_power_status():
"""
Get CEB power outage / load shedding status.
Returns current power supply status, active load shedding schedules,
and any CEB announcements.
"""
try:
from src.utils.utils import tool_ceb_power_status
power_data = tool_ceb_power_status()
return {
"status": "success",
**power_data
}
except Exception as e:
logger.error(f"[API] Error fetching power status: {e}")
return {
"status": "error",
"load_shedding_active": False,
"error": str(e)
}
@app.get("/api/fuel")
def get_fuel_prices():
"""
Get current fuel prices in Sri Lanka.
Returns prices for Petrol 92/95, Diesel, Super Diesel, and Kerosene.
"""
try:
from src.utils.utils import tool_fuel_prices
fuel_data = tool_fuel_prices()
return {
"status": "success",
**fuel_data
}
except Exception as e:
logger.error(f"[API] Error fetching fuel prices: {e}")
return {
"status": "error",
"prices": {},
"error": str(e)
}
@app.get("/api/economy")
def get_economic_indicators():
"""
Get key economic indicators from CBSL.
Returns inflation rates, policy rates, exchange rates, and forex reserves.
"""
try:
from src.utils.utils import tool_cbsl_indicators
economy_data = tool_cbsl_indicators()
return {
"status": "success",
**economy_data
}
except Exception as e:
logger.error(f"[API] Error fetching economic indicators: {e}")
return {
"status": "error",
"indicators": {},
"error": str(e)
}
@app.get("/api/health")
def get_health_alerts():
"""
Get health alerts and disease information.
Returns current health alerts, dengue case data, and health advisories.
"""
try:
from src.utils.utils import tool_health_alerts
health_data = tool_health_alerts()
return {
"status": "success",
**health_data
}
except Exception as e:
logger.error(f"[API] Error fetching health data: {e}")
return {
"status": "error",
"alerts": [],
"dengue": {},
"error": str(e)
}
@app.get("/api/commodities")
def get_commodity_prices():
"""
Get prices for essential commodities.
Returns current prices for rice, sugar, dhal, milk powder, and other staples.
"""
try:
from src.utils.utils import tool_commodity_prices
commodity_data = tool_commodity_prices()
return {
"status": "success",
**commodity_data
}
except Exception as e:
logger.error(f"[API] Error fetching commodity prices: {e}")
return {
"status": "error",
"commodities": [],
"error": str(e)
}
@app.get("/api/water")
def get_water_supply_status():
"""
Get water supply disruption alerts from NWSDB.
Returns active disruptions, affected areas, and restoration estimates.
"""
try:
from src.utils.utils import tool_water_supply_alerts
water_data = tool_water_supply_alerts()
return {
"status": "success",
**water_data
}
except Exception as e:
logger.error(f"[API] Error fetching water status: {e}")
return {
"status": "error",
"active_disruptions": [],
"error": str(e)
}
# NOTE: Weather predictions endpoint moved to async version below (line ~1540)
# NOTE: Currency prediction endpoint moved to async version below (line ~1680)
@app.get("/api/currency/history")
def get_currency_history(days: int = 7):
"""
Get historical USD/LKR exchange rate data.
Args:
days: Number of days of history to return (default 7)
Returns:
List of historical rates with date and close price.
"""
try:
from pathlib import Path
import pandas as pd
# Path to currency data
data_dir = Path(__file__).parent / "models" / "currency-volatility-prediction" / "artifacts" / "data"
# Find the data file
data_files = list(data_dir.glob("currency_data_*.csv")) if data_dir.exists() else []
if data_files:
# Get most recent data file
latest_file = max(data_files, key=lambda p: p.stem)
df = pd.read_csv(latest_file)
# Get last N days
df['date'] = pd.to_datetime(df['date'])
df = df.sort_values('date', ascending=False).head(days)
df = df.sort_values('date', ascending=True)
history = []
for _, row in df.iterrows():
history.append({
"date": row['date'].strftime("%Y-%m-%d"),
"close": float(row['close']),
"high": float(row.get('high', row['close'])),
"low": float(row.get('low', row['close']))
})
return {
"status": "success",
"history": history,
"days": len(history)
}
return {
"status": "no_data",
"message": "No historical data available. Run data ingestion first.",
"history": []
}
except Exception as e:
logger.error(f"[CurrencyAPI] Error fetching history: {e}")
return {
"status": "error",
"error": str(e),
"history": []
}
# ============================================
# TRENDING DETECTION ENDPOINTS
# ============================================
@app.get("/api/trending")
def get_trending_topics(limit: int = 10):
"""
Get currently trending topics.
Returns topics with momentum > 2x (gaining traction).
"""
try:
from src.utils.trending_detector import get_trending_now, get_spikes
# Use the global storage_manager instance defined earlier in main.py
# no need to import it if we are inside main.py function scope where it's visible or passed
# But since this is a route function, it might need global access or import.
# Assuming storage_manager is available globally in this file as it was initialized earlier.
trending = get_trending_now(limit=limit)
spikes = get_spikes()
# Enrich top 5 trending topics with related feeds
for topic in trending[:5]:
keyword = topic["topic"]
# Search for relevant feeds (limit 2 per topic to keep payload small)
try:
related = storage_manager.search_feeds(keyword, limit=2)
topic["related_feeds"] = related
except Exception as e:
logger.warning(f"Error searching feeds for topic {keyword}: {e}")
topic["related_feeds"] = []
return {
"status": "success",
"trending_topics": trending,
"spike_alerts": spikes,
"total_trending": len(trending),
"total_spikes": len(spikes)
}
except Exception as e:
logger.error(f"[TrendingAPI] Error: {e}")
return {
"status": "error",
"error": str(e),
"trending_topics": [],
"spike_alerts": []
}
@app.get("/api/trending/topic/{topic}")
def get_topic_history(topic: str, hours: int = 24):
"""
Get hourly mention history for a specific topic.
Args:
topic: Topic name to get history for
hours: Number of hours of history to return (default 24)
"""
try:
from src.utils.trending_detector import get_trending_detector
detector = get_trending_detector()
history = detector.get_topic_history(topic, hours=hours)
momentum = detector.get_momentum(topic)
is_spike = detector.is_spike(topic)
return {
"status": "success",
"topic": topic,
"momentum": momentum,
"is_spike": is_spike,
"history": history
}
except Exception as e:
logger.error(f"[TrendingAPI] Error getting history for {topic}: {e}")
return {
"status": "error",
"error": str(e),
"topic": topic,
"momentum": 1.0,
"is_spike": False,
"history": []
}
@app.post("/api/trending/record")
def record_topic_mention(topic: str, source: str = "manual", domain: str = "general"):
"""
Record a topic mention (for testing/manual tracking).
Args:
topic: Topic/keyword being mentioned
source: Source of the mention (twitter, news, etc.)
domain: Domain category (political, economical, etc.)
"""
try:
from src.utils.trending_detector import record_topic_mention as record_mention
record_mention(topic=topic, source=source, domain=domain)
# Get updated momentum
from src.utils.trending_detector import get_trending_detector
detector = get_trending_detector()
momentum = detector.get_momentum(topic)
return {
"status": "success",
"message": f"Recorded mention for '{topic}'",
"current_momentum": momentum,
"is_spike": detector.is_spike(topic)
}
except Exception as e:
logger.error(f"[TrendingAPI] Error recording mention: {e}")
return {
"status": "error",
"error": str(e)
}
# ============================================
# ANOMALY DETECTION ENDPOINTS
# ============================================
# Lazy-loaded anomaly detection components
_anomaly_models = {} # {language: model}
_vectorizer = None
_language_detector = None
def _load_anomaly_components():
"""Load per-language anomaly detection models and vectorizer"""
global _anomaly_models, _vectorizer, _language_detector
if _anomaly_models:
return True
try:
import joblib
from pathlib import Path
# Model directories
output_dir = Path(__file__).parent / "models" / "anomaly-detection" / "output"
artifacts_dir = Path(__file__).parent / "models" / "anomaly-detection" / "artifacts" / "model_trainer"
# Load per-language models
for lang in ["english", "sinhala", "tamil"]:
for search_dir in [artifacts_dir, output_dir]:
model_path = search_dir / f"isolation_forest_{lang}.joblib"
if model_path.exists():
_anomaly_models[lang] = joblib.load(model_path)
logger.info(f"[AnomalyAPI] Loaded {lang} model from {model_path.name}")
break
# Fallback to legacy model if no per-language models found
if not _anomaly_models:
legacy_paths = [
output_dir / "isolation_forest_embeddings_only.joblib",
output_dir / "isolation_forest_model.joblib",
]
for legacy_path in legacy_paths:
if legacy_path.exists():
_anomaly_models["english"] = joblib.load(legacy_path)
logger.info(f"[AnomalyAPI] Loaded legacy model: {legacy_path.name}")
break
if not _anomaly_models:
logger.warning("[AnomalyAPI] No trained models found. Run training first.")
return False
# Load vectorizer and language detector
from models.anomaly_detection.src.utils.vectorizer import get_vectorizer
from models.anomaly_detection.src.utils.language_detector import detect_language
_vectorizer = get_vectorizer()
_language_detector = detect_language
logger.info(f"[AnomalyAPI] ✓ Loaded models for: {list(_anomaly_models.keys())}")
return True
except Exception as e:
logger.error(f"[AnomalyAPI] Failed to load components: {e}")
return False
@app.post("/api/predict")
def predict_anomaly(texts: List[str] = None, text: str = None):
"""
Run anomaly detection on text(s) using per-language models.
Args:
texts: List of texts to analyze
text: Single text to analyze (alternative to texts)
Returns:
Predictions with anomaly scores
"""
try:
# Handle input
if text and not texts:
texts = [text]
if not texts:
return {"error": "No text provided. Use 'text' or 'texts' field.", "predictions": []}
# Load components
if not _load_anomaly_components():
# If no model, return scores based on heuristics
return {
"predictions": [
{
"text": t[:100] + "..." if len(t) > 100 else t,
"is_anomaly": False,
"anomaly_score": 0.0,
"method": "heuristic"
}
for t in texts
],
"model_status": "not_trained",
"message": "Model not trained yet. Using default scores."
}
# Process texts with per-language models
predictions = []
for t in texts:
try:
# Detect language
lang, lang_conf = _language_detector(t)
# Vectorize
vector = _vectorizer.vectorize(t, lang)
# Select appropriate model
if lang in _anomaly_models:
model = _anomaly_models[lang]
method = f"isolation_forest_{lang}"
elif "english" in _anomaly_models:
model = _anomaly_models["english"]
method = "isolation_forest_english_fallback"
else:
# No model available
predictions.append({
"text": t[:100] + "..." if len(t) > 100 else t,
"is_anomaly": False,
"anomaly_score": 0.0,
"language": lang,
"method": "no_model"
})
continue
# Predict: -1 = anomaly, 1 = normal
prediction = model.predict([vector])[0]
# Get anomaly score
if hasattr(model, 'decision_function'):
score = -model.decision_function([vector])[0]
elif hasattr(model, 'score_samples'):
score = -model.score_samples([vector])[0]
else:
score = 1.0 if prediction == -1 else 0.0
predictions.append({
"text": t[:100] + "..." if len(t) > 100 else t,
"is_anomaly": prediction == -1,
"anomaly_score": float(score),
"language": lang,
"method": method
})
except Exception as e:
logger.error(f"[AnomalyAPI] Error predicting: {e}")
predictions.append({
"text": t[:100] + "..." if len(t) > 100 else t,
"is_anomaly": False,
"anomaly_score": 0.0,
"error": str(e)
})
return {
"predictions": predictions,
"total": len(predictions),
"anomalies_found": sum(1 for p in predictions if p.get("is_anomaly")),
"model_status": "loaded",
"models_available": list(_anomaly_models.keys())
}
except Exception as e:
logger.error(f"[AnomalyAPI] Predict error: {e}", exc_info=True)
return {"error": str(e), "predictions": []}
@app.get("/api/anomalies")
def get_anomalies(limit: int = 20, threshold: float = 0.5):
"""
Get recent feeds that are flagged as anomalies.
Args:
limit: Max number of results
threshold: Anomaly score threshold (0-1)
Returns:
List of anomalous events
"""
try:
# Get recent feeds
feeds = storage_manager.get_recent_feeds(limit=100)
if not feeds:
# No feeds yet - return helpful message
return {
"anomalies": [],
"total": 0,
"model_status": "no_data",
"message": "No feed data available yet. Wait for graph execution to complete."
}
if not _load_anomaly_components():
# Use severity + keyword-based scoring as intelligent fallback
anomalies = []
anomaly_keywords = ["emergency", "crisis", "breaking", "urgent", "alert",
"warning", "critical", "disaster", "flood", "protest"]
for f in feeds:
score = 0.0
summary = str(f.get("summary", "")).lower()
severity = f.get("severity", "low")
# Severity-based scoring
if severity == "critical": score = 0.9
elif severity == "high": score = 0.75
elif severity == "medium": score = 0.5
else: score = 0.25
# Keyword boosting
keyword_matches = sum(1 for kw in anomaly_keywords if kw in summary)
if keyword_matches > 0:
score = min(1.0, score + (keyword_matches * 0.1))
# Only include if above threshold
if score >= threshold:
anomalies.append({
**f,
"anomaly_score": round(score, 3),
"is_anomaly": score >= 0.7
})
# Sort by anomaly score
anomalies.sort(key=lambda x: x.get("anomaly_score", 0), reverse=True)
return {
"anomalies": anomalies[:limit],
"total": len(anomalies),
"threshold": threshold,
"model_status": "fallback_scoring",
"message": "Using severity + keyword scoring. Train ML model for advanced detection."
}
# ML Models are loaded - use per-language models for scoring
anomalies = []
per_lang_counts = {"english": 0, "sinhala": 0, "tamil": 0}
for feed in feeds:
summary = feed.get("summary", "")
if not summary:
continue
try:
lang, _ = _language_detector(summary)
vector = _vectorizer.vectorize(summary, lang)
# Select appropriate model
if lang in _anomaly_models:
model = _anomaly_models[lang]
method = f"isolation_forest_{lang}"
elif "english" in _anomaly_models:
model = _anomaly_models["english"]
method = "isolation_forest_english_fallback"
else:
continue
per_lang_counts[lang] = per_lang_counts.get(lang, 0) + 1
prediction = model.predict([vector])[0]
if hasattr(model, 'decision_function'):
score = -model.decision_function([vector])[0]
else:
score = 1.0 if prediction == -1 else 0.0
# Normalize score to 0-1 range
normalized_score = max(0, min(1, (score + 0.5)))
if prediction == -1 or normalized_score >= threshold:
anomalies.append({
**feed,
"anomaly_score": float(round(normalized_score, 3)),
"is_anomaly": prediction == -1,
"language": lang,
"detection_method": method
})
if len(anomalies) >= limit:
break
except Exception as e:
logger.debug(f"[AnomalyAPI] Error scoring feed: {e}")
continue
# Sort by anomaly score
anomalies.sort(key=lambda x: x.get("anomaly_score", 0), reverse=True)
return {
"anomalies": anomalies,
"total": len(anomalies),
"threshold": threshold,
"model_status": "ml_active",
"models_loaded": list(_anomaly_models.keys()),
"per_language_counts": per_lang_counts
}
except Exception as e:
logger.error(f"[AnomalyAPI] Get anomalies error: {e}")
return {"anomalies": [], "total": 0, "error": str(e)}
@app.get("/api/model/status")
def get_model_status():
"""Get anomaly detection model status"""
try:
from pathlib import Path
output_dir = Path(__file__).parent / "models" / "anomaly-detection" / "output"
models_found = []
if output_dir.exists():
for f in output_dir.glob("*.joblib"):
models_found.append(f.name)
loaded = _anomaly_model is not None
return {
"model_loaded": loaded,
"models_available": models_found,
"vectorizer_loaded": _vectorizer is not None,
"batch_threshold": int(os.getenv("BATCH_THRESHOLD", "1000")),
"output_directory": str(output_dir)
}
except Exception as e:
return {"error": str(e), "model_loaded": False}
# ============================================
# RAG CHATBOT ENDPOINTS
# ============================================
# Lazy-loaded RAG instance
_rag_instance = None
def _get_rag():
"""Get or create RAG instance"""
global _rag_instance
if _rag_instance is None:
try:
from src.rag import RogerRAG
_rag_instance = RogerRAG()
logger.info("[RAG API] ✓ RAG instance initialized")
except Exception as e:
logger.error(f"[RAG API] Failed to initialize RAG: {e}")
return None
return _rag_instance
class ChatRequest(BaseModel):
message: str
domain_filter: Optional[str] = None
use_history: bool = True
class ChatResponse(BaseModel):
answer: str
sources: List[Dict[str, Any]] = []
reformulated: Optional[str] = None
docs_found: int = 0
error: Optional[str] = None
@app.post("/api/rag/chat", response_model=ChatResponse)
def rag_chat(request: ChatRequest):
"""
Chat with the RAG system.
Args:
message: User's question
domain_filter: Optional domain (political, economic, weather, social, intelligence)
use_history: Whether to use chat history for context (default: True)
Returns:
AI response with sources
"""
try:
rag = _get_rag()
if not rag:
return ChatResponse(
answer="RAG system not available. Please check server logs.",
error="RAG initialization failed"
)
result = rag.query(
question=request.message,
domain_filter=request.domain_filter,
use_history=request.use_history
)
return ChatResponse(
answer=result.get("answer", "No response generated."),
sources=result.get("sources", []),
reformulated=result.get("reformulated"),
docs_found=result.get("docs_found", 0),
error=result.get("error")
)
except Exception as e:
logger.error(f"[RAG API] Chat error: {e}", exc_info=True)
return ChatResponse(
answer=f"Error processing your request: {str(e)}",
error=str(e)
)
@app.get("/api/rag/stats")
def rag_stats():
"""Get RAG system statistics"""
try:
rag = _get_rag()
if not rag:
return {"error": "RAG not available", "status": "offline"}
stats = rag.get_stats()
stats["status"] = "online"
return stats
except Exception as e:
return {"error": str(e), "status": "error"}
@app.post("/api/rag/clear")
def rag_clear_history():
"""Clear RAG chat history"""
try:
rag = _get_rag()
if rag:
rag.clear_history()
return {"message": "Chat history cleared", "success": True}
return {"message": "RAG not available", "success": False}
except Exception as e:
return {"error": str(e), "success": False}
# =============================================================================
# INTELLIGENCE CONFIG ENDPOINTS (User-defined monitoring targets)
# =============================================================================
INTEL_CONFIG_PATH = os.path.join(os.path.dirname(__file__), "src", "config", "intel_config.json")
def _ensure_intel_config() -> str:
"""Ensure config directory and file exist with default structure"""
os.makedirs(os.path.dirname(INTEL_CONFIG_PATH), exist_ok=True)
if not os.path.exists(INTEL_CONFIG_PATH):
default_config = {
"user_profiles": {"twitter": [], "facebook": [], "linkedin": []},
"user_keywords": [],
"user_products": []
}
with open(INTEL_CONFIG_PATH, "w", encoding="utf-8") as f:
json.dump(default_config, f, indent=2)
logger.info(f"[IntelConfig] Created default config at {INTEL_CONFIG_PATH}")
return INTEL_CONFIG_PATH
@app.get("/api/intel/config")
def get_intel_config():
"""
Get current intelligence monitoring configuration.
Returns user-defined profiles, keywords, and products that the
Intelligence Agent monitors in addition to defaults.
"""
try:
path = _ensure_intel_config()
with open(path, "r", encoding="utf-8") as f:
config = json.load(f)
return {"status": "success", "config": config}
except Exception as e:
logger.error(f"[IntelConfig] Error reading config: {e}")
return {"status": "error", "error": str(e)}
class IntelConfigUpdate(BaseModel):
user_profiles: Optional[Dict[str, List[str]]] = None
user_keywords: Optional[List[str]] = None
user_products: Optional[List[str]] = None
@app.post("/api/intel/config")
def update_intel_config(config: IntelConfigUpdate):
"""
Update intelligence monitoring configuration.
Replaces the entire user config with the provided values.
"""
try:
path = _ensure_intel_config()
# Read existing config
with open(path, "r", encoding="utf-8") as f:
existing = json.load(f)
# Update with provided values
if config.user_profiles is not None:
existing["user_profiles"] = config.user_profiles
if config.user_keywords is not None:
existing["user_keywords"] = config.user_keywords
if config.user_products is not None:
existing["user_products"] = config.user_products
# Save
with open(path, "w", encoding="utf-8") as f:
json.dump(existing, f, indent=2)
logger.info(f"[IntelConfig] Updated config: {len(existing.get('user_keywords', []))} keywords, {sum(len(v) for v in existing.get('user_profiles', {}).values())} profiles")
return {"status": "updated", "config": existing}
except Exception as e:
logger.error(f"[IntelConfig] Error updating config: {e}")
return {"status": "error", "error": str(e)}
@app.post("/api/intel/config/add")
def add_intel_target(target_type: str, value: str, platform: Optional[str] = None):
"""
Add a single monitoring target.
Args:
target_type: "keyword", "product", or "profile"
value: The value to add
platform: Required for "profile" type (twitter, facebook, linkedin)
Example:
POST /api/intel/config/add?target_type=keyword&value=Colombo+Port
POST /api/intel/config/add?target_type=profile&value=CompetitorX&platform=twitter
"""
try:
path = _ensure_intel_config()
with open(path, "r", encoding="utf-8") as f:
config = json.load(f)
added = False
if target_type == "keyword":
if value not in config.get("user_keywords", []):
config.setdefault("user_keywords", []).append(value)
added = True
elif target_type == "product":
if value not in config.get("user_products", []):
config.setdefault("user_products", []).append(value)
added = True
elif target_type == "profile":
if not platform:
return {"status": "error", "error": "platform is required for profile type"}
profiles = config.setdefault("user_profiles", {})
platform_list = profiles.setdefault(platform, [])
if value not in platform_list:
platform_list.append(value)
added = True
else:
return {"status": "error", "error": f"Invalid target_type: {target_type}"}
if added:
with open(path, "w", encoding="utf-8") as f:
json.dump(config, f, indent=2)
logger.info(f"[IntelConfig] Added {target_type}: {value}")
return {"status": "added" if added else "already_exists", "config": config}
except Exception as e:
logger.error(f"[IntelConfig] Error adding target: {e}")
return {"status": "error", "error": str(e)}
@app.delete("/api/intel/config/remove")
def remove_intel_target(target_type: str, value: str, platform: Optional[str] = None):
"""
Remove a monitoring target.
Args:
target_type: "keyword", "product", or "profile"
value: The value to remove
platform: Required for "profile" type
"""
try:
path = _ensure_intel_config()
with open(path, "r", encoding="utf-8") as f:
config = json.load(f)
removed = False
if target_type == "keyword":
if value in config.get("user_keywords", []):
config["user_keywords"].remove(value)
removed = True
elif target_type == "product":
if value in config.get("user_products", []):
config["user_products"].remove(value)
removed = True
elif target_type == "profile":
if not platform:
return {"status": "error", "error": "platform is required for profile type"}
if platform in config.get("user_profiles", {}) and value in config["user_profiles"][platform]:
config["user_profiles"][platform].remove(value)
removed = True
else:
return {"status": "error", "error": f"Invalid target_type: {target_type}"}
if removed:
with open(path, "w", encoding="utf-8") as f:
json.dump(config, f, indent=2)
logger.info(f"[IntelConfig] Removed {target_type}: {value}")
return {"status": "removed" if removed else "not_found", "config": config}
except Exception as e:
logger.error(f"[IntelConfig] Error removing target: {e}")
return {"status": "error", "error": str(e)}
# =============================================================================
# WEATHER PREDICTION ENDPOINTS
# =============================================================================
# Lazy-loaded weather predictor
_weather_predictor = None
def get_weather_predictor():
"""Lazy-load the weather predictor using isolated import."""
global _weather_predictor
if _weather_predictor is not None:
return _weather_predictor
try:
import importlib.util
from pathlib import Path
import json
# Use importlib.util for fully isolated import (avoids package collisions)
weather_src = Path(__file__).parent / "models" / "weather-prediction" / "src"
predictor_path = weather_src / "components" / "predictor.py"
if not predictor_path.exists():
logger.error(f"[WeatherAPI] predictor.py not found at {predictor_path}")
return None
# CRITICAL: Remove any conflicting paths (currency-volatility-prediction/src)
# to avoid entity.config_entity collision
currency_src = str(Path(__file__).parent / "models" / "currency-volatility-prediction" / "src")
stock_src = str(Path(__file__).parent / "models" / "stock-price-prediction" / "src")
anomaly_src = str(Path(__file__).parent / "models" / "anomaly-detection" / "src")
original_path = sys.path.copy()
sys.path = [p for p in sys.path if currency_src not in p and stock_src not in p and anomaly_src not in p]
# CRITICAL: Clear cached entity modules that may have been imported from wrong path
modules_to_clear = [k for k in sys.modules.keys() if 'entity' in k.lower() or 'config_entity' in k.lower()]
saved_modules = {}
for mod_name in modules_to_clear:
saved_modules[mod_name] = sys.modules.pop(mod_name, None)
# Add weather src to path FIRST for relative imports
weather_src_str = str(weather_src)
if weather_src_str not in sys.path:
sys.path.insert(0, weather_src_str)
try:
# Now load predictor module
spec = importlib.util.spec_from_file_location(
"weather_predictor_module",
str(predictor_path)
)
module = importlib.util.module_from_spec(spec)
spec.loader.exec_module(module)
_weather_predictor = module.WeatherPredictor()
logger.info("[WeatherAPI] ✓ Weather predictor initialized via isolated import")
finally:
# Restore original path
sys.path = original_path
# Restore saved modules (to avoid breaking other parts of the system)
for mod_name, mod in saved_modules.items():
if mod is not None:
sys.modules[mod_name] = mod
return _weather_predictor
except Exception as e:
logger.error(f"[WeatherAPI] Failed to initialize predictor: {e}")
import traceback
logger.error(f"[WeatherAPI] Full traceback:\n{traceback.format_exc()}")
return None
@app.get("/api/weather/predictions")
async def get_weather_predictions():
"""
Get weather predictions for all 25 Sri Lankan districts.
Returns next-day predictions including:
- Temperature (high/low)
- Rainfall (amount and probability)
- Flood risk
- Severity classification
"""
predictor = get_weather_predictor()
if predictor is None:
return {
"status": "unavailable",
"message": "Weather prediction model not loaded",
"predictions": None
}
try:
# Try to get latest predictions from file
predictions = predictor.get_latest_predictions()
if predictions is None:
# Generate new predictions
logger.info("[WeatherAPI] Generating new predictions...")
predictions = predictor.predict_all_districts()
predictor.save_predictions(predictions)
return {
"status": "success",
"prediction_date": predictions.get("prediction_date"),
"generated_at": predictions.get("generated_at"),
"districts": predictions.get("districts", {}),
"total_districts": len(predictions.get("districts", {}))
}
except Exception as e:
logger.error(f"[WeatherAPI] Error getting predictions: {e}")
return {"status": "error", "message": str(e)}
@app.get("/api/weather/predictions/{district}")
async def get_district_weather(district: str):
"""Get weather prediction for a specific district."""
predictor = get_weather_predictor()
if predictor is None:
return {"status": "unavailable", "message": "Weather predictor not loaded"}
try:
predictions = predictor.get_latest_predictions()
if predictions is None:
predictions = predictor.predict_all_districts()
districts = predictions.get("districts", {})
# Case-insensitive lookup
district_key = None
for d in districts.keys():
if d.lower() == district.lower():
district_key = d
break
if district_key is None:
return {
"status": "not_found",
"message": f"District '{district}' not found",
"available_districts": list(districts.keys())
}
return {
"status": "success",
"district": district_key,
"prediction_date": predictions.get("prediction_date"),
"prediction": districts[district_key]
}
except Exception as e:
return {"status": "error", "message": str(e)}
@app.get("/api/weather/model/status")
async def get_weather_model_status():
"""Get weather prediction model status and training info."""
from pathlib import Path
models_dir = Path(__file__).parent / "models" / "weather-prediction" / "artifacts" / "models"
predictions_dir = Path(__file__).parent / "models" / "weather-prediction" / "output" / "predictions"
model_files = list(models_dir.glob("lstm_*.h5")) if models_dir.exists() else []
prediction_files = list(predictions_dir.glob("predictions_*.json")) if predictions_dir.exists() else []
latest_prediction = None
if prediction_files:
latest = max(prediction_files, key=lambda p: p.stat().st_mtime)
latest_prediction = {
"file": latest.name,
"modified": datetime.fromtimestamp(latest.stat().st_mtime).isoformat()
}
return {
"status": "available" if model_files else "not_trained",
"models_trained": len(model_files),
"trained_stations": [f.stem.replace("lstm_", "").upper() for f in model_files],
"latest_prediction": latest_prediction,
"predictions_available": len(prediction_files)
}
# =============================================================================
# CURRENCY PREDICTION ENDPOINTS
# =============================================================================
# Lazy-loaded currency predictor
_currency_predictor = None
def get_currency_predictor():
"""Lazy-load the currency predictor."""
global _currency_predictor
if _currency_predictor is None:
try:
import sys
from pathlib import Path
currency_path = Path(__file__).parent / "models" / "currency-volatility-prediction" / "src"
sys.path.insert(0, str(currency_path))
from components.predictor import CurrencyPredictor
_currency_predictor = CurrencyPredictor()
logger.info("[CurrencyAPI] Currency predictor initialized")
except Exception as e:
logger.warning(f"[CurrencyAPI] Failed to initialize predictor: {e}")
_currency_predictor = None
return _currency_predictor
@app.get("/api/currency/prediction")
async def get_currency_prediction():
"""
Get USD/LKR currency prediction for next day.
Returns:
- Current rate
- Predicted rate
- Expected change percentage
- Direction (strengthening/weakening)
- Volatility classification
"""
predictor = get_currency_predictor()
if predictor is None:
# Generate fallback prediction inline
import numpy as np
current_rate = 298.0
np.random.seed(int(datetime.now().timestamp()) % 2**31)
change_pct = np.random.normal(0.05, 0.3)
predicted_rate = current_rate * (1 + change_pct / 100)
return {
"status": "success",
"prediction": {
"prediction_date": (datetime.now() + timedelta(days=1)).strftime("%Y-%m-%d"),
"generated_at": datetime.now().isoformat(),
"model_version": "fallback",
"is_fallback": True,
"current_rate": round(current_rate, 2),
"predicted_rate": round(predicted_rate, 2),
"expected_change": round(predicted_rate - current_rate, 2),
"expected_change_pct": round(change_pct, 3),
"direction": "strengthening" if change_pct < 0 else "weakening",
"direction_emoji": "📈" if change_pct < 0 else "📉",
"volatility_class": "low",
"note": "Using fallback - model initializing"
}
}
try:
# Try to get latest prediction from file
prediction = predictor.get_latest_prediction()
if prediction is None:
# Generate fallback
logger.info("[CurrencyAPI] No prediction found, generating fallback...")
prediction = predictor.generate_fallback_prediction()
predictor.save_prediction(prediction)
return {
"status": "success",
"prediction": prediction
}
except Exception as e:
logger.error(f"[CurrencyAPI] Error: {e}")
return {"status": "error", "message": str(e)}
@app.get("/api/currency/history")
async def get_currency_history(days: int = 30):
"""Get historical USD/LKR rates."""
from pathlib import Path
import pandas as pd
try:
data_dir = Path(__file__).parent / "models" / "currency-volatility-prediction" / "artifacts" / "data"
csv_files = list(data_dir.glob("currency_data_*.csv")) if data_dir.exists() else []
if not csv_files:
return {"status": "no_data", "message": "No currency data available"}
latest = max(csv_files, key=lambda p: p.stat().st_mtime)
df = pd.read_csv(latest, parse_dates=["date"])
# Get last N days
df = df.tail(days)
history = []
for _, row in df.iterrows():
history.append({
"date": row["date"].strftime("%Y-%m-%d") if hasattr(row["date"], "strftime") else str(row["date"]),
"close": round(row["close"], 2),
"high": round(row.get("high", row["close"]), 2),
"low": round(row.get("low", row["close"]), 2),
"daily_return_pct": round(row.get("daily_return", 0) * 100, 3)
})
return {
"status": "success",
"days": len(history),
"history": history
}
except Exception as e:
return {"status": "error", "message": str(e)}
@app.get("/api/currency/model/status")
async def get_currency_model_status():
"""Get currency prediction model status."""
from pathlib import Path
models_dir = Path(__file__).parent / "models" / "currency-volatility-prediction" / "artifacts" / "models"
predictions_dir = Path(__file__).parent / "models" / "currency-volatility-prediction" / "output" / "predictions"
model_exists = (models_dir / "gru_usd_lkr.h5").exists() if models_dir.exists() else False
prediction_files = list(predictions_dir.glob("currency_prediction_*.json")) if predictions_dir.exists() else []
latest_prediction = None
if prediction_files:
latest = max(prediction_files, key=lambda p: p.stat().st_mtime)
latest_prediction = {
"file": latest.name,
"modified": datetime.fromtimestamp(latest.stat().st_mtime).isoformat()
}
return {
"status": "available" if model_exists else "not_trained",
"model_type": "GRU",
"target": "USD/LKR",
"latest_prediction": latest_prediction,
"predictions_available": len(prediction_files)
}
# =============================================================================
# STOCK PREDICTION ENDPOINTS
# =============================================================================
# Lazy-loaded stock predictor
_stock_predictor = None
def get_stock_predictor():
"""Lazy-load the stock predictor."""
global _stock_predictor
if _stock_predictor is None:
try:
import sys
from pathlib import Path
stock_path = Path(__file__).parent / "models" / "stock-price-prediction" / "src"
sys.path.insert(0, str(stock_path))
from components.predictor import StockPredictor
_stock_predictor = StockPredictor()
logger.info("[StockAPI] Stock predictor initialized")
except Exception as e:
logger.warning(f"[StockAPI] Failed to initialize predictor: {e}")
_stock_predictor = None
return _stock_predictor
@app.get("/api/stocks/predictions")
async def get_stock_predictions():
"""
Get stock price predictions for all configured stocks.
Returns predictions for 10 popular stocks with:
- Current price
- Predicted next-day price
- Expected change percentage
- Trend classification (bullish/bearish/neutral)
- Model architecture used
"""
predictor = get_stock_predictor()
if predictor is None:
# Generate fallback even without predictor
try:
import sys
from pathlib import Path
stock_path = Path(__file__).parent / "models" / "stock-price-prediction" / "src"
sys.path.insert(0, str(stock_path))
from constants.training_pipeline import STOCKS_TO_TRAIN
from datetime import datetime
predictions = {
"prediction_date": (datetime.now()).strftime("%Y-%m-%d"),
"generated_at": datetime.now().isoformat(),
"stocks": {},
"summary": {"total_stocks": len(STOCKS_TO_TRAIN), "bullish": 0, "bearish": 0, "neutral": 0}
}
import numpy as np
for code, info in STOCKS_TO_TRAIN.items():
np.random.seed(hash(code) % 2**31)
change_pct = np.random.normal(0.1, 1.0)
trend = "bullish" if change_pct > 0.5 else "bearish" if change_pct < -0.5 else "neutral"
predictions["summary"][trend] = predictions["summary"].get(trend, 0) + 1
predictions["stocks"][code] = {
"symbol": code,
"name": info.get("name", code),
"sector": info.get("sector", "Unknown"),
"current_price": 100.0,
"predicted_price": 100.0 * (1 + change_pct / 100),
"expected_change_pct": round(change_pct, 3),
"trend": trend,
"trend_emoji": "📈" if trend == "bullish" else "📉" if trend == "bearish" else "➡️",
"confidence": round(np.random.uniform(0.65, 0.85), 2),
"is_fallback": True
}
return {"status": "success", "predictions": predictions}
except Exception as e:
return {"status": "unavailable", "message": f"Stock prediction model not loaded: {e}"}
try:
# Try to get latest predictions from file
predictions = predictor.get_latest_predictions()
if predictions is None:
# Generate fallback predictions
logger.info("[StockAPI] No predictions found, generating fallback...")
predictions = predictor.predict_all_stocks()
predictions = {
"prediction_date": (datetime.now()).strftime("%Y-%m-%d"),
"generated_at": datetime.now().isoformat(),
"stocks": predictions,
"summary": {"total_stocks": len(predictions)}
}
return {
"status": "success",
"predictions": predictions
}
except Exception as e:
logger.error(f"[StockAPI] Error: {e}")
return {"status": "error", "message": str(e)}
@app.get("/api/stocks/predictions/{symbol}")
async def get_stock_prediction_by_symbol(symbol: str):
"""Get prediction for a specific stock symbol."""
predictor = get_stock_predictor()
if predictor is None:
return {"status": "unavailable", "message": "Stock prediction model not loaded"}
try:
predictions = predictor.get_latest_predictions()
if predictions and symbol.upper() in predictions.get("stocks", {}):
return {
"status": "success",
"prediction": predictions["stocks"][symbol.upper()]
}
else:
# Generate fallback
return {
"status": "success",
"prediction": predictor._generate_fallback_prediction(symbol.upper())
}
except Exception as e:
return {"status": "error", "message": str(e)}
@app.get("/api/stocks/model/status")
async def get_stock_model_status():
"""Get stock prediction model status for all stocks."""
from pathlib import Path
import json
models_dir = Path(__file__).parent / "models" / "stock-price-prediction" / "artifacts" / "models"
predictions_dir = Path(__file__).parent / "models" / "stock-price-prediction" / "output" / "predictions"
model_files = list(models_dir.glob("*_model.h5")) if models_dir.exists() else []
prediction_files = list(predictions_dir.glob("stock_predictions_*.json")) if predictions_dir.exists() else []
# Get training summary
summary_path = models_dir / "training_summary.json" if models_dir.exists() else None
training_summary = None
if summary_path and summary_path.exists():
with open(summary_path) as f:
training_summary = json.load(f)
latest_prediction = None
if prediction_files:
latest = max(prediction_files, key=lambda p: p.stat().st_mtime)
latest_prediction = {
"file": latest.name,
"modified": datetime.fromtimestamp(latest.stat().st_mtime).isoformat()
}
return {
"status": "available" if model_files else "not_trained",
"models_trained": len(model_files),
"trained_stocks": [f.stem.replace("_model", "").upper() for f in model_files],
"training_summary": training_summary,
"latest_prediction": latest_prediction,
"predictions_available": len(prediction_files)
}
@app.websocket("/ws")
async def websocket_endpoint(websocket: WebSocket):
await manager.connect(websocket)
try:
# Send initial state
try:
await websocket.send_text(json.dumps(current_state, default=str))
except Exception as e:
logger.debug(f"[WS] Initial send failed: {e}")
await manager.disconnect(websocket)
return
# Main receive loop
while True:
try:
txt = await websocket.receive_text()
except WebSocketDisconnect:
logger.info("[WS] Client disconnected")
break
except Exception as e:
logger.debug(f"[WS] Receive error: {e}")
break
# Handle pong responses
try:
payload = json.loads(txt)
if isinstance(payload, dict) and payload.get("type") == "pong":
async with manager._lock:
meta = manager.active_connections.get(websocket)
if meta is not None:
meta['last_pong'] = utc_now()
meta['misses'] = 0
continue
except json.JSONDecodeError:
continue
finally:
await manager.disconnect(websocket)
if __name__ == "__main__":
import uvicorn
import uuid
uvicorn.run(app, host="0.0.0.0", port=8000, log_level="info")