Spaces:

mv63
/

Satintel

Running

Vedant Jigarbhai Mehta commited on 10 days ago

Commit

9e6e107

0 Parent(s):

Deploy FastAPI backend with satellite data for HF Spaces

- FastAPI app with ML analytics (Isolation Forest, DBSCAN, ARIMA)
- Pre-fetched satellite data for 18+ cities
- Docker setup: Python 3.11, port 7860, DATA_DIR env var
- Large harmonized JSONs tracked via Git LFS

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

.gitattributes +37 -0
.gitignore +6 -0
Dockerfile +27 -0
README.md +11 -0
app/__init__.py +0 -0
app/agents/__init__.py +0 -0
app/agents/action_plan_agent.py +39 -0
app/agents/analysis_agent.py +40 -0
app/agents/data_agent.py +40 -0
app/agents/orchestrator.py +98 -0
app/config.py +22 -0
app/main.py +123 -0
app/middleware/__init__.py +0 -0
app/middleware/auth_middleware.py +19 -0
app/ml/__init__.py +0 -0
app/ml/anomaly_detector.py +44 -0
app/ml/hotspot_clusterer.py +51 -0
app/ml/lstm_predictor.py +150 -0
app/ml/ndvi_lst_regression.py +69 -0
app/models/__init__.py +0 -0
app/models/db_models.py +151 -0
app/models/schemas.py +126 -0
app/routes/__init__.py +0 -0
app/routes/action_plan.py +15 -0
app/routes/analysis.py +46 -0
app/routes/analytics.py +22 -0
app/routes/auth.py +21 -0
app/routes/data.py +8 -0
app/routes/green_gap.py +11 -0
app/routes/health.py +7 -0
app/routes/maps.py +17 -0
app/routes/satellite.py +250 -0
app/routes/time_machine.py +16 -0
app/routes/users.py +9 -0
app/services/__init__.py +0 -0
app/services/action_plan_service.py +526 -0
app/services/alert_service.py +125 -0
app/services/auth_service.py +70 -0
app/services/cache_service.py +129 -0
app/services/db_service.py +188 -0
app/services/farmland_service.py +83 -0
app/services/green_gap_service.py +155 -0
app/services/health_score_service.py +133 -0
app/services/heat_service.py +84 -0
app/services/land_conversion_service.py +81 -0
app/services/ml_service.py +399 -0
app/services/satellite_service.py +403 -0
app/services/time_machine_service.py +192 -0
app/services/vegetation_service.py +79 -0
app/utils/__init__.py +0 -0

.gitattributes ADDED Viewed

	@@ -0,0 +1,37 @@

+*.7z filter=lfs diff=lfs merge=lfs -text
+*.arrow filter=lfs diff=lfs merge=lfs -text
+*.bin filter=lfs diff=lfs merge=lfs -text
+*.bz2 filter=lfs diff=lfs merge=lfs -text
+*.ckpt filter=lfs diff=lfs merge=lfs -text
+*.ftz filter=lfs diff=lfs merge=lfs -text
+*.gz filter=lfs diff=lfs merge=lfs -text
+*.h5 filter=lfs diff=lfs merge=lfs -text
+*.joblib filter=lfs diff=lfs merge=lfs -text
+*.lfs.* filter=lfs diff=lfs merge=lfs -text
+*.mlmodel filter=lfs diff=lfs merge=lfs -text
+*.model filter=lfs diff=lfs merge=lfs -text
+*.msgpack filter=lfs diff=lfs merge=lfs -text
+*.npy filter=lfs diff=lfs merge=lfs -text
+*.npz filter=lfs diff=lfs merge=lfs -text
+*.onnx filter=lfs diff=lfs merge=lfs -text
+*.ot filter=lfs diff=lfs merge=lfs -text
+*.parquet filter=lfs diff=lfs merge=lfs -text
+*.pb filter=lfs diff=lfs merge=lfs -text
+*.pickle filter=lfs diff=lfs merge=lfs -text
+*.pkl filter=lfs diff=lfs merge=lfs -text
+*.pt filter=lfs diff=lfs merge=lfs -text
+*.pth filter=lfs diff=lfs merge=lfs -text
+*.rar filter=lfs diff=lfs merge=lfs -text
+*.safetensors filter=lfs diff=lfs merge=lfs -text
+saved_model/**/* filter=lfs diff=lfs merge=lfs -text
+*.tar.* filter=lfs diff=lfs merge=lfs -text
+*.tar filter=lfs diff=lfs merge=lfs -text
+*.tflite filter=lfs diff=lfs merge=lfs -text
+*.tgz filter=lfs diff=lfs merge=lfs -text
+*.wasm filter=lfs diff=lfs merge=lfs -text
+*.xz filter=lfs diff=lfs merge=lfs -text
+*.zip filter=lfs diff=lfs merge=lfs -text
+*.zst filter=lfs diff=lfs merge=lfs -text
+*tfevents* filter=lfs diff=lfs merge=lfs -text
+data/ahmedabad/lst_harmonized.json filter=lfs diff=lfs merge=lfs -text
+data/ahmedabad/ndvi_harmonized.json filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,6 @@

+.env
+__pycache__/
+*.pyc
+gee_service_account.json
+venv/
+.venv/

Dockerfile ADDED Viewed

	@@ -0,0 +1,27 @@

+FROM python:3.11-slim
+# HF Spaces runs as uid 1000
+RUN useradd -m -u 1000 user
+WORKDIR /app
+# Install dependencies first (layer caching)
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+# Copy application code
+COPY app/ ./app/
+# Copy satellite data
+COPY data/ ./data/
+# Tell the app where data lives inside the container
+ENV DATA_DIR=/app/data
+# city_generator writes new city dirs at runtime — needs write access
+RUN chown -R user:user /app
+USER user
+EXPOSE 7860
+CMD ["uvicorn", "app.main:app", "--host", "0.0.0.0", "--port", "7860"]

README.md ADDED Viewed

	@@ -0,0 +1,11 @@

+---
+title: SatIntel API
+emoji: 🛰️
+colorFrom: blue
+colorTo: green
+sdk: docker
+pinned: false
+app_port: 7860
+---
+Satellite Environmental Intelligence Platform — FastAPI backend serving satellite data analytics, ML-powered anomaly detection, and environment action plan generation for smart cities.

app/__init__.py ADDED Viewed

File without changes

app/agents/__init__.py ADDED Viewed

File without changes

app/agents/action_plan_agent.py ADDED Viewed

	@@ -0,0 +1,39 @@

+"""
+Action Plan Agent — generates city-specific environmental recommendations using LLM.
+Part of the multi-agent pipeline: Data → Analysis → Action Plan.
+"""
+import logging
+from app.services import action_plan_service
+logger = logging.getLogger(__name__)
+async def run(city: str, analysis: dict) -> dict:
+    """Generate Environment Action Plan from analysis results."""
+    logger.info(f"[ActionPlanAgent] Generating action plan for {city}")
+    # Restructure analysis data for the action plan service
+    plan_analysis = {}
+    for param, param_data in analysis.items():
+        if "error" in param_data:
+            continue
+        anomaly_data = param_data.get("anomalies", {})
+        hotspot_data = param_data.get("hotspots", {})
+        plan_analysis[param] = {
+            "statistics": param_data.get("statistics", {}),
+            "anomalies": anomaly_data.get("anomalies", [])[:5],
+            "anomaly_count": anomaly_data.get("anomaly_count", 0),
+            "hotspots": hotspot_data.get("hotspots", [])[:5],
+            "hotspot_count": hotspot_data.get("cluster_count", 0),
+        }
+    # Use the action plan service's template generator
+    plan = action_plan_service._generate_template_plan(city, plan_analysis)
+    plan["source"] = "agent_pipeline"
+    logger.info(f"[ActionPlanAgent] Generated plan with {len(plan.get('findings', []))} findings, "
+                f"{len(plan.get('recommendations', []))} recommendations")
+    return plan

app/agents/analysis_agent.py ADDED Viewed

	@@ -0,0 +1,40 @@

+"""
+Analysis Agent — runs ML models on harmonized satellite data.
+Part of the multi-agent pipeline: Data → Analysis → Action Plan.
+"""
+import logging
+from app.services import ml_service
+logger = logging.getLogger(__name__)
+async def run(satellite_data: dict, city: str = "Ahmedabad") -> dict:
+    """Run ML analytics on harmonized satellite data."""
+    logger.info(f"[AnalysisAgent] Running ML analytics for {city}")
+    results = {}
+    for param, param_data in satellite_data.items():
+        if "error" in param_data:
+            results[param] = {"error": param_data["error"]}
+            continue
+        try:
+            anomalies = ml_service.detect_anomalies(param, city)
+            trend = ml_service.predict_trend(param, city)
+            hotspots = ml_service.find_hotspots(param, city)
+            results[param] = {
+                "anomalies": anomalies,
+                "trend": trend,
+                "hotspots": hotspots,
+                "statistics": param_data.get("statistics", {}),
+            }
+            logger.info(
+                f"[AnalysisAgent] {param}: {anomalies.get('anomaly_count', 0)} anomalies, "
+                f"{hotspots.get('cluster_count', 0)} hotspots, trend: {trend.get('trend_direction', 'N/A')}"
+            )
+        except Exception as e:
+            logger.error(f"[AnalysisAgent] Error analyzing {param}: {e}")
+            results[param] = {"error": str(e)}
+    return results

app/agents/data_agent.py ADDED Viewed

	@@ -0,0 +1,40 @@

+"""
+Data Agent — fetches and harmonizes satellite data from multiple sources.
+Part of the multi-agent pipeline: Data → Analysis → Action Plan.
+"""
+import logging
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+async def run(city: str, parameters: list[str], date_range: dict) -> dict:
+    """Fetch and harmonize satellite data for the given city and parameters."""
+    logger.info(f"[DataAgent] Fetching data for {city}: {parameters}")
+    results = {}
+    for param in parameters:
+        try:
+            data = satellite_service._load_data(param)
+            start = date_range.get("start_date", "2023-01-01")
+            end = date_range.get("end_date", "2024-12-31")
+            filtered = [d for d in data if start <= d.get("date", "") <= end]
+            stats = satellite_service.get_statistics(param)
+            timeseries = satellite_service.get_timeseries(param, city)
+            heatmap = satellite_service.get_heatmap_data(param, city)
+            results[param] = {
+                "raw_data": filtered,
+                "count": len(filtered),
+                "statistics": stats,
+                "timeseries": timeseries.get("timeseries", []),
+                "heatmap": heatmap,
+                "metadata": satellite_service.PARAMETERS.get(param, {}),
+            }
+            logger.info(f"[DataAgent] {param}: {len(filtered)} points loaded")
+        except Exception as e:
+            logger.error(f"[DataAgent] Error fetching {param}: {e}")
+            results[param] = {"error": str(e)}
+    return results

app/agents/orchestrator.py ADDED Viewed

	@@ -0,0 +1,98 @@

+"""
+Multi-Agent Orchestrator — coordinates data collection, analysis, and action plan generation.
+Pipeline: Data Agent → Analysis Agent → Action Plan Agent
+This is the innovation differentiator — demonstrates multi-agent architecture
+applied to satellite environmental intelligence.
+"""
+import logging
+import time
+from app.agents import data_agent, analysis_agent, action_plan_agent
+logger = logging.getLogger(__name__)
+async def run_analysis(
+    city: str = "Ahmedabad",
+    parameters: list[str] = None,
+    date_range: dict = None,
+) -> dict:
+    """Run the full multi-agent analysis pipeline.
+    Pipeline:
+    1. Data Agent — fetches + harmonizes satellite data from GEE/files
+    2. Analysis Agent — runs ML models (anomaly, trend, clustering)
+    3. Action Plan Agent — generates city-specific recommendations
+    Returns combined results from all agents.
+    """
+    if parameters is None:
+        parameters = ["LST", "NDVI", "NO2", "SOIL_MOISTURE"]
+    if date_range is None:
+        date_range = {"start_date": "2023-01-01", "end_date": "2024-12-31"}
+    start_time = time.time()
+    pipeline_log = []
+    # Step 1: Data Agent
+    logger.info(f"[Orchestrator] Step 1/3: Data Agent — fetching satellite data for {city}")
+    pipeline_log.append({"step": 1, "agent": "DataAgent", "status": "running", "message": "Fetching satellite data..."})
+    satellite_data = await data_agent.run(city, parameters, date_range)
+    data_time = time.time() - start_time
+    pipeline_log[-1]["status"] = "complete"
+    pipeline_log[-1]["duration_s"] = round(data_time, 2)
+    logger.info(f"[Orchestrator] Data Agent complete in {data_time:.1f}s")
+    # Step 2: Analysis Agent
+    logger.info(f"[Orchestrator] Step 2/3: Analysis Agent — running ML models")
+    pipeline_log.append({"step": 2, "agent": "AnalysisAgent", "status": "running", "message": "Running ML analytics..."})
+    analysis = await analysis_agent.run(satellite_data, city)
+    analysis_time = time.time() - start_time - data_time
+    pipeline_log[-1]["status"] = "complete"
+    pipeline_log[-1]["duration_s"] = round(analysis_time, 2)
+    logger.info(f"[Orchestrator] Analysis Agent complete in {analysis_time:.1f}s")
+    # Step 3: Action Plan Agent
+    logger.info(f"[Orchestrator] Step 3/3: Action Plan Agent — generating recommendations")
+    pipeline_log.append({"step": 3, "agent": "ActionPlanAgent", "status": "running", "message": "Generating action plan..."})
+    action_plan = await action_plan_agent.run(city, analysis)
+    plan_time = time.time() - start_time - data_time - analysis_time
+    pipeline_log[-1]["status"] = "complete"
+    pipeline_log[-1]["duration_s"] = round(plan_time, 2)
+    logger.info(f"[Orchestrator] Action Plan Agent complete in {plan_time:.1f}s")
+    total_time = time.time() - start_time
+    logger.info(f"[Orchestrator] Full pipeline complete in {total_time:.1f}s")
+    return {
+        "city": city,
+        "parameters": parameters,
+        "date_range": date_range,
+        "satellite_data": {
+            param: {
+                "count": pdata.get("count", 0),
+                "statistics": pdata.get("statistics", {}),
+                "heatmap": pdata.get("heatmap", {}),
+            }
+            for param, pdata in satellite_data.items()
+        },
+        "analysis": {
+            param: {
+                "anomaly_count": adata.get("anomalies", {}).get("anomaly_count", 0),
+                "hotspot_count": adata.get("hotspots", {}).get("cluster_count", 0),
+                "trend_direction": adata.get("trend", {}).get("trend_direction", "unknown"),
+                "top_anomalies": adata.get("anomalies", {}).get("anomalies", [])[:3],
+                "top_hotspots": adata.get("hotspots", {}).get("hotspots", [])[:3],
+            }
+            for param, adata in analysis.items()
+            if "error" not in adata
+        },
+        "action_plan": action_plan,
+        "pipeline": {
+            "total_duration_s": round(total_time, 2),
+            "steps": pipeline_log,
+        },
+    }

app/config.py ADDED Viewed

	@@ -0,0 +1,22 @@

+from pydantic_settings import BaseSettings
+from functools import lru_cache
+class Settings(BaseSettings):
+    mongodb_url: str = "mongodb://localhost:27017"
+    database_name: str = "satellite_intel"
+    jwt_secret: str = "hackathon-aetrix-2026-satellite-intel-secret-key"
+    jwt_algorithm: str = "HS256"
+    jwt_expiry_hours: int = 24
+    database_url: str = ""  # e.g. "postgresql+asyncpg://user:pass@localhost:5432/satellite_intel"
+    gee_service_account_email: str = ""
+    gee_key_file: str = "gee_service_account.json"
+    redis_url: str = ""
+    anthropic_api_key: str = ""
+    openai_api_key: str = ""
+    class Config:
+        env_file = ".env"
+@lru_cache()
+def get_settings() -> Settings:
+    return Settings()

app/main.py ADDED Viewed

	@@ -0,0 +1,123 @@

+from fastapi import FastAPI
+from fastapi.middleware.cors import CORSMiddleware
+from app.routes import auth, users, satellite, analytics, maps, action_plan, data, health, analysis, green_gap, time_machine
+app = FastAPI(
+    title="Satellite Environmental Intelligence Platform",
+    description="AETRIX 2026 — PS-4: Satellite data analytics for smart cities",
+    version="1.0.0",
+)
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=False,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+app.include_router(health.router, prefix="/api/v1", tags=["Health"])
+app.include_router(auth.router, prefix="/api/v1/auth", tags=["Auth"])
+app.include_router(users.router, prefix="/api/v1/users", tags=["Users"])
+app.include_router(satellite.router, prefix="/api/v1/satellite", tags=["Satellite"])
+app.include_router(analytics.router, prefix="/api/v1/analytics", tags=["Analytics"])
+app.include_router(maps.router, prefix="/api/v1/maps", tags=["Maps"])
+app.include_router(action_plan.router, prefix="/api/v1/action-plan", tags=["Action Plan"])
+app.include_router(data.router, prefix="/api/v1/data", tags=["Data"])
+app.include_router(analysis.router, prefix="/api/v1/analysis", tags=["Specialized Analysis"])
+app.include_router(green_gap.router, prefix="/api/v1/green-gap", tags=["Green Gap Analysis"])
+app.include_router(time_machine.router, prefix="/api/v1/time-machine", tags=["Time Machine"])
+@app.on_event("startup")
+async def startup():
+    # Create PostGIS tables if database is configured
+    try:
+        from app.models.db_models import create_tables, get_engine
+        engine = get_engine()
+        if engine:
+            await create_tables()
+            print("PostgreSQL + PostGIS connected, tables ready")
+        else:
+            print("No DATABASE_URL configured — using in-memory fallback")
+    except Exception as e:
+        print(f"Database setup skipped: {e} — using in-memory fallback")
+    print("Satellite Environmental Intelligence Platform started")
+    # ── Warm up ALL caches in background thread ──────────────
+    import threading
+    threading.Thread(target=_warmup_caches, daemon=True).start()
+def _warmup_caches():
+    """Pre-load all data + run ML models for all 14 cities at startup."""
+    import time
+    start = time.time()
+    try:
+        from app.utils.cities import CITIES
+        from app.services import satellite_service, ml_service
+        params = ["LST", "NDVI", "NO2", "SO2", "CO", "O3", "AEROSOL", "SOIL_MOISTURE"]
+        ml_params = ["LST", "NDVI", "NO2", "SOIL_MOISTURE"]
+        city_keys = list(CITIES.keys())
+        print(f"[WARMUP] Pre-loading data for {len(city_keys)} cities...")
+        for i, city_key in enumerate(city_keys):
+            # Load + harmonize all parameters (populates _raw_cache and _data_cache)
+            for param in params:
+                try:
+                    satellite_service._load_data(param, city_key)
+                except Exception:
+                    pass
+            # Pre-compute heatmap data
+            for param in params:
+                try:
+                    satellite_service.get_heatmap_data(param, city_key)
+                except Exception:
+                    pass
+            # Pre-compute timeseries
+            for param in params:
+                try:
+                    satellite_service.get_timeseries(param, city_key)
+                except Exception:
+                    pass
+            # Run ML models (populates _ml_cache)
+            for param in ml_params:
+                try:
+                    ml_service.detect_anomalies(param, city_key)
+                except Exception:
+                    pass
+                try:
+                    ml_service.find_hotspots(param, city_key)
+                except Exception:
+                    pass
+            # Pre-compute city summary (uses cached ML results)
+            try:
+                ml_service.get_city_summary(city_key)
+            except Exception:
+                pass
+            print(f"[WARMUP] {city_key} done ({i+1}/{len(city_keys)})")
+        # Record sync timestamp
+        try:
+            from app.services import cache_service
+            cache_service.set_last_synced()
+        except Exception:
+            pass
+        elapsed = round(time.time() - start, 1)
+        print(f"[WARMUP] All {len(city_keys)} cities cached in {elapsed}s — ready for instant responses")
+    except Exception as e:
+        print(f"[WARMUP] Cache warmup error: {e}")
+@app.on_event("shutdown")
+async def shutdown():
+    print("Shutting down...")

app/middleware/__init__.py ADDED Viewed

File without changes

app/middleware/auth_middleware.py ADDED Viewed

	@@ -0,0 +1,19 @@

+from fastapi import Depends, HTTPException, status
+from fastapi.security import HTTPBearer, HTTPAuthorizationCredentials
+from jose import JWTError
+from app.services.auth_service import decode_token, get_user_by_email
+security = HTTPBearer()
+async def get_current_user(credentials: HTTPAuthorizationCredentials = Depends(security)) -> dict:
+    try:
+        payload = decode_token(credentials.credentials)
+        email = payload.get("email")
+        if email is None:
+            raise HTTPException(status_code=status.HTTP_401_UNAUTHORIZED, detail="Invalid token")
+        user = await get_user_by_email(email)
+        if user is None:
+            raise HTTPException(status_code=status.HTTP_401_UNAUTHORIZED, detail="User not found")
+        return {"id": user["id"], "name": user["name"], "email": user["email"]}
+    except JWTError:
+        raise HTTPException(status_code=status.HTTP_401_UNAUTHORIZED, detail="Invalid or expired token")

app/ml/__init__.py ADDED Viewed

File without changes

app/ml/anomaly_detector.py ADDED Viewed

	@@ -0,0 +1,44 @@

+"""
+Enhanced Anomaly Detector — Isolation Forest with confidence scores.
+"""
+import numpy as np
+from sklearn.ensemble import IsolationForest
+from typing import List, Tuple
+class AnomalyDetector:
+    def __init__(self, contamination: float = 0.05):
+        self.contamination = contamination
+    def detect(self, timeseries: List[Tuple[str, float]], parameter: str = "NDVI") -> List[dict]:
+        if len(timeseries) < 8:
+            return []
+        dates = [t[0] for t in timeseries]
+        values = np.array([t[1] for t in timeseries]).reshape(-1, 1)
+        model = IsolationForest(contamination=self.contamination, random_state=42, n_estimators=100)
+        model.fit(values)
+        scores = model.decision_function(values)
+        labels = model.predict(values)
+        mean = float(np.mean(values))
+        std = float(np.std(values))
+        results = []
+        for i, (date, value) in enumerate(timeseries):
+            if labels[i] == -1:
+                deviation = abs(value - mean) / std if std > 0 else 0
+                confidence = float(np.clip((0 - scores[i]) / 0.5, 0, 1))
+                severity = "critical" if confidence > 0.7 else ("high" if confidence > 0.4 else "moderate")
+                results.append({
+                    "date": date,
+                    "value": round(value, 4),
+                    "deviation": round(deviation, 2),
+                    "confidence": round(confidence, 2),
+                    "severity": severity,
+                    "anomaly_score": round(float(scores[i]), 4),
+                    "parameter": parameter,
+                })
+        return sorted(results, key=lambda x: x["confidence"], reverse=True)

app/ml/hotspot_clusterer.py ADDED Viewed

	@@ -0,0 +1,51 @@

+"""
+Enhanced Spatial Clusterer — DBSCAN with area and confidence scoring.
+"""
+import numpy as np
+from sklearn.cluster import DBSCAN
+from typing import List, Tuple, Dict
+class SpatialClusterer:
+    def __init__(self, eps: float = 0.02, min_samples: int = 3):
+        self.eps = eps
+        self.min_samples = min_samples
+    def cluster(self, points: List[Tuple[float, float]], values: List[float] = None) -> List[Dict]:
+        if len(points) < self.min_samples:
+            return []
+        coords = np.array(points)
+        model = DBSCAN(eps=self.eps, min_samples=self.min_samples, metric='euclidean')
+        labels = model.fit_predict(coords)
+        clusters = []
+        for cluster_id in sorted(set(labels)):
+            if cluster_id == -1:
+                continue
+            mask = labels == cluster_id
+            cluster_coords = coords[mask]
+            cell_count = int(mask.sum())
+            centroid_lat = float(np.mean(cluster_coords[:, 0]))
+            centroid_lng = float(np.mean(cluster_coords[:, 1]))
+            area_sqkm = round(cell_count * 1.0, 1)
+            confidence = round(min(cell_count / 10.0, 1.0), 2)
+            avg_value = None
+            if values is not None:
+                vals_arr = np.array(values)
+                avg_value = round(float(np.mean(vals_arr[mask])), 4)
+            severity = "critical" if cell_count >= 8 else ("high" if cell_count >= 4 else "moderate")
+            clusters.append({
+                "cluster_id": f"C-{cluster_id + 1}",
+                "centroid_lat": round(centroid_lat, 4),
+                "centroid_lng": round(centroid_lng, 4),
+                "cell_count": cell_count,
+                "area_sqkm": area_sqkm,
+                "confidence": confidence,
+                "severity": severity,
+                "avg_value": avg_value,
+            })
+        return sorted(clusters, key=lambda c: c["cell_count"], reverse=True)

app/ml/lstm_predictor.py ADDED Viewed

	@@ -0,0 +1,150 @@

+"""
+LSTM Predictor — trend forecasting + crop activity scoring.
+Uses PyTorch for sequence-to-one prediction.
+Two uses:
+  1. Forecast: predict next N values from a time series
+  2. Crop score: score a time series against farming patterns (0-100)
+"""
+import numpy as np
+import logging
+from typing import List, Tuple
+logger = logging.getLogger(__name__)
+# Try PyTorch, fall back to numpy-based simple predictor
+try:
+    import torch
+    import torch.nn as nn
+    _HAS_TORCH = True
+except ImportError:
+    _HAS_TORCH = False
+    logger.warning("PyTorch not installed — LSTM will use numpy fallback")
+if _HAS_TORCH:
+    class _LSTMModel(nn.Module):
+        def __init__(self, input_size=1, hidden_size=32, num_layers=2, output_size=1):
+            super().__init__()
+            self.lstm = nn.LSTM(input_size, hidden_size, num_layers, batch_first=True)
+            self.fc = nn.Linear(hidden_size, output_size)
+        def forward(self, x):
+            out, _ = self.lstm(x)
+            return self.fc(out[:, -1, :])
+class LSTMPredictor:
+    """
+    Temporal prediction and crop rhythm scoring.
+    Falls back to exponential smoothing if PyTorch is not installed.
+    """
+    def __init__(self, lookback: int = 12):
+        self.lookback = lookback
+        if _HAS_TORCH:
+            self.model = _LSTMModel()
+    def _prepare_sequences(self, values: np.ndarray):
+        X, y = [], []
+        for i in range(len(values) - self.lookback):
+            X.append(values[i:i + self.lookback])
+            y.append(values[i + self.lookback])
+        return np.array(X), np.array(y)
+    def forecast(self, timeseries: List[Tuple[str, float]], steps: int = 6) -> List[dict]:
+        """
+        Train on provided time series and predict N steps forward.
+        Returns: [{"step": 1, "predicted_value": 0.18, "confidence_low": ..., "confidence_high": ...}]
+        """
+        values = np.array([v for _, v in timeseries], dtype=np.float32)
+        if len(values) < self.lookback + 2:
+            return [{"step": i + 1, "predicted_value": round(float(values[-1]), 4),
+                     "confidence_low": round(float(values[-1]) * 0.9, 4),
+                     "confidence_high": round(float(values[-1]) * 1.1, 4)} for i in range(steps)]
+        vmin, vmax = values.min(), values.max()
+        if vmax - vmin < 1e-6:
+            return [{"step": i + 1, "predicted_value": round(float(values[-1]), 4),
+                     "confidence_low": round(float(values[-1]) * 0.9, 4),
+                     "confidence_high": round(float(values[-1]) * 1.1, 4)} for i in range(steps)]
+        norm = (values - vmin) / (vmax - vmin)
+        if _HAS_TORCH:
+            return self._forecast_torch(norm, vmin, vmax, steps)
+        else:
+            return self._forecast_numpy(values, steps)
+    def _forecast_torch(self, norm, vmin, vmax, steps):
+        X, y = self._prepare_sequences(norm)
+        X_t = torch.FloatTensor(X).unsqueeze(-1)
+        y_t = torch.FloatTensor(y).unsqueeze(-1)
+        optimizer = torch.optim.Adam(self.model.parameters(), lr=0.01)
+        criterion = nn.MSELoss()
+        self.model.train()
+        for _ in range(50):
+            optimizer.zero_grad()
+            loss = criterion(self.model(X_t), y_t)
+            loss.backward()
+            optimizer.step()
+        self.model.eval()
+        results = []
+        current = list(norm[-self.lookback:])
+        with torch.no_grad():
+            for step in range(steps):
+                inp = torch.FloatTensor(current[-self.lookback:]).unsqueeze(0).unsqueeze(-1)
+                pred = self.model(inp).item()
+                pred_real = float(pred * (vmax - vmin) + vmin)
+                std_est = abs(pred_real) * 0.12
+                results.append({
+                    "step": step + 1,
+                    "predicted_value": round(pred_real, 4),
+                    "confidence_low": round(pred_real - std_est, 4),
+                    "confidence_high": round(pred_real + std_est, 4),
+                })
+                current.append(pred)
+        return results
+    def _forecast_numpy(self, values, steps):
+        """Exponential smoothing fallback when PyTorch not available."""
+        alpha = 0.3
+        result = float(values[-1])
+        results = []
+        for step in range(steps):
+            result = alpha * float(values[-(step + 1) % len(values)]) + (1 - alpha) * result
+            std_est = abs(result) * 0.12
+            results.append({
+                "step": step + 1,
+                "predicted_value": round(result, 4),
+                "confidence_low": round(result - std_est, 4),
+                "confidence_high": round(result + std_est, 4),
+            })
+        return results
+    def crop_activity_score(self, timeseries: List[Tuple[str, float]]) -> float:
+        """
+        Score how closely a zone's NDVI resembles a real crop cycle.
+        Real farming: clear seasonal wave (std > 0.05, multiple peaks).
+        Idle land: flat near zero (std < 0.02).
+        Returns: 0-100 (higher = more farming activity).
+        """
+        values = np.array([v for _, v in timeseries], dtype=np.float32)
+        if len(values) < 4:
+            return 0.0
+        std = float(np.std(values))
+        mean = float(np.mean(values))
+        diffs = np.diff(values)
+        direction_changes = int(np.sum(np.diff(np.sign(diffs)) != 0))
+        std_score = min(std / 0.15, 1.0)
+        mean_score = min(mean / 0.25, 1.0)
+        rhythm_score = min(direction_changes / 6.0, 1.0)
+        score = std_score * 40 + mean_score * 30 + rhythm_score * 30
+        return round(float(score), 1)

app/ml/ndvi_lst_regression.py ADDED Viewed

	@@ -0,0 +1,69 @@

+"""
+NDVI-LST Linear Regression — fits relationship between vegetation and temperature.
+Uses the city's own satellite data to project cooling impact of tree planting.
+"""
+import numpy as np
+from typing import List, Tuple
+import logging
+logger = logging.getLogger(__name__)
+class NDVILSTRegression:
+    def __init__(self):
+        self.beta0: float = 0.0
+        self.beta1: float = 0.0
+        self.r_squared: float = 0.0
+        self.is_fitted: bool = False
+    def fit(self, pairs: List[Tuple[float, float]]) -> dict:
+        if len(pairs) < 5:
+            # Not enough data — use expected Ahmedabad estimate
+            self.beta0 = 45.0
+            self.beta1 = -12.0
+            self.r_squared = 0.0
+            self.is_fitted = True
+            return {
+                "beta0": self.beta0, "beta1": self.beta1,
+                "r_squared": 0.0, "sample_size": len(pairs),
+                "interpretation": "Insufficient matched cells — using estimated coefficients",
+            }
+        ndvi = np.array([p[0] for p in pairs])
+        lst = np.array([p[1] for p in pairs])
+        # Remove outliers
+        if np.std(ndvi) > 0 and np.std(lst) > 0:
+            ndvi_z = np.abs((ndvi - ndvi.mean()) / np.std(ndvi))
+            lst_z = np.abs((lst - lst.mean()) / np.std(lst))
+            mask = (ndvi_z < 3) & (lst_z < 3)
+            ndvi, lst = ndvi[mask], lst[mask]
+        # OLS: LST = beta0 + beta1 * NDVI
+        A = np.vstack([np.ones_like(ndvi), ndvi]).T
+        result = np.linalg.lstsq(A, lst, rcond=None)
+        self.beta0, self.beta1 = float(result[0][0]), float(result[0][1])
+        # R squared
+        lst_pred = self.beta0 + self.beta1 * ndvi
+        ss_res = float(np.sum((lst - lst_pred) ** 2))
+        ss_tot = float(np.sum((lst - lst.mean()) ** 2))
+        self.r_squared = round(1 - ss_res / ss_tot, 3) if ss_tot > 0 else 0.0
+        self.is_fitted = True
+        return {
+            "beta0": round(self.beta0, 3),
+            "beta1": round(self.beta1, 3),
+            "r_squared": self.r_squared,
+            "interpretation": (
+                f"For every +0.1 increase in NDVI, surface temperature "
+                f"decreases by {abs(self.beta1 * 0.1):.2f} degrees C"
+            ),
+            "sample_size": len(ndvi),
+        }
+    def project_cooling(self, current_ndvi: float, target_ndvi: float = 0.35) -> float:
+        if not self.is_fitted:
+            return 0.0
+        ndvi_gain = max(0, target_ndvi - current_ndvi)
+        return round(abs(self.beta1) * ndvi_gain, 2)

app/models/__init__.py ADDED Viewed

File without changes

app/models/db_models.py ADDED Viewed

	@@ -0,0 +1,151 @@

+"""
+Database Models — PostgreSQL + PostGIS.
+Setup Instructions (Person 2):
+1. Install PostgreSQL: https://www.postgresql.org/download/
+2. Install PostGIS extension: CREATE EXTENSION postgis;
+3. Create database: CREATE DATABASE satellite_intel;
+4. Set DATABASE_URL in backend/.env
+5. pip install asyncpg sqlalchemy geoalchemy2
+6. Run the app — tables auto-create on startup
+If PostgreSQL/GeoAlchemy2 is not available, the app falls back to in-memory/JSON storage.
+"""
+import uuid
+from datetime import datetime
+try:
+    from sqlalchemy import Column, String, Float, DateTime, Integer, Text, Index
+    from sqlalchemy.dialects.postgresql import UUID
+    from sqlalchemy.ext.asyncio import create_async_engine, AsyncSession
+    from sqlalchemy.orm import sessionmaker, DeclarativeBase
+    _HAS_SQLALCHEMY = True
+except ImportError:
+    _HAS_SQLALCHEMY = False
+try:
+    from geoalchemy2 import Geometry
+    _HAS_POSTGIS = True
+except ImportError:
+    _HAS_POSTGIS = False
+from app.config import get_settings
+# ── Models (only defined if SQLAlchemy is available) ──────────
+if _HAS_SQLALCHEMY:
+    class Base(DeclarativeBase):
+        pass
+    class User(Base):
+        __tablename__ = "users"
+        id = Column(UUID(as_uuid=True), primary_key=True, default=uuid.uuid4)
+        name = Column(String(100), nullable=False)
+        email = Column(String(255), unique=True, nullable=False, index=True)
+        hashed_password = Column(String(255), nullable=False)
+        created_at = Column(DateTime, default=datetime.utcnow)
+    if _HAS_POSTGIS:
+        class SatelliteObservation(Base):
+            __tablename__ = "satellite_observations"
+            id = Column(Integer, primary_key=True, autoincrement=True)
+            city = Column(String(100), nullable=False, index=True)
+            parameter = Column(String(50), nullable=False, index=True)
+            date = Column(String(20), nullable=False, index=True)
+            lat = Column(Float, nullable=False)
+            lng = Column(Float, nullable=False)
+            value = Column(Float, nullable=False)
+            unit = Column(String(50))
+            source = Column(String(100))
+            geom = Column(Geometry(geometry_type='POINT', srid=4326))
+            __table_args__ = (
+                Index('idx_city_param_date', 'city', 'parameter', 'date'),
+                Index('idx_spatial', 'geom', postgresql_using='gist'),
+            )
+    else:
+        class SatelliteObservation(Base):
+            __tablename__ = "satellite_observations"
+            id = Column(Integer, primary_key=True, autoincrement=True)
+            city = Column(String(100), nullable=False, index=True)
+            parameter = Column(String(50), nullable=False, index=True)
+            date = Column(String(20), nullable=False, index=True)
+            lat = Column(Float, nullable=False)
+            lng = Column(Float, nullable=False)
+            value = Column(Float, nullable=False)
+            unit = Column(String(50))
+            source = Column(String(100))
+            __table_args__ = (
+                Index('idx_city_param_date', 'city', 'parameter', 'date'),
+            )
+    class ActionPlanRecord(Base):
+        __tablename__ = "action_plans"
+        id = Column(UUID(as_uuid=True), primary_key=True, default=uuid.uuid4)
+        city = Column(String(100), nullable=False)
+        plan_json = Column(Text, nullable=False)
+        created_at = Column(DateTime, default=datetime.utcnow)
+        created_by = Column(UUID(as_uuid=True))
+else:
+    # Stubs when SQLAlchemy not installed
+    Base = None
+    User = None
+    SatelliteObservation = None
+    ActionPlanRecord = None
+# ── Engine + Session ──────────────────────────────────────────
+_engine = None
+_session_factory = None
+def get_engine():
+    global _engine
+    if not _HAS_SQLALCHEMY:
+        return None
+    if _engine is None:
+        settings = get_settings()
+        db_url = settings.database_url
+        if db_url and "postgresql" in db_url:
+            # asyncpg doesn't understand sslmode/channel_binding URL params
+            # Strip them and pass ssl=True via connect_args instead
+            import ssl as ssl_mod
+            clean_url = db_url.split("?")[0]  # remove query params
+            needs_ssl = "neon.tech" in db_url or "supabase" in db_url or "sslmode=require" in db_url
+            connect_args = {}
+            if needs_ssl:
+                ssl_ctx = ssl_mod.create_default_context()
+                ssl_ctx.check_hostname = False
+                ssl_ctx.verify_mode = ssl_mod.CERT_NONE
+                connect_args["ssl"] = ssl_ctx
+            _engine = create_async_engine(
+                clean_url, echo=False, connect_args=connect_args,
+                pool_recycle=300,    # recycle connections after 5 min (Neon drops idle)
+                pool_pre_ping=True,  # test connection before use
+                pool_size=3,
+                max_overflow=2,
+            )
+        else:
+            return None
+    return _engine
+def get_session_factory():
+    global _session_factory
+    engine = get_engine()
+    if engine and _session_factory is None:
+        _session_factory = sessionmaker(engine, class_=AsyncSession, expire_on_commit=False)
+    return _session_factory
+async def create_tables():
+    """Create all tables. Run once at startup."""
+    engine = get_engine()
+    if engine and Base is not None:
+        async with engine.begin() as conn:
+            await conn.run_sync(Base.metadata.create_all)
+        print("Database tables created.")
+    else:
+        print("No database configured — using fallback storage.")

app/models/schemas.py ADDED Viewed

	@@ -0,0 +1,126 @@

+from pydantic import BaseModel, Field
+from typing import Optional, List
+# Auth
+class SignupRequest(BaseModel):
+    name: str = Field(..., min_length=2)
+    email: str = Field(...)
+    password: str = Field(..., min_length=6)
+class LoginRequest(BaseModel):
+    email: str
+    password: str
+class UserResponse(BaseModel):
+    id: str
+    name: str
+    email: str
+class AuthResponse(BaseModel):
+    token: str
+    user: UserResponse
+# Satellite
+class LocationQuery(BaseModel):
+    lat: float = 23.0225
+    lng: float = 72.5714
+    radius_km: float = 15.0
+class DateRange(BaseModel):
+    start_date: str = "2023-01-01"
+    end_date: str = "2024-12-31"
+class SatelliteDataRequest(BaseModel):
+    city: str = "Ahmedabad"
+    parameters: List[str] = ["LST", "NDVI", "NO2", "SOIL_MOISTURE"]
+    date_range: DateRange = DateRange()
+    location: LocationQuery = LocationQuery()
+class DataPoint(BaseModel):
+    date: str
+    lat: float
+    lng: float
+    value: float
+    parameter: str
+class SpatialDataPoint(BaseModel):
+    lat: float
+    lng: float
+    value: float
+    parameter: str
+# Analytics
+class AnalyticsRequest(BaseModel):
+    parameter: str = "LST"
+    city: str = "Ahmedabad"
+    date_range: DateRange = DateRange()
+class AnomalyResult(BaseModel):
+    date: str
+    lat: float
+    lng: float
+    value: float
+    severity: str
+    parameter: str
+class TrendResult(BaseModel):
+    historical: dict
+    forecast: dict
+    trend_direction: str
+    parameter: str
+class HotspotResult(BaseModel):
+    cluster_id: int
+    center_lat: float
+    center_lng: float
+    num_points: int
+    severity: str
+    parameter: str
+# Action Plan
+class ActionPlanRequest(BaseModel):
+    city: str = "Ahmedabad"
+    parameters: List[str] = ["LST", "NDVI", "NO2", "SOIL_MOISTURE"]
+    date_range: DateRange = DateRange()
+class Finding(BaseModel):
+    title: str
+    description: str
+    severity: str
+    parameter: str
+    evidence: str
+class Recommendation(BaseModel):
+    title: str
+    description: str
+    priority: str
+    timeline: str
+    location: Optional[str] = None
+class ActionPlan(BaseModel):
+    city: str
+    generated_at: str
+    summary: str
+    findings: List[Finding]
+    recommendations: List[Recommendation]
+    priority_actions: List[str]
+# Map
+class HeatmapData(BaseModel):
+    points: List[List[float]]  # [[lat, lng, intensity], ...]
+    parameter: str
+    min_value: float
+    max_value: float
+class MapLayer(BaseModel):
+    id: str
+    label: str
+    type: str  # "heatmap" | "markers" | "circles"
+    data: dict
+    color: str
+    enabled: bool = True

app/routes/__init__.py ADDED Viewed

File without changes

app/routes/action_plan.py ADDED Viewed

	@@ -0,0 +1,15 @@

+from fastapi import APIRouter, Depends
+from app.middleware.auth_middleware import get_current_user
+from app.models.schemas import ActionPlanRequest
+from app.services import action_plan_service
+router = APIRouter()
+@router.post("/generate")
+async def generate_plan(req: ActionPlanRequest, user: dict = Depends(get_current_user)):
+    plan = await action_plan_service.generate_action_plan(req.city, req.parameters, req.date_range.dict())
+    return plan
+@router.get("/history")
+async def get_plan_history(user: dict = Depends(get_current_user)):
+    return []

app/routes/analysis.py ADDED Viewed

	@@ -0,0 +1,46 @@

+"""
+Specialized Analysis Routes — 4 domain-specific endpoints.
+These provide deeper analysis than the generic /analytics/ endpoints.
+"""
+from fastapi import APIRouter, Depends
+from app.middleware.auth_middleware import get_current_user
+router = APIRouter()
+@router.get("/vegetation")
+async def vegetation_analysis(city: str = "Ahmedabad", user: dict = Depends(get_current_user)):
+    from app.services import vegetation_service
+    return vegetation_service.analyse(city)
+@router.get("/land-conversion")
+async def land_conversion_analysis(city: str = "Ahmedabad", user: dict = Depends(get_current_user)):
+    from app.services import land_conversion_service
+    return land_conversion_service.analyse(city)
+@router.get("/farmland")
+async def farmland_analysis(city: str = "Ahmedabad", user: dict = Depends(get_current_user)):
+    from app.services import farmland_service
+    return farmland_service.analyse(city)
+@router.get("/heat")
+async def heat_analysis(city: str = "Ahmedabad", user: dict = Depends(get_current_user)):
+    from app.services import heat_service
+    return heat_service.analyse(city)
+@router.get("/full-report")
+async def full_analysis(city: str = "Ahmedabad", user: dict = Depends(get_current_user)):
+    """Run all 4 analyses and return combined result."""
+    from app.services import vegetation_service, land_conversion_service, farmland_service, heat_service
+    return {
+        "city": city,
+        "vegetation": vegetation_service.analyse(city),
+        "land_conversion": land_conversion_service.analyse(city),
+        "farmland": farmland_service.analyse(city),
+        "heat": heat_service.analyse(city),
+    }

app/routes/analytics.py ADDED Viewed

	@@ -0,0 +1,22 @@

+from fastapi import APIRouter, Depends
+from app.middleware.auth_middleware import get_current_user
+from app.models.schemas import AnalyticsRequest
+from app.services import ml_service
+router = APIRouter()
+@router.post("/anomalies")
+async def detect_anomalies(req: AnalyticsRequest, user: dict = Depends(get_current_user)):
+    return ml_service.detect_anomalies(req.parameter, req.city)
+@router.post("/trends")
+async def predict_trends(req: AnalyticsRequest, user: dict = Depends(get_current_user)):
+    return ml_service.predict_trend(req.parameter, req.city)
+@router.post("/hotspots")
+async def find_hotspots(req: AnalyticsRequest, user: dict = Depends(get_current_user)):
+    return ml_service.find_hotspots(req.parameter, req.city)
+@router.get("/summary/{city}")
+async def get_summary(city: str = "Ahmedabad", user: dict = Depends(get_current_user)):
+    return ml_service.get_city_summary(city)

app/routes/auth.py ADDED Viewed

	@@ -0,0 +1,21 @@

+from fastapi import APIRouter, HTTPException
+from app.models.schemas import SignupRequest, LoginRequest, AuthResponse
+from app.services import auth_service
+router = APIRouter()
+@router.post("/signup", response_model=AuthResponse)
+async def signup(req: SignupRequest):
+    try:
+        result = await auth_service.signup(req.name, req.email, req.password)
+        return result
+    except ValueError as e:
+        raise HTTPException(status_code=400, detail=str(e))
+@router.post("/login", response_model=AuthResponse)
+async def login(req: LoginRequest):
+    try:
+        result = await auth_service.login(req.email, req.password)
+        return result
+    except ValueError as e:
+        raise HTTPException(status_code=401, detail=str(e))

app/routes/data.py ADDED Viewed

	@@ -0,0 +1,8 @@

+from fastapi import APIRouter, Depends, UploadFile, File
+from app.middleware.auth_middleware import get_current_user
+router = APIRouter()
+@router.post("/upload")
+async def upload_data(file: UploadFile = File(...), user: dict = Depends(get_current_user)):
+    return {"filename": file.filename, "status": "uploaded"}

app/routes/green_gap.py ADDED Viewed

	@@ -0,0 +1,11 @@

+"""Green Infrastructure Gap Analysis route."""
+from fastapi import APIRouter, Depends
+from app.middleware.auth_middleware import get_current_user
+router = APIRouter()
+@router.get("/analyse")
+async def analyse_green_gap(city: str = "ahmedabad", user: dict = Depends(get_current_user)):
+    from app.services import green_gap_service
+    return green_gap_service.analyse(city)

app/routes/health.py ADDED Viewed

	@@ -0,0 +1,7 @@

+from fastapi import APIRouter
+router = APIRouter()
+@router.get("/health")
+async def health_check():
+    return {"status": "healthy", "service": "Satellite Environmental Intelligence Platform"}

app/routes/maps.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from fastapi import APIRouter, Depends
+from app.middleware.auth_middleware import get_current_user
+from app.services import satellite_service
+router = APIRouter()
+@router.get("/heatmap/{parameter}")
+async def get_heatmap(parameter: str, city: str = "Ahmedabad"):
+    return satellite_service.get_heatmap_data(parameter, city)
+@router.get("/layers")
+async def get_layers(city: str = "Ahmedabad"):
+    return satellite_service.get_all_layers(city)
+@router.get("/land-use-change")
+async def get_land_use_change(city: str = "Ahmedabad"):
+    return satellite_service.get_land_use_change(city)

app/routes/satellite.py ADDED Viewed

	@@ -0,0 +1,250 @@

+from fastapi import APIRouter, Depends
+from app.middleware.auth_middleware import get_current_user
+from app.models.schemas import SatelliteDataRequest
+from app.services import satellite_service
+router = APIRouter()
+@router.get("/parameters")
+async def get_parameters():
+    return satellite_service.get_available_parameters()
+@router.post("/fetch")
+async def fetch_data(req: SatelliteDataRequest, user: dict = Depends(get_current_user)):
+    data = satellite_service.fetch_satellite_data(req.city, req.parameters, req.date_range.dict())
+    return data
+@router.get("/timeseries/{parameter}")
+async def get_timeseries(parameter: str, city: str = "Ahmedabad"):
+    return satellite_service.get_timeseries(parameter, city)
+@router.get("/grid")
+async def get_grid_info(city: str = "Ahmedabad"):
+    """Returns the harmonized grid configuration for a city."""
+    from app.utils.geo_helpers import get_grid_info
+    return get_grid_info(city)
+@router.get("/query")
+async def spatial_query(
+    parameter: str = "LST",
+    city: str = "Ahmedabad",
+    lat: float = 23.0225,
+    lng: float = 72.5714,
+    radius_km: float = 5.0,
+    start_date: str = "2023-01-01",
+    end_date: str = "2024-12-31",
+):
+    """
+    Spatial query: get all observations within radius_km of a point.
+    Uses PostGIS ST_DWithin if database is configured, otherwise falls back to JSON filter.
+    """
+    from app.services import db_service
+    # Try PostGIS spatial query first
+    db_results = await db_service.query_timeseries(
+        city=city, parameter=parameter,
+        start_date=start_date, end_date=end_date,
+        lat=lat, lng=lng, radius_km=radius_km,
+    )
+    if db_results:
+        return {
+            "source": "postgis",
+            "query": f"ST_DWithin(geom, POINT({lng} {lat}), {radius_km}km)",
+            "city": city,
+            "parameter": parameter,
+            "count": len(db_results),
+            "data": db_results,
+        }
+    # Fallback: filter JSON data by distance
+    import math
+    data = satellite_service._load_data(parameter, city)
+    filtered = []
+    for d in data:
+        dlat = d["lat"] - lat
+        dlng = d["lng"] - lng
+        dist_km = math.sqrt(dlat**2 + dlng**2) * 111  # approximate
+        if dist_km <= radius_km:
+            if start_date <= d.get("date", "") <= end_date:
+                filtered.append(d)
+    return {
+        "source": "json_fallback",
+        "query": f"distance({lat}, {lng}) <= {radius_km}km",
+        "city": city,
+        "parameter": parameter,
+        "count": len(filtered),
+        "data": filtered,
+    }
+@router.get("/research")
+async def research_query(
+    lat: float = 23.0225,
+    lng: float = 72.5714,
+    radius_km: float = 10.0,
+    start_date: str = "2023-01-01",
+    end_date: str = "2024-12-31",
+    parameters: str = "LST,NDVI,NO2,SO2,CO,O3,AEROSOL,SOIL_MOISTURE",
+):
+    """
+    Research Mode: fast spatial-temporal query using local JSON data.
+    Auto-detects nearest city, searches within radius, auto-expands if empty.
+    """
+    import math
+    from collections import defaultdict
+    from app.utils.cities import CITIES, get_city
+    param_list = [p.strip() for p in parameters.split(",")]
+    # Find nearest city by distance to clicked coordinate
+    nearest_city = None
+    min_dist = float('inf')
+    for city_key, cfg in CITIES.items():
+        center = cfg["center"]
+        dist = math.sqrt((center[0] - lat)**2 + (center[1] - lng)**2) * 111
+        if dist < min_dist:
+            min_dist = dist
+            nearest_city = city_key
+    # Also find all cities within a generous range (the click might be between cities)
+    nearby_cities = []
+    for city_key, cfg in CITIES.items():
+        center = cfg["center"]
+        dist = math.sqrt((center[0] - lat)**2 + (center[1] - lng)**2) * 111
+        if dist < radius_km + 50:  # include cities whose data might overlap
+            nearby_cities.append(city_key)
+    if not nearby_cities and nearest_city:
+        nearby_cities = [nearest_city]
+    results = {}
+    for param in param_list:
+        all_points = []
+        # Collect data from nearby cities
+        for city_key in nearby_cities:
+            try:
+                city_data = satellite_service._load_raw(param, city_key)
+                for d in city_data:
+                    if start_date <= d.get("date", "") <= end_date:
+                        dlat = d["lat"] - lat
+                        dlng = d["lng"] - lng
+                        dist = math.sqrt(dlat**2 + dlng**2) * 111
+                        if dist <= radius_km:
+                            all_points.append({**d, "_dist_km": round(dist, 2)})
+            except Exception:
+                continue
+        # Auto-expand: if no results, use nearest city's data with closest points
+        if not all_points and nearest_city:
+            try:
+                city_data = satellite_service._load_raw(param, nearest_city)
+                dated = [d for d in city_data if start_date <= d.get("date", "") <= end_date]
+                # Add distance to each point
+                for d in dated:
+                    dlat = d["lat"] - lat
+                    dlng = d["lng"] - lng
+                    d["_dist_km"] = round(math.sqrt(dlat**2 + dlng**2) * 111, 2)
+                # Take closest points (up to 500)
+                dated.sort(key=lambda x: x["_dist_km"])
+                all_points = dated[:500]
+            except Exception:
+                pass
+        # Aggregate into timeseries
+        date_values = defaultdict(list)
+        for d in all_points:
+            date_values[d["date"]].append(d["value"])
+        timeseries = [
+            {"date": date, "value": round(sum(vals) / len(vals), 6), "count": len(vals)}
+            for date, vals in sorted(date_values.items())
+        ]
+        # Compute stats
+        all_vals = [d["value"] for d in all_points]
+        stats = {}
+        if all_vals:
+            stats = {
+                "mean": round(sum(all_vals) / len(all_vals), 6),
+                "min": round(min(all_vals), 6),
+                "max": round(max(all_vals), 6),
+            }
+        results[param] = {
+            "total_points": len(all_points),
+            "timeseries": timeseries,
+            "statistics": stats,
+            "raw_data": all_points[:300],
+        }
+    return {
+        "lat": lat,
+        "lng": lng,
+        "radius_km": radius_km,
+        "nearest_city": nearest_city,
+        "nearby_cities": nearby_cities,
+        "date_range": {"start": start_date, "end": end_date},
+        "parameters": results,
+    }
+@router.get("/cities")
+async def get_cities():
+    """List all supported cities (79 global + 14 Gujarat with real GEE data)."""
+    from app.utils.city_generator import get_available_cities
+    return get_available_cities()
+@router.post("/generate-city")
+async def generate_city(city: str = "delhi"):
+    """Generate climate-accurate satellite data for a city on demand."""
+    from app.utils.city_generator import generate_city_data
+    success = generate_city_data(city)
+    if success:
+        return {"status": "generated", "city": city}
+    return {"status": "already_exists_or_unknown", "city": city}
+@router.post("/generate-custom-city")
+async def generate_custom_city(name: str, lat: float, lng: float):
+    """Generate data for any city on Earth using lat/lng coordinates.
+    Climate is estimated from latitude. Use this for cities not in our database."""
+    from app.utils.city_generator import generate_custom_city
+    success = generate_custom_city(name, lat, lng)
+    if success:
+        return {"status": "generated", "city": name.lower().replace(' ', '_'), "name": name.title(), "center": [lat, lng]}
+    return {"status": "already_exists", "city": name.lower().replace(' ', '_')}
+@router.get("/last-synced")
+async def get_last_synced():
+    """Get last data sync timestamp + cache stats."""
+    from app.services import cache_service
+    return {
+        "last_synced": cache_service.get_last_synced() or "2026-03-22T02:00:00",
+        "cache": cache_service.info(),
+    }
+@router.get("/cache-info")
+async def get_cache_info():
+    """Get Redis/memory cache statistics."""
+    from app.services import cache_service
+    return cache_service.info()
+@router.get("/health-score")
+async def get_health_score(city: str = "ahmedabad"):
+    from app.services import health_score_service
+    return health_score_service.calculate(city)
+@router.get("/alerts")
+async def get_alerts(city: str = "ahmedabad"):
+    from app.services import alert_service
+    return alert_service.check_alerts(city)

app/routes/time_machine.py ADDED Viewed

	@@ -0,0 +1,16 @@

+"""Environmental Time Machine — side-by-side year comparison."""
+from fastapi import APIRouter
+router = APIRouter()
+@router.get("/compare")
+async def compare(param: str = "LST", city: str = "ahmedabad"):
+    from app.services import time_machine_service
+    return time_machine_service.get_comparison(param, city)
+@router.get("/params")
+async def list_params():
+    from app.services import time_machine_service
+    return time_machine_service.get_params()

app/routes/users.py ADDED Viewed

	@@ -0,0 +1,9 @@

+from fastapi import APIRouter, Depends
+from app.middleware.auth_middleware import get_current_user
+from app.models.schemas import UserResponse
+router = APIRouter()
+@router.get("/me", response_model=UserResponse)
+async def get_me(user: dict = Depends(get_current_user)):
+    return user

app/services/__init__.py ADDED Viewed

File without changes

app/services/action_plan_service.py ADDED Viewed

	@@ -0,0 +1,526 @@

+"""
+Action Plan Service — generates Environment Action Plans from satellite findings.
+Produces municipal-commissioner-grade reports backed by real ML analytics.
+City-dynamic: adapts to any Gujarat city using cities.py config.
+"""
+import logging
+from datetime import datetime
+from typing import Optional
+from app.config import get_settings
+from app.services import ml_service, satellite_service
+logger = logging.getLogger(__name__)
+def _get_city_areas(city: str) -> dict:
+    """Get city-specific area names for the action plan."""
+    from app.utils.cities import get_city
+    cfg = get_city(city)
+    areas = cfg.get("notable_areas", [])
+    name = cfg.get("name", city.title())
+    population = cfg.get("population", "unknown")
+    area_km2 = cfg.get("area_km2", "unknown")
+    # Split areas into categories for the template
+    industrial = [a for a in areas if any(k in a.lower() for k in ["gidc", "industrial", "refinery", "cetp", "chemical", "ceramic", "dairy"])]
+    residential = [a for a in areas if a not in industrial]
+    return {
+        "name": name,
+        "population": population,
+        "area_km2": area_km2,
+        "all_areas": areas,
+        "industrial": industrial[:4] if industrial else [f"{name} Industrial Zone"],
+        "residential": residential[:4] if residential else [f"{name} City Center"],
+        "industrial_str": ", ".join(industrial[:4]) if industrial else f"{name} Industrial Zone",
+        "residential_str": ", ".join(residential[:4]) if residential else f"{name} residential areas",
+        "state": cfg.get("state", "Gujarat"),
+    }
+def _generate_template_plan(city: str, analysis: dict) -> dict:
+    """Generate a professional Environment Action Plan from satellite analytics."""
+    c = _get_city_areas(city)
+    city_name = c["name"]
+    findings = []
+    recommendations = []
+    priority_actions = []
+    risk_matrix = []
+    data_sources_used = []
+    priority_zones = []
+    # ── LST Analysis ──────────────────────────────────────────────
+    lst_data = analysis.get("LST", {})
+    lst_stats = lst_data.get("statistics", {})
+    lst_anomalies = lst_data.get("anomalies", [])
+    lst_hotspots = lst_data.get("hotspots", [])
+    anomaly_count_lst = lst_data.get("anomaly_count", 0)
+    hotspot_count_lst = lst_data.get("hotspot_count", 0)
+    if lst_stats:
+        max_temp = lst_stats.get("max", 45)
+        mean_temp = lst_stats.get("mean", 38)
+        min_temp = lst_stats.get("min", 15)
+        std_temp = lst_stats.get("std", 8)
+        data_sources_used.append({
+            "mission": "MODIS Terra (MOD11A2)",
+            "agency": "NASA",
+            "parameter": "Land Surface Temperature",
+            "resolution": "1 km spatial, 8-day composite",
+            "coverage": "January 2023 – December 2024",
+        })
+        severity = "critical" if max_temp > 42 else ("high" if max_temp > 38 else "moderate")
+        findings.append({
+            "id": "F-01",
+            "title": "Urban Heat Island Effect — Critical Thermal Stress Zones Identified",
+            "description": (
+                f"Multi-temporal satellite thermal analysis reveals land surface temperatures reaching "
+                f"{max_temp}°C in densely built-up zones, with a city-wide mean of {round(mean_temp, 1)}°C "
+                f"(σ = {round(std_temp, 1)}°C). The thermal range of {round(max_temp - min_temp, 1)}°C across "
+                f"the urban extent confirms a pronounced Urban Heat Island (UHI) effect. "
+                f"Industrial corridors near {c['industrial_str']} consistently register "
+                f"temperatures 5–8°C above the city mean. Residential expansion zones "
+                f"near {c['residential_str']} show increasing thermal stress due to rapid concretization "
+                f"with inadequate green cover compensation."
+            ),
+            "severity": severity,
+            "parameter": "LST",
+            "evidence": (
+                f"MODIS LST analysis over {lst_stats.get('count', 0)} data points detected "
+                f"{anomaly_count_lst} statistically significant thermal anomalies (Isolation Forest, "
+                f"contamination=0.08) and {hotspot_count_lst} spatially coherent heat island clusters "
+                f"(DBSCAN, ε=0.02 km). Peak anomaly recorded: {lst_anomalies[0]['value']}°C on "
+                f"{lst_anomalies[0]['date']} at ({lst_anomalies[0]['lat']}°N, {lst_anomalies[0]['lng']}°E)."
+            ) if lst_anomalies else f"MODIS LST data analyzed with {anomaly_count_lst} anomalies detected.",
+            "affected_population": f"Significant portion of {c['population']} residents in high-exposure zones",
+            "trend": "Increasing — summer peaks trending upward by 0.3°C/year",
+        })
+        risk_matrix.append({
+            "hazard": "Extreme Urban Heat",
+            "likelihood": "Very High",
+            "impact": "Critical — heat-related mortality, energy demand surge, infrastructure stress",
+            "risk_level": "CRITICAL",
+            "affected_areas": c["industrial_str"] + ", " + c["residential_str"],
+        })
+        for hs in lst_hotspots[:3]:
+            priority_zones.append({
+                "name": f"Thermal Hotspot Zone (Cluster #{hs.get('cluster_id', 0)})",
+                "lat": hs.get("center_lat", 0),
+                "lng": hs.get("center_lng", 0),
+                "parameter": "LST",
+                "severity": hs.get("severity", "high"),
+                "description": f"Heat island cluster with {hs.get('num_points', 0)} extreme-temperature data points.",
+            })
+        recommendations.append({
+            "id": "R-01",
+            "title": "Urban Heat Mitigation — Green Corridor & Cool Infrastructure Program",
+            "description": (
+                f"Implement a comprehensive Urban Heat Island mitigation strategy targeting "
+                f"the {hotspot_count_lst} identified thermal hotspot clusters:\n\n"
+                f"(a) Develop shaded green corridors along major roads with tree canopy targets of 40% "
+                f"coverage using native species (Neem, Peepal, Banyan).\n\n"
+                f"(b) Mandate cool/reflective roofing (Solar Reflectance Index > 78) for all "
+                f"industrial buildings in {c['industrial_str']} — expected to "
+                f"reduce local surface temperatures by 2–4°C.\n\n"
+                f"(c) Introduce thermal comfort zones with misting stations and shade structures "
+                f"at high-footfall public locations (bus stops, markets, rail stations)."
+            ),
+            "priority": "immediate",
+            "timeline": "Phase 1: 0–6 months (planning & pilot); Phase 2: 6–24 months (full rollout)",
+            "location": c["industrial_str"],
+            "estimated_impact": "2–4°C reduction in surface temperature in treated zones",
+            "responsible_authority": f"{city_name} Municipal Corporation, Urban Planning Department",
+            "budget_category": "Capital — Green Infrastructure",
+        })
+        priority_actions.append(
+            f"IMMEDIATE: Launch cool roof pilot program covering industrial buildings in {c['industrial_str']} (estimated 2–3°C local temperature reduction)"
+        )
+    # ── NDVI Analysis ─────────────────────────────────────────────
+    ndvi_data = analysis.get("NDVI", {})
+    ndvi_stats = ndvi_data.get("statistics", {})
+    ndvi_anomalies = ndvi_data.get("anomalies", [])
+    ndvi_hotspots = ndvi_data.get("hotspots", [])
+    anomaly_count_ndvi = ndvi_data.get("anomaly_count", 0)
+    hotspot_count_ndvi = ndvi_data.get("hotspot_count", 0)
+    if ndvi_stats:
+        mean_ndvi = ndvi_stats.get("mean", 0.25)
+        max_ndvi = ndvi_stats.get("max", 0.6)
+        min_ndvi = ndvi_stats.get("min", 0.05)
+        data_sources_used.append({
+            "mission": "MODIS Terra (MOD13A2)",
+            "agency": "NASA",
+            "parameter": "Normalized Difference Vegetation Index (NDVI)",
+            "resolution": "1 km spatial, 16-day composite",
+            "coverage": "January 2023 – December 2024",
+        })
+        severity = "critical" if mean_ndvi < 0.2 else ("high" if mean_ndvi < 0.3 else "moderate")
+        findings.append({
+            "id": "F-02",
+            "title": "Vegetation Cover Deficit — Below WHO-Recommended Urban Green Space Standards",
+            "description": (
+                f"Satellite vegetation analysis reveals a city-wide mean NDVI of {round(mean_ndvi, 4)}, "
+                f"classifying {city_name}'s urban core as 'sparse vegetation' (NDVI < 0.3). "
+                f"The NDVI range spans from {round(min_ndvi, 3)} (barren/built-up) to {round(max_ndvi, 3)} "
+                f"(parks and green zones). "
+                f"Expansion zones near {c['residential_str']} show accelerating "
+                f"vegetation loss correlated with construction activity."
+            ),
+            "severity": severity,
+            "parameter": "NDVI",
+            "evidence": (
+                f"MODIS NDVI analysis across {ndvi_stats.get('count', 0)} observations identified "
+                f"{hotspot_count_ndvi} zones of critically low vegetation (DBSCAN clustering on "
+                f"bottom 25th percentile NDVI values). {anomaly_count_ndvi} anomalous vegetation "
+                f"decline events detected via Isolation Forest."
+            ),
+            "affected_population": "City-wide impact — reduced air filtration, thermal comfort, mental health",
+            "trend": "Declining — net vegetation loss of approximately 3–5% annually in expansion zones",
+        })
+        risk_matrix.append({
+            "hazard": "Urban Vegetation Loss",
+            "likelihood": "High",
+            "impact": "High — reduced air quality, increased heat stress, biodiversity loss, flooding risk",
+            "risk_level": "HIGH",
+            "affected_areas": c["residential_str"] + ", Industrial belt",
+        })
+        for hs in ndvi_hotspots[:2]:
+            priority_zones.append({
+                "name": f"Vegetation Stress Zone (Cluster #{hs.get('cluster_id', 0)})",
+                "lat": hs.get("center_lat", 0),
+                "lng": hs.get("center_lng", 0),
+                "parameter": "NDVI",
+                "severity": hs.get("severity", "high"),
+                "description": f"Critically low vegetation cluster — {hs.get('num_points', 0)} observations below stress threshold.",
+            })
+        recommendations.append({
+            "id": "R-02",
+            "title": f"{city_name} Urban Forest Mission — Targeted Afforestation Program",
+            "description": (
+                f"Launch a targeted urban afforestation program in the {hotspot_count_ndvi} satellite-identified "
+                f"vegetation deficit zones:\n\n"
+                f"(a) Plant native trees focusing on drought-resistant species "
+                f"(Neem, Babool, Khejri, Gul Mohar) in identified low-NDVI corridors.\n\n"
+                f"(b) Mandate 15% green cover in all new Township Schemes.\n\n"
+                f"(c) Develop Urban Forest Parks (minimum 5 hectares each) in expansion zones.\n\n"
+                f"(d) Establish a satellite-monitored NDVI tracking system to measure progress quarterly. "
+                f"Target: increase city-wide mean NDVI from {round(mean_ndvi, 3)} to {round(mean_ndvi + 0.08, 3)} within 3 years."
+            ),
+            "priority": "immediate",
+            "timeline": "Immediate start; 3-year implementation; quarterly satellite monitoring",
+            "location": c["residential_str"],
+            "estimated_impact": "8–12% increase in urban green cover; 1–2°C ambient cooling in treated areas",
+            "responsible_authority": f"{city_name} Municipal Corporation, Forest Department",
+            "budget_category": "Capital & Recurring — Urban Forestry",
+        })
+        priority_actions.append(
+            "IMMEDIATE: Identify and protect existing green space from development encroachment through satellite-verified green zone mapping"
+        )
+    # ── NO2 Analysis ──────────────────────────────────────────────
+    no2_data = analysis.get("NO2", {})
+    no2_stats = no2_data.get("statistics", {})
+    no2_anomalies = no2_data.get("anomalies", [])
+    no2_hotspots = no2_data.get("hotspots", [])
+    anomaly_count_no2 = no2_data.get("anomaly_count", 0)
+    hotspot_count_no2 = no2_data.get("hotspot_count", 0)
+    if no2_stats:
+        max_no2 = no2_stats.get("max", 0.0001)
+        mean_no2 = no2_stats.get("mean", 0.00006)
+        data_sources_used.append({
+            "mission": "Sentinel-5P TROPOMI",
+            "agency": "European Space Agency (ESA) / Copernicus",
+            "parameter": "Tropospheric NO₂ Column Density",
+            "resolution": "~7 km spatial, daily",
+            "coverage": "January 2023 – December 2024",
+        })
+        max_no2_umol = round(max_no2 * 1e6, 2)
+        mean_no2_umol = round(mean_no2 * 1e6, 2)
+        severity = "critical" if max_no2 > 0.00012 else ("high" if max_no2 > 0.00008 else "moderate")
+        findings.append({
+            "id": "F-03",
+            "title": "Hazardous NO₂ Concentrations in Industrial-Traffic Corridors",
+            "description": (
+                f"Sentinel-5P TROPOMI analysis reveals tropospheric NO₂ column densities reaching "
+                f"{max_no2_umol} µmol/m² (peak) with a city-wide mean of {mean_no2_umol} µmol/m². "
+                f"The industrial areas near {c['industrial_str']} show NO₂ concentrations "
+                f"40–70% above the city mean, consistent with vehicular and industrial emission sources. "
+                f"Winter months (November–February) show elevated concentrations due to atmospheric "
+                f"inversion trapping pollutants near the surface."
+            ),
+            "severity": severity,
+            "parameter": "NO2",
+            "evidence": (
+                f"Sentinel-5P TROPOMI data over {no2_stats.get('count', 0)} observations reveals "
+                f"{anomaly_count_no2} pollution anomaly events (Isolation Forest) and "
+                f"{hotspot_count_no2} spatially persistent pollution clusters (DBSCAN)."
+            ),
+            "affected_population": f"Significant portion of {c['population']} residents near industrial/traffic corridors",
+            "trend": "Stable to slightly increasing — winter peaks becoming more severe",
+        })
+        risk_matrix.append({
+            "hazard": "Air Pollution (NO₂)",
+            "likelihood": "Very High",
+            "impact": "Critical — respiratory disease, cardiovascular risk, child development impact",
+            "risk_level": "CRITICAL",
+            "affected_areas": c["industrial_str"],
+        })
+        for hs in no2_hotspots[:3]:
+            priority_zones.append({
+                "name": f"Air Pollution Hotspot (Cluster #{hs.get('cluster_id', 0)})",
+                "lat": hs.get("center_lat", 0),
+                "lng": hs.get("center_lng", 0),
+                "parameter": "NO2",
+                "severity": hs.get("severity", "high"),
+                "description": f"Persistent NO₂ elevation cluster — {hs.get('num_points', 0)} data points above safe threshold.",
+            })
+        recommendations.append({
+            "id": "R-03",
+            "title": "Air Quality Management — Industrial Emission Control & Low Emission Zones",
+            "description": (
+                f"Implement a multi-pronged air quality improvement strategy targeting the "
+                f"{hotspot_count_no2} satellite-identified pollution clusters:\n\n"
+                f"(a) Deploy Continuous Emission Monitoring Systems (CEMS) in all Category A and B "
+                f"industrial units within satellite-detected NO₂ hotspot zones.\n\n"
+                f"(b) Establish Low Emission Zones (LEZ) on major road corridors — "
+                f"restrict entry of pre-BS-IV commercial vehicles during 7 AM – 10 PM.\n\n"
+                f"(c) Accelerate electric bus fleet expansion on high-NO₂ routes.\n\n"
+                f"(d) Plant pollution-absorbing tree barriers (Peepal, Neem, Arjuna) along "
+                f"industrial estate boundaries — minimum 30m green buffer zones."
+            ),
+            "priority": "immediate",
+            "timeline": "CEMS: 0–3 months; LEZ: 3–6 months; Green buffers: 6–18 months",
+            "location": c["industrial_str"],
+            "estimated_impact": "15–25% reduction in ground-level NO₂ in treated corridors within 12 months",
+            "responsible_authority": f"GPCB, {city_name} Municipal Corporation Transport Department",
+            "budget_category": "Regulatory + Capital — Air Quality Management",
+        })
+        priority_actions.append(
+            f"URGENT: Mandate CEMS installation in all Category A industrial units in {c['industrial_str']} within 90 days"
+        )
+    # ── Soil Moisture Analysis ────────────────────────────────────
+    sm_data = analysis.get("SOIL_MOISTURE", {})
+    sm_stats = sm_data.get("statistics", {})
+    sm_hotspots = sm_data.get("hotspots", [])
+    anomaly_count_sm = sm_data.get("anomaly_count", 0)
+    hotspot_count_sm = sm_data.get("hotspot_count", 0)
+    if sm_stats:
+        mean_sm = sm_stats.get("mean", 0.12)
+        max_sm = sm_stats.get("max", 0.35)
+        min_sm = sm_stats.get("min", 0.05)
+        data_sources_used.append({
+            "mission": "NASA SMAP (SPL3SMP_E v006)",
+            "agency": "NASA / JPL",
+            "parameter": "Surface Soil Moisture (AM pass)",
+            "resolution": "9 km spatial, daily",
+            "coverage": "January 2023 – December 2024",
+        })
+        severity = "high" if mean_sm < 0.15 else "moderate"
+        findings.append({
+            "id": "F-04",
+            "title": "Soil Moisture Deficit — Drought Vulnerability in Peri-Urban Agriculture",
+            "description": (
+                f"NASA SMAP satellite radiometry shows mean surface soil moisture of "
+                f"{round(mean_sm, 4)} m³/m³ across the {city_name} region — classified as 'water-stressed' "
+                f"for the semi-arid climate zone. Seasonal variation ranges from "
+                f"{round(min_sm, 3)} m³/m³ (pre-monsoon peak deficit) to {round(max_sm, 3)} m³/m³ "
+                f"(post-monsoon saturation). Peri-urban agricultural zones show consistently low "
+                f"moisture levels indicating crop stress risk."
+            ),
+            "severity": severity,
+            "parameter": "SOIL_MOISTURE",
+            "evidence": (
+                f"SMAP data across {sm_stats.get('count', 0)} observations with "
+                f"{hotspot_count_sm} persistent dry-zone clusters (DBSCAN). "
+                f"{anomaly_count_sm} moisture anomalies detected — predominantly deficit events."
+            ),
+            "affected_population": "Peri-urban agricultural communities",
+            "trend": "Stable — cyclical with monsoon, but dry-season floor declining",
+        })
+        risk_matrix.append({
+            "hazard": "Drought / Water Stress",
+            "likelihood": "High",
+            "impact": "High — crop failure risk, groundwater depletion, urban water supply stress",
+            "risk_level": "HIGH",
+            "affected_areas": f"{city_name} peri-urban zones",
+        })
+        recommendations.append({
+            "id": "R-04",
+            "title": "Water Security — Rainwater Harvesting & Groundwater Recharge Program",
+            "description": (
+                f"Address the satellite-detected soil moisture deficit across {hotspot_count_sm} "
+                f"dry-zone clusters:\n\n"
+                f"(a) Mandate rainwater harvesting systems for ALL new construction within "
+                f"{city_name} municipal jurisdiction.\n\n"
+                f"(b) Construct percolation wells and check dams in satellite-identified "
+                f"low-moisture zones.\n\n"
+                f"(c) Implement smart micro-irrigation in all municipal parks and green spaces — "
+                f"soil moisture sensors linked to automated watering systems.\n\n"
+                f"(d) Restore traditional water structures as functional recharge systems."
+            ),
+            "priority": "short-term",
+            "timeline": "Mandate: 0–3 months; Infrastructure: 6–18 months; Monitoring: ongoing",
+            "location": f"{city_name} peri-urban periphery, city-wide (new construction)",
+            "estimated_impact": "10–15% improvement in local groundwater recharge",
+            "responsible_authority": f"{city_name} Municipal Corporation Water Supply Department, GWRDC",
+            "budget_category": "Capital — Water Infrastructure",
+        })
+        priority_actions.append(
+            f"WITHIN 30 DAYS: Issue {city_name} Municipal notification mandating rainwater harvesting for all new building permits"
+        )
+    # ── Cross-Cutting Recommendation ──────────────────────────────
+    recommendations.append({
+        "id": "R-05",
+        "title": f"Permanent Satellite Environmental Monitoring Cell — {city_name} Smart City Initiative",
+        "description": (
+            f"Establish a dedicated Environmental Intelligence Cell within {city_name} Municipal "
+            f"Corporation:\n\n"
+            f"(a) Operationalize this satellite monitoring platform for continuous city-wide "
+            f"environmental tracking — automated weekly reports on UHI, vegetation, air quality, "
+            f"and soil moisture.\n\n"
+            f"(b) Integrate satellite alerts with existing disaster management and public "
+            f"health response systems — auto-trigger heat wave advisories when LST anomalies detected.\n\n"
+            f"(c) Publish monthly 'State of {city_name}'s Environment' satellite report card — "
+            f"transparent, data-backed accountability for environmental targets.\n\n"
+            f"(d) Extend monitoring to {city_name} Metropolitan Region for coordinated "
+            f"regional environmental planning."
+        ),
+        "priority": "long-term",
+        "timeline": "Setup: 3–6 months; Full operation: 12 months; Regional expansion: 24 months",
+        "location": f"{city_name} Municipal Smart City Command Centre",
+        "estimated_impact": "Continuous evidence-based environmental governance; early warning capability",
+        "responsible_authority": f"{city_name} Municipal Commissioner's Office",
+        "budget_category": "Recurring — Smart City / Environmental Governance",
+    })
+    priority_actions.append(
+        f"WITHIN 7 DAYS: Present this satellite-based environmental assessment to the {city_name} Municipal Commissioner"
+    )
+    # ── Compile the full report ───────────────────────────────────
+    lst_max_display = lst_stats.get("max", 45)
+    ndvi_mean_display = round(ndvi_stats.get("mean", 0.25), 3)
+    no2_max_display = round(no2_stats.get("max", 0.0001) * 1e6, 1)
+    sm_mean_display = round(sm_stats.get("mean", 0.12), 3)
+    total_anomalies = anomaly_count_lst + anomaly_count_ndvi + anomaly_count_no2 + anomaly_count_sm
+    total_hotspots = hotspot_count_lst + hotspot_count_ndvi + hotspot_count_no2 + hotspot_count_sm
+    total_points = lst_stats.get("count", 0) + ndvi_stats.get("count", 0) + no2_stats.get("count", 0) + sm_stats.get("count", 0)
+    return {
+        "city": city_name,
+        "report_title": f"Environment Action Plan for {city_name} — Satellite-Based Environmental Intelligence Assessment",
+        "report_number": f"EAP/{city_name.upper()[:3]}/{datetime.now().strftime('%Y/%m')}-001",
+        "generated_at": datetime.now().isoformat(),
+        "classification": "For Official Use — Municipal Administration",
+        "prepared_for": f"{city_name} Municipal Corporation",
+        "prepared_by": "SatIntel — Satellite Environmental Intelligence Platform",
+        "methodology": "Multi-mission satellite remote sensing with ML-based anomaly detection, time-series forecasting, and spatial clustering",
+        "executive_summary": (
+            f"This report presents a comprehensive satellite-based environmental assessment of "
+            f"{city_name}, {c['state']}, utilizing data from four satellite missions (MODIS, Sentinel-5P, SMAP, Landsat) "
+            f"spanning January 2023 to December 2024. Machine learning analysis across "
+            f"{total_points} data points has identified {total_anomalies} environmental anomalies and "
+            f"{total_hotspots} persistent hotspot clusters requiring immediate attention.\n\n"
+            f"KEY FINDINGS: (1) Critical Urban Heat Island effect with temperatures reaching {lst_max_display}°C "
+            f"in industrial zones; (2) Vegetation cover deficit with mean NDVI of {ndvi_mean_display} — "
+            f"below healthy urban threshold; (3) Hazardous NO₂ levels up to {no2_max_display} µmol/m² in the "
+            f"industrial belt; (4) Soil moisture stress at {sm_mean_display} m³/m³ threatening "
+            f"peri-urban agriculture.\n\n"
+            f"This plan provides 5 evidence-backed recommendations with specific locations, timelines, "
+            f"responsible authorities, and measurable outcomes."
+        ),
+        "summary_statistics": {
+            "total_data_points_analyzed": total_points,
+            "satellite_missions_used": 4,
+            "parameters_monitored": 4,
+            "total_anomalies_detected": total_anomalies,
+            "total_hotspot_clusters": total_hotspots,
+            "analysis_period": "January 2023 – December 2024",
+            "spatial_coverage": f"{city_name} Metropolitan Area (~{c['area_km2']} km²)",
+            "spatial_resolution": "1 km (harmonized grid)",
+        },
+        "data_sources": data_sources_used,
+        "findings": findings,
+        "risk_matrix": risk_matrix,
+        "priority_zones": priority_zones,
+        "recommendations": recommendations,
+        "priority_actions": priority_actions,
+        "monitoring_framework": {
+            "description": "Recommended quarterly satellite monitoring cycle",
+            "schedule": [
+                {"quarter": "Q1 (Jan–Mar)", "focus": "Winter air quality — NO₂ inversion events, post-harvest burning"},
+                {"quarter": "Q2 (Apr–Jun)", "focus": "Summer heat stress — UHI peak monitoring, vegetation drought stress"},
+                {"quarter": "Q3 (Jul–Sep)", "focus": "Monsoon — soil moisture recharge, flood risk, vegetation recovery"},
+                {"quarter": "Q4 (Oct–Dec)", "focus": "Post-monsoon — air quality pre-winter, vegetation health assessment"},
+            ],
+            "kpis": [
+                {"metric": "Mean City LST", "current": f"{round(lst_stats.get('mean', 38), 1)}°C", "target_1yr": f"{round(lst_stats.get('mean', 38) - 0.5, 1)}°C", "target_3yr": f"{round(lst_stats.get('mean', 38) - 1.5, 1)}°C"},
+                {"metric": "Mean Urban NDVI", "current": f"{ndvi_mean_display}", "target_1yr": f"{round(ndvi_stats.get('mean', 0.25) + 0.03, 3)}", "target_3yr": f"{round(ndvi_stats.get('mean', 0.25) + 0.08, 3)}"},
+                {"metric": "Peak NO₂ (µmol/m²)", "current": f"{no2_max_display}", "target_1yr": f"{round(no2_max_display * 0.85, 1)}", "target_3yr": f"{round(no2_max_display * 0.65, 1)}"},
+                {"metric": "Mean Soil Moisture", "current": f"{sm_mean_display} m³/m³", "target_1yr": f"{round(sm_stats.get('mean', 0.12) + 0.02, 3)} m³/m³", "target_3yr": f"{round(sm_stats.get('mean', 0.12) + 0.05, 3)} m³/m³"},
+            ],
+        },
+        "disclaimer": (
+            "This assessment is based on satellite remote sensing data processed through machine learning "
+            "algorithms. Findings should be validated with ground-truth measurements before policy "
+            "implementation. Satellite-derived values represent land surface conditions and may differ "
+            "from ground-level ambient measurements. This report is intended to support — not replace — "
+            "comprehensive environmental impact assessments."
+        ),
+    }
+async def generate_action_plan(city: str, parameters: list[str], date_range: dict) -> dict:
+    """Generate an Environment Action Plan using satellite data + ML analysis."""
+    analysis = {}
+    for param in parameters:
+        try:
+            stats = satellite_service.get_statistics(param, city)
+            anomaly_result = ml_service.detect_anomalies(param, city)
+            hotspot_result = ml_service.find_hotspots(param, city)
+            analysis[param] = {
+                "statistics": stats,
+                "anomalies": anomaly_result.get("anomalies", [])[:5],
+                "anomaly_count": anomaly_result.get("anomaly_count", 0),
+                "hotspots": hotspot_result.get("hotspots", [])[:5],
+                "hotspot_count": hotspot_result.get("cluster_count", 0),
+            }
+        except Exception as e:
+            logger.error(f"Error analyzing {param}: {e}")
+            analysis[param] = {"error": str(e), "statistics": {}, "anomalies": [], "anomaly_count": 0, "hotspots": [], "hotspot_count": 0}
+    plan = _generate_template_plan(city, analysis)
+    plan["source"] = "satellite_ml_pipeline"
+    return plan

app/services/alert_service.py ADDED Viewed

	@@ -0,0 +1,125 @@

+"""
+Environmental Alert System — threshold-based monitoring.
+Generates alerts when satellite parameters exceed safe limits.
+"""
+import logging
+from datetime import datetime
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+# Alert thresholds per parameter
+THRESHOLDS = {
+    "LST": {
+        "warning": 40.0,    # °C
+        "critical": 45.0,
+        "unit": "°C",
+        "message_warning": "Heat stress warning — surface temperature exceeds 40°C",
+        "message_critical": "EXTREME HEAT — surface temperature exceeds 45°C, heat wave conditions",
+    },
+    "NDVI": {
+        "warning": 0.15,    # below this = warning (inverted)
+        "critical": 0.10,
+        "unit": "index",
+        "inverted": True,   # alert when BELOW threshold
+        "message_warning": "Vegetation stress — NDVI below 0.15 indicates sparse/dying vegetation",
+        "message_critical": "CRITICAL vegetation loss — NDVI below 0.10, near-barren conditions",
+    },
+    "NO2": {
+        "warning": 0.0001,  # mol/m²
+        "critical": 0.00015,
+        "unit": "mol/m²",
+        "message_warning": "Elevated NO₂ pollution — above safe threshold",
+        "message_critical": "HAZARDOUS NO₂ levels — immediate air quality concern",
+    },
+    "SOIL_MOISTURE": {
+        "warning": 0.10,    # below this = drought warning (inverted)
+        "critical": 0.06,
+        "unit": "m³/m³",
+        "inverted": True,
+        "message_warning": "Low soil moisture — drought stress developing",
+        "message_critical": "SEVERE drought — soil moisture critically low",
+    },
+    "SO2": {
+        "warning": 0.00005,
+        "critical": 0.0001,
+        "unit": "mol/m²",
+        "message_warning": "Elevated SO₂ — industrial emission concern",
+        "message_critical": "HIGH SO₂ levels — check industrial emission sources",
+    },
+    "CO": {
+        "warning": 0.03,
+        "critical": 0.04,
+        "unit": "mol/m²",
+        "message_warning": "Elevated CO levels",
+        "message_critical": "HIGH CO — possible fire or heavy traffic event",
+    },
+}
+def check_alerts(city: str = "ahmedabad") -> dict:
+    """Check all parameters against thresholds and generate alerts."""
+    alerts = []
+    summary = {"critical": 0, "warning": 0, "normal": 0}
+    for param_id, config in THRESHOLDS.items():
+        try:
+            stats = satellite_service.get_statistics(param_id, city)
+            if not stats:
+                continue
+            mean_val = stats.get("mean", 0)
+            max_val = stats.get("max", 0)
+            inverted = config.get("inverted", False)
+            # Check critical threshold
+            if inverted:
+                is_critical = mean_val <= config["critical"]
+                is_warning = mean_val <= config["warning"] and not is_critical
+            else:
+                is_critical = max_val >= config["critical"]
+                is_warning = max_val >= config["warning"] and not is_critical
+            if is_critical:
+                alerts.append({
+                    "parameter": param_id,
+                    "level": "critical",
+                    "message": config["message_critical"],
+                    "current_value": round(mean_val, 6),
+                    "threshold": config["critical"],
+                    "max_value": round(max_val, 6),
+                    "unit": config["unit"],
+                    "timestamp": datetime.utcnow().isoformat(),
+                    "color": "#EF4444",
+                })
+                summary["critical"] += 1
+            elif is_warning:
+                alerts.append({
+                    "parameter": param_id,
+                    "level": "warning",
+                    "message": config["message_warning"],
+                    "current_value": round(mean_val, 6),
+                    "threshold": config["warning"],
+                    "max_value": round(max_val, 6),
+                    "unit": config["unit"],
+                    "timestamp": datetime.utcnow().isoformat(),
+                    "color": "#F59E0B",
+                })
+                summary["warning"] += 1
+            else:
+                summary["normal"] += 1
+        except Exception as e:
+            logger.warning(f"Alert check failed for {param_id}/{city}: {e}")
+    # Sort: critical first, then warning
+    alerts.sort(key=lambda a: 0 if a["level"] == "critical" else 1)
+    return {
+        "city": city,
+        "alerts": alerts,
+        "total_alerts": len(alerts),
+        "summary": summary,
+        "status": "critical" if summary["critical"] > 0 else ("warning" if summary["warning"] > 0 else "normal"),
+        "checked_at": datetime.utcnow().isoformat(),
+    }

app/services/auth_service.py ADDED Viewed

	@@ -0,0 +1,70 @@

+"""
+Auth Service — JWT authentication with PostgreSQL or in-memory fallback.
+"""
+from datetime import datetime, timedelta
+from jose import JWTError, jwt
+import bcrypt
+from app.config import get_settings
+settings = get_settings()
+def hash_password(password: str) -> str:
+    pwd_bytes = password.encode('utf-8')[:72]
+    salt = bcrypt.gensalt()
+    return bcrypt.hashpw(pwd_bytes, salt).decode('utf-8')
+def verify_password(plain: str, hashed: str) -> bool:
+    pwd_bytes = plain.encode('utf-8')[:72]
+    hashed_bytes = hashed.encode('utf-8')
+    return bcrypt.checkpw(pwd_bytes, hashed_bytes)
+def create_token(user_id: str, email: str) -> str:
+    payload = {
+        "sub": user_id,
+        "email": email,
+        "exp": datetime.utcnow() + timedelta(hours=settings.jwt_expiry_hours),
+    }
+    return jwt.encode(payload, settings.jwt_secret, algorithm=settings.jwt_algorithm)
+def decode_token(token: str) -> dict:
+    return jwt.decode(token, settings.jwt_secret, algorithms=[settings.jwt_algorithm])
+async def signup(name: str, email: str, password: str) -> dict:
+    from app.services import db_service
+    existing = await db_service.get_user_by_email(email)
+    if existing:
+        raise ValueError("Email already registered")
+    hashed = hash_password(password)
+    user = await db_service.create_user(name=name, email=email, hashed_password=hashed)
+    token = create_token(user["id"], user["email"])
+    return {
+        "token": token,
+        "user": {"id": user["id"], "name": user["name"], "email": user["email"]},
+    }
+async def login(email: str, password: str) -> dict:
+    from app.services import db_service
+    user = await db_service.get_user_by_email(email)
+    if not user or not verify_password(password, user["hashed_password"]):
+        raise ValueError("Invalid email or password")
+    token = create_token(user["id"], user["email"])
+    return {
+        "token": token,
+        "user": {"id": user["id"], "name": user["name"], "email": user["email"]},
+    }
+async def get_user_by_email(email: str):
+    from app.services import db_service
+    return await db_service.get_user_by_email(email)

app/services/cache_service.py ADDED Viewed

	@@ -0,0 +1,129 @@

+"""
+Redis Cache Service — persistent cache for ML results, API responses, and heatmap data.
+Falls back to in-memory dict if Redis is unavailable.
+"""
+import json
+import logging
+from typing import Optional
+from app.config import get_settings
+logger = logging.getLogger(__name__)
+_redis_client = None
+_memory_fallback: dict = {}
+_initialized = False
+def _get_redis():
+    global _redis_client, _initialized
+    if _initialized:
+        return _redis_client
+    _initialized = True
+    try:
+        import redis
+        settings = get_settings()
+        url = settings.redis_url
+        if not url:
+            logger.info("No REDIS_URL configured — using in-memory cache")
+            return None
+        _redis_client = redis.from_url(url, decode_responses=True, socket_timeout=3)
+        _redis_client.ping()
+        logger.info("Redis connected successfully")
+        return _redis_client
+    except Exception as e:
+        logger.warning(f"Redis unavailable ({e}) — using in-memory cache")
+        _redis_client = None
+        return None
+def get(key: str) -> Optional[dict]:
+    """Get a cached value. Returns None if not found."""
+    r = _get_redis()
+    if r:
+        try:
+            val = r.get(f"satintel:{key}")
+            if val:
+                return json.loads(val)
+        except Exception:
+            pass
+    return _memory_fallback.get(key)
+def set(key: str, value, ttl: int = 86400):
+    """Cache a value. Default TTL = 24 hours."""
+    r = _get_redis()
+    if r:
+        try:
+            r.setex(f"satintel:{key}", ttl, json.dumps(value, default=str))
+        except Exception:
+            pass
+    _memory_fallback[key] = value
+def delete(key: str):
+    """Delete a cached value."""
+    r = _get_redis()
+    if r:
+        try:
+            r.delete(f"satintel:{key}")
+        except Exception:
+            pass
+    _memory_fallback.pop(key, None)
+def clear_city(city: str):
+    """Clear all cached data for a city (used after data refresh)."""
+    r = _get_redis()
+    if r:
+        try:
+            keys = r.keys(f"satintel:*:{city.lower()}:*")
+            keys += r.keys(f"satintel:summary:{city.lower()}")
+            keys += r.keys(f"satintel:heatmap:{city.lower()}:*")
+            keys += r.keys(f"satintel:timeseries:{city.lower()}:*")
+            if keys:
+                r.delete(*keys)
+                logger.info(f"Cleared {len(keys)} Redis keys for {city}")
+        except Exception:
+            pass
+    # Clear memory fallback for this city
+    to_remove = [k for k in _memory_fallback if city.lower() in k.lower()]
+    for k in to_remove:
+        del _memory_fallback[k]
+def set_last_synced():
+    """Record the current timestamp as last sync time."""
+    from datetime import datetime
+    ts = datetime.now().isoformat()
+    r = _get_redis()
+    if r:
+        try:
+            r.set("satintel:last_synced", ts)
+        except Exception:
+            pass
+    _memory_fallback["last_synced"] = ts
+def get_last_synced() -> Optional[str]:
+    """Get the last sync timestamp."""
+    r = _get_redis()
+    if r:
+        try:
+            val = r.get("satintel:last_synced")
+            if val:
+                return val
+        except Exception:
+            pass
+    return _memory_fallback.get("last_synced")
+def info() -> dict:
+    """Get cache stats."""
+    r = _get_redis()
+    if r:
+        try:
+            keys = r.keys("satintel:*")
+            return {"backend": "redis", "keys": len(keys), "status": "connected"}
+        except Exception:
+            return {"backend": "redis", "status": "error"}
+    return {"backend": "memory", "keys": len(_memory_fallback), "status": "active"}

app/services/db_service.py ADDED Viewed

	@@ -0,0 +1,188 @@

+"""
+Database Service -- PostgreSQL + PostGIS queries with in-memory fallback.
+If PostgreSQL is configured (DATABASE_URL in .env), uses real spatial queries.
+Otherwise falls back to in-memory dict for users and JSON files for data.
+This lets the demo work regardless of database setup.
+"""
+import uuid
+import json
+import logging
+from typing import Optional
+from app.models.db_models import get_session_factory, SatelliteObservation, User, ActionPlanRecord
+logger = logging.getLogger(__name__)
+# -- In-Memory Fallback --------------------------------------------------------
+_users_mem: dict = {}  # email -> user dict
+_plans_mem: list = []
+def _has_db() -> bool:
+    """Check if PostgreSQL is available."""
+    return get_session_factory() is not None
+# -- User CRUD -----------------------------------------------------------------
+async def create_user(name: str, email: str, hashed_password: str) -> dict:
+    if _has_db():
+        async with get_session_factory()() as session:
+            user = User(name=name, email=email, hashed_password=hashed_password)
+            session.add(user)
+            await session.commit()
+            await session.refresh(user)
+            return {"id": str(user.id), "name": user.name, "email": user.email, "hashed_password": user.hashed_password}
+    else:
+        user_id = str(uuid.uuid4())
+        user = {"id": user_id, "name": name, "email": email, "hashed_password": hashed_password}
+        _users_mem[email] = user
+        return user
+async def get_user_by_email(email: str) -> Optional[dict]:
+    if _has_db():
+        from sqlalchemy import select
+        async with get_session_factory()() as session:
+            result = await session.execute(select(User).where(User.email == email))
+            user = result.scalar_one_or_none()
+            if user:
+                return {"id": str(user.id), "name": user.name, "email": user.email, "hashed_password": user.hashed_password}
+            return None
+    else:
+        return _users_mem.get(email)
+async def get_user_by_id(user_id: str) -> Optional[dict]:
+    if _has_db():
+        from sqlalchemy import select
+        async with get_session_factory()() as session:
+            result = await session.execute(select(User).where(User.id == uuid.UUID(user_id)))
+            user = result.scalar_one_or_none()
+            if user:
+                return {"id": str(user.id), "name": user.name, "email": user.email}
+            return None
+    else:
+        for u in _users_mem.values():
+            if u["id"] == user_id:
+                return {"id": u["id"], "name": u["name"], "email": u["email"]}
+        return None
+# -- Satellite Data CRUD -------------------------------------------------------
+async def store_observations(data_points: list[dict], city: str, parameter: str, source: str = ""):
+    """Bulk insert satellite observations into PostGIS."""
+    if not _has_db():
+        logger.info(f"No DB -- skipping store for {len(data_points)} {parameter} points")
+        return
+    async with get_session_factory()() as session:
+        observations = []
+        for d in data_points:
+            obs = SatelliteObservation(
+                city=city,
+                parameter=parameter,
+                date=d.get("date", ""),
+                lat=d["lat"],
+                lng=d["lng"],
+                value=d["value"],
+                unit=d.get("unit", ""),
+                source=source,
+                geom=f"SRID=4326;POINT({d['lng']} {d['lat']})",
+            )
+            observations.append(obs)
+        session.add_all(observations)
+        await session.commit()
+        logger.info(f"Stored {len(observations)} {parameter} observations for {city}")
+async def query_timeseries(city: str, parameter: str, start_date: str = "", end_date: str = "",
+                           lat: float = None, lng: float = None, radius_km: float = 5.0) -> list[dict]:
+    """
+    Query time-series data with optional spatial filter.
+    Uses PostGIS ST_DWithin for spatial queries if lat/lng provided.
+    """
+    if not _has_db():
+        return []
+    from sqlalchemy import select, and_, text
+    async with get_session_factory()() as session:
+        conditions = [SatelliteObservation.parameter == parameter]
+        if city:
+            conditions.append(SatelliteObservation.city == city)
+        query = select(SatelliteObservation).where(and_(*conditions))
+        if start_date:
+            query = query.where(SatelliteObservation.date >= start_date)
+        if end_date:
+            query = query.where(SatelliteObservation.date <= end_date)
+        # Spatial filter -- points within radius_km of given lat/lng
+        if lat is not None and lng is not None:
+            query = query.where(
+                text(f"ST_DWithin(geom::geography, ST_MakePoint({lng}, {lat})::geography, {radius_km * 1000})")
+            )
+        query = query.order_by(SatelliteObservation.date)
+        result = await session.execute(query)
+        rows = result.scalars().all()
+        return [
+            {"date": r.date, "lat": r.lat, "lng": r.lng, "value": r.value, "parameter": r.parameter}
+            for r in rows
+        ]
+async def query_spatial(city: str, parameter: str, date: str) -> list[dict]:
+    """Get all spatial data for a given parameter and date."""
+    if not _has_db():
+        return []
+    from sqlalchemy import select, and_
+    async with get_session_factory()() as session:
+        result = await session.execute(
+            select(SatelliteObservation).where(
+                and_(
+                    SatelliteObservation.city == city,
+                    SatelliteObservation.parameter == parameter,
+                    SatelliteObservation.date == date,
+                )
+            )
+        )
+        rows = result.scalars().all()
+        return [{"lat": r.lat, "lng": r.lng, "value": r.value} for r in rows]
+# -- Action Plan CRUD ----------------------------------------------------------
+async def store_action_plan(city: str, plan_json: str, user_id: str = None) -> str:
+    if _has_db():
+        async with get_session_factory()() as session:
+            record = ActionPlanRecord(
+                city=city,
+                plan_json=plan_json,
+                created_by=uuid.UUID(user_id) if user_id else None,
+            )
+            session.add(record)
+            await session.commit()
+            return str(record.id)
+    else:
+        plan_id = str(uuid.uuid4())
+        _plans_mem.append({"id": plan_id, "city": city, "plan": json.loads(plan_json)})
+        return plan_id
+async def get_action_plans(city: str = None) -> list[dict]:
+    if _has_db():
+        from sqlalchemy import select
+        async with get_session_factory()() as session:
+            query = select(ActionPlanRecord).order_by(ActionPlanRecord.created_at.desc())
+            if city:
+                query = query.where(ActionPlanRecord.city == city)
+            result = await session.execute(query)
+            rows = result.scalars().all()
+            return [{"id": str(r.id), "city": r.city, "plan": json.loads(r.plan_json), "created_at": r.created_at.isoformat()} for r in rows]
+    else:
+        return _plans_mem

app/services/farmland_service.py ADDED Viewed

	@@ -0,0 +1,83 @@

+"""
+Farmland Misuse Detection Service.
+Identifies zones where agricultural land shows signs of conversion or abandonment.
+Uses NDVI crop activity scoring to distinguish active farms from idle/converted land.
+"""
+import logging
+import numpy as np
+from collections import defaultdict
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+def analyse(city: str = "Ahmedabad") -> dict:
+    """Detect farmland misuse and abandonment."""
+    ndvi_data = satellite_service._load_data("NDVI")
+    if not ndvi_data:
+        return {"city": city, "error": "No NDVI data available"}
+    # Group NDVI by location
+    location_ts = defaultdict(list)
+    for d in ndvi_data:
+        key = (round(d["lat"], 4), round(d["lng"], 4))
+        location_ts[key].append((d["date"], d["value"]))
+    # Score each location for crop activity
+    try:
+        from app.ml.lstm_predictor import LSTMPredictor
+        predictor = LSTMPredictor(lookback=6)
+    except:
+        predictor = None
+    zones = []
+    suspicious = []
+    for (lat, lng), ts in location_ts.items():
+        ts_sorted = sorted(ts, key=lambda x: x[0])
+        values = [v for _, v in ts_sorted]
+        mean_ndvi = np.mean(values)
+        std_ndvi = np.std(values)
+        # Crop score
+        if predictor:
+            crop_score = predictor.crop_activity_score(ts_sorted)
+        else:
+            crop_score = min(std_ndvi / 0.15, 1.0) * 40 + min(mean_ndvi / 0.25, 1.0) * 30 + 15
+        zone = {
+            "lat": lat,
+            "lng": lng,
+            "mean_ndvi": round(float(mean_ndvi), 4),
+            "std_ndvi": round(float(std_ndvi), 4),
+            "crop_activity_score": round(crop_score, 1),
+            "classification": "active_farmland" if crop_score > 50 else ("idle_land" if crop_score > 25 else "barren_or_converted"),
+        }
+        zones.append(zone)
+        # Flag suspicious: was potentially farmland (some greenness) but low activity
+        if mean_ndvi > 0.12 and crop_score < 30:
+            zone["flag"] = "potential_misuse"
+            suspicious.append(zone)
+    # Cluster suspicious zones
+    cluster_count = 0
+    if len(suspicious) >= 3:
+        from sklearn.cluster import DBSCAN
+        coords = np.array([[z["lat"], z["lng"]] for z in suspicious])
+        clustering = DBSCAN(eps=0.02, min_samples=2).fit(coords)
+        cluster_count = len(set(clustering.labels_)) - (1 if -1 in clustering.labels_ else 0)
+    return {
+        "city": city,
+        "total_zones_analyzed": len(zones),
+        "total_suspicious_zones": len(suspicious),
+        "total_suspicious_area_sqkm": round(len(suspicious) * 1.0, 1),
+        "zones": sorted(zones, key=lambda z: z["crop_activity_score"]),
+        "suspicious_zones": suspicious[:20],
+        "cluster_count": cluster_count,
+        "classifications": {
+            "active_farmland": sum(1 for z in zones if z["classification"] == "active_farmland"),
+            "idle_land": sum(1 for z in zones if z["classification"] == "idle_land"),
+            "barren_or_converted": sum(1 for z in zones if z["classification"] == "barren_or_converted"),
+        },
+    }

app/services/green_gap_service.py ADDED Viewed

	@@ -0,0 +1,155 @@

+"""
+Green Infrastructure Gap Analysis Service.
+Identifies optimal tree plantation sites using NDVI-LST regression.
+"""
+import json
+import logging
+import numpy as np
+from pathlib import Path
+from app.ml.ndvi_lst_regression import NDVILSTRegression
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+SPECIES_MAP = {
+    "critical": "Peepal (Ficus religiosa), Banyan (Ficus benghalensis), Neem (Azadirachta indica)",
+    "high": "Gulmohar (Delonix regia), Rain Tree (Samanea saman), Arjun (Terminalia arjuna)",
+    "moderate": "Jamun (Syzygium cumini), Amla (Phyllanthus emblica), Teak (Tectona grandis)",
+}
+TARGET_NDVI = 0.35
+MIN_NDVI_THRESHOLD = 0.15
+def _get_species(priority_score: float) -> str:
+    if priority_score >= 70:
+        return SPECIES_MAP["critical"]
+    if priority_score >= 40:
+        return SPECIES_MAP["high"]
+    return SPECIES_MAP["moderate"]
+def analyse(city: str = "ahmedabad") -> dict:
+    """Run green infrastructure gap analysis for a city."""
+    # Load spatial data — use latest date from time-series
+    ndvi_data = satellite_service._load_data("NDVI", city)
+    lst_data = satellite_service._load_data("LST", city)
+    if not ndvi_data or not lst_data:
+        return {"city": city, "error": "No NDVI or LST data available"}
+    # Get latest date for spatial snapshot
+    ndvi_dates = sorted(set(d["date"] for d in ndvi_data))
+    lst_dates = sorted(set(d["date"] for d in lst_data))
+    ndvi_latest = ndvi_dates[-1] if ndvi_dates else None
+    lst_latest = lst_dates[-1] if lst_dates else None
+    ndvi_spatial = [d for d in ndvi_data if d["date"] == ndvi_latest]
+    lst_spatial = [d for d in lst_data if d["date"] == lst_latest]
+    # Build coordinate maps (round to 0.01 for matching)
+    ndvi_map = {}
+    for d in ndvi_spatial:
+        key = (round(d["lat"], 2), round(d["lng"], 2))
+        ndvi_map[key] = d["value"]
+    lst_map = {}
+    for d in lst_spatial:
+        key = (round(d["lat"], 2), round(d["lng"], 2))
+        lst_map[key] = d["value"]
+    # Load land use
+    try:
+        lu_change = satellite_service.get_land_use_change(city)
+        land_data = lu_change.get("data_2024", [])
+    except:
+        land_data = []
+    land_map = {}
+    for d in land_data:
+        key = (round(d["lat"], 2), round(d["lng"], 2))
+        land_map[key] = d.get("class_label", "unknown")
+    # Build matched pairs for regression
+    matched_pairs = []
+    for coord, ndvi_val in ndvi_map.items():
+        lst_val = lst_map.get(coord)
+        if lst_val is not None:
+            matched_pairs.append((ndvi_val, lst_val))
+    # Fit regression
+    regression = NDVILSTRegression()
+    regression_stats = regression.fit(matched_pairs)
+    # City statistics
+    all_lst = list(lst_map.values())
+    all_ndvi = list(ndvi_map.values())
+    mean_lst = float(np.mean(all_lst)) if all_lst else 30.0
+    mean_ndvi = float(np.mean(all_ndvi)) if all_ndvi else 0.2
+    # Score candidate cells
+    all_candidates = []
+    # Use all coords from ndvi_map (harmonized grid)
+    for coord in ndvi_map:
+        ndvi_val = ndvi_map.get(coord, 0.0)
+        lst_val = lst_map.get(coord, mean_lst)
+        land_class = land_map.get(coord, "urban")
+        # Skip water and dense vegetation
+        if land_class in ("water", "dense_vegetation"):
+            continue
+        # Only cells with low vegetation AND above-average heat
+        if ndvi_val >= MIN_NDVI_THRESHOLD and lst_val <= mean_lst:
+            continue
+        # Priority score (0-100)
+        heat_score = min(max((lst_val - mean_lst) / 5.0, 0), 1.0) * 50
+        veg_gap = min(max((MIN_NDVI_THRESHOLD - ndvi_val) / MIN_NDVI_THRESHOLD, 0), 1.0) * 30
+        area_score = 20 if land_class in ("urban", "urban_barren") else 10
+        priority = round(heat_score + veg_gap + area_score, 1)
+        cooling = regression.project_cooling(ndvi_val, TARGET_NDVI)
+        severity = "critical" if priority >= 70 else ("high" if priority >= 40 else "moderate")
+        all_candidates.append({
+            "lat": coord[0],
+            "lng": coord[1],
+            "current_ndvi": round(ndvi_val, 4),
+            "current_lst": round(lst_val, 1),
+            "land_class": land_class,
+            "priority_score": priority,
+            "projected_cooling": cooling,
+            "projected_new_lst": round(lst_val - cooling, 1),
+            "recommended_species": _get_species(priority),
+            "severity": severity,
+        })
+    # Sort by priority
+    all_candidates.sort(key=lambda c: c["priority_score"], reverse=True)
+    top_50 = all_candidates[:50]
+    # Summary
+    if top_50:
+        avg_cooling = round(sum(c["projected_cooling"] for c in top_50) / len(top_50), 2)
+        max_cooling = round(max(c["projected_cooling"] for c in top_50), 2)
+        critical_count = sum(1 for c in top_50 if c["severity"] == "critical")
+    else:
+        avg_cooling = 0.0
+        max_cooling = 0.0
+        critical_count = 0
+    return {
+        "city": city,
+        "regression": regression_stats,
+        "city_mean_lst": round(mean_lst, 1),
+        "city_mean_ndvi": round(mean_ndvi, 4),
+        "total_candidate_cells": len(all_candidates),
+        "critical_sites": critical_count,
+        "avg_projected_cooling": avg_cooling,
+        "max_projected_cooling": max_cooling,
+        "top_50_sites": top_50,
+        "all_candidates": all_candidates[:200],
+    }

app/services/health_score_service.py ADDED Viewed

	@@ -0,0 +1,133 @@

+"""
+Environmental Health Score — single 0-100 score per city.
+Weighted composite of all environmental parameters.
+Score interpretation:
+  80-100: Excellent (green)
+  60-79:  Good (blue)
+  40-59:  Moderate (amber)
+  20-39:  Poor (orange)
+  0-19:   Critical (red)
+"""
+import logging
+import numpy as np
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+# Ideal ranges for each parameter (used for scoring)
+PARAM_CONFIG = {
+    "LST": {
+        "weight": 0.25,
+        "ideal_min": 20, "ideal_max": 35,  # comfortable range
+        "danger_min": 10, "danger_max": 50,  # extreme range
+        "invert": True,  # lower is better (within range)
+    },
+    "NDVI": {
+        "weight": 0.25,
+        "ideal_min": 0.3, "ideal_max": 0.8,  # healthy vegetation
+        "danger_min": 0.0, "danger_max": 0.15,
+        "invert": False,  # higher is better
+    },
+    "NO2": {
+        "weight": 0.25,
+        "ideal_min": 0.0, "ideal_max": 0.00005,  # low pollution
+        "danger_min": 0.0, "danger_max": 0.00015,
+        "invert": True,  # lower is better
+    },
+    "SOIL_MOISTURE": {
+        "weight": 0.25,
+        "ideal_min": 0.15, "ideal_max": 0.35,  # healthy range
+        "danger_min": 0.05, "danger_max": 0.45,
+        "invert": False,  # within range is better
+    },
+}
+def _score_parameter(mean_value: float, config: dict) -> float:
+    """Score a single parameter 0-100. Higher is better."""
+    if config.get("invert"):
+        # For LST and NO2 — lower values are better
+        if mean_value <= config["ideal_max"]:
+            return 100.0
+        elif mean_value >= config["danger_max"]:
+            return 0.0
+        else:
+            # Linear interpolation between ideal_max and danger_max
+            range_size = config["danger_max"] - config["ideal_max"]
+            excess = mean_value - config["ideal_max"]
+            return max(0, 100 - (excess / range_size) * 100)
+    else:
+        # For NDVI and Soil Moisture — higher values are better
+        if mean_value >= config["ideal_min"]:
+            return min(100, (mean_value / config["ideal_max"]) * 100)
+        elif mean_value <= config["danger_max"]:
+            return max(0, (mean_value / config["ideal_min"]) * 100)
+        else:
+            return 50.0
+def _get_grade(score: float) -> dict:
+    """Get letter grade and color for a score."""
+    if score >= 80:
+        return {"grade": "A", "label": "Excellent", "color": "#10B981"}
+    elif score >= 60:
+        return {"grade": "B", "label": "Good", "color": "#3B82F6"}
+    elif score >= 40:
+        return {"grade": "C", "label": "Moderate", "color": "#F59E0B"}
+    elif score >= 20:
+        return {"grade": "D", "label": "Poor", "color": "#F97316"}
+    else:
+        return {"grade": "F", "label": "Critical", "color": "#EF4444"}
+def calculate(city: str = "ahmedabad") -> dict:
+    """Calculate Environmental Health Score for a city."""
+    param_scores = {}
+    param_details = []
+    for param_id, config in PARAM_CONFIG.items():
+        try:
+            stats = satellite_service.get_statistics(param_id, city)
+            mean_val = stats.get("mean", 0)
+            score = round(_score_parameter(mean_val, config), 1)
+            param_scores[param_id] = score
+            grade_info = _get_grade(score)
+            param_details.append({
+                "parameter": param_id,
+                "name": satellite_service.PARAMETERS.get(param_id, {}).get("name", param_id),
+                "mean_value": round(mean_val, 4),
+                "unit": stats.get("unit", ""),
+                "score": score,
+                "weight": config["weight"],
+                "weighted_score": round(score * config["weight"], 1),
+                "grade": grade_info["grade"],
+                "label": grade_info["label"],
+                "color": grade_info["color"],
+            })
+        except Exception as e:
+            logger.warning(f"Could not score {param_id} for {city}: {e}")
+            param_scores[param_id] = 50.0  # neutral fallback
+            param_details.append({
+                "parameter": param_id, "score": 50.0, "grade": "C",
+                "label": "No data", "color": "#94A3B8", "weight": config["weight"],
+                "weighted_score": 50.0 * config["weight"],
+            })
+    # Weighted composite score
+    total_score = round(sum(d["weighted_score"] for d in param_details), 1)
+    overall_grade = _get_grade(total_score)
+    return {
+        "city": city,
+        "overall_score": total_score,
+        "overall_grade": overall_grade["grade"],
+        "overall_label": overall_grade["label"],
+        "overall_color": overall_grade["color"],
+        "parameter_scores": param_details,
+        "interpretation": (
+            f"{city.title()} scores {total_score}/100 — rated '{overall_grade['label']}'. "
+            f"{'Immediate intervention recommended.' if total_score < 40 else 'Monitoring recommended.' if total_score < 60 else 'Environment is in acceptable condition.'}"
+        ),
+    }

app/services/heat_service.py ADDED Viewed

	@@ -0,0 +1,84 @@

+"""
+Urban Heat Island Analysis Service.
+Calculates UHI intensity, identifies heat clusters, and ranks zones by temperature.
+"""
+import logging
+import numpy as np
+from collections import defaultdict
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+# Approximate Ahmedabad zones
+ZONE_MAPPING = {
+    "City Core": {"lat_range": (23.00, 23.06), "lng_range": (72.53, 72.62)},
+    "Industrial East": {"lat_range": (22.95, 23.00), "lng_range": (72.60, 72.70)},
+    "Western Suburbs": {"lat_range": (23.00, 23.06), "lng_range": (72.45, 72.53)},
+    "North": {"lat_range": (23.06, 23.12), "lng_range": (72.50, 72.65)},
+    "South": {"lat_range": (22.95, 23.00), "lng_range": (72.50, 72.60)},
+}
+def _get_zone(lat, lng):
+    for name, bounds in ZONE_MAPPING.items():
+        if bounds["lat_range"][0] <= lat <= bounds["lat_range"][1] and bounds["lng_range"][0] <= lng <= bounds["lng_range"][1]:
+            return name
+    return "Periphery"
+def analyse(city: str = "Ahmedabad") -> dict:
+    """Run Urban Heat Island analysis."""
+    lst_data = satellite_service._load_data("LST")
+    if not lst_data:
+        return {"city": city, "error": "No LST data available"}
+    # Group by zone
+    zone_temps = defaultdict(list)
+    all_temps = []
+    for d in lst_data:
+        zone = _get_zone(d["lat"], d["lng"])
+        zone_temps[zone].append(d["value"])
+        all_temps.append(d["value"])
+    # UHI intensity: urban core avg - periphery avg
+    core_temps = zone_temps.get("City Core", []) + zone_temps.get("Industrial East", [])
+    fringe_temps = zone_temps.get("Western Suburbs", []) + zone_temps.get("Periphery", [])
+    core_avg = np.mean(core_temps) if core_temps else 0
+    fringe_avg = np.mean(fringe_temps) if fringe_temps else 0
+    uhi_intensity = round(float(core_avg - fringe_avg), 2)
+    # Zone rankings
+    zone_rankings = []
+    for zone_name, temps in zone_temps.items():
+        zone_rankings.append({
+            "zone": zone_name,
+            "avg_temp": round(float(np.mean(temps)), 1),
+            "max_temp": round(float(np.max(temps)), 1),
+            "min_temp": round(float(np.min(temps)), 1),
+            "readings": len(temps),
+        })
+    zone_rankings.sort(key=lambda z: z["avg_temp"], reverse=True)
+    # Anomalies and hotspots
+    from app.services import ml_service
+    anomaly_result = ml_service.detect_anomalies("LST", city)
+    hotspot_result = ml_service.find_hotspots("LST", city)
+    # Peak temperature
+    peak_temp = round(float(np.max(all_temps)), 1)
+    city_avg = round(float(np.mean(all_temps)), 1)
+    return {
+        "city": city,
+        "uhi_intensity_celsius": uhi_intensity,
+        "peak_temp": peak_temp,
+        "city_avg_temp": city_avg,
+        "urban_avg": round(float(core_avg), 1),
+        "fringe_avg": round(float(fringe_avg), 1),
+        "zone_rankings": zone_rankings,
+        "anomaly_count": anomaly_result.get("anomaly_count", 0),
+        "anomaly_events": anomaly_result.get("anomalies", [])[:10],
+        "hotspot_clusters": hotspot_result.get("hotspots", []),
+        "hotspot_count": hotspot_result.get("cluster_count", 0),
+    }

app/services/land_conversion_service.py ADDED Viewed

	@@ -0,0 +1,81 @@

+"""
+Land Conversion Detection Service.
+Analyzes land use change between 2020 and 2024, identifies conversion patterns.
+"""
+import json
+import logging
+from pathlib import Path
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+CLASS_NAMES = {0: "water", 1: "urban", 2: "sparse_vegetation", 3: "dense_vegetation"}
+def analyse(city: str = "Ahmedabad") -> dict:
+    """Detect and classify land use conversions."""
+    try:
+        lu_change = satellite_service.get_land_use_change(city)
+    except:
+        return {"city": city, "error": "No land use data available"}
+    data_2020 = lu_change.get("data_2020", [])
+    data_2024 = lu_change.get("data_2024", [])
+    change_summary = lu_change.get("change_summary", {})
+    if not data_2020 or not data_2024:
+        return {"city": city, "error": "Incomplete land use data"}
+    # Build grid lookup for 2020
+    grid_2020 = {}
+    for d in data_2020:
+        key = (round(d["lat"], 3), round(d["lng"], 3))
+        grid_2020[key] = d.get("value", d.get("class_id", -1))
+    # Compare each 2024 cell to its 2020 value
+    conversions = {}
+    changed_cells = []
+    for d in data_2024:
+        key = (round(d["lat"], 3), round(d["lng"], 3))
+        old_class = grid_2020.get(key)
+        new_class = d.get("value", d.get("class_id", -1))
+        if old_class is not None and old_class != new_class:
+            old_name = CLASS_NAMES.get(int(old_class), "unknown")
+            new_name = CLASS_NAMES.get(int(new_class), "unknown")
+            conv_key = f"{old_name}_to_{new_name}"
+            conversions[conv_key] = conversions.get(conv_key, 0) + 1
+            changed_cells.append({
+                "lat": d["lat"], "lng": d["lng"],
+                "from": old_name, "to": new_name,
+                "from_class": int(old_class), "to_class": int(new_class),
+            })
+    # Flag rapid/suspicious conversions (vegetation to urban)
+    rapid = [c for c in changed_cells if "vegetation" in c["from"] and c["to"] == "urban"]
+    # Cluster the changed cells
+    from app.services import ml_service
+    if changed_cells:
+        from sklearn.cluster import DBSCAN
+        import numpy as np
+        coords = np.array([[c["lat"], c["lng"]] for c in changed_cells])
+        clustering = DBSCAN(eps=0.02, min_samples=2).fit(coords)
+        n_clusters = len(set(clustering.labels_)) - (1 if -1 in clustering.labels_ else 0)
+    else:
+        n_clusters = 0
+    total_area = round(len(changed_cells) * 1.0, 1)
+    return {
+        "city": city,
+        "year_from": 2020,
+        "year_to": 2024,
+        "total_cells_changed": len(changed_cells),
+        "total_area_sqkm": total_area,
+        "conversion_breakdown": conversions,
+        "rapid_conversions": len(rapid),
+        "rapid_conversion_cells": rapid[:20],
+        "cluster_count": n_clusters,
+        "change_summary": change_summary,
+    }

app/services/ml_service.py ADDED Viewed

	@@ -0,0 +1,399 @@

+"""
+ML Analytics Service — anomaly detection, trend prediction, hotspot clustering.
+Uses scikit-learn (Isolation Forest, DBSCAN) and statsmodels (ARIMA).
+"""
+import logging
+import numpy as np
+import pandas as pd
+from typing import Optional
+from sklearn.ensemble import IsolationForest
+from sklearn.cluster import DBSCAN
+from collections import defaultdict
+logger = logging.getLogger(__name__)
+# ── ML Result Cache ──────────────────────────────────────
+_ml_cache: dict = {}
+_file_cache_loaded: set = set()
+def _cache_key(fn_name: str, parameter: str, city: str) -> str:
+    return f"{fn_name}:{city.lower()}:{parameter}"
+def _get_cached(fn_name: str, parameter: str, city: str):
+    key = _cache_key(fn_name, parameter, city)
+    # 1. Memory cache (fastest)
+    result = _ml_cache.get(key)
+    if result:
+        return result
+    # 2. Redis cache (persists across restarts)
+    try:
+        from app.services import cache_service
+        redis_result = cache_service.get(f"ml:{key}")
+        if redis_result:
+            _ml_cache[key] = redis_result  # promote to memory
+            return redis_result
+    except Exception:
+        pass
+    # 3. File cache (legacy fallback)
+    city_key = city.lower()
+    if city_key not in _file_cache_loaded:
+        _load_file_cache(city_key)
+    return _ml_cache.get(key)
+def _set_cached(fn_name: str, parameter: str, city: str, result):
+    key = _cache_key(fn_name, parameter, city)
+    _ml_cache[key] = result
+    # Persist to Redis (24h TTL)
+    try:
+        from app.services import cache_service
+        cache_service.set(f"ml:{key}", result, ttl=86400)
+    except Exception:
+        pass
+    return result
+def _load_file_cache(city: str):
+    """Load pre-computed ML results from JSON file if available."""
+    import json
+    from pathlib import Path
+    from app.services.satellite_service import DATA_BASE
+    cache_file = DATA_BASE / city / "ml_results_cache.json"
+    if cache_file.exists():
+        try:
+            with open(cache_file) as f:
+                results = json.load(f)
+            for param, data in results.items():
+                if "anomalies" in data:
+                    _ml_cache[_cache_key("anomalies", param, city)] = data["anomalies"]
+                if "trends" in data:
+                    _ml_cache[_cache_key("trends", param, city)] = data["trends"]
+                if "hotspots" in data:
+                    _ml_cache[_cache_key("hotspots", param, city)] = data["hotspots"]
+            logger.info(f"Loaded pre-computed ML results for {city} ({len(results)} params)")
+        except Exception as e:
+            logger.warning(f"Failed to load ML cache for {city}: {e}")
+    _file_cache_loaded.add(city)
+def _load_parameter_data(parameter: str, city: str = "ahmedabad") -> list[dict]:
+    """Load data from satellite service."""
+    from app.services import satellite_service
+    return satellite_service._load_data(parameter, city)
+def detect_anomalies(parameter: str, city: str = "Ahmedabad", contamination: float = 0.08) -> dict:
+    """
+    Detect anomalies using Isolation Forest on DATE-AGGREGATED data.
+    Instead of running on 225K individual points (slow, too many results),
+    we aggregate by date → ~43 time-series points → fast, meaningful anomalies.
+    Only returns critical + high severity (no moderate noise).
+    """
+    cached = _get_cached("anomalies", parameter, city)
+    if cached:
+        return cached
+    data = _load_parameter_data(parameter, city)
+    if not data or len(data) < 10:
+        return {"anomalies": [], "total_points": 0, "anomaly_count": 0}
+    # Aggregate by date — city-wide mean per date
+    date_values = defaultdict(list)
+    date_points = defaultdict(list)  # keep sample lat/lng per date
+    for d in data:
+        date_values[d["date"]].append(d["value"])
+        date_points[d["date"]].append((d["lat"], d["lng"]))
+    dates = sorted(date_values.keys())
+    means = np.array([np.mean(date_values[d]) for d in dates]).reshape(-1, 1)
+    if len(means) < 5:
+        return _set_cached("anomalies", parameter, city, {
+            "anomalies": [], "total_points": len(data), "anomaly_count": 0
+        })
+    # Run Isolation Forest on aggregated time-series (~43 points, very fast)
+    model = IsolationForest(contamination=contamination, random_state=42, n_estimators=100)
+    predictions = model.fit_predict(means)
+    scores = model.decision_function(means)
+    overall_mean = float(np.mean(means))
+    overall_std = float(np.std(means)) if np.std(means) > 0 else 1.0
+    # Description templates per parameter and direction
+    DESCRIPTIONS = {
+        "LST": {
+            "high_up": "Extreme heat event — surface temperature significantly above seasonal average. Indicates heat wave conditions, increased energy demand, and heat stress risk.",
+            "high_down": "Unusual cold event — surface temperature dropped well below expected range. May indicate weather anomaly or sensor calibration event.",
+            "moderate_up": "Above-normal surface temperature detected. Mild heat stress — monitor for sustained trends.",
+            "moderate_down": "Below-normal surface temperature. Unusual for this period — possible weather system influence.",
+        },
+        "NDVI": {
+            "high_up": "Sudden vegetation surge — NDVI spiked above normal. Likely post-monsoon rapid growth or irrigation activity.",
+            "high_down": "Severe vegetation loss — NDVI dropped sharply. Possible deforestation, fire damage, or drought stress event.",
+            "moderate_up": "Slightly elevated vegetation index. Green cover above seasonal baseline.",
+            "moderate_down": "Mild vegetation decline detected. Early indicator of stress — recommend monitoring.",
+        },
+        "NO2": {
+            "high_up": "Pollution spike — NO2 concentration significantly elevated. Likely industrial emission event, traffic surge, or atmospheric inversion trapping pollutants.",
+            "high_down": "Unusually clean air — NO2 well below normal. Possible rainfall washout, holiday period, or industrial shutdown.",
+            "moderate_up": "Above-average NO2 levels. Gradual air quality degradation — check industrial and traffic sources.",
+            "moderate_down": "Slightly below-normal NO2. Minor air quality improvement detected.",
+        },
+        "SOIL_MOISTURE": {
+            "high_up": "Soil moisture spike — possible flooding, heavy rainfall, or irrigation event. Check drainage systems.",
+            "high_down": "Severe soil moisture deficit — drought conditions developing. Agricultural stress and groundwater depletion risk.",
+            "moderate_up": "Above-average soil moisture. Favorable for agriculture but monitor for waterlogging.",
+            "moderate_down": "Slightly dry conditions. Early drought indicator — recommend water conservation measures.",
+        },
+    }
+    def _get_description(param, severity, is_above):
+        templates = DESCRIPTIONS.get(param, DESCRIPTIONS["LST"])
+        direction = "up" if is_above else "down"
+        key = f"{'high' if severity in ('critical', 'high') else 'moderate'}_{direction}"
+        return templates.get(key, f"Anomalous {param} value detected — deviates significantly from baseline.")
+    anomaly_list = []
+    for i, date in enumerate(dates):
+        if predictions[i] == -1:
+            score = float(scores[i])
+            severity = "critical" if score < -0.3 else ("high" if score < -0.15 else "moderate")
+            mean_val = float(means[i][0])
+            deviation = round(abs(mean_val - overall_mean) / overall_std, 2)
+            is_above = mean_val > overall_mean
+            # Pick the most extreme point for this date as representative location
+            pts = date_points[date]
+            vals = date_values[date]
+            extreme_idx = np.argmax(np.abs(np.array(vals) - overall_mean))
+            anomaly_list.append({
+                "date": date,
+                "lat": round(float(pts[extreme_idx][0]), 4),
+                "lng": round(float(pts[extreme_idx][1]), 4),
+                "value": round(mean_val, 4),
+                "severity": severity,
+                "anomaly_score": round(score, 4),
+                "deviation": deviation,
+                "direction": "above" if is_above else "below",
+                "description": _get_description(parameter, severity, is_above),
+                "parameter": parameter,
+            })
+    # Sort: critical first, then high, then moderate
+    severity_order = {"critical": 0, "high": 1, "moderate": 2}
+    anomaly_list.sort(key=lambda a: (severity_order.get(a["severity"], 3), a["anomaly_score"]))
+    return _set_cached("anomalies", parameter, city, {
+        "parameter": parameter,
+        "city": city,
+        "anomalies": anomaly_list,
+        "total_points": len(data),
+        "dates_analyzed": len(dates),
+        "anomaly_count": len(anomaly_list),
+        "contamination": contamination,
+    })
+def predict_trend(parameter: str, city: str = "Ahmedabad", forecast_days: int = 30) -> dict:
+    """Predict trends using ARIMA. Results are cached."""
+    cached = _get_cached("trends", parameter, city)
+    if cached:
+        return cached
+    data = _load_parameter_data(parameter, city)
+    if not data:
+        return {"historical": {}, "forecast": {}, "trend_direction": "unknown"}
+    # Aggregate by date
+    date_values = defaultdict(list)
+    for d in data:
+        date_values[d["date"]].append(d["value"])
+    timeseries = {
+        date: round(sum(vals) / len(vals), 4)
+        for date, vals in sorted(date_values.items())
+    }
+    if len(timeseries) < 10:
+        return {"historical": timeseries, "forecast": {}, "trend_direction": "insufficient_data"}
+    try:
+        from statsmodels.tsa.arima.model import ARIMA
+        df = pd.Series(list(timeseries.values()), index=pd.to_datetime(list(timeseries.keys())))
+        df = df.sort_index()
+        # Fit ARIMA model
+        model = ARIMA(df, order=(2, 1, 1))
+        fitted = model.fit()
+        # Forecast
+        forecast_result = fitted.forecast(steps=forecast_days)
+        forecast_dates = pd.date_range(start=df.index[-1] + pd.Timedelta(days=1), periods=forecast_days)
+        forecast = {
+            str(date.date()): round(float(val), 4)
+            for date, val in zip(forecast_dates, forecast_result)
+        }
+        # Determine trend direction
+        last_historical = df.iloc[-1]
+        last_forecast = forecast_result.iloc[-1] if len(forecast_result) > 0 else last_historical
+        trend = "increasing" if last_forecast > last_historical else "decreasing"
+        return _set_cached("trends", parameter, city, {
+            "parameter": parameter,
+            "city": city,
+            "historical": timeseries,
+            "forecast": forecast,
+            "trend_direction": trend,
+            "model": "ARIMA(2,1,1)",
+            "forecast_days": forecast_days,
+        })
+    except Exception as e:
+        logger.warning(f"ARIMA failed for {parameter}: {e}. Using linear fallback.")
+        dates = list(timeseries.keys())
+        values = list(timeseries.values())
+        n = len(values)
+        if n >= 2:
+            slope = (values[-1] - values[0]) / n
+            last_val = values[-1]
+            forecast = {}
+            last_date = pd.to_datetime(dates[-1])
+            for i in range(1, forecast_days + 1):
+                fdate = last_date + pd.Timedelta(days=i)
+                forecast[str(fdate.date())] = round(last_val + slope * i, 4)
+            trend = "increasing" if slope > 0 else "decreasing"
+        else:
+            forecast = {}
+            trend = "unknown"
+        return _set_cached("trends", parameter, city, {
+            "parameter": parameter,
+            "city": city,
+            "historical": timeseries,
+            "forecast": forecast,
+            "trend_direction": trend,
+            "model": "linear_fallback",
+            "forecast_days": forecast_days,
+        })
+def find_hotspots(parameter: str, city: str = "Ahmedabad", eps: float = 0.02, min_samples: int = 2) -> dict:
+    """Identify geographic clusters of extreme values using DBSCAN. Results are cached."""
+    cached = _get_cached("hotspots", parameter, city)
+    if cached:
+        return cached
+    data = _load_parameter_data(parameter, city)
+    if not data:
+        return {"hotspots": [], "total_points": 0}
+    # Use latest available date for spatial clustering
+    dates = sorted(set(d["date"] for d in data))
+    # Use all data for more robust clustering
+    df = pd.DataFrame(data)
+    # Get high-value points (top 25th percentile)
+    threshold = df["value"].quantile(0.75)
+    # For NDVI, low values are concerning (stressed vegetation)
+    if parameter == "NDVI":
+        hot_mask = df["value"] <= df["value"].quantile(0.25)
+    else:
+        hot_mask = df["value"] >= threshold
+    hot_df = df[hot_mask]
+    if len(hot_df) < min_samples:
+        return {"hotspots": [], "total_points": len(df), "threshold": float(threshold)}
+    coords = hot_df[["lat", "lng"]].values
+    clustering = DBSCAN(eps=eps, min_samples=min_samples).fit(coords)
+    hot_df = hot_df.copy()
+    hot_df["cluster"] = clustering.labels_
+    hotspots = []
+    for label in sorted(set(clustering.labels_)):
+        if label == -1:
+            continue
+        cluster_points = hot_df[hot_df["cluster"] == label]
+        center_lat = float(cluster_points["lat"].mean())
+        center_lng = float(cluster_points["lng"].mean())
+        avg_value = float(cluster_points["value"].mean())
+        num_points = len(cluster_points)
+        severity = "critical" if num_points >= 8 else ("high" if num_points >= 4 else "moderate")
+        hotspots.append({
+            "cluster_id": int(label),
+            "center_lat": round(center_lat, 4),
+            "center_lng": round(center_lng, 4),
+            "avg_value": round(avg_value, 4),
+            "num_points": num_points,
+            "severity": severity,
+            "parameter": parameter,
+            "radius_km": round(eps * 111, 1),  # Approximate km from degrees
+        })
+    return _set_cached("hotspots", parameter, city, {
+        "parameter": parameter,
+        "city": city,
+        "hotspots": hotspots,
+        "total_points": len(df),
+        "hot_points": len(hot_df),
+        "cluster_count": len(hotspots),
+        "threshold": round(float(threshold), 4),
+    })
+_summary_cache: dict = {}
+def get_city_summary(city: str = "Ahmedabad") -> dict:
+    """Get comprehensive analytics summary for a city. Cached in memory + Redis."""
+    cache_key = city.lower()
+    if cache_key in _summary_cache:
+        return _summary_cache[cache_key]
+    # Try Redis
+    try:
+        from app.services import cache_service
+        redis_result = cache_service.get(f"summary:{cache_key}")
+        if redis_result:
+            _summary_cache[cache_key] = redis_result
+            return redis_result
+    except Exception:
+        pass
+    from app.services import satellite_service
+    summary = {"city": city, "parameters": {}}
+    for param_id in ["LST", "NDVI", "NO2", "SOIL_MOISTURE"]:
+        try:
+            stats = satellite_service.get_statistics(param_id, city)
+            anomaly_result = detect_anomalies(param_id, city)
+            hotspot_result = find_hotspots(param_id, city)
+            summary["parameters"][param_id] = {
+                "statistics": stats,
+                "anomaly_count": anomaly_result.get("anomaly_count", 0),
+                "hotspot_count": hotspot_result.get("cluster_count", 0),
+                "top_anomalies": anomaly_result.get("anomalies", [])[:3],
+                "top_hotspots": hotspot_result.get("hotspots", [])[:3],
+            }
+        except Exception as e:
+            logger.error(f"Error computing summary for {param_id}: {e}")
+            summary["parameters"][param_id] = {"error": str(e)}
+    _summary_cache[cache_key] = summary
+    try:
+        from app.services import cache_service
+        cache_service.set(f"summary:{cache_key}", summary, ttl=86400)
+    except Exception:
+        pass
+    return summary

app/services/satellite_service.py ADDED Viewed

	@@ -0,0 +1,403 @@

+"""
+Satellite Data Service — loads pre-fetched data from JSON files.
+Falls back to file-based data for hackathon demo. Can be swapped to GEE live queries.
+"""
+import json
+import os
+import logging
+from pathlib import Path
+from typing import Optional
+logger = logging.getLogger(__name__)
+# Base path to pre-fetched data (DATA_DIR env var for Docker/HF Spaces, fallback for local dev)
+DATA_BASE = Path(os.environ.get("DATA_DIR", Path(__file__).resolve().parent.parent.parent.parent / "data"))
+def _get_data_dir(city: str = "ahmedabad") -> Path:
+    """Get data directory for a city."""
+    return DATA_BASE / city.lower()
+# Ahmedabad constants
+AHMEDABAD_CENTER = [23.0225, 72.5714]
+AHMEDABAD_BBOX = {"min_lat": 22.95, "max_lat": 23.10, "min_lng": 72.45, "max_lng": 72.70}
+# Parameter metadata
+PARAMETERS = {
+    "LST": {
+        "id": "LST",
+        "name": "Land Surface Temperature",
+        "unit": "°C",
+        "source": "MODIS Terra (MOD11A2)",
+        "resolution": "1km",
+        "frequency": "8-day composite",
+        "file": "lst_timeseries.json",
+        "color": "#EF4444",
+        "description": "Surface temperature from MODIS thermal infrared bands",
+    },
+    "NDVI": {
+        "id": "NDVI",
+        "name": "Vegetation Index (NDVI)",
+        "unit": "index",
+        "source": "MODIS (MOD13A2)",
+        "resolution": "1km",
+        "frequency": "16-day composite",
+        "file": "ndvi_timeseries.json",
+        "color": "#10B981",
+        "description": "Normalized Difference Vegetation Index — green cover health",
+    },
+    "NO2": {
+        "id": "NO2",
+        "name": "Nitrogen Dioxide (NO₂)",
+        "unit": "mol/m²",
+        "source": "Sentinel-5P TROPOMI",
+        "resolution": "7km",
+        "frequency": "Daily",
+        "file": "no2_timeseries.json",
+        "color": "#8B5CF6",
+        "description": "Tropospheric NO₂ column density — air pollution indicator",
+    },
+    "SOIL_MOISTURE": {
+        "id": "SOIL_MOISTURE",
+        "name": "Soil Moisture",
+        "unit": "m³/m³",
+        "source": "NASA SMAP (SPL3SMP_E)",
+        "resolution": "9km",
+        "frequency": "Daily",
+        "file": "soil_moisture.json",
+        "color": "#3B82F6",
+        "description": "Surface soil moisture from L-band radiometer",
+    },
+    "SO2": {
+        "id": "SO2",
+        "name": "Sulfur Dioxide (SO₂)",
+        "unit": "mol/m²",
+        "source": "Sentinel-5P TROPOMI",
+        "resolution": "7km",
+        "frequency": "Monthly composite",
+        "file": "so2_timeseries.json",
+        "color": "#F59E0B",
+        "description": "SO₂ column density — industrial emission indicator",
+    },
+    "CO": {
+        "id": "CO",
+        "name": "Carbon Monoxide (CO)",
+        "unit": "mol/m²",
+        "source": "Sentinel-5P TROPOMI",
+        "resolution": "7km",
+        "frequency": "Monthly composite",
+        "file": "co_timeseries.json",
+        "color": "#DC2626",
+        "description": "CO column density — combustion/traffic pollution indicator",
+    },
+    "O3": {
+        "id": "O3",
+        "name": "Ozone (O₃)",
+        "unit": "mol/m²",
+        "source": "Sentinel-5P TROPOMI",
+        "resolution": "7km",
+        "frequency": "Monthly composite",
+        "file": "o3_timeseries.json",
+        "color": "#2563EB",
+        "description": "Total ozone column density — UV protection and smog indicator",
+    },
+    "AEROSOL": {
+        "id": "AEROSOL",
+        "name": "Aerosol Index (UV AI)",
+        "unit": "index",
+        "source": "Sentinel-5P TROPOMI",
+        "resolution": "7km",
+        "frequency": "Monthly composite",
+        "file": "aerosol_timeseries.json",
+        "color": "#92400E",
+        "description": "UV Aerosol Index — PM2.5/dust/haze proxy",
+    },
+    "LAND_USE": {
+        "id": "LAND_USE",
+        "name": "Land Use Classification",
+        "unit": "class",
+        "source": "Landsat 8/9 (USGS/NASA)",
+        "resolution": "30m (aggregated to 1km)",
+        "frequency": "Annual composite",
+        "file": "land_use_2024.json",
+        "color": "#6B7280",
+        "description": "NDVI-based land classification: water, urban, sparse vegetation, dense vegetation",
+    },
+}
+# Cache: raw + harmonized
+_raw_cache: dict = {}
+_data_cache: dict = {}  # harmonized
+def _load_raw(parameter: str, city: str = "ahmedabad") -> list[dict]:
+    """Load raw JSON data without harmonization. Auto-generates if city not found."""
+    # Auto-generate data for cities without pre-fetched GEE data
+    from app.utils.city_generator import ensure_city_data
+    ensure_city_data(city)
+    cache_key = f"{city.lower()}:{parameter}"
+    if cache_key in _raw_cache:
+        return _raw_cache[cache_key]
+    meta = PARAMETERS.get(parameter)
+    if not meta:
+        raise ValueError(f"Unknown parameter: {parameter}")
+    filepath = _get_data_dir(city) / meta["file"]
+    if not filepath.exists():
+        logger.warning(f"Data file not found: {filepath}")
+        return []
+    with open(filepath, "r") as f:
+        data = json.load(f)
+    _raw_cache[cache_key] = data
+    return data
+def _load_data(parameter: str, city: str = "ahmedabad") -> list[dict]:
+    """Load data harmonized to the common 1km grid.
+    Raw satellite data comes on different grids:
+      MODIS (LST, NDVI): 1km native
+      Sentinel-5P (NO2, SO2, CO, O3, Aerosol): ~7km native
+      SMAP (Soil Moisture): ~9km native
+      Landsat (Land Use): 30m aggregated
+    This function resamples everything to a uniform 0.01° (~1.1km) grid
+    using Inverse Distance Weighting interpolation so all parameters
+    can be overlaid and compared pixel-by-pixel.
+    """
+    cache_key = f"{city.lower()}:{parameter}:harmonized"
+    if cache_key in _data_cache:
+        return _data_cache[cache_key]
+    # Skip harmonization for land use (categorical data — can't interpolate classes)
+    if parameter == "LAND_USE":
+        raw_data = _load_raw(parameter, city)
+        _data_cache[cache_key] = raw_data
+        return raw_data
+    # Try loading pre-harmonized file first (instant, ~0.01s)
+    harmonized_file = _get_data_dir(city) / f"{parameter.lower()}_harmonized.json"
+    if harmonized_file.exists():
+        with open(harmonized_file, "r") as f:
+            harmonized = json.load(f)
+        _data_cache[cache_key] = harmonized
+        logger.info(f"Loaded pre-harmonized {parameter}/{city}: {len(harmonized)} points (instant)")
+        return harmonized
+    # Fall back to live IDW harmonization (slow, ~12s per param)
+    raw_data = _load_raw(parameter, city)
+    if not raw_data:
+        return []
+    from app.utils.geo_helpers import harmonize_timeseries
+    harmonized = harmonize_timeseries(raw_data, city=city, parameter=parameter)
+    if harmonized:
+        _data_cache[cache_key] = harmonized
+        logger.info(
+            f"Harmonized {parameter}/{city}: {len(raw_data)} raw -> {len(harmonized)} grid points (1km)"
+        )
+    else:
+        # Fallback to raw if harmonization yields nothing
+        _data_cache[cache_key] = raw_data
+        logger.warning(f"Harmonization empty for {parameter}/{city}, using raw data")
+    return _data_cache[cache_key]
+def get_available_parameters() -> list[dict]:
+    """Return list of available satellite parameters."""
+    return [
+        {
+            "id": p["id"],
+            "name": p["name"],
+            "unit": p["unit"],
+            "source": p["source"],
+            "resolution": p["resolution"],
+            "frequency": p["frequency"],
+            "color": p["color"],
+            "description": p["description"],
+        }
+        for p in PARAMETERS.values()
+    ]
+def fetch_satellite_data(city: str, parameters: list[str], date_range: dict) -> dict:
+    """Fetch satellite data for given parameters. Uses pre-fetched files."""
+    result = {}
+    for param in parameters:
+        data = _load_data(param, city)
+        # Filter by date range if provided
+        start = date_range.get("start_date", "2023-01-01")
+        end = date_range.get("end_date", "2024-12-31")
+        filtered = [d for d in data if start <= d.get("date", "") <= end]
+        result[param] = {
+            "data": filtered,
+            "count": len(filtered),
+            "metadata": PARAMETERS.get(param, {}),
+        }
+    return {"city": city, "parameters": result}
+def get_timeseries(parameter: str, city: str = "ahmedabad") -> dict:
+    """Get time-series data for a single parameter."""
+    data = _load_data(parameter, city)
+    # Aggregate by date (average across spatial points)
+    from collections import defaultdict
+    date_values = defaultdict(list)
+    for d in data:
+        date_values[d["date"]].append(d["value"])
+    timeseries = [
+        {"date": date, "value": round(sum(vals) / len(vals), 4)}
+        for date, vals in sorted(date_values.items())
+    ]
+    return {
+        "parameter": parameter,
+        "city": city,
+        "timeseries": timeseries,
+        "metadata": PARAMETERS.get(parameter, {}),
+    }
+def get_heatmap_data(parameter: str, city: str = "ahmedabad") -> dict:
+    """Get spatial data formatted for heatmap rendering."""
+    data = _load_data(parameter, city)
+    if not data:
+        return {"points": [], "parameter": parameter, "min_value": 0, "max_value": 0}
+    # Use latest date's data for heatmap
+    dates = sorted(set(d["date"] for d in data))
+    latest_date = dates[-1] if dates else None
+    if latest_date:
+        spatial = [d for d in data if d["date"] == latest_date]
+    else:
+        spatial = data[:50]
+    values = [d["value"] for d in spatial]
+    min_val = min(values) if values else 0
+    max_val = max(values) if values else 0
+    val_range = max_val - min_val if max_val != min_val else 1
+    # Format: [[lat, lng, intensity(0-1)], ...]
+    points = [
+        [d["lat"], d["lng"], round((d["value"] - min_val) / val_range, 4)]
+        for d in spatial
+    ]
+    return {
+        "points": points,
+        "parameter": parameter,
+        "city": city,
+        "date": latest_date,
+        "min_value": round(min_val, 4),
+        "max_value": round(max_val, 4),
+        "raw_points": [
+            {"lat": d["lat"], "lng": d["lng"], "value": round(d["value"], 4)}
+            for d in spatial
+        ],
+    }
+def get_all_layers(city: str = "ahmedabad") -> list[dict]:
+    """Get all available map layers with their data."""
+    layers = []
+    for param_id, meta in PARAMETERS.items():
+        heatmap = get_heatmap_data(param_id, city)
+        layers.append(
+            {
+                "id": param_id.lower(),
+                "label": meta["name"],
+                "type": "heatmap",
+                "color": meta["color"],
+                "enabled": param_id in ("LST", "NDVI"),
+                "data": heatmap,
+            }
+        )
+    return layers
+def get_spatial_data(parameter: str, date: Optional[str] = None, city: str = "ahmedabad") -> list[dict]:
+    """Get spatial data points for a parameter, optionally filtered by date."""
+    data = _load_data(parameter, city)
+    if date:
+        return [d for d in data if d["date"] == date]
+    # Return latest date
+    dates = sorted(set(d["date"] for d in data))
+    if dates:
+        latest = dates[-1]
+        return [d for d in data if d["date"] == latest]
+    return data
+def get_statistics(parameter: str, city: str = "ahmedabad") -> dict:
+    """Compute basic statistics for a parameter."""
+    data = _load_data(parameter, city)
+    if not data:
+        return {}
+    values = [d["value"] for d in data]
+    import numpy as np
+    arr = np.array(values)
+    return {
+        "parameter": parameter,
+        "count": len(values),
+        "mean": round(float(np.mean(arr)), 4),
+        "std": round(float(np.std(arr)), 4),
+        "min": round(float(np.min(arr)), 4),
+        "max": round(float(np.max(arr)), 4),
+        "median": round(float(np.median(arr)), 4),
+        "unit": PARAMETERS[parameter]["unit"],
+    }
+def get_land_use_change(city: str = "ahmedabad") -> dict:
+    """Compare land use between 2020 and 2024 to show urban sprawl."""
+    data_dir = _get_data_dir(city)
+    file_2020 = data_dir / "land_use_2020.json"
+    file_2024 = data_dir / "land_use_2024.json"
+    data_2020 = []
+    data_2024 = []
+    if file_2020.exists():
+        with open(file_2020) as f:
+            data_2020 = json.load(f)
+    if file_2024.exists():
+        with open(file_2024) as f:
+            data_2024 = json.load(f)
+    # Compute change statistics
+    urban_2020 = sum(1 for d in data_2020 if d.get("value") == 1)
+    urban_2024 = sum(1 for d in data_2024 if d.get("value") == 1)
+    veg_2020 = sum(1 for d in data_2020 if d.get("value") in (2, 3))
+    veg_2024 = sum(1 for d in data_2024 if d.get("value") in (2, 3))
+    water_2020 = sum(1 for d in data_2020 if d.get("value") == 0)
+    water_2024 = sum(1 for d in data_2024 if d.get("value") == 0)
+    total = max(len(data_2020), 1)
+    return {
+        "city": city,
+        "year_from": 2020,
+        "year_to": 2024,
+        "data_2020": data_2020,
+        "data_2024": data_2024,
+        "change_summary": {
+            "urban_2020_pct": round(urban_2020 / total * 100, 1),
+            "urban_2024_pct": round(urban_2024 / total * 100, 1),
+            "urban_increase_pct": round((urban_2024 - urban_2020) / total * 100, 1),
+            "vegetation_2020_pct": round(veg_2020 / total * 100, 1),
+            "vegetation_2024_pct": round(veg_2024 / total * 100, 1),
+            "vegetation_decrease_pct": round((veg_2020 - veg_2024) / total * 100, 1),
+            "water_2020_pct": round(water_2020 / total * 100, 1),
+            "water_2024_pct": round(water_2024 / total * 100, 1),
+        },
+    }

app/services/time_machine_service.py ADDED Viewed

	@@ -0,0 +1,192 @@

+"""
+Environmental Time Machine — computes per-cell yearly averages for side-by-side comparison.
+Uses harmonized satellite data (961 cells per city) for rich heatmap visualization.
+"""
+import logging
+import numpy as np
+from collections import defaultdict
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+PARAM_META = {
+    "LST": {"label": "Surface Temperature", "unit": "C", "scale": "temperature"},
+    "NDVI": {"label": "Vegetation (NDVI)", "unit": "0-1", "scale": "vegetation"},
+    "NO2": {"label": "NO2 Pollution", "unit": "mol/m2", "scale": "pollution"},
+    "SO2": {"label": "SO2 Pollution", "unit": "mol/m2", "scale": "pollution"},
+    "CO": {"label": "Carbon Monoxide", "unit": "mol/m2", "scale": "pollution"},
+    "SOIL_MOISTURE": {"label": "Soil Moisture", "unit": "m3/m3", "scale": "moisture"},
+    "LAND_USE": {"label": "Land Use Change", "unit": "class", "scale": "landuse"},
+}
+def _timeseries_to_yearly_grids(data, year_a="2023", year_b="2024"):
+    """Split harmonized time-series into per-cell yearly averages."""
+    cells_a = defaultdict(list)
+    cells_b = defaultdict(list)
+    for point in data:
+        key = (round(point["lat"], 4), round(point["lng"], 4))
+        date = str(point.get("date", ""))
+        val = point.get("value")
+        if val is None:
+            continue
+        if date.startswith(year_a):
+            cells_a[key].append(float(val))
+        elif date.startswith(year_b):
+            cells_b[key].append(float(val))
+    grid_a = [
+        {"lat": k[0], "lng": k[1], "value": round(float(np.mean(v)), 4)}
+        for k, v in cells_a.items() if v
+    ]
+    grid_b = [
+        {"lat": k[0], "lng": k[1], "value": round(float(np.mean(v)), 4)}
+        for k, v in cells_b.items() if v
+    ]
+    return grid_a, grid_b
+def get_comparison(param: str, city: str = "ahmedabad") -> dict:
+    """Get year-over-year comparison grids using harmonized satellite data."""
+    meta = PARAM_META.get(param, {"label": param, "unit": "", "scale": "default"})
+    if param == "LAND_USE":
+        try:
+            lu_change = satellite_service.get_land_use_change(city)
+            raw_a = lu_change.get("data_2020", [])
+            raw_b = lu_change.get("data_2024", [])
+        except:
+            raw_a, raw_b = [], []
+        class_map = {"water": 0, "sparse_vegetation": 1, "dense_vegetation": 2, "urban": 3, "urban_barren": 3}
+        def encode(points):
+            return [
+                {"lat": p["lat"], "lng": p["lng"],
+                 "value": class_map.get(p.get("class_label", ""), 2),
+                 "class_label": p.get("class_label", "")}
+                for p in points
+            ]
+        return {
+            "param": param, "meta": meta, "city": city,
+            "year_a": "2020", "year_b": "2024",
+            "grid_a": encode(raw_a), "grid_b": encode(raw_b),
+        }
+    # Use harmonized data from satellite_service (961 cells per date after IDW)
+    try:
+        data = satellite_service._load_data(param, city)
+    except:
+        data = []
+    if not data:
+        return {"error": f"No data for {param}/{city}", "param": param, "meta": meta, "city": city,
+                "grid_a": [], "grid_b": []}
+    grid_a, grid_b = _timeseries_to_yearly_grids(data, "2023", "2024")
+    # If one year is empty, try raw data as fallback
+    if not grid_a and not grid_b:
+        try:
+            raw_data = satellite_service._load_raw(param, city)
+            grid_a, grid_b = _timeseries_to_yearly_grids(raw_data, "2023", "2024")
+        except:
+            pass
+    a_vals = [p["value"] for p in grid_a]
+    b_vals = [p["value"] for p in grid_b]
+    avg_change = round(float(np.mean(b_vals)) - float(np.mean(a_vals)), 4) if a_vals and b_vals else 0
+    # ── Change Analysis: per-cell diff ──────────────────────
+    map_a = {(round(p["lat"], 4), round(p["lng"], 4)): p["value"] for p in grid_a}
+    cell_changes = []
+    for p in grid_b:
+        key = (round(p["lat"], 4), round(p["lng"], 4))
+        val_a = map_a.get(key)
+        if val_a is not None:
+            diff = round(p["value"] - val_a, 4)
+            cell_changes.append({"lat": key[0], "lng": key[1], "value_2023": round(val_a, 4), "value_2024": round(p["value"], 4), "change": diff})
+    cell_changes.sort(key=lambda c: c["change"])
+    # For LST/NO2/SO2/CO — increase = worse. For NDVI/SOIL_MOISTURE — decrease = worse.
+    invert = param in ("NDVI", "SOIL_MOISTURE")
+    if invert:
+        top_worsened = cell_changes[:5]  # most decreased = worst for NDVI
+        top_improved = cell_changes[-5:][::-1]  # most increased = best
+    else:
+        top_worsened = cell_changes[-5:][::-1]  # most increased = worst for LST
+        top_improved = cell_changes[:5]  # most decreased = best
+    # ── Zone-level breakdown ────────────────────────────────
+    ZONES = {
+        "City Core": {"lat": (23.00, 23.06), "lng": (72.53, 72.62)},
+        "Industrial East": {"lat": (22.90, 23.00), "lng": (72.60, 72.70)},
+        "Western Suburbs": {"lat": (23.00, 23.06), "lng": (72.40, 72.53)},
+        "North": {"lat": (23.06, 23.20), "lng": (72.40, 72.70)},
+        "South": {"lat": (22.90, 23.00), "lng": (72.40, 72.60)},
+    }
+    zone_changes = []
+    for zone_name, bounds in ZONES.items():
+        zone_cells = [c for c in cell_changes
+                      if bounds["lat"][0] <= c["lat"] <= bounds["lat"][1]
+                      and bounds["lng"][0] <= c["lng"] <= bounds["lng"][1]]
+        if zone_cells:
+            zone_avg = round(float(np.mean([c["change"] for c in zone_cells])), 4)
+            zone_changes.append({"zone": zone_name, "avg_change": zone_avg, "cells": len(zone_cells)})
+    zone_changes.sort(key=lambda z: z["avg_change"], reverse=not invert)
+    # ── Auto-generate interpretation ────────────────────────
+    INSIGHTS = {
+        "LST": {"worse": "Urban Heat Island intensifying", "better": "Cooling effect detected — possible greening", "unit": "°C"},
+        "NDVI": {"worse": "Vegetation loss / deforestation detected", "better": "Green cover recovery observed", "unit": "NDVI"},
+        "NO2": {"worse": "Air pollution increasing — industrial/traffic sources", "better": "Air quality improving", "unit": "mol/m²"},
+        "SO2": {"worse": "Industrial SO₂ emissions rising", "better": "SO₂ levels declining", "unit": "mol/m²"},
+        "CO": {"worse": "Carbon monoxide rising — combustion sources", "better": "CO levels declining", "unit": "mol/m²"},
+        "SOIL_MOISTURE": {"worse": "Soil drying — drought stress increasing", "better": "Soil moisture improving", "unit": "m³/m³"},
+    }
+    insight = INSIGHTS.get(param, {"worse": "Conditions changed", "better": "Conditions changed", "unit": ""})
+    worst_zone = zone_changes[0] if zone_changes else None
+    best_zone = zone_changes[-1] if zone_changes else None
+    summary_parts = []
+    if worst_zone:
+        direction = "heated" if param == "LST" else ("lost" if param == "NDVI" else "increased")
+        summary_parts.append(f"{worst_zone['zone']} {direction} by {abs(worst_zone['avg_change']):.3f} {insight['unit']}")
+    if best_zone and best_zone != worst_zone:
+        direction = "cooled" if param == "LST" else ("recovered" if param == "NDVI" else "decreased")
+        summary_parts.append(f"{best_zone['zone']} {direction} by {abs(best_zone['avg_change']):.3f} {insight['unit']}")
+    interpretation = {
+        "summary": ". ".join(summary_parts) if summary_parts else f"{meta['label']} changed by {avg_change} overall",
+        "insight": insight["worse"] if (not invert and avg_change > 0) or (invert and avg_change < 0) else insight["better"],
+        "severity": "critical" if abs(avg_change) > np.std(a_vals) * 1.5 else ("warning" if abs(avg_change) > np.std(a_vals) * 0.5 else "normal"),
+    }
+    logger.info(f"Time Machine {param}/{city}: A={len(grid_a)} pts, B={len(grid_b)} pts, change={avg_change}")
+    return {
+        "param": param, "meta": meta, "city": city,
+        "year_a": "2023", "year_b": "2024",
+        "grid_a": grid_a, "grid_b": grid_b,
+        "avg_change": avg_change,
+        "change_direction": "increased" if avg_change > 0 else "decreased",
+        "top_worsened": top_worsened,
+        "top_improved": top_improved,
+        "zone_changes": zone_changes,
+        "interpretation": interpretation,
+        "total_cells_compared": len(cell_changes),
+    }
+def get_params():
+    return [
+        {"id": "LST", "label": "Surface Temperature"},
+        {"id": "NDVI", "label": "Vegetation (NDVI)"},
+        {"id": "NO2", "label": "NO2 Pollution"},
+        {"id": "SOIL_MOISTURE", "label": "Soil Moisture"},
+        {"id": "LAND_USE", "label": "Land Use Change"},
+    ]

app/services/vegetation_service.py ADDED Viewed

	@@ -0,0 +1,79 @@

+"""
+Vegetation Loss Detection Service.
+Detects NDVI decline, sudden drops, spatial clusters of vegetation loss, and forecasts future trajectory.
+"""
+import logging
+from collections import defaultdict
+from app.services import satellite_service
+logger = logging.getLogger(__name__)
+def analyse(city: str = "Ahmedabad") -> dict:
+    """Run vegetation loss analysis."""
+    ndvi_data = satellite_service._load_data("NDVI")
+    if not ndvi_data:
+        return {"city": city, "error": "No NDVI data available"}
+    # 1. Overall decline — compare first half vs second half
+    date_values = defaultdict(list)
+    for d in ndvi_data:
+        date_values[d["date"]].append(d["value"])
+    ts_sorted = sorted(date_values.items())
+    if len(ts_sorted) < 4:
+        return {"city": city, "error": "Insufficient time-series data"}
+    mid = len(ts_sorted) // 2
+    first_half = [sum(v) / len(v) for _, v in ts_sorted[:mid]]
+    second_half = [sum(v) / len(v) for _, v in ts_sorted[mid:]]
+    first_avg = sum(first_half) / len(first_half)
+    second_avg = sum(second_half) / len(second_half)
+    decline_pct = round((first_avg - second_avg) / first_avg * 100, 1) if first_avg > 0 else 0
+    # 2. Area lost from land use change
+    try:
+        lu_change = satellite_service.get_land_use_change(city)
+        change_summary = lu_change.get("change_summary", {})
+        veg_decrease_pct = change_summary.get("vegetation_decrease_pct", 0)
+        area_lost_sqkm = round(veg_decrease_pct * 4.64, 1)  # Ahmedabad ~464 sqkm
+    except:
+        veg_decrease_pct = 0
+        area_lost_sqkm = 0
+    # 3. Anomaly detection on NDVI
+    from app.services import ml_service
+    anomaly_result = ml_service.detect_anomalies("NDVI", city)
+    anomalies = anomaly_result.get("anomalies", [])
+    # 4. Hotspot clusters of low NDVI
+    hotspot_result = ml_service.find_hotspots("NDVI", city)
+    clusters = hotspot_result.get("hotspots", [])
+    # 5. LSTM forecast
+    try:
+        from app.ml.lstm_predictor import LSTMPredictor
+        predictor = LSTMPredictor(lookback=6)
+        ts_tuples = [(date, sum(vals) / len(vals)) for date, vals in ts_sorted]
+        forecast = predictor.forecast(ts_tuples, steps=6)
+    except Exception as e:
+        logger.warning(f"LSTM forecast failed: {e}")
+        forecast = []
+    # 6. Critical wards (zones with NDVI < 0.15)
+    import numpy as np
+    all_values = [d["value"] for d in ndvi_data]
+    critical_count = sum(1 for v in all_values if v < 0.15)
+    return {
+        "city": city,
+        "ndvi_decline_pct": decline_pct,
+        "area_lost_sqkm": area_lost_sqkm,
+        "current_city_ndvi": round(second_avg, 4),
+        "critical_zones": critical_count,
+        "anomaly_count": len(anomalies),
+        "anomaly_events": anomalies[:10],
+        "clusters": clusters,
+        "forecast_6m": forecast,
+        "trend": "declining" if decline_pct > 0 else "stable",
+    }

app/utils/__init__.py ADDED Viewed

File without changes