Spaces:

W1nd5pac
/

microclimate-x-demo

Paused

App Files Files Community

W1nd5pac commited on about 19 hours ago

Commit

a8358d8

verified ·

1 Parent(s): cbd64ba

Deploy 2026-05-20T07:09:24Z — 11e81c5 (code)

Browse files

Files changed (46) hide show

.dockerignore +29 -0
.gitignore +75 -0
.pre-commit-config.yaml +22 -0
CHANGELOG.md +139 -0
CONTRIBUTING.md +63 -0
Dockerfile +60 -0
LICENSE +28 -0
Makefile +78 -0
README.md +272 -5
backend/__init__.py +3 -0
backend/cache.py +190 -0
backend/config.py +208 -0
backend/errors.py +26 -0
backend/main.py +455 -0
backend/ml_engine.py +126 -0
backend/rule_engine.py +480 -0
backend/schemas.py +72 -0
backend/terrain.py +151 -0
docker-compose.yml +26 -0
docs/DEPLOY_HF.md +143 -0
docs/MEETING_CHEAT_SHEET.html +644 -0
docs/MEETING_CHEAT_SHEET.md +372 -0
docs/architecture.md +116 -0
docs/dataset.md +111 -0
docs/pipeline_order.md +109 -0
docs/progress_update_brief.html +619 -0
docs/progress_update_brief.md +235 -0
docs/supervisor_meeting_brief.md +161 -0
docs/thresholds.md +150 -0
docs/项目大白话讲解.html +883 -0
docs/项目大白话讲解.md +383 -0
frontend/index.html +579 -0
models/.gitkeep +0 -0
models/MODEL_CARD.md +133 -0
models/feature_columns.json +20 -0
models/training_report.json +82 -0
pyproject.toml +45 -0
requirements-dev.txt +14 -0
requirements.txt +17 -0
scripts/1_download_dataset.py +138 -0
scripts/1b_synth_dataset.py +168 -0
scripts/2_preprocess.py +160 -0
scripts/3_train_model.py +183 -0
scripts/4_evaluate_model.py +272 -0
scripts/deploy_hf.sh +135 -0
scripts/start_demo.sh +86 -0

.dockerignore ADDED Viewed

	@@ -0,0 +1,29 @@

+.git/
+.github/
+.venv/
+.pytest_cache/
+__pycache__/
+*.pyc
+*.pyo
+# Local databases — must NOT bake into the image
+cache.sqlite3
+cache.sqlite3-*
+*.sqlite
+*.sqlite3*
+# Large dataset artefacts — re-download or regenerate inside the image
+data/
+figures/
+# Dev / IDE
+.idea/
+.vscode/
+*.iml
+.DS_Store
+# Docs not needed at runtime
+docs/
+*.docx
+*.md
+!README.md

.gitignore ADDED Viewed

	@@ -0,0 +1,75 @@

+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+.venv/
+venv/
+env/
+ENV/
+.pytest_cache/
+.mypy_cache/
+.ruff_cache/
+*.egg-info/
+build/
+dist/
+# Data & Models — big binaries stay local
+data/*.csv
+data/*.parquet
+models/*.pkl
+models/*.joblib
+models/*.onnx
+*.db
+*.sqlite
+*.sqlite3
+*.sqlite3-shm
+*.sqlite3-wal
+# Coverage + test artefacts
+.coverage
+coverage.xml
+htmlcov/
+# Generated figures — re-create with `make evaluate`
+# (we keep evaluation_summary.json + threshold_sweep.csv as audit trail)
+figures/*.png
+!figures/.gitkeep
+*.db-journal
+*.db-wal
+*.db-shm
+# …but keep small JSON artefacts that document the training run.
+!models/training_report.json
+!models/feature_columns.json
+# Notebooks
+.ipynb_checkpoints/
+*.ipynb
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+.DS_Store
+Thumbs.db
+# OS
+.DS_Store?
+._*
+.Spotlight-V100
+.Trashes
+ehthumbs.db
+# Logs
+*.log
+logs/
+# Env
+.env
+.env.local
+# Keep directory placeholders
+!data/.gitkeep
+!models/.gitkeep

.pre-commit-config.yaml ADDED Viewed

	@@ -0,0 +1,22 @@

+# Pre-commit hooks — see https://pre-commit.com/
+# Install: pip install pre-commit && pre-commit install
+repos:
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v5.0.0
+    hooks:
+      - id: trailing-whitespace
+      - id: end-of-file-fixer
+      - id: check-yaml
+      - id: check-json
+      - id: check-toml
+      - id: check-merge-conflict
+      - id: check-added-large-files
+        args: [--maxkb=2048]
+  - repo: https://github.com/astral-sh/ruff-pre-commit
+    rev: v0.6.9
+    hooks:
+      - id: ruff
+        args: [--fix]
+      - id: ruff-format

CHANGELOG.md ADDED Viewed

	@@ -0,0 +1,139 @@

+# Changelog
+All notable changes to this project will be documented in this file.
+Format follows [Keep a Changelog](https://keepachangelog.com/en/1.1.0/);
+versioning follows [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
+---
+## [1.0.0] — 2026-05-11
+The first complete release. Engineering-grade hardening across backend,
+ML pipeline, frontend, and DevOps; the rule engine is fully aligned with
+the D5 thesis proposal §3.7 / P4.
+### Added — Backend
+- **Request-ID middleware** that stamps every response with `X-Request-ID`
+  and `X-Response-Time-ms`. Incoming `X-Request-ID` headers propagate end
+  to end, enabling cross-service tracing.
+- **Centralised error contract** (`backend/errors.py`) — every non-2xx
+  response is a typed `ErrorResponse { error, detail, request_id, context }`
+  JSON document; no bare 500-HTML responses leak.
+- **Structured logging** with per-request log records (`request_id` field
+  on every line, ISO-8601 timestamps).
+- **Enriched `/api/health`** reporting uptime, cache row counts (live /
+  expired / total), DB size, and inference-log size.
+- **`/api/version`** endpoint returning version + git short SHA + ML
+  feature schema.
+- **Cache hygiene** — `prune_expired()` runs on startup, sweeps inference-log
+  rows older than 7 days, and `cache_stats()` is exposed via `/api/health`.
+- **Fire-and-forget cache writes** with the task reference retained
+  (`asyncio.create_task` lint compliance).
+- **Defensive ML engine** — `predict_rain_probability` always returns
+  `float ∈ [0, 1]`; NaN/Inf/wrong-type feature values gracefully degrade;
+  model-load failures fall through to the heuristic instead of crashing.
+- **Improved heuristic fallback** — now also responds to
+  `pressure_change_3h` so the "no model yet" demo still behaves sensibly.
+- **Terrain edge cases** — antimeridian wrap, polar clamp, ocean / no-data
+  DEM cells handled instead of raising obscure type errors.
+### Added — Rule Engine (already shipped, now fully tested)
+- 4 sub-hazard scorers — rainfall / fog / wind gust / thunderstorm.
+- D5 §3.7.2 R1-R4 Decision Table.
+- Activity-aware weighted composite (`hiker | driver | construction | general`).
+- Dominant-hazard composite formula: `0.80·max + 0.20·mean(rest)`.
+### Added — ML pipeline
+- **`scripts/4_evaluate_model.py`** generating publication-quality figures
+  (ROC + AUC, PR + AP, calibration / Brier, threshold sweep, top-20
+  feature importance, confusion matrix at F2-optimal threshold).
+- **`figures/evaluation_summary.json`** machine-readable evaluation blob
+  for the thesis appendix.
+- **`figures/threshold_sweep.csv`** for full reproducibility of the
+  precision-recall trade-off table.
+- **`models/MODEL_CARD.md`** — HuggingFace-style model card with intended
+  use, training data, evaluation, limitations, and ethical considerations.
+### Added — Tests
+- HTTP integration tests with `respx`-mocked external APIs
+  (`tests/test_api.py`): happy path, cache hit, distinct cache slot per
+  activity, invalid input → 422, upstream failure → 502, CORS, OpenAPI
+  schema.
+- Cache layer tests (`tests/test_cache.py`): TTL, expiry, prune, stats.
+- Terrain edge-case tests (`tests/test_terrain_edge.py`): antimeridian,
+  polar clamp, malformed DEM.
+- ML engine tests (`tests/test_ml_engine.py`): unloaded behaviour,
+  heuristic monotonicity, NaN/None resilience.
+- Session-scoped `conftest.py` sets an isolated `MICROCLIMATEX_DB` for
+  every test run (no clobbering the dev cache).
+- **Total: 70 tests; backend coverage 97 %.**
+### Added — Frontend
+- Activity selector (Hiker / Driver / Construction / General) with
+  `localStorage` persistence and keyboard accessibility (`aria-pressed`
+  + `focus-visible`).
+- 4 mini-gauges for the per-hazard sub-scores, each with a tooltip
+  explaining what drives it.
+- D5 §3.7.2 R1-R4 indicator badges (highlight when fired).
+- Demo scenarios dropdown (Genting · Cameron · Kinabalu · Everest · Singapore).
+- **Loading spinner** during in-flight requests.
+- **Toast notification** for errors and "no model loaded" warnings.
+- **Map layer switcher** — Dark base + Topographic option.
+- Bilingual EN/ZH UI persisted across reloads.
+### Added — DevOps / Reproducibility
+- **GitHub Actions CI** (`.github/workflows/ci.yml`) — pytest matrix on
+  Python 3.9 / 3.11 / 3.12, ruff lint, coverage XML artefact, plus a
+  Docker image-build smoke test with Buildx + GHA cache.
+- **Multi-stage Dockerfile** — builder stage for wheels, slim runtime
+  with a non-root `mcx` user, baked-in HEALTHCHECK against `/api/health`.
+- **`docker-compose.yml`** with a named data volume.
+- **`Makefile`** — single-word recipes for `install`, `test`, `lint`,
+  `run`, `synth`, `preprocess`, `train`, `evaluate`, `docker`, `clean`.
+- **`requirements-dev.txt`** — split dev tooling (pytest-cov, ruff,
+  respx, matplotlib) from runtime requirements.
+- **`pyproject.toml`** — ruff configuration + pytest config.
+- **`.pre-commit-config.yaml`** — trailing-whitespace, end-of-file,
+  YAML/JSON/TOML checks, large-file guard, ruff lint + format.
+- **`.dockerignore`** keeping the image lean.
+### Added — Documentation
+- `docs/architecture.md` — P4.1 → P4.6 internal flow + dominant-hazard
+  formula rationale.
+- `docs/thresholds.md` — every threshold cited; new §8-§12 for the four
+  hazard categories, R1-R4 table, and activity-weight matrix.
+- `docs/dataset.md` — formal target definition (`is_rain_event`) and
+  train/test split rationale.
+### Changed
+- Rainfall sub-scorer calibration — 45 % macro probability now lands at
+  ~ 40 (Caution band), matching the proposal's intent.
+- Composite-score formula switched from naive arithmetic mean to
+  **dominant-hazard + secondary** to avoid mean dilution.
+- Cache key now incorporates `activity` — different weights → different
+  composite → must not share a slot.
+### Fixed
+- `tenacity.RetryError` from the retry decorator was not caught by the
+  `except httpx.HTTPError` clause, producing a misleading 500. Now caught
+  alongside `httpx.HTTPError` and `ValueError`, returning a clean 502.
+---
+## [0.2.0] — 2026-05-11
+Initial D5-alignment pass — see commit `55fd759`.
+## [0.1.0] — 2026-05-11
+Project scaffolding and Hybrid Engine v1 — see commits `b218f5b`
+through `4639890`.

CONTRIBUTING.md ADDED Viewed

	@@ -0,0 +1,63 @@

+# Contributing to MicroClimate-X
+Thanks for your interest! This is a Final Year Project (UKM) and we
+welcome both academic feedback and code contributions.
+## Quick setup
+```bash
+git clone https://github.com/KyoukoLi/microclimate-x
+cd microclimate-x
+make install-dev          # creates ./.venv, installs runtime + dev deps
+make test                 # runs the full suite; should be 70+ passes
+make lint                 # ruff check
+make run                  # uvicorn dev server on http://localhost:8000
+```
+The full developer toolbox is in the [Makefile](./Makefile) — `make help`
+lists every target.
+## Project rhythm
+| Layer | Source of truth |
+|---|---|
+| Engineering thresholds & academic citations | `backend/config.py` + `docs/thresholds.md` |
+| Hybrid engine flow & section mapping | `backend/rule_engine.py` + `docs/architecture.md` |
+| ML pipeline (features ↔ training ↔ evaluation) | `scripts/2_preprocess.py` ↔ `scripts/3_train_model.py` ↔ `scripts/4_evaluate_model.py` |
+| Frontend contract | `backend/schemas.py` (Pydantic) is consumed verbatim by `frontend/index.html` |
+If you change something in one column, please update the corresponding
+artefact in the same column.
+## Pull-request checklist
+1. **All tests pass**: `make test` — 70 / 70.
+2. **Linter is clean**: `make lint` — 0 ruff errors.
+3. **New behaviour is tested.** Add a unit test or an HTTP integration
+   test that fails *without* your change.
+4. **Public APIs documented.** Update `docs/` and the OpenAPI docstrings
+   if you change request / response shapes.
+5. **Thresholds are cited.** Any new numeric threshold in `config.py`
+   needs an `# Citation:` block referencing peer-reviewed literature or
+   an authoritative regulation.
+6. **No secrets, no large binaries.** Pre-commit hooks (`make install-dev`
+   then `pre-commit install`) enforce both.
+## Safety-critical code review
+This is decision-support software for outdoor activity. Reviewers should
+specifically check:
+* **Does this change weaken the Veto cascade?** If a behavioural change
+  could let a "Safe" verdict fire in a situation that previously fired
+  Danger, the PR needs an explicit test demonstrating the new threshold
+  is still life-safety-compliant.
+* **Does this change leak temporal autocorrelation?** Random train/test
+  splits on time-series data are *forbidden*; always use the time-based
+  split in `scripts/3_train_model.py`.
+## Reporting issues
+Bugs, academic critique, or threshold disputes — please open an issue
+with the **scenario**, the **expected verdict**, and the **observed
+verdict**. Citations to the relevant safety literature are very welcome.

Dockerfile ADDED Viewed

	@@ -0,0 +1,60 @@

+# syntax=docker/dockerfile:1.7
+# ─────────────────────────────────────────────────────────────────
+# Stage 1 — builder: install Python deps into a self-contained venv
+# ─────────────────────────────────────────────────────────────────
+FROM python:3.12-slim AS builder
+ENV PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1 \
+    PIP_NO_CACHE_DIR=1 \
+    PIP_DISABLE_PIP_VERSION_CHECK=1
+WORKDIR /build
+# Build deps for any C-extension wheels that need compilation
+# (scikit-learn / numpy ship wheels for linux/amd64+arm64 so this is usually a no-op).
+RUN apt-get update && apt-get install -y --no-install-recommends \
+        build-essential \
+    && rm -rf /var/lib/apt/lists/*
+COPY requirements.txt .
+RUN python -m venv /opt/venv \
+    && /opt/venv/bin/pip install --upgrade pip \
+    && /opt/venv/bin/pip install -r requirements.txt
+# ─────────────────────────────────────────────────────────────────
+# Stage 2 — runtime: minimal image with only the venv + app code
+# ─────────────────────────────────────────────────────────────────
+FROM python:3.12-slim AS runtime
+ENV PYTHONDONTWRITEBYTECODE=1 \
+    PYTHONUNBUFFERED=1 \
+    PATH="/opt/venv/bin:$PATH" \
+    MICROCLIMATEX_DB=/tmp/cache.sqlite3
+# Non-root user for least-privilege execution.
+RUN useradd --create-home --shell /bin/bash --uid 10001 mcx \
+    && mkdir -p /app /data \
+    && chown -R mcx:mcx /app /data
+COPY --from=builder /opt/venv /opt/venv
+WORKDIR /app
+COPY --chown=mcx:mcx backend/   backend/
+COPY --chown=mcx:mcx frontend/  frontend/
+COPY --chown=mcx:mcx scripts/   scripts/
+COPY --chown=mcx:mcx models/    models/
+COPY --chown=mcx:mcx README.md LICENSE ./
+USER mcx
+EXPOSE 8000
+VOLUME ["/data"]
+# Container-aware health check — uses the same /api/health endpoint as humans.
+HEALTHCHECK --interval=30s --timeout=5s --start-period=10s --retries=3 \
+    CMD python -c "import urllib.request, sys; \
+sys.exit(0) if urllib.request.urlopen('http://localhost:8000/api/health', timeout=2).status == 200 else sys.exit(1)" || exit 1
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]

LICENSE ADDED Viewed

	@@ -0,0 +1,28 @@

+MIT License
+Copyright (c) 2026 L.ZH (Universiti Kebangsaan Malaysia)
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
+DISCLAIMER FOR SAFETY-CRITICAL USE:
+This software is intended as a decision-support tool only. It does NOT
+replace official meteorological forecasts issued by national weather services.
+The authors accept no liability for decisions made based on this software's
+output. Users — particularly hikers, climbers, and outdoor workers — should
+always consult official weather warnings and exercise their own judgment.

Makefile ADDED Viewed

	@@ -0,0 +1,78 @@

+# MicroClimate-X — common dev tasks. Run `make help` for a full list.
+#
+# Conventions:
+#   * `make <target>` is the single source of truth for a workflow step.
+#   * Targets are idempotent; running twice should not break anything.
+#   * Heavy tasks (train, eval) write into git-ignored directories.
+PYTHON  ?= ./.venv/bin/python
+PIP     ?= ./.venv/bin/pip
+UVICORN ?= ./.venv/bin/uvicorn
+PYTEST  ?= ./.venv/bin/pytest
+RUFF    ?= ./.venv/bin/ruff
+.DEFAULT_GOAL := help
+.PHONY: help venv install install-dev test test-fast lint format coverage \
+        synth preprocess train evaluate run clean docker docker-run
+help:                          ## Show this help.
+	@awk 'BEGIN{FS=":.*##";print "MicroClimate-X — available targets:"} /^[a-zA-Z_-]+:.*?##/{printf "  \033[36m%-15s\033[0m %s\n",$$1,$$2}' $(MAKEFILE_LIST)
+venv:                          ## Create a Python 3.10+ venv at ./.venv
+	python3 -m venv .venv
+	$(PIP) install --upgrade pip
+install: venv                  ## Install runtime dependencies.
+	$(PIP) install -r requirements.txt
+install-dev: install           ## Install runtime + dev dependencies.
+	$(PIP) install -r requirements-dev.txt
+# ── Quality ────────────────────────────────────────────────────────────
+lint:                          ## Run ruff lint check.
+	$(RUFF) check backend/ scripts/ tests/
+format:                        ## Format code with ruff.
+	$(RUFF) format backend/ scripts/ tests/
+	$(RUFF) check --fix backend/ scripts/ tests/
+test:                          ## Run the full test suite with coverage.
+	$(PYTEST) tests/ --cov=backend --cov-report=term-missing
+test-fast:                     ## Run tests quietly, no coverage.
+	$(PYTEST) tests/ -q
+coverage:                      ## Generate an HTML coverage report.
+	$(PYTEST) tests/ --cov=backend --cov-report=html
+	@echo "Open htmlcov/index.html in your browser."
+# ── ML pipeline ────────────────────────────────────────────────────────
+synth:                         ## Generate synthetic dataset (no network).
+	$(PYTHON) scripts/1b_synth_dataset.py
+preprocess:                    ## Build features + target (data/processed.csv).
+	$(PYTHON) scripts/2_preprocess.py
+train:                         ## Train the Random Forest model.
+	$(PYTHON) scripts/3_train_model.py
+evaluate:                      ## Generate publication figures + threshold sweep.
+	$(PYTHON) scripts/4_evaluate_model.py
+# ── Local run ──────────────────────────────────────────────────────────
+run:                           ## Start the FastAPI dev server with auto-reload.
+	$(UVICORN) backend.main:app --reload --host 127.0.0.1 --port 8000
+# ── Docker ─────────────────────────────────────────────────────────────
+docker:                        ## Build the Docker image.
+	docker build -t microclimate-x:latest .
+docker-run: docker             ## Build then run the container on port 8000.
+	docker compose up --build
+# ── Housekeeping ───────────────────────────────────────────────────────
+clean:                         ## Remove caches, coverage, and SQLite WAL files.
+	rm -rf .pytest_cache htmlcov .coverage coverage.xml
+	rm -f  cache.sqlite3 cache.sqlite3-*
+	find . -name __pycache__ -type d -prune -exec rm -rf {} +

README.md CHANGED Viewed

@@ -1,10 +1,277 @@
 ---
-title: Microclimate X Demo
-emoji: 🐨
-colorFrom: indigo
-colorTo: purple
 sdk: docker
 pinned: false
 ---
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: MicroClimate-X
+emoji: 🌧️
+colorFrom: blue
+colorTo: green
 sdk: docker
+app_port: 8000
 pinned: false
+license: mit
+short_description: Hybrid microclimate risk for complex terrain (FYP demo)
 ---
+# MicroClimate-X
+> Intelligent Meteorological Analysis System for Complex Terrain
+> 面向复杂地形的智能气象分析系统
+> **Live demo / 在线演示**: <https://huggingface.co/spaces/W1nd5pac/microclimate-x>
+> (Deployed as a Hugging Face Space — Docker SDK. See [`docs/DEPLOY_HF.md`](docs/DEPLOY_HF.md) for the deployment recipe.)
+![CI](https://github.com/KyoukoLi/microclimate-x/actions/workflows/ci.yml/badge.svg)
+![Python](https://img.shields.io/badge/Python-3.9%20%7C%203.11%20%7C%203.12-blue)
+![FastAPI](https://img.shields.io/badge/FastAPI-0.110%2B-009688)
+![Vue3](https://img.shields.io/badge/Vue.js-3-4FC08D)
+![ML](https://img.shields.io/badge/ML-RandomForest-orange)
+![Coverage](https://img.shields.io/badge/coverage-97%25-brightgreen)
+![Tests](https://img.shields.io/badge/tests-70%20passing-success)
+![Docker](https://img.shields.io/badge/Docker-multi--stage-2496ED?logo=docker&logoColor=white)
+![License](https://img.shields.io/badge/License-MIT-green)
+A Final Year Project at **Universiti Kebangsaan Malaysia (UKM)** — Faculty of Information Science & Technology.
+### For thesis supervisors / 导师阅读路径
+| Step | Document | What it shows |
+|---|---|---|
+| 1. Dataset | [`docs/dataset.md`](docs/dataset.md) | Source · schema · **Y derivation** · train/test split |
+| 2. Model   | [`models/MODEL_CARD.md`](models/MODEL_CARD.md) | Intended use · metrics · limitations · ethics |
+| 3. Evaluation | [`figures/`](figures/) + [`figures/evaluation_summary.json`](figures/evaluation_summary.json) | 6 publication figures, all reproducible via `make evaluate` |
+| 4. Architecture | [`docs/architecture.md`](docs/architecture.md) + [`docs/thresholds.md`](docs/thresholds.md) | Hybrid engine, every threshold cited |
+| 5. Pipeline order | [`docs/pipeline_order.md`](docs/pipeline_order.md) | Explicit "dataset → model → app" sequence |
+| 6. Meeting brief | [`docs/supervisor_meeting_brief.md`](docs/supervisor_meeting_brief.md) | Detailed bilingual EN/ZH script |
+| 7. **Cheat sheet** | [`docs/MEETING_CHEAT_SHEET.md`](docs/MEETING_CHEAT_SHEET.md) · [HTML](docs/MEETING_CHEAT_SHEET.html) | **Open on screen during the meeting** — tab-order · demo script · Q&A · checklist |
+---
+## 1. Problem Statement / 痛点
+Traditional weather forecasting relies on **macro-scale grids (20 km × 20 km)** that fail catastrophically in complex terrain. A single forecast cell may cover a mountain peak, a valley floor, and a windward slope — all of which have vastly different microclimates.
+传统天气预报使用 **20 km × 20 km 宏观网格**，在山区会严重失真。同一网格内可能同时包含山顶、谷底和迎风坡，但它们的微气候完全不同。
+## 2. Solution: The Hybrid Engine / 解决方案
+MicroClimate-X uses a **dual-engine hybrid architecture** combining a Machine Learning predictor with a topographic Rule-Based Expert System.
+```
+            ┌──────────────────────────────────────────────────┐
+            │  User clicks a coordinate on the map (lat, lon)  │
+            └────────────────────┬─────────────────────────────┘
+                                 │
+            ┌────────────────────▼─────────────────────────────┐
+            │   Open-Meteo (weather) + Open Topo Data (DEM)    │
+            └────────────────────┬─────────────────────────────┘
+                                 │
+              ┌──────────────────┴───────────────────┐
+              │                                      │
+   ┌──────────▼──────────┐              ┌────────────▼───────────┐
+   │  Engine A           │              │  Engine B              │
+   │  Random Forest      │   probability│  Topographic Rules     │
+   │  (in-distribution   ├─────────────►│  + Veto Triggers       │
+   │   rain probability) │              │  (safety-critical)     │
+   └─────────────────────┘              └────────────┬───────────┘
+                                                     │
+                                        ┌────────────▼───────────┐
+                                        │  Risk Score 0-100      │
+                                        │  + Bilingual Advice    │
+                                        │  + XAI Inference Log   │
+                                        └────────────────────────┘
+```
+### Why Hybrid? / 为什么混合？
+Pure ML can fail catastrophically out-of-distribution. Example: feed Mount Everest coordinates → ML predicts 0% rain → returns "Safe" — ignoring -30°C, hypoxia, gale-force winds.
+**Engine B's Veto mechanism** provides bounded safety guarantees by overriding the ML score when physical thresholds are breached. This follows the **Neuro-Symbolic AI** paradigm (Garcez & Lamb, 2020).
+### Engine B internals — one-to-one with D5 proposal §3.7 / P4
+The rule engine is decomposed exactly along the lines of the thesis proposal so every line of code maps to a section number:
+| Proposal step | Code | Output |
+|---|---|---|
+| **P4.1** Load Dynamic Risk Rules | `backend/config.py` | All thresholds, weights, and the R1-R4 decision table, each annotated with its academic citation |
+| **P4.2** Fetch User Context | `?activity=hiker\|driver\|construction\|general` | Activity is plumbed into the request flow |
+| **P4.3** Evaluate Environmental Risks | Four `score_*_risk()` functions in `rule_engine.py` | Rainfall / Fog / Wind-gust / Thunderstorm sub-scores (each 0-100) |
+| **§3.7.2 Table 4.2** Decision Table | `apply_decision_table_3_7_2()` | Which of R1-R4 fired (hidden rain / no amplification / heavy downpour / standard rain) |
+| Veto cascade | `_collect_veto_triggers()` | Life-safety overrides (Mt-Everest type) — capped at 100 |
+| **P4.4** Activity weighting | `apply_activity_weighting()` | (activity × hazard) weight matrix |
+| **P4.5** Composite score | Same | `0.80 · max(weighted) + 0.20 · mean(rest)` — dominant hazard wins |
+| **P4.6** Actionable advice | `_normal_advice()` / `_veto_advice()` | Bilingual EN/ZH paragraph that names the dominant hazard |
+Four hazard categories surfaced in the UI as four mini-gauges; the four R1-R4 indicators light up beside the score card whenever a rule fires.
+## 3. Tech Stack / 技术栈
+| Layer | Technology |
+|---|---|
+| Frontend | Vue 3 (CDN) + Tailwind CSS + Leaflet.js + ECharts |
+| Backend | Python 3.10+, FastAPI, Uvicorn |
+| ML | Scikit-Learn (Random Forest), Pandas, NumPy |
+| Storage | SQLite 3 (WAL mode, risk-adaptive TTL cache) |
+| External | Open-Meteo Historical Archive (ERA5), Open Topo Data (SRTM DEM) |
+## 4. Dataset / 数据集
+- **Source**: [Open-Meteo Historical Weather API](https://open-meteo.com/en/docs/historical-weather-api) (ERA5 reanalysis)
+- **Region**: Malaysian mountain areas (Genting Highlands, Cameron Highlands, Fraser's Hill, Klang Valley, Mount Kinabalu region)
+- **Time Range**: 2020-01-01 to 2023-12-31 (hourly resolution, 5 sites × ~35 000 hours each)
+- **Features (X)**: `elevation_m`, `temperature_c`, `humidity_pct`, `wind_speed_kmh`, `wind_direction_deg`, `surface_pressure_hpa`
+- **Target (Y)**: `is_rain_event` — binary, 1 if `precipitation(t+1h) > 0.1 mm` else 0 (per WMO trace-precipitation definition)
+## 5. Quick Start / 快速开始
+```bash
+git clone https://github.com/KyoukoLi/microclimate-x.git
+cd microclimate-x
+# Fast path — everything via the Makefile
+make install-dev         # 1. create venv + install runtime + dev deps
+make synth               # 2. generate synthetic dataset (offline)
+#  …or `make` nothing here and run `python scripts/1_download_dataset.py`
+#     to fetch real ERA5 data when network is available.
+make preprocess          # 3. feature engineering + Y derivation
+make train               # 4. RF training + time-based CV
+make evaluate            # 5. ROC / PR / calibration / threshold-sweep figures
+make run                 # 6. uvicorn dev server on http://localhost:8000
+# Then open frontend/index.html (or browse to http://localhost:8000/app/)
+```
+### Docker one-liner
+```bash
+docker compose up --build
+# API lives on http://localhost:8000  ·  frontend on http://localhost:8000/app/
+```
+### Test it
+```bash
+make test         # 70 tests, ~12 s
+make lint         # ruff — zero errors expected
+```
+### Training results on real ERA5 data / 真实 ERA5 数据训练结果
+Trained on **175 315 hourly samples** from Open-Meteo Historical Archive
+(ECMWF ERA5 reanalysis) covering five Malaysian mountain sites,
+2020-01-01 → 2024-12-31. Time-based split: last 20 % per site held out
+(n = 35 063 test samples). See [`models/MODEL_CARD.md`](models/MODEL_CARD.md)
+for the full evaluation card and `figures/` for publication-ready plots.
+| Metric | Value | Source |
+|---|---|---|
+| Test ROC AUC | **0.871** | `figures/01_roc_curve.png` |
+| Test PR Average Precision | **0.750** | `figures/02_pr_curve.png` |
+| Brier score (calibration) | **0.138** | `figures/03_calibration_curve.png` |
+| Best F2 @ τ = 0.20 | **0.778** | `figures/04_threshold_sweep.png` |
+| Recall (at chosen τ = 0.20) | **0.934** — safety-critical recall |
+| Class balance | 29.2 % positive (Malaysian mountain climatology) |
+We deliberately operate at **τ = 0.20**, not the default 0.50, because
+in safety-critical settings a missed rain event (false negative) on a
+windward slope is dramatically worse than a false positive. F2 score
+weights recall 4× higher than precision and is the principled metric
+for this regime.
+**5-fold time-series CV** on the training fold gives AUC ranging
+0.828-0.908 (mean ≈ 0.858), confirming the model is not over-fitting a
+single temporal slice.
+#### Feature importance — what the model actually learned
+| Rank | Feature | Importance | Interpretation |
+|---|---|---|---|
+| 1 | `precipitation_lag_1h` | 37.1 % | Rain autocorrelation — the well-documented "rain begets rain" persistence signal in short-term nowcasting (Wilson et al., 2010). |
+| 2-3 | `hour_cos`, `hour_sin` | 18.6 % | Diurnal convective cycle — Malaysian mountain rainfall peaks in late afternoon. |
+| 4 | `pressure_change_3h` | 4.7 % | Falling pressure precedes incoming storms — the classical synoptic-scale precursor. |
+| 5-6 | `wind_v`, `dew_point_c` | 8.1 % | Moisture transport + saturation potential. |
+| 7-14 | other meteorological X | 22 % | T, humidity, cloud cover, wind, dew-point depression, pressure. |
+| 15-17 | `month_*`, `elevation_m` | 4 % | Low because the time-of-day and lag features already absorb most of the seasonal/static signal. |
+| 18 | `cape_jkg` | **0.0 %** | ⚠️ ERA5 archive CAPE values for these coordinates are predominantly zero — a known coverage gap. The Veto-rule engine still uses CAPE thresholds directly from the live Open-Meteo forecast at inference time. |
+#### Why F2 instead of accuracy?
+Accuracy is misleading on imbalanced safety-critical classification.
+A model that predicts "no rain" 100 % of the time achieves
+**69.2 % accuracy** here while being completely useless. F2 weights
+recall twice as heavily as precision, which is correct for a
+hiker-safety app where missing a real rain event (False Negative) is
+far worse than a false alarm (False Positive).
+See `models/training_report.json` for the full 5-fold CV report.
+## 6. Project Structure / 项目结构
+```
+microclimate-x/
+├── backend/
+│   ├── main.py           # FastAPI app + lifespan
+│   ├── ml_engine.py      # Loads RF model, predict_proba
+│   ├── rule_engine.py    # Veto rules + risk scoring + bilingual advice
+│   ├── terrain.py        # DEM-based Valley/Slope/Flat classification
+│   ├── cache.py          # SQLite WAL cache, risk-adaptive TTL
+│   ├── schemas.py        # Pydantic request/response models
+│   └── config.py         # Thresholds + academic citations
+├── scripts/
+│   ├── 1_download_dataset.py    # Open-Meteo + Open-Topo-Data (real ERA5)
+│   ├── 1b_synth_dataset.py      # physically-plausible offline fallback
+│   ├── 2_preprocess.py
+│   └── 3_train_model.py
+├── frontend/
+│   └── index.html        # Single-file Vue3 SPA
+├── docs/
+│   ├── architecture.md
+│   └── thresholds.md     # Veto thresholds with academic citations
+├── tests/
+│   └── test_rule_engine.py
+├── data/                 # raw/processed CSVs (gitignored)
+├── models/               # trained .pkl artifacts (gitignored)
+└── requirements.txt
+```
+## 7. Key Design Decisions / 关键设计
+| Decision | Rationale |
+|---|---|
+| **Random Forest over SVM / Deep Learning** | Handles non-linear weather-terrain interactions; outputs interpretable feature importance; no GPU needed; robust on tabular data |
+| **Binary classification (`is_rain_event`)** | One-hour-ahead nowcasting matches the use case (hikers' immediate decisions) |
+| **Time-based train/test split** | Random split would leak temporal correlation → inflated metrics |
+| **Class-weight balanced** | Rain is the minority class (~25% in Malaysian mountains) |
+| **Wind direction as u/v components** | Raw degrees treat 0° and 360° as far apart — mathematically incorrect |
+| **Risk-adaptive cache TTL** | High-risk scenarios refresh faster (60 s) than safe ones (600 s) |
+| **SQLite WAL mode** | Allows concurrent reads during writes — critical for FastAPI async |
+## 8. Academic References / 学术参考
+1. **Bhuiyan, M. A. E., et al.** (2020). *Improving satellite-based precipitation estimates over complex terrain using machine learning algorithms*. **Journal of Hydrology**.
+2. **Maclean, I. M., et al.** (2018). *Microclima: An R package for modelling meso- and microclimate*. **Methods in Ecology and Evolution**.
+3. **Garcez, A. d., & Lamb, L. C.** (2020). *Neurosymbolic AI: The 3rd Wave*. arXiv:2012.05876.
+4. **Luks, A. M., et al.** (2019). *Wilderness Medical Society Practice Guidelines for the Prevention and Treatment of Acute Altitude Illness*.
+5. **Vandal, T., et al.** (2017). *DeepSD: Generating high-resolution climate change projections through single image super-resolution*. **KDD**.
+See `docs/thresholds.md` for the full citation table per Veto threshold.
+## 9. Roadmap
+- [x] Frontend dashboard with XAI inference log
+- [x] SQLite caching with WAL + risk-adaptive TTL
+- [x] Terrain detection engine (Valley / Slope / Flat)
+- [x] Rule-based Veto + 0-100 scoring engine (19/19 unit tests passing)
+- [x] Bilingual (EN/ZH) advice generation
+- [x] Dataset download script (Open-Meteo + Open Topo Data) + offline synthetic fallback
+- [x] Preprocessing pipeline (feature engineering + label `is_rain_event`)
+- [x] Random Forest training with time-based CV — **trained on real ERA5 data, test AUC = 0.871**
+- [ ] Model comparison (RFC vs LogReg vs XGBoost) — thesis Chapter 5
+- [ ] Hindcast validation against real Malaysian flood events
+- [ ] PWA offline mode for low-network mountain use
+## 10. License
+MIT — see `LICENSE`.
+---
+*Developed by L.ZH @ Universiti Kebangsaan Malaysia (UKM) for the Final Year Project (FYP).*

backend/__init__.py ADDED Viewed

	@@ -0,0 +1,3 @@


1	+ """MicroClimate-X backend package."""
2	+
3	+ __version__ = "0.1.0"

backend/cache.py ADDED Viewed

	@@ -0,0 +1,190 @@

+"""
+SQLite-backed grid cache with risk-adaptive TTL.
+Design notes
+------------
+* WAL journal mode lets concurrent reads proceed during writes — critical
+  for FastAPI's async I/O. Default rollback-journal mode would serialise
+  every reader behind a writer.
+* All blocking sqlite3 calls are wrapped in `asyncio.to_thread` so they
+  never stall the event loop.
+* Cache key quantises (lat, lon) to a fixed grid resolution (~1.1 km).
+  Without quantisation, floating-point jitter destroys hit rate.
+"""
+from __future__ import annotations
+import asyncio
+import json
+import sqlite3
+import time
+from pathlib import Path
+from typing import Any
+from . import config
+_INIT_SQL = """
+CREATE TABLE IF NOT EXISTS grid_cache (
+    grid_key   TEXT PRIMARY KEY,
+    payload    TEXT NOT NULL,
+    expires_at INTEGER NOT NULL
+);
+CREATE INDEX IF NOT EXISTS idx_expires ON grid_cache(expires_at);
+CREATE TABLE IF NOT EXISTS inference_log (
+    id        INTEGER PRIMARY KEY AUTOINCREMENT,
+    ts        INTEGER NOT NULL,
+    lat       REAL NOT NULL,
+    lon       REAL NOT NULL,
+    risk      INTEGER NOT NULL,
+    veto      INTEGER NOT NULL,
+    summary   TEXT NOT NULL
+);
+CREATE INDEX IF NOT EXISTS idx_log_ts ON inference_log(ts);
+"""
+# Inference-log retention — older rows are pruned on startup.
+INFERENCE_LOG_RETENTION_DAYS = 7
+def _grid_key(lat: float, lon: float, activity: str = "general") -> str:
+    res = config.GRID_RESOLUTION_DEG
+    return f"{round(lat / res)}:{round(lon / res)}:{activity}"
+def _connect(db_path: Path) -> sqlite3.Connection:
+    conn = sqlite3.connect(db_path, timeout=5.0, isolation_level=None)
+    conn.execute("PRAGMA journal_mode=WAL;")
+    conn.execute("PRAGMA synchronous=NORMAL;")
+    conn.execute("PRAGMA busy_timeout=5000;")
+    return conn
+def _init_blocking(db_path: Path) -> None:
+    conn = _connect(db_path)
+    try:
+        conn.executescript(_INIT_SQL)
+    finally:
+        conn.close()
+async def init_db(db_path: Path = config.DB_PATH) -> None:
+    """Create tables and switch to WAL. Idempotent."""
+    await asyncio.to_thread(_init_blocking, db_path)
+def _get_blocking(db_path: Path, key: str) -> tuple[dict[str, Any], int] | None:
+    conn = _connect(db_path)
+    try:
+        row = conn.execute(
+            "SELECT payload, expires_at FROM grid_cache WHERE grid_key=?",
+            (key,),
+        ).fetchone()
+        if row is None:
+            return None
+        payload, expires_at = row
+        if expires_at <= int(time.time()):
+            return None
+        ttl_remaining = expires_at - int(time.time())
+        return json.loads(payload), ttl_remaining
+    finally:
+        conn.close()
+async def get(lat: float, lon: float, *, activity: str = "general") -> tuple[dict[str, Any], int] | None:
+    return await asyncio.to_thread(_get_blocking, config.DB_PATH, _grid_key(lat, lon, activity))
+def _set_blocking(db_path: Path, key: str, payload: dict[str, Any], ttl_sec: int) -> None:
+    conn = _connect(db_path)
+    try:
+        conn.execute(
+            "INSERT OR REPLACE INTO grid_cache(grid_key, payload, expires_at) "
+            "VALUES (?, ?, ?)",
+            (key, json.dumps(payload), int(time.time()) + ttl_sec),
+        )
+    finally:
+        conn.close()
+async def set(lat: float, lon: float, payload: dict[str, Any], ttl_sec: int,
+              *, activity: str = "general") -> None:
+    await asyncio.to_thread(_set_blocking, config.DB_PATH, _grid_key(lat, lon, activity),
+                            payload, ttl_sec)
+def adaptive_ttl(risk_score: int, has_veto: bool) -> int:
+    """Higher risk → shorter TTL. We must not serve stale 'Safe' results
+    while severe weather is developing."""
+    if has_veto or risk_score >= 70:
+        return config.TTL_HIGH_RISK_SEC
+    if risk_score >= 40:
+        return config.TTL_MID_RISK_SEC
+    return config.TTL_LOW_RISK_SEC
+def _log_blocking(db_path: Path, lat: float, lon: float, risk: int,
+                  veto: bool, summary: str) -> None:
+    conn = _connect(db_path)
+    try:
+        conn.execute(
+            "INSERT INTO inference_log(ts, lat, lon, risk, veto, summary) "
+            "VALUES (?, ?, ?, ?, ?, ?)",
+            (int(time.time()), lat, lon, risk, int(veto), summary),
+        )
+    finally:
+        conn.close()
+async def log_inference(lat: float, lon: float, risk: int,
+                        veto: bool, summary: str) -> None:
+    await asyncio.to_thread(_log_blocking, config.DB_PATH, lat, lon,
+                            risk, veto, summary)
+# ──────────────────────────────────────────────────────────────────────────
+# GC / introspection
+# ──────────────────────────────────────────────────────────────────���───────
+def _prune_blocking(db_path: Path) -> int:
+    """Delete expired cache rows + old inference_log rows. Returns total deleted."""
+    now = int(time.time())
+    log_cutoff = now - INFERENCE_LOG_RETENTION_DAYS * 86_400
+    conn = _connect(db_path)
+    try:
+        c1 = conn.execute("DELETE FROM grid_cache WHERE expires_at <= ?", (now,)).rowcount
+        c2 = conn.execute("DELETE FROM inference_log WHERE ts < ?",       (log_cutoff,)).rowcount
+        return int(c1 or 0) + int(c2 or 0)
+    finally:
+        conn.close()
+async def prune_expired(db_path: Path = config.DB_PATH) -> int:
+    """Run cache GC. Returns number of rows removed across both tables."""
+    return await asyncio.to_thread(_prune_blocking, db_path)
+def _stats_blocking(db_path: Path) -> dict[str, Any]:
+    now = int(time.time())
+    conn = _connect(db_path)
+    try:
+        total  = conn.execute("SELECT COUNT(*) FROM grid_cache").fetchone()[0]
+        live   = conn.execute(
+            "SELECT COUNT(*) FROM grid_cache WHERE expires_at > ?",
+            (now,),
+        ).fetchone()[0]
+        logged = conn.execute("SELECT COUNT(*) FROM inference_log").fetchone()[0]
+        page_size = conn.execute("PRAGMA page_size").fetchone()[0]
+        page_count = conn.execute("PRAGMA page_count").fetchone()[0]
+        return {
+            "rows_total":        int(total),
+            "rows_live":         int(live),
+            "rows_expired":      int(total) - int(live),
+            "inference_log_rows": int(logged),
+            "db_bytes":           int(page_size) * int(page_count),
+        }
+    finally:
+        conn.close()
+async def cache_stats(db_path: Path = config.DB_PATH) -> dict[str, Any]:
+    return await asyncio.to_thread(_stats_blocking, db_path)

backend/config.py ADDED Viewed

	@@ -0,0 +1,208 @@

+"""
+Central configuration for MicroClimate-X.
+EVERY Veto threshold below has an academic / regulatory citation.
+This is intentional — at thesis defence the panel WILL ask
+"why 3500 m, why -5 °C, why 40 km/h?". Be ready to point to this file.
+"""
+from __future__ import annotations
+import os
+import subprocess
+from pathlib import Path
+ROOT = Path(__file__).resolve().parent.parent
+MODEL_DIR = ROOT / "models"
+DATA_DIR  = ROOT / "data"
+DB_PATH   = Path(os.environ.get("MICROCLIMATEX_DB", str(ROOT / "cache.sqlite3")))
+def _detect_git_revision() -> str:
+    """Best-effort short SHA. Returns "unknown" if git is not available
+    or this directory isn't a checkout (e.g. inside a Docker image)."""
+    env = os.environ.get("MICROCLIMATEX_GIT_REV")
+    if env:
+        return env
+    try:
+        out = subprocess.run(
+            ["git", "rev-parse", "--short", "HEAD"],
+            cwd=ROOT, capture_output=True, text=True, timeout=2.0,
+        )
+        if out.returncode == 0:
+            return out.stdout.strip()
+    except (FileNotFoundError, subprocess.SubprocessError):    # pragma: no cover
+        pass
+    return "unknown"
+GIT_REVISION = _detect_git_revision()
+# ──────────────────────────────────────────────────────────────────────────
+# Veto thresholds — one-vote rejection rules
+# ──────────────────────────────────────────────────────────────────────────
+# Citation: Luks et al. (2019) "Wilderness Medical Society Practice
+#           Guidelines for the Prevention and Treatment of Acute Altitude
+#           Illness." High altitude (>2500 m) carries clinical risk; severe
+#           hypoxia onset is well-documented above ~3500 m.
+ALTITUDE_HYPOXIA_M = 3500.0
+# Citation: WMO Beaufort scale — Force 6 "Strong breeze" ≈ 39-49 km/h,
+#           the threshold above which outdoor activity becomes hazardous.
+GALE_WIND_KMH = 40.0
+# Citation: UIAA Medical Commission frostbite risk guidance — exposed skin
+#           freezes rapidly below approximately -5 °C with wind chill.
+EXTREME_COLD_C = -5.0
+# Citation: U.S. NWS convective forecasting handbook — CAPE > 1000 J/kg
+#           indicates moderate-to-strong instability suitable for
+#           thunderstorm development.
+HIGH_CAPE_JKG = 1000.0
+# Citation: FAA AIM 7-1-12 — visibility below 100 m is classified as
+#           Category III instrument-only conditions. Used here as an extreme
+#           low-visibility threshold (whiteout / dense fog).
+LOW_VISIBILITY_M = 100.0
+# Wind alignment with slope normal vector (orographic uplift). The
+# threshold 0.7 corresponds to ~45 degrees of slope-facing wind.
+OROGRAPHIC_DOT_THRESHOLD = 0.7
+# Wet-flood trigger in a valley basin: high probability of localised rain
+# combined with valley-floor topography.
+VALLEY_FLOOD_PROB = 0.80
+# ──────────────────────────────────────────────────────────────────────────
+# Risk scoring (additive penalties when no Veto fires)
+# ──────────────────────────────────────────────────────────────────────────
+PENALTY = {
+    "ml_high_rain_prob": 35,   # ML predicts >= 70 % rain probability
+    "ml_mid_rain_prob":  15,   # ML predicts 40-70 % rain probability
+    "valley_floor":      10,
+    "windward_slope":    20,
+    "orographic_lift":   25,
+    "altitude_high":     15,   # 2500-3500 m, sub-Veto altitude band
+    "wind_strong":       10,   # 25-40 km/h
+}
+# ──────────────────────────────────────────────────────────────────────────
+# Four hazard categories — matches D5 proposal §3.7 / P4.3
+# ──────────────────────────────────────────────────────────────────────────
+# Fog risk:
+#   WMO surface synoptic code: fog ≈ visibility < 1 km, RH typically > 95 %,
+#   dew-point depression < ~2 °C. Valley/Slope basins trap radiation fog.
+FOG_HUMIDITY_PCT      = 95.0
+FOG_DEW_DEP_MAX_C     = 2.0
+FOG_CLOUD_BASE_MAX_M  = 800.0    # from D5 §3.7.2 decision table
+# Wind gust risk:
+#   On exposed ridges and mountain passes, sustained 25 km/h winds with
+#   topographic acceleration commonly gust to Beaufort F6 levels.
+GUST_WIND_MIN_KMH     = 25.0     # below GALE_WIND_KMH but still risky
+# Thunderstorm risk:
+#   NWS "moderate instability" begins at CAPE 500 J/kg; sharp pressure drop
+#   often precedes convective initiation.
+THUNDER_CAPE_MIN_JKG  = 500.0
+THUNDER_PRESSURE_DROP = -2.0     # hPa over past 3 h (matches D5 §1.3 example)
+# ──────────────────────────────────────────────────────────────────────────
+# Decision Table — D5 §3.7.2 / Table 4.2  (one-to-one with the thesis)
+# ──────────────────────────────────────────────────────────────────────────
+# Each rule fires when ALL of its non-None conditions hold. The thesis
+# narrative motivates this table as: "macro forecast says no rain, but
+# the local terrain conditions imply hidden risk".
+DECISION_TABLE_3_7_2 = {
+    "R1": {
+        "description":            "Hidden rain risk — macro says no, terrain says yes",
+        "macro_rain_prob_max":    0.30,
+        "macro_rain_prob_min":    None,
+        "humidity_min_pct":       85.0,
+        "wind_into_slope":        True,
+        "terrain":                "WindwardSlope",
+        "pressure_change_3h_max": -1.5,
+        "cloud_base_max_m":       FOG_CLOUD_BASE_MAX_M,
+        "conclusion_en":          "Hidden rain risk: terrain analysis indicates orographic precipitation despite low macro probability.",
+        "conclusion_zh":          "隐藏降雨风险：宏观预报概率低，但地形分析表明存在地形抬升降水。",
+    },
+    "R2": {
+        "description":            "No significant risk — terrain not aligned",
+        "macro_rain_prob_max":    0.30,
+        "macro_rain_prob_min":    None,
+        "humidity_min_pct":       85.0,
+        "wind_into_slope":        False,
+        "terrain":                "LeewardOrValley",
+        "pressure_change_3h_max": -1.5,
+        "cloud_base_max_m":       FOG_CLOUD_BASE_MAX_M,
+        "conclusion_en":          "No significant rainfall danger at this spot in this period.",
+        "conclusion_zh":          "此地此时无显著降雨危险。",
+    },
+    "R3": {
+        "description":            "Heavy downpour incoming — avoid exposure",
+        "macro_rain_prob_max":    None,
+        "macro_rain_prob_min":    0.70,
+        "humidity_min_pct":       None,
+        "wind_into_slope":        True,
+        "terrain":                "WindwardSlope",
+        "pressure_change_3h_max": None,
+        "cloud_base_max_m":       None,
+        "conclusion_en":          "Heavy downpour incoming. Avoid mountains and valleys.",
+        "conclusion_zh":          "强降雨即将到来。请避开山区与峡谷。",
+    },
+    "R4": {
+        "description":            "Normal rain — no terrain amplification",
+        "macro_rain_prob_max":    None,
+        "macro_rain_prob_min":    0.70,
+        "humidity_min_pct":       None,
+        "wind_into_slope":        None,
+        "terrain":                None,
+        "pressure_change_3h_max": None,
+        "cloud_base_max_m":       None,
+        "conclusion_en":          "Rain expected, but no terrain-induced amplification. Standard rain precautions apply.",
+        "conclusion_zh":          "预计有雨，但无地形抬升放大。按一般雨天措施应对即可。",
+    },
+}
+# ──────────────────────────────────────────────────────────────────────────
+# Activity-aware weighting — D5 §3.7 / P4.4
+# ──────────────────────────────────────────────────────────────────────────
+# Composite = Σ w_i · subscore_i, then renormalised to 0-100.
+# Rows: activity. Cols: rainfall, fog, wind_gust, thunderstorm.
+ACTIVITY_WEIGHTS = {
+    "hiker":        {"rainfall": 1.0, "fog": 1.3, "wind_gust": 1.0, "thunderstorm": 1.4},
+    "driver":       {"rainfall": 0.8, "fog": 1.5, "wind_gust": 1.3, "thunderstorm": 0.9},
+    "construction": {"rainfall": 1.0, "fog": 0.8, "wind_gust": 1.5, "thunderstorm": 1.4},
+    "general":      {"rainfall": 1.0, "fog": 1.0, "wind_gust": 1.0, "thunderstorm": 1.0},
+}
+# ──────────────────────────────────────────────────────────────────────────
+# Cache TTL (risk-adaptive)
+# ──────────────────────────────────────────────────────────────────────────
+# Safety-critical apps must not serve stale "Safe" verdicts during developing
+# storms. Bucket TTL by risk band.
+TTL_HIGH_RISK_SEC = 60      # any Veto fired OR risk >= 70
+TTL_MID_RISK_SEC  = 300     # risk 40-70
+TTL_LOW_RISK_SEC  = 600     # risk < 40
+# Grid resolution used as cache key (0.01° ≈ 1.1 km at the equator).
+GRID_RESOLUTION_DEG = 0.01
+# ──────────────────────────────────────────────────────────────────────────
+# External API endpoints
+# ──────────────────────────────────────────────────────────────────────────
+OPEN_METEO_FORECAST_URL = "https://api.open-meteo.com/v1/forecast"
+OPEN_TOPO_URL           = "https://api.opentopodata.org/v1/srtm30m"
+# ──────────────────────────────────────────────────────────────────────────
+# Domain constants
+# ──────────────────────────────────────────────────────────────────────────
+# WMO definition of trace precipitation.
+RAIN_THRESHOLD_MM = 0.1

backend/errors.py ADDED Viewed

	@@ -0,0 +1,26 @@

+"""
+Centralised error contract.
+Every non-2xx response from the API has the same JSON shape so a
+client (Vue SPA, curl, Postman, future mobile app) can rely on it.
+"""
+from __future__ import annotations
+from typing import Any
+from pydantic import BaseModel
+class ErrorResponse(BaseModel):
+    error:      str          # short, stable identifier (snake_case)
+    detail:     str          # human readable
+    request_id: str | None = None
+    context:    dict[str, Any] | None = None
+# Canonical error identifiers — used as the `error` field. Adding new ones
+# requires updating the OpenAPI docstring on the predict() endpoint too.
+ERR_UPSTREAM_FAILURE = "upstream_failure"
+ERR_INVALID_INPUT    = "invalid_input"
+ERR_MODEL_ERROR      = "model_error"
+ERR_INTERNAL         = "internal_error"

backend/main.py ADDED Viewed

	@@ -0,0 +1,455 @@

+"""
+FastAPI entry point for MicroClimate-X.
+Endpoints
+---------
+GET  /                 — name / version / banner
+GET  /api/predict      — main prediction endpoint (?lat=&lon=&activity=)
+GET  /api/health       — JSON health + cache stats + DB latency
+GET  /api/version      — version metadata for clients
+Lifespan
+--------
+* On startup: WAL-mode SQLite init, prune expired cache rows, load ML model.
+* On shutdown: dispose of the shared httpx.AsyncClient.
+Resilience
+----------
+* `RequestIDMiddleware` stamps every request with `X-Request-ID` for log
+  correlation (taken from incoming header if present, otherwise generated).
+* All exceptions surface as a `errors.ErrorResponse` JSON document — no
+  bare 500 HTML responses leak.
+"""
+from __future__ import annotations
+import asyncio
+import datetime as _dt
+import logging
+import math
+import time
+import uuid
+from contextlib import asynccontextmanager
+from typing import Any
+import httpx
+from fastapi import FastAPI, HTTPException, Query, Request
+from fastapi.exceptions import RequestValidationError
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import JSONResponse
+from fastapi.staticfiles import StaticFiles
+from starlette.middleware.base import BaseHTTPMiddleware
+from tenacity import RetryError, retry, stop_after_attempt, wait_exponential
+from . import cache, config, rule_engine, terrain
+from .errors import (
+    ERR_INTERNAL,
+    ERR_INVALID_INPUT,
+    ERR_UPSTREAM_FAILURE,
+    ErrorResponse,
+)
+from .ml_engine import MLEngine
+from .schemas import ActivityType, PredictionResponse
+__version__ = "1.0.0"
+# ──────────────────────────────────────────────────────────────────────────
+# Logging — structured records: ts | level | request_id | message
+# ──────────────────────────────────────────────────────────────────────────
+class _RequestIDFilter(logging.Filter):
+    def filter(self, record: logging.LogRecord) -> bool:
+        if not hasattr(record, "request_id"):
+            record.request_id = "-"
+        return True
+_handler = logging.StreamHandler()
+_handler.setFormatter(logging.Formatter(
+    "%(asctime)s | %(levelname)-7s | %(request_id)s | %(name)s | %(message)s",
+    datefmt="%Y-%m-%dT%H:%M:%S",
+))
+_handler.addFilter(_RequestIDFilter())
+logging.basicConfig(level=logging.INFO, handlers=[_handler], force=True)
+log = logging.getLogger("microclimate-x")
+# ──────────────────────────────────────────────────────────────────────────
+# Lifespan: model + DB + HTTP client
+# ──────────────────────────────────────────────────────────────────────────
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    log.info("Starting MicroClimate-X backend (v%s)…", __version__)
+    await cache.init_db()
+    pruned = await cache.prune_expired()
+    if pruned:
+        log.info("Cache GC removed %d expired rows on startup.", pruned)
+    engine = MLEngine()
+    engine.load()
+    if engine.is_loaded:
+        log.info("ML model loaded from %s", engine.loaded_from)
+    else:
+        log.warning(
+            "No trained model found — falling back to heuristic predictor. "
+            "Run scripts/3_train_model.py to enable Random Forest."
+        )
+    app.state.ml = engine
+    app.state.http = httpx.AsyncClient(timeout=15.0, http2=False)
+    app.state.start_ts = time.time()
+    try:
+        yield
+    finally:
+        await app.state.http.aclose()
+        log.info("Shutdown complete.")
+app = FastAPI(
+    title="MicroClimate-X API",
+    version=__version__,
+    description=(
+        "Hybrid microclimate risk assessment for complex terrain. "
+        "Combines a Random Forest macro-rain predictor with a topographic "
+        "rule-based expert system (Veto cascade + R1-R4 decision table "
+        "+ activity-aware composite). "
+        "Implements proposal §3.7 — sub-process P4.1 through P4.6."
+    ),
+    lifespan=lifespan,
+)
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_methods=["GET"],
+    allow_headers=["*"],
+    expose_headers=["X-Request-ID", "X-Response-Time-ms"],
+)
+# ──────────────────────────────────────────────────────────────────────────
+# Request-ID + timing middleware
+# ───────────────────────��──────────────────────────────────────────────────
+class RequestIDMiddleware(BaseHTTPMiddleware):
+    """Tag every request with `X-Request-ID` and measure latency.
+    The ID propagates from incoming headers (so a load-balancer / front-end
+    can supply one) and falls back to a new UUID4 prefix.
+    """
+    async def dispatch(self, request: Request, call_next):
+        req_id = request.headers.get("x-request-id") or uuid.uuid4().hex[:12]
+        # Stash on request state so handlers can read it.
+        request.state.request_id = req_id
+        start = time.perf_counter()
+        try:
+            response = await call_next(request)
+        except Exception:                                    # pragma: no cover
+            elapsed_ms = int((time.perf_counter() - start) * 1000)
+            log.exception(
+                "unhandled exception",
+                extra={"request_id": req_id, "path": request.url.path,
+                        "elapsed_ms": elapsed_ms},
+            )
+            return _json_error(
+                req_id, 500, ERR_INTERNAL,
+                "Internal server error — please retry.",
+            )
+        elapsed_ms = int((time.perf_counter() - start) * 1000)
+        response.headers["X-Request-ID"]       = req_id
+        response.headers["X-Response-Time-ms"] = str(elapsed_ms)
+        # Only log non-static-asset, non-OPTIONS for noise control.
+        if request.url.path.startswith("/api/") or request.url.path in {"/"}:
+            log.info(
+                "%s %s -> %d (%d ms)",
+                request.method, request.url.path, response.status_code, elapsed_ms,
+                extra={"request_id": req_id},
+            )
+        return response
+app.add_middleware(RequestIDMiddleware)
+# ──────────────────────────────────────────────────────────────────────────
+# Exception handlers — every error follows the ErrorResponse schema
+# ──────────────────────────────────────────────────────────────────────────
+def _json_error(req_id: str | None, status: int, code: str, detail: str,
+                ctx: dict[str, Any] | None = None) -> JSONResponse:
+    payload = ErrorResponse(error=code, detail=detail, request_id=req_id, context=ctx)
+    return JSONResponse(status_code=status, content=payload.model_dump(exclude_none=True))
+@app.exception_handler(RequestValidationError)
+async def _on_validation_error(request: Request, exc: RequestValidationError):
+    req_id = getattr(request.state, "request_id", None)
+    return _json_error(
+        req_id, 422, ERR_INVALID_INPUT,
+        "One or more query parameters failed validation.",
+        ctx={"errors": exc.errors()[:5]},
+    )
+@app.exception_handler(HTTPException)
+async def _on_http_exception(request: Request, exc: HTTPException):
+    req_id = getattr(request.state, "request_id", None)
+    code = (
+        ERR_UPSTREAM_FAILURE if exc.status_code in {502, 503, 504}
+        else ERR_INVALID_INPUT if exc.status_code in {400, 422}
+        else ERR_INTERNAL
+    )
+    return _json_error(req_id, exc.status_code, code, str(exc.detail))
+@app.exception_handler(Exception)
+async def _on_unhandled(request: Request, exc: Exception):     # pragma: no cover
+    req_id = getattr(request.state, "request_id", None)
+    log.exception("unhandled top-level exception",
+                  extra={"request_id": req_id or "-"})
+    return _json_error(
+        req_id, 500, ERR_INTERNAL,
+        "Internal server error — please retry. If the problem persists, file an issue.",
+    )
+# ──────────────────────────────────────────────────────────────────────────
+# Frontend static files (optional — only if /frontend exists alongside backend)
+# ──────────────────────────────────────────────────────────────────────────
+FRONTEND_DIR = config.ROOT / "frontend"
+if FRONTEND_DIR.exists():
+    app.mount("/app", StaticFiles(directory=FRONTEND_DIR, html=True), name="frontend")
+# ──────────────────────────────────────────────────────────────────────────
+# Health & version & root
+# ──────────────────────────────────────────────────────────────────────────
+@app.get("/")
+async def root() -> dict[str, Any]:
+    return {
+        "name":         "MicroClimate-X",
+        "version":      __version__,
+        "ml_loaded":    app.state.ml.is_loaded,
+        "frontend_url": "/app/",
+        "docs_url":     "/docs",
+        "openapi_url":  "/openapi.json",
+    }
+@app.get("/api/version")
+async def version() -> dict[str, Any]:
+    return {
+        "version":        __version__,
+        "git_revision":   config.GIT_REVISION,
+        "ml_loaded":      app.state.ml.is_loaded,
+        "ml_loaded_from": app.state.ml.loaded_from,
+        "ml_features":    [*app.state.ml.feature_columns[:5], "…"]
+                          if len(app.state.ml.feature_columns) > 5
+                          else app.state.ml.feature_columns,
+    }
+@app.get("/api/health")
+async def health() -> dict[str, Any]:
+    stats = await cache.cache_stats()
+    return {
+        "status":          "ok",
+        "uptime_sec":      int(time.time() - app.state.start_ts),
+        "ml_loaded":       app.state.ml.is_loaded,
+        "cache":           stats,
+        "db_path":         str(config.DB_PATH),
+        "version":         __version__,
+    }
+# ──────────────────────────────────────────────────────────────────────────
+# External fetching helpers
+# ──────────────────────────────────────────────────────────────────────────
+@retry(stop=stop_after_attempt(3), wait=wait_exponential(min=1, max=8))
+async def _fetch_current_weather(client: httpx.AsyncClient, lat: float, lon: float) -> dict[str, Any]:
+    resp = await client.get(
+        config.OPEN_METEO_FORECAST_URL,
+        params={
+            "latitude":  lat,
+            "longitude": lon,
+            "current":   ",".join([
+                "temperature_2m", "relative_humidity_2m", "precipitation",
+                "wind_speed_10m", "wind_direction_10m", "surface_pressure",
+                "dew_point_2m", "cloud_cover", "cape", "visibility",
+            ]),
+            "windspeed_unit": "kmh",
+            "timezone": "auto",
+        },
+        timeout=15.0,
+    )
+    resp.raise_for_status()
+    raw = resp.json().get("current", {})
+    return {
+        "temperature_c":         raw.get("temperature_2m"),
+        "humidity_pct":          raw.get("relative_humidity_2m"),
+        "precipitation_mm":      raw.get("precipitation", 0.0),
+        "wind_speed_kmh":        raw.get("wind_speed_10m", 0.0),
+        "wind_direction_deg":    raw.get("wind_direction_10m", 0.0),
+        "pressure_hpa":          raw.get("surface_pressure"),
+        "dew_point_c":           raw.get("dew_point_2m"),
+        "cloud_cover_pct":       raw.get("cloud_cover", 0.0),
+        "cape_jkg":              raw.get("cape", 0.0),
+        "visibility_m":          raw.get("visibility", 10000.0),
+    }
+# ──────────────────────────────────────────────────────────────────────────
+# Main endpoint
+# ──────────────────────────────────────────────────────────────────────────
+@app.get(
+    "/api/predict",
+    response_model=PredictionResponse,
+    responses={
+        422: {"model": ErrorResponse, "description": "Invalid query parameters."},
+        502: {"model": ErrorResponse, "description": "Upstream weather/DEM service failed."},
+        500: {"model": ErrorResponse, "description": "Unexpected server error."},
+    },
+)
+async def predict(
+    request: Request,
+    lat: float = Query(..., ge=-90.0,  le=90.0,  description="Latitude (WGS84)"),
+    lon: float = Query(..., ge=-180.0, le=180.0, description="Longitude (WGS84)"),
+    activity: ActivityType = Query(
+        "general",
+        description="User activity context — affects composite score weighting (D5 §3.7 / P4.4).",
+    ),
+) -> PredictionResponse:
+    req_id = getattr(request.state, "request_id", "-")
+    # ── Cache lookup first (per-coordinate + per-activity) ──
+    hit = await cache.get(lat, lon, activity=activity)
+    if hit is not None:
+        payload, ttl_remaining = hit
+        payload["cached"] = True
+        payload["cache_ttl"] = ttl_remaining
+        log.info("cache hit (ttl_remaining=%ds)", ttl_remaining, extra={"request_id": req_id})
+        return PredictionResponse(**payload)
+    client: httpx.AsyncClient = app.state.http
+    # ── Fetch DEM (terrain) and weather in parallel ──
+    try:
+        dem9, weather = await asyncio.gather(
+            terrain.fetch_dem_3x3(lat, lon, client),
+            _fetch_current_weather(client, lat, lon),
+        )
+    except (httpx.HTTPError, RetryError, ValueError) as exc:
+        log.warning(
+            "upstream API failure: %s",
+            type(exc).__name__,
+            extra={"request_id": req_id},
+        )
+        raise HTTPException(
+            status_code=502,
+            detail=f"Upstream weather/DEM service unavailable ({type(exc).__name__}). "
+                   f"Please retry shortly.",
+        ) from exc
+    tinfo = terrain.classify_terrain(dem9)
+    orographic_dot = (
+        terrain.orographic_lift_dot(
+            weather.get("wind_direction_deg", 0.0),
+            tinfo.aspect_deg,
+            tinfo.slope_deg,
+        )
+        if tinfo.terrain == "Slope" else 0.0
+    )
+    # ── Build ML feature dict ──
+    feats = _build_ml_features(weather, tinfo.elevation_m)
+    try:
+        ml_prob = app.state.ml.predict_rain_probability(feats)
+    except Exception as exc:                                  # pragma: no cover
+        log.exception("ML inference failed", extra={"request_id": req_id})
+        raise HTTPException(
+            status_code=500,
+            detail=f"Model inference failed: {exc!r}",
+        ) from exc
+    # ── Apply Rule Engine ──
+    rule_result = rule_engine.evaluate(
+        lat=lat,
+        lon=lon,
+        elevation_m=tinfo.elevation_m,
+        terrain=tinfo.terrain,
+        weather=weather,
+        ml_rain_prob=ml_prob,
+        slope_deg=tinfo.slope_deg,
+        aspect_deg=tinfo.aspect_deg,
+        orographic_dot=orographic_dot,
+        activity=activity,
+    )
+    # ── Assemble response ──
+    ttl = cache.adaptive_ttl(rule_result.risk_score, rule_result.has_veto)
+    response = PredictionResponse(
+        latitude=lat,
+        longitude=lon,
+        elevation_m=tinfo.elevation_m,
+        terrain=tinfo.terrain,
+        ml_rain_probability=ml_prob,
+        hazard_subscores=rule_result.hazard_subscores,
+        decision_table_matches=rule_result.decision_table_matches,
+        activity=rule_result.activity,
+        risk_score=rule_result.risk_score,
+        risk_level=rule_result.risk_level,
+        veto_triggers=rule_result.veto_triggers,
+        inference_log=rule_result.inference_log,
+        advice_en=rule_result.advice_en,
+        advice_zh=rule_result.advice_zh,
+        cached=False,
+        cache_ttl=ttl,
+    )
+    # ── Cache + audit-log (fire-and-forget — never blocks the response) ──
+    payload_dump = response.model_dump(mode="json")
+    _bg_tasks: set[asyncio.Task[Any]] = getattr(request.app.state, "bg_tasks", None) or set()
+    request.app.state.bg_tasks = _bg_tasks
+    for coro in (
+        cache.set(lat, lon, payload_dump, ttl, activity=activity),
+        cache.log_inference(
+            lat, lon, rule_result.risk_score, rule_result.has_veto,
+            rule_result.advice_en,
+        ),
+    ):
+        task = asyncio.create_task(coro)
+        _bg_tasks.add(task)
+        task.add_done_callback(_bg_tasks.discard)
+    return response
+# ──────────────────────────────────────────────────────────────────────────
+# Helpers
+# ──────────────────────────────────────────────────────────────────────────
+def _build_ml_features(weather: dict[str, Any], elevation_m: float) -> dict[str, float]:
+    """Mirror of `scripts/2_preprocess.py` — keep features in sync with training."""
+    now = _dt.datetime.now()
+    feats = dict(weather)
+    feats["elevation_m"] = elevation_m
+    wind_kmh = weather.get("wind_speed_kmh", 0.0) or 0.0
+    wind_dir = weather.get("wind_direction_deg", 0.0) or 0.0
+    feats["wind_u"]    = wind_kmh * math.sin(math.radians(wind_dir))
+    feats["wind_v"]    = wind_kmh * math.cos(math.radians(wind_dir))
+    feats["hour_sin"]  = math.sin(2 * math.pi * now.hour  / 24.0)
+    feats["hour_cos"]  = math.cos(2 * math.pi * now.hour  / 24.0)
+    feats["month_sin"] = math.sin(2 * math.pi * now.month / 12.0)
+    feats["month_cos"] = math.cos(2 * math.pi * now.month / 12.0)
+    temp = weather.get("temperature_c") or 25.0
+    dew  = weather.get("dew_point_c")   or temp
+    feats["dew_point_depression"] = temp - dew
+    feats["pressure_change_3h"]   = 0.0     # set by historical training; 0 at inference
+    feats["precipitation_lag_1h"] = weather.get("precipitation_mm", 0.0) or 0.0
+    return feats

backend/ml_engine.py ADDED Viewed

	@@ -0,0 +1,126 @@

+"""
+ML Predictor wrapper.
+The trained Random Forest is loaded ONCE at FastAPI startup (lifespan)
+and held in memory — never reload inside a request handler.
+When the model artefact is missing we fall back to a physically-motivated
+heuristic so the API still runs end-to-end before `scripts/3_train_model.py`
+has been executed. The heuristic deliberately uses the same feature names
+as the trained model so swapping between them is transparent to callers.
+"""
+from __future__ import annotations
+import json
+import logging
+import math
+from pathlib import Path
+from typing import Any
+import joblib
+from . import config
+log = logging.getLogger("microclimate-x.ml")
+class MLEngine:
+    """Thin, defensive wrapper around the joblibbed RandomForestClassifier.
+    Invariant: ``predict_rain_probability`` ALWAYS returns a float in [0, 1].
+    Any internal failure logs and falls through to the heuristic.
+    """
+    def __init__(self) -> None:
+        self.model: Any | None = None
+        self.feature_columns: list[str] = []
+        self.loaded_from: str | None = None
+        self.training_report: dict[str, Any] | None = None
+    # ── Load --------------------------------------------------------
+    def load(self) -> None:
+        model_path    = config.MODEL_DIR / "rf_model.pkl"
+        features_path = config.MODEL_DIR / "feature_columns.json"
+        report_path   = config.MODEL_DIR / "training_report.json"
+        if not (model_path.exists() and features_path.exists()):
+            self.model = None
+            self.loaded_from = None
+            return
+        try:
+            self.model = joblib.load(model_path)
+            self.feature_columns = json.loads(features_path.read_text())
+            self.loaded_from = str(model_path)
+            if report_path.exists():
+                self.training_report = json.loads(report_path.read_text())
+            log.info(
+                "loaded RF model with %d features (%s)",
+                len(self.feature_columns), Path(model_path).name,
+            )
+        except Exception as exc:   # pragma: no cover — defensive
+            log.exception("Failed to load trained model: %s", exc)
+            self.model = None
+            self.loaded_from = None
+    @property
+    def is_loaded(self) -> bool:
+        return self.model is not None
+    # ── Predict -----------------------------------------------------
+    def predict_rain_probability(self, feats: dict[str, float]) -> float:
+        """Return P(rain in next hour) ∈ [0, 1]."""
+        if self.is_loaded:
+            try:
+                X = [[self._safe_feat(feats, col) for col in self.feature_columns]]
+                p = float(self.model.predict_proba(X)[0, 1])
+                return min(1.0, max(0.0, p))
+            except Exception as exc:                          # pragma: no cover
+                log.exception("RF inference failed (%s) — falling back to heuristic.", exc)
+        return self._fallback_heuristic(feats)
+    # ── Helpers -----------------------------------------------------
+    @staticmethod
+    def _safe_feat(feats: dict[str, float], col: str) -> float:
+        v = feats.get(col, 0.0)
+        if v is None:
+            return 0.0
+        try:
+            f = float(v)
+        except (TypeError, ValueError):
+            return 0.0
+        if math.isnan(f) or math.isinf(f):
+            return 0.0
+        return f
+    @staticmethod
+    def _fallback_heuristic(f: dict[str, float]) -> float:
+        """Smooth, physically-motivated proxy used when no trained model
+        exists yet. Uses the same feature inputs as the trained model so the
+        downstream rule engine sees no behaviour change."""
+        humidity = MLEngine._safe_get(f, "humidity_pct", 60.0)
+        dew_dep  = MLEngine._safe_get(f, "dew_point_depression", 5.0)
+        cloud    = MLEngine._safe_get(f, "cloud_cover_pct", 50.0)
+        cape     = MLEngine._safe_get(f, "cape_jkg", 0.0)
+        prev     = MLEngine._safe_get(f, "precipitation_lag_1h", 0.0)
+        pres_dp  = MLEngine._safe_get(f, "pressure_change_3h", 0.0)
+        z = (
+            0.05 * (humidity - 70.0)
+            - 0.22 * dew_dep
+            + 0.02 * (cloud - 50.0)
+            + 0.0015 * cape
+            + 1.50 * (1.0 if prev > 0.1 else 0.0)
+            - 0.30 * pres_dp               # falling pressure → more rain
+        )
+        return 1.0 / (1.0 + math.exp(-z))
+    @staticmethod
+    def _safe_get(d: dict[str, float], k: str, default: float) -> float:
+        v = d.get(k, default)
+        if v is None or (isinstance(v, float) and (math.isnan(v) or math.isinf(v))):
+            return default
+        try:
+            return float(v)
+        except (TypeError, ValueError):
+            return default

backend/rule_engine.py ADDED Viewed

	@@ -0,0 +1,480 @@

+"""
+Topographic Rule-Based Expert System — Engine B of the hybrid architecture.
+This module is structured to mirror D5 proposal §3.7 / P4 so it is auditable
+against the thesis section by section:
+    P4.1  Load Dynamic Risk Rules          → constants in backend/config.py
+    P4.2  Fetch User Context (activity)    → `evaluate(activity=…)` parameter
+    P4.3  Evaluate Environmental Risks     → four `score_*_risk()` functions
+                                              (rainfall / fog / wind_gust / thunderstorm)
+    P4.4  Apply Activity-Specific Weight   → `apply_activity_weighting()`
+    P4.5  Calculate Composite Risk Score   → weighted sum + Veto cap
+    P4.6  Generate Actionable Advice       → bilingual advice helpers
+In parallel, the Veto cascade (life-safety overrides) and the D5 §3.7.2
+Table 4.2 Decision Table run alongside the composite score.
+"""
+from __future__ import annotations
+from dataclasses import dataclass, field
+from typing import Any
+from . import config
+from .schemas import (
+    ActivityType,
+    DecisionTableMatch,
+    HazardSubscores,
+    InferenceStep,
+    RiskLevel,
+    VetoTrigger,
+)
+@dataclass
+class RuleResult:
+    risk_score: int = 0
+    risk_level: RiskLevel = "Safe"
+    veto_triggers:        list[VetoTrigger] = field(default_factory=list)
+    inference_log:        list[InferenceStep] = field(default_factory=list)
+    advice_en: str = ""
+    advice_zh: str = ""
+    hazard_subscores:     HazardSubscores = field(
+        default_factory=lambda: HazardSubscores(rainfall=0, fog=0, wind_gust=0, thunderstorm=0)
+    )
+    decision_table_matches: list[DecisionTableMatch] = field(default_factory=list)
+    activity: ActivityType = "general"
+    @property
+    def has_veto(self) -> bool:
+        return len(self.veto_triggers) > 0
+def _bin_level(score: int) -> RiskLevel:
+    if score >= 80:
+        return "Danger"
+    if score >= 55:
+        return "Warning"
+    if score >= 30:
+        return "Caution"
+    return "Safe"
+def _clip(x: float) -> int:
+    return max(0, min(100, round(x)))
+# ════════════════════════════════════════════════════════════════════════
+# P4.3 — Four Hazard Sub-Scorers (each returns 0-100)
+# ════════════════════════════════════════════════════════════════════════
+def score_rainfall_risk(
+    *, ml_rain_prob: float, terrain: str, orographic_dot: float,
+    pressure_change_3h: float, humidity_pct: float,
+) -> int:
+    """Rainfall sub-score. Backbone is ML probability; terrain amplifies.
+    Calibration: ml_rain_prob 0.45 on flat terrain should yield ~40
+    (matching the proposal's intuition that 45 % probability already warrants
+    a 'Caution' verdict)."""
+    s = ml_rain_prob * 55.0                   # baseline 0-55 from ML
+    if ml_rain_prob >= 0.70:
+        s += 20.0                              # high-confidence rain bonus
+    elif ml_rain_prob >= 0.40:
+        s += 12.0
+    if terrain == "Valley":
+        s += 8.0
+    elif terrain == "Slope":
+        s += orographic_dot * 25.0             # up to +25 on a windward slope
+    if pressure_change_3h <= -1.5:             # storm-precursor pressure fall
+        s += 8.0
+    if humidity_pct >= 90.0:
+        s += 6.0
+    return _clip(s)
+def score_fog_risk(
+    *, humidity_pct: float, dew_point_depression: float,
+    cloud_cover_pct: float, terrain: str, elevation_m: float,
+) -> int:
+    """Fog sub-score. Saturated boundary layer + heavy low cloud + a basin
+    or slope that traps the radiation/advection fog."""
+    if dew_point_depression > 5.0:
+        return _clip(humidity_pct - 80.0)    # near-zero unless very humid
+    s = 0.0
+    # Humidity → saturation contribution.
+    if humidity_pct >= config.FOG_HUMIDITY_PCT:
+        s += 55.0
+    elif humidity_pct >= 90.0:
+        s += 25.0
+    elif humidity_pct >= 85.0:
+        s += 10.0
+    # Dew-point depression: smaller = closer to saturation.
+    if dew_point_depression <= config.FOG_DEW_DEP_MAX_C:
+        s += 25.0
+    elif dew_point_depression <= 3.5:
+        s += 12.0
+    # Low cloud cover suggests a low-lying cloud deck = potential fog when
+    # cloud base meets terrain.
+    if cloud_cover_pct >= 90.0:
+        s += 10.0
+    elif cloud_cover_pct >= 70.0:
+        s += 5.0
+    # Terrain modifier: valleys trap radiation fog; high peaks intersect cloud base.
+    if terrain == "Valley":
+        s += 10.0
+    elif terrain == "Peak" and elevation_m >= 1500.0:
+        s += 8.0
+    return _clip(s)
+def score_wind_gust_risk(
+    *, wind_speed_kmh: float, terrain: str, slope_deg: float,
+    orographic_dot: float,
+) -> int:
+    """Wind gust sub-score. Sustained wind × topographic acceleration."""
+    if wind_speed_kmh < config.GUST_WIND_MIN_KMH * 0.6:
+        # Calm conditions — even ridges won't produce dangerous gusts.
+        return _clip(wind_speed_kmh)
+    # Baseline: linear in sustained wind, saturating at the gale Veto level.
+    s = (wind_speed_kmh / config.GALE_WIND_KMH) * 55.0
+    # Topographic acceleration on ridges and exposed slopes.
+    if terrain in {"Peak", "Slope"}:
+        s += min(slope_deg, 30.0)         # up to +30 for very steep slopes
+    if terrain == "Slope" and abs(orographic_dot) >= 0.5:
+        s += 8.0                            # pass / saddle wind funnel
+    return _clip(s)
+def score_thunderstorm_risk(
+    *, cape_jkg: float, pressure_change_3h: float, humidity_pct: float,
+) -> int:
+    """Thunderstorm sub-score. Atmospheric instability + storm precursors."""
+    s = 0.0
+    # CAPE — primary indicator. Linear up to NWS "strong instability" 2500 J/kg.
+    if cape_jkg >= config.HIGH_CAPE_JKG:
+        s += 60.0
+    elif cape_jkg >= config.THUNDER_CAPE_MIN_JKG:
+        s += 35.0 + (cape_jkg - config.THUNDER_CAPE_MIN_JKG) / 20.0
+    elif cape_jkg >= 200.0:
+        s += 12.0
+    # Falling pressure precedes convective initiation.
+    if pressure_change_3h <= config.THUNDER_PRESSURE_DROP:
+        s += 20.0
+    elif pressure_change_3h <= -1.0:
+        s += 8.0
+    # Humidity gates whether instability can actually produce a thunderstorm.
+    if humidity_pct >= 80.0:
+        s += 10.0
+    return _clip(s)
+# ════════════════════════════════════════════════════════════════════════
+# D5 §3.7.2 / Table 4.2 — Decision Table R1-R4
+# ════════════════════════════════════════════════════════════════════════
+def apply_decision_table_3_7_2(
+    *,
+    macro_rain_prob:    float,
+    humidity_pct:       float,
+    wind_into_slope:    bool,
+    terrain:            str,
+    pressure_change_3h: float,
+    cloud_base_m:       float | None,
+) -> list[DecisionTableMatch]:
+    """Returns the list of decision-table rules (R1-R4) that fired.
+    One-to-one match against D5 §3.7.2 Table 4.2."""
+    terrain_kind = "WindwardSlope" if (terrain == "Slope" and wind_into_slope) else \
+                   "LeewardOrValley" if terrain in {"Valley"} or (terrain == "Slope" and not wind_into_slope) else \
+                   terrain
+    matches: list[DecisionTableMatch] = []
+    for rule_id, rule in config.DECISION_TABLE_3_7_2.items():
+        ok = True
+        if rule["macro_rain_prob_max"] is not None and macro_rain_prob > rule["macro_rain_prob_max"]:
+            ok = False
+        if rule["macro_rain_prob_min"] is not None and macro_rain_prob < rule["macro_rain_prob_min"]:
+            ok = False
+        if rule["humidity_min_pct"] is not None and humidity_pct < rule["humidity_min_pct"]:
+            ok = False
+        if rule["wind_into_slope"] is not None and wind_into_slope != rule["wind_into_slope"]:
+            ok = False
+        if rule["terrain"] is not None and terrain_kind != rule["terrain"]:
+            ok = False
+        if rule["pressure_change_3h_max"] is not None and pressure_change_3h > rule["pressure_change_3h_max"]:
+            ok = False
+        if rule["cloud_base_max_m"] is not None and (cloud_base_m is None or cloud_base_m > rule["cloud_base_max_m"]):
+            ok = False
+        if ok:
+            matches.append(DecisionTableMatch(
+                rule=rule_id,
+                description=rule["description"],
+                conclusion_en=rule["conclusion_en"],
+                conclusion_zh=rule["conclusion_zh"],
+            ))
+    return matches
+# ════════════════════════════════════════════════════════════════════════
+# P4.4 — Activity-aware composite scoring
+# ════════════════════════════════════════════════════════════════════════
+def apply_activity_weighting(
+    subs: HazardSubscores, activity: ActivityType,
+) -> int:
+    """Composite 0-100 score.
+    Design rationale: a naive mean dilutes the dominant hazard — e.g. an
+    extreme thunderstorm risk (90) averaged with three safe (10) values
+    would yield 30, which understates the actual danger. We therefore use
+    a **dominant-hazard + secondary-contribution** formulation:
+        composite = 0.80 · max(weighted sub-scores)
+                  + 0.20 · mean(weighted sub-scores excluding max)
+    This ensures the worst hazard for the user's activity drives the score,
+    while still allowing multiple moderate hazards to push the score up.
+    """
+    w = config.ACTIVITY_WEIGHTS[activity]
+    weighted = [
+        min(100.0, w["rainfall"]     * subs.rainfall),
+        min(100.0, w["fog"]          * subs.fog),
+        min(100.0, w["wind_gust"]    * subs.wind_gust),
+        min(100.0, w["thunderstorm"] * subs.thunderstorm),
+    ]
+    top  = max(weighted)
+    rest = sum(weighted) - top
+    others_mean = rest / 3.0
+    return _clip(top * 0.80 + others_mean * 0.20)
+# ════════════════════════════════════════════════════════════════════════
+# Veto cascade (life-safety overrides) — same as before, unchanged behaviour
+# ════════════════════════════════════════════════════════════════════════
+def _collect_veto_triggers(
+    *, elevation_m: float, terrain: str, weather: dict[str, Any],
+    ml_rain_prob: float, orographic_dot: float,
+) -> list[VetoTrigger]:
+    temp_c     = weather.get("temperature_c", 25.0)
+    wind_kmh   = weather.get("wind_speed_kmh", 0.0)
+    cape       = weather.get("cape_jkg", 0.0)
+    visibility = weather.get("visibility_m", 10000.0)
+    out: list[VetoTrigger] = []
+    if elevation_m > config.ALTITUDE_HYPOXIA_M:
+        out.append(VetoTrigger(
+            rule="altitude_hypoxia", value=elevation_m,
+            message_en=f"Altitude {elevation_m:.0f} m exceeds {config.ALTITUDE_HYPOXIA_M:.0f} m — severe hypoxia risk.",
+            message_zh=f"海拔 {elevation_m:.0f} m 超过 {config.ALTITUDE_HYPOXIA_M:.0f} m，存在严重缺氧风险。",
+        ))
+    if temp_c <= config.EXTREME_COLD_C:
+        out.append(VetoTrigger(
+            rule="extreme_cold", value=temp_c,
+            message_en=f"Temperature {temp_c:.1f}°C — frostbite risk per UIAA guidance.",
+            message_zh=f"温度 {temp_c:.1f}°C，UIAA 指南判定为冻伤风险。",
+        ))
+    if wind_kmh >= config.GALE_WIND_KMH:
+        out.append(VetoTrigger(
+            rule="gale_wind", value=wind_kmh,
+            message_en=f"Wind speed {wind_kmh:.0f} km/h ≥ Beaufort Force 6 — hazardous.",
+            message_zh=f"风速 {wind_kmh:.0f} km/h 达到蒲福风级 6 级以上，存在危险。",
+        ))
+    if cape >= config.HIGH_CAPE_JKG:
+        out.append(VetoTrigger(
+            rule="high_cape_lightning", value=cape,
+            message_en=f"CAPE {cape:.0f} J/kg — significant thunderstorm potential.",
+            message_zh=f"CAPE {cape:.0f} J/kg，存在显著雷暴风险。",
+        ))
+    if visibility < config.LOW_VISIBILITY_M:
+        out.append(VetoTrigger(
+            rule="low_visibility", value=visibility,
+            message_en=f"Visibility {visibility:.0f} m — whiteout / dense fog.",
+            message_zh=f"能见度 {visibility:.0f} m，白毛风或浓雾。",
+        ))
+    if (terrain == "Slope" and orographic_dot >= config.OROGRAPHIC_DOT_THRESHOLD
+            and ml_rain_prob >= 0.50):
+        out.append(VetoTrigger(
+            rule="orographic_lift_storm", value=orographic_dot,
+            message_en="Wind impinging on windward slope with high rain probability — enhanced orographic precipitation.",
+            message_zh="风向正对迎风坡，叠加高降雨概率，地形抬升强化降水。",
+        ))
+    if terrain == "Valley" and ml_rain_prob >= config.VALLEY_FLOOD_PROB:
+        out.append(VetoTrigger(
+            rule="valley_flash_flood", value=ml_rain_prob,
+            message_en="Valley basin with very high rain probability — flash-flood risk.",
+            message_zh="处于山谷盆地且降雨概率极高，存在山洪暴发风险。",
+        ))
+    return out
+# ════════════════════════════════════════════════════════════════════════
+# Top-level entry point — orchestrates P4.2 → P4.3 → P4.4 → P4.5 → P4.6
+# ════════════════════════════════════════════════════════════════════════
+def evaluate(
+    *,
+    lat: float,
+    lon: float,
+    elevation_m: float,
+    terrain: str,
+    weather: dict[str, Any],
+    ml_rain_prob: float,
+    slope_deg: float,
+    aspect_deg: float,
+    orographic_dot: float,
+    activity: ActivityType = "general",
+) -> RuleResult:
+    """Apply the full Hybrid scoring + Veto cascade + D5 §3.7 pipeline."""
+    result = RuleResult(activity=activity)
+    log = result.inference_log
+    log.append(InferenceStep(
+        kind="info",
+        text_en=f"Inference @ ({lat:.4f}, {lon:.4f})  elev={elevation_m:.0f} m  terrain={terrain}  activity={activity}",
+        text_zh=f"推理位置 ({lat:.4f}, {lon:.4f})  海拔 {elevation_m:.0f} m  地形 {terrain}  活动���型 {activity}",
+    ))
+    log.append(InferenceStep(
+        kind="ml",
+        text_en=f"Engine A (Random Forest) — rain probability next hour = {ml_rain_prob:.1%}",
+        text_zh=f"引擎 A（随机森林）下一小时降雨概率 = {ml_rain_prob:.1%}",
+    ))
+    # ── P4.3: Four hazard sub-scores ──
+    humidity = weather.get("humidity_pct", 60.0)
+    dew_dep  = weather.get("dew_point_depression",
+                            weather.get("temperature_c", 25.0) - weather.get("dew_point_c",
+                                weather.get("temperature_c", 25.0)))
+    pres_dp  = weather.get("pressure_change_3h", 0.0)
+    cloud    = weather.get("cloud_cover_pct", 50.0)
+    cape     = weather.get("cape_jkg", 0.0)
+    wind_kmh = weather.get("wind_speed_kmh", 0.0)
+    subs = HazardSubscores(
+        rainfall    = score_rainfall_risk(
+            ml_rain_prob=ml_rain_prob, terrain=terrain, orographic_dot=orographic_dot,
+            pressure_change_3h=pres_dp, humidity_pct=humidity),
+        fog         = score_fog_risk(
+            humidity_pct=humidity, dew_point_depression=dew_dep,
+            cloud_cover_pct=cloud, terrain=terrain, elevation_m=elevation_m),
+        wind_gust   = score_wind_gust_risk(
+            wind_speed_kmh=wind_kmh, terrain=terrain,
+            slope_deg=slope_deg, orographic_dot=orographic_dot),
+        thunderstorm= score_thunderstorm_risk(
+            cape_jkg=cape, pressure_change_3h=pres_dp, humidity_pct=humidity),
+    )
+    result.hazard_subscores = subs
+    log.append(InferenceStep(
+        kind="hazard",
+        text_en=f"Sub-scores — Rainfall={subs.rainfall}  Fog={subs.fog}  Gust={subs.wind_gust}  Thunder={subs.thunderstorm}",
+        text_zh=f"分项评分 — 降雨={subs.rainfall}  雾={subs.fog}  阵风={subs.wind_gust}  雷暴={subs.thunderstorm}",
+    ))
+    # ── D5 §3.7.2 Decision Table R1-R4 (informational, not score-changing) ──
+    wind_into_slope = (terrain == "Slope" and orographic_dot >= 0.3)
+    cloud_base_m   = weather.get("cloud_base_m")
+    if cloud_base_m is None and cloud >= 90.0 and dew_dep <= 2.0:
+        cloud_base_m = 600.0   # crude proxy when API doesn't provide cloud base
+    result.decision_table_matches = apply_decision_table_3_7_2(
+        macro_rain_prob=ml_rain_prob,
+        humidity_pct=humidity,
+        wind_into_slope=wind_into_slope,
+        terrain=terrain,
+        pressure_change_3h=pres_dp,
+        cloud_base_m=cloud_base_m,
+    )
+    for m in result.decision_table_matches:
+        log.append(InferenceStep(
+            kind="table",
+            text_en=f"D5 §3.7.2 {m.rule} fired — {m.conclusion_en}",
+            text_zh=f"D5 §3.7.2 {m.rule} 触发 —— {m.conclusion_zh}",
+        ))
+    # ── Veto cascade (life-safety overrides) ──
+    result.veto_triggers = _collect_veto_triggers(
+        elevation_m=elevation_m, terrain=terrain, weather=weather,
+        ml_rain_prob=ml_rain_prob, orographic_dot=orographic_dot,
+    )
+    if result.has_veto:
+        for v in result.veto_triggers:
+            log.append(InferenceStep(kind="veto", text_en=f"VETO: {v.message_en}",
+                                      text_zh=f"否决触发：{v.message_zh}"))
+        result.risk_score = 100
+        result.risk_level = "Danger"
+        result.advice_en, result.advice_zh = _veto_advice(result.veto_triggers)
+        log.append(InferenceStep(kind="score",
+            text_en="Final risk = 100 (Veto cascade; ML probability overridden).",
+            text_zh="最终风险 = 100（一票否决；ML 概率被覆盖）。"))
+        return result
+    # ── P4.4 + P4.5: activity-weighted composite score ──
+    composite = apply_activity_weighting(subs, activity)
+    result.risk_score = composite
+    result.risk_level = _bin_level(composite)
+    log.append(InferenceStep(
+        kind="activity",
+        text_en=f"Activity={activity}: weighted composite score = {composite}.",
+        text_zh=f"活动类型 {activity}：加权综合评分 = {composite}。",
+    ))
+    # ── P4.6: bilingual advice ──
+    result.advice_en, result.advice_zh = _normal_advice(
+        composite, terrain, ml_rain_prob, subs, activity)
+    log.append(InferenceStep(kind="score",
+        text_en=f"Final risk score = {composite} → {result.risk_level}.",
+        text_zh=f"最终风险评分 = {composite} → {result.risk_level}。"))
+    return result
+# ════════════════════════════════════════════════════════════════════════
+# P4.6 — Bilingual advice generation
+# ════════════════════════════════════════════════════════════════════════
+def _veto_advice(triggers: list[VetoTrigger]) -> tuple[str, str]:
+    en = "DANGER — do not proceed. " + " ".join(t.message_en for t in triggers)
+    zh = "危险 —— 请勿前往。" + " ".join(t.message_zh for t in triggers)
+    return en, zh
+def _normal_advice(score: int, terrain: str, ml_prob: float,
+                   subs: HazardSubscores, activity: ActivityType) -> tuple[str, str]:
+    # Pick the dominant hazard to mention specifically.
+    by_score = sorted(
+        [("Rainfall", "降雨", subs.rainfall),
+         ("Fog",      "雾",   subs.fog),
+         ("Wind gust","阵风", subs.wind_gust),
+         ("Thunderstorm","雷暴", subs.thunderstorm)],
+        key=lambda x: -x[2],
+    )
+    top_en, top_zh, top_score = by_score[0]
+    if score >= 80:
+        en = f"Danger ({top_en} dominant, {top_score}/100): cancel outdoor activity; seek shelter immediately."
+        zh = f"危险（主要风险 {top_zh} {top_score}/100）：立即取消户外活动，寻找避难所。"
+    elif score >= 55:
+        en = (f"Warning ({top_en} dominant, {top_score}/100) in {terrain.lower()} terrain "
+              f"for activity={activity}. Postpone non-essential travel.")
+        zh = f"警告（主要风险 {top_zh} {top_score}/100）：{terrain}地形下 {activity} 活动，建议推迟非必要出行。"
+    elif score >= 30:
+        en = (f"Caution ({top_en} dominant, {top_score}/100): monitor weather closely; "
+              f"carry appropriate gear (rain prob {ml_prob:.0%}).")
+        zh = f"注意（主要风险 {top_zh} {top_score}/100）：密切关注天气，携带适当装备（降雨概率 {ml_prob:.0%}）。"
+    else:
+        en = "Safe: conditions favourable for outdoor activity. Stay aware."
+        zh = "安全：当前条件适合户外活动，仍请保持警觉。"
+    return en, zh

backend/schemas.py ADDED Viewed

	@@ -0,0 +1,72 @@

+"""Pydantic request / response schemas — the contract between FE and BE."""
+from __future__ import annotations
+from typing import Literal
+from pydantic import BaseModel, Field
+TerrainType = Literal["Valley", "Slope", "Flat", "Peak", "Unknown"]
+RiskLevel   = Literal["Safe", "Caution", "Warning", "Danger"]
+ActivityType = Literal["hiker", "driver", "construction", "general"]
+class PredictionRequest(BaseModel):
+    latitude:  float = Field(..., ge=-90.0,  le=90.0,  description="WGS84 latitude")
+    longitude: float = Field(..., ge=-180.0, le=180.0, description="WGS84 longitude")
+    activity:  ActivityType = "general"
+class VetoTrigger(BaseModel):
+    rule:    str
+    value:   float | None
+    message_en: str
+    message_zh: str
+class InferenceStep(BaseModel):
+    """One line of the XAI (explainable AI) inference log."""
+    kind: Literal["info", "ml", "rule", "veto", "score", "hazard", "table", "activity"]
+    text_en: str
+    text_zh: str
+class HazardSubscores(BaseModel):
+    """Per-category risk score 0-100. Matches the four hazard types
+    enumerated in the D5 proposal §3.7 (P4.3)."""
+    rainfall:     int = Field(..., ge=0, le=100)
+    fog:          int = Field(..., ge=0, le=100)
+    wind_gust:    int = Field(..., ge=0, le=100)
+    thunderstorm: int = Field(..., ge=0, le=100)
+class DecisionTableMatch(BaseModel):
+    """A row of D5 §3.7.2 / Table 4.2 that has fired for this request."""
+    rule:           str           # 'R1' | 'R2' | 'R3' | 'R4'
+    description:    str
+    conclusion_en:  str
+    conclusion_zh:  str
+class PredictionResponse(BaseModel):
+    latitude:  float
+    longitude: float
+    elevation_m: float
+    terrain: TerrainType
+    ml_rain_probability: float = Field(..., ge=0.0, le=1.0)
+    hazard_subscores: HazardSubscores
+    decision_table_matches: list[DecisionTableMatch]
+    activity: ActivityType
+    risk_score: int = Field(..., ge=0, le=100)
+    risk_level: RiskLevel
+    veto_triggers: list[VetoTrigger]
+    inference_log: list[InferenceStep]
+    advice_en: str
+    advice_zh: str
+    cached:    bool = False
+    cache_ttl: int  = 0

backend/terrain.py ADDED Viewed

	@@ -0,0 +1,151 @@

+"""
+DEM-based terrain classification.
+Given a 3×3 elevation matrix centred on the query point, we classify the
+terrain as Valley / Slope / Flat / Peak and compute the slope vector
+needed for orographic-uplift detection.
+The classification heuristic follows the **Topographic Position Index
+(TPI)** approach from Weiss (2001) and is the same technique used in the
+microclimate-modelling literature (e.g. Maclean et al., 2018, "Microclima").
+"""
+from __future__ import annotations
+import math
+from dataclasses import dataclass
+import httpx
+from . import config
+@dataclass
+class TerrainInfo:
+    elevation_m: float
+    terrain:    str          # "Valley" | "Slope" | "Flat" | "Peak" | "Unknown"
+    slope_deg:  float        # 0-90
+    aspect_deg: float        # 0-360, direction the slope faces (downhill)
+    tpi:        float        # signed, positive = ridge, negative = valley
+# ────────────────────────────────────────────────────────────────────────
+# DEM fetching
+# ────────────────────────────────────────────────────────────────────────
+def _build_3x3_grid(lat: float, lon: float, step_deg: float = 0.01) -> list[tuple[float, float]]:
+    """Eight neighbours + centre, ordered row-major (NW, N, NE, W, C, E, SW, S, SE).
+    Handles the antimeridian (lon ∈ [-180, 180]) and clips latitudes that
+    would walk off the poles. Without this, querying e.g. (89.999, 179.999)
+    would produce DEM coordinates that the upstream API rejects.
+    """
+    points = []
+    for dlat in (+step_deg, 0.0, -step_deg):       # north → south
+        for dlon in (-step_deg, 0.0, +step_deg):   # west  → east
+            new_lat = max(-90.0, min(90.0, lat + dlat))
+            new_lon = lon + dlon
+            # Wrap longitudes into (-180, 180] range.
+            if new_lon > 180.0:
+                new_lon -= 360.0
+            elif new_lon < -180.0:
+                new_lon += 360.0
+            points.append((new_lat, new_lon))
+    return points
+async def fetch_dem_3x3(lat: float, lon: float, client: httpx.AsyncClient,
+                       step_deg: float = 0.01) -> list[float]:
+    """Returns 9 elevation values for the 3×3 grid around (lat, lon)."""
+    pts = _build_3x3_grid(lat, lon, step_deg)
+    locations = "|".join(f"{p[0]},{p[1]}" for p in pts)
+    resp = await client.get(
+        config.OPEN_TOPO_URL,
+        params={"locations": locations},
+        timeout=15.0,
+    )
+    resp.raise_for_status()
+    data = resp.json()
+    elevations = []
+    for r in data.get("results", []):
+        e = r.get("elevation")
+        # Open-Topo returns None for ocean points and other no-data tiles.
+        elevations.append(float(e) if e is not None else 0.0)
+    if len(elevations) != 9:
+        raise ValueError(
+            f"DEM API returned {len(elevations)} cells, expected 9. "
+            "Coordinates may be over ocean or outside coverage."
+        )
+    return elevations
+# ────────────────────────────────────────────────────────────────────────
+# Classification
+# ────────────────────────────────────────────────────────────────────────
+def classify_terrain(dem9: list[float], cell_size_m: float = 1100.0) -> TerrainInfo:
+    """
+    Indices for the 3x3 matrix:
+        0 1 2          (NW, N,  NE)
+        3 4 5          (W,  C,  E )
+        6 7 8          (SW, S,  SE)
+    """
+    if len(dem9) != 9:
+        raise ValueError(f"DEM matrix must be 3x3, got {len(dem9)} cells")
+    nw, n, ne, w, c, e, sw, s, se = dem9
+    # Horn's algorithm — surface derivatives.
+    dzdx = ((ne + 2 * e + se) - (nw + 2 * w + sw)) / (8 * cell_size_m)
+    dzdy = ((sw + 2 * s + se) - (nw + 2 * n + ne)) / (8 * cell_size_m)
+    slope_rad = math.atan(math.hypot(dzdx, dzdy))
+    slope_deg = math.degrees(slope_rad)
+    # Aspect: compass bearing pointing DOWNHILL (0=N, 90=E, 180=S, 270=W).
+    aspect_rad = math.atan2(dzdy, -dzdx)  # math convention
+    aspect_deg = (math.degrees(aspect_rad) + 360.0) % 360.0
+    # Topographic Position Index (TPI): centre cell minus mean of neighbours.
+    neighbours = [nw, n, ne, w, e, sw, s, se]
+    tpi = c - sum(neighbours) / 8.0
+    if abs(tpi) < 5 and slope_deg < 5:
+        terrain = "Flat"
+    elif tpi < -10:
+        terrain = "Valley"
+    elif tpi > 20:
+        terrain = "Peak"
+    else:
+        terrain = "Slope"
+    return TerrainInfo(
+        elevation_m=c,
+        terrain=terrain,
+        slope_deg=slope_deg,
+        aspect_deg=aspect_deg,
+        tpi=tpi,
+    )
+def orographic_lift_dot(wind_dir_deg: float, slope_aspect_deg: float,
+                        slope_deg: float) -> float:
+    """
+    Returns a unitless 'orographic uplift' index in [-1, +1].
+    Aspect points DOWNHILL — the slope NORMAL (uphill direction) is the
+    opposite bearing. If wind blows opposite to aspect (i.e. into the slope),
+    the dot product approaches +1, scaled by slope steepness.
+    A high positive value means wind is being forced upward → enhanced rain
+    on the windward face.
+    """
+    wind_rad   = math.radians(wind_dir_deg)
+    uphill_rad = math.radians((slope_aspect_deg + 180.0) % 360.0)
+    # Wind direction in meteorology = direction FROM which wind blows, so
+    # the wind-vector pointing direction is (wind_dir + 180°). For the dot
+    # product we just need the cosine of the angle between (wind FROM) and
+    # (uphill direction).
+    cos_angle = math.cos(wind_rad - uphill_rad)
+    # Scale by slope steepness — a 1° slope barely matters.
+    return cos_angle * math.sin(math.radians(min(slope_deg, 60.0)))

docker-compose.yml ADDED Viewed

	@@ -0,0 +1,26 @@

+services:
+  api:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    image: microclimate-x:latest
+    container_name: microclimate-x
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    environment:
+      # Override Dockerfile default (/tmp, HF-Spaces-friendly) with the named
+      # volume so cache.sqlite3 survives container restarts on self-hosting.
+      - MICROCLIMATEX_DB=/data/cache.sqlite3
+      - MICROCLIMATEX_GIT_REV=${MICROCLIMATEX_GIT_REV:-docker}
+    volumes:
+      - mcx-data:/data
+    healthcheck:
+      test: ["CMD", "python", "-c", "import urllib.request,sys; sys.exit(0) if urllib.request.urlopen('http://localhost:8000/api/health',timeout=2).status==200 else sys.exit(1)"]
+      interval: 30s
+      timeout: 5s
+      retries: 3
+      start_period: 10s
+volumes:
+  mcx-data:

docs/DEPLOY_HF.md ADDED Viewed

	@@ -0,0 +1,143 @@

+# Deploying MicroClimate-X to Hugging Face Spaces
+> 一次部署，永久公网 URL，导师随时可看，不用挂笔记本。
+> One-time deploy → permanent public URL your supervisor can open any time, no laptop required.
+---
+## Why Hugging Face Spaces?
+* **Free** persistent hosting for ML demos (CPU tier is enough for this project).
+* **Docker SDK** — reuses the existing `Dockerfile` 1:1, no platform-specific build hacks.
+* **Server-side Git LFS** — the 217 MB `rf_model.pkl` uploads through `huggingface-cli`
+  without needing local `git-lfs` installed.
+* The HF Space URL (`https://huggingface.co/spaces/<user>/microclimate-x`) is *the*
+  canonical demo URL for ML thesis projects in 2026.
+---
+## Architecture on HF Spaces
+```
+┌──────────────────────────────────────────────────────────────┐
+│  https://huggingface.co/spaces/<user>/microclimate-x         │
+│                                                              │
+│  Docker image (this repo's Dockerfile)                       │
+│   ├─ FastAPI @ :8000   (declared via README.md `app_port`)   │
+│   ├─ /app/frontend/  ── mounted at /app/                     │
+│   ├─ /app/models/    ── rf_model.pkl baked in                │
+│   └─ /tmp/cache.sqlite3 (ephemeral — fine for demo)          │
+│                                                              │
+│  ↓ outbound HTTP                                             │
+│  ├─ api.open-meteo.com           (weather, ERA5)             │
+│  └─ api.opentopodata.org/srtm30m (DEM)                       │
+└──────────────────────────────────────────────────────────────┘
+```
+The frontend talks to its own origin via relative `/api/…` URLs, so no CORS
+fiddling and no front-end edits are needed.
+---
+## 3-step deploy
+### Step 1 — Create the Space (web UI, one minute)
+1. Go to <https://huggingface.co/new-space>
+2. Fill in:
+   * **Owner**: your HF account
+   * **Space name**: `microclimate-x`
+   * **License**: MIT
+   * **Space SDK**: **Docker** → "Blank" template
+   * **Hardware**: CPU basic (free)
+   * **Visibility**: Public
+3. Click **Create Space**. You'll land on an empty repo page.
+### Step 2 — Authenticate the CLI (one minute)
+```bash
+# Install once
+pip install -U "huggingface_hub[cli]"
+# Get a token at https://huggingface.co/settings/tokens
+#   - Type: Write
+#   - Scope: read + write to the new Space
+huggingface-cli login
+# (paste the token when prompted)
+```
+### Step 3 — Push (one command)
+From the repo root:
+```bash
+./scripts/deploy_hf.sh <hf-username>/microclimate-x
+# e.g.
+./scripts/deploy_hf.sh KyoukoLi/microclimate-x
+```
+The script uploads:
+* `backend/`, `frontend/`, `scripts/`, `models/`, `docs/`
+* `Dockerfile`, `requirements.txt`, `README.md`, `LICENSE`, `pyproject.toml`
+and skips local-only junk (`data/`, `figures/`, `tests/`, `.venv/`, SQLite caches, …).
+HF then runs the same `Dockerfile` you use locally. Build takes ≈ 3–5 min the first time
+(the 217 MB model upload dominates) and < 1 min for subsequent deploys.
+When the Space's status badge turns green ("Running"), the URL
+`https://huggingface.co/spaces/<user>/microclimate-x` is live. Send that to your supervisor.
+---
+## Updating the demo after code changes
+```bash
+git commit -am "fix: …"
+./scripts/deploy_hf.sh KyoukoLi/microclimate-x
+```
+The script diffs against the remote, so only changed files are re-uploaded.
+A code-only change (no model retrain) is a < 10 s push.
+---
+## Troubleshooting
+| Symptom | Likely cause | Fix |
+|---|---|---|
+| Build log: `unable to open database file` | `MICROCLIMATEX_DB` points to a read-only path on HF | Dockerfile already sets it to `/tmp/cache.sqlite3`. Make sure your Space doesn't override it under **Settings → Variables and secrets**. |
+| Build log: `port 7860 expected, got 8000` | HF didn't parse the `app_port` frontmatter | Confirm `README.md` starts with the YAML block including `app_port: 8000`. |
+| App loads but every request → 502 | Outbound calls to Open-Meteo / Open Topo Data hit HF's egress timeout | Increase `httpx.AsyncClient(timeout=…)` in `backend/main.py` (currently 15 s). |
+| ML predictor banner says "heuristic" | `models/rf_model.pkl` wasn't uploaded | Re-run `./scripts/deploy_hf.sh`; the script prompts before continuing without the model. |
+| LFS quota exceeded | Free HF accounts get 5 GB LFS — we use ~220 MB | Delete old commits' LFS objects under **Files & versions → Settings**. |
+---
+## Optional: GitHub Actions auto-sync
+If you'd rather have `git push origin main` auto-deploy to HF, add this workflow:
+```yaml
+# .github/workflows/sync-to-hf.yml
+name: Sync to Hugging Face Space
+on:
+  push:
+    branches: [main]
+jobs:
+  sync:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+        with: { fetch-depth: 0 }
+      - uses: actions/setup-python@v5
+        with: { python-version: "3.12" }
+      - run: pip install -U "huggingface_hub[cli]"
+      - run: |
+          echo "${{ secrets.HF_TOKEN }}" | huggingface-cli login --token "$(cat -)"
+          ./scripts/deploy_hf.sh KyoukoLi/microclimate-x
+```
+Add `HF_TOKEN` to the GitHub repo's secrets. Now every push to `main`
+re-deploys the Space.

docs/MEETING_CHEAT_SHEET.html ADDED Viewed

	@@ -0,0 +1,644 @@

+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<title>Supervisor Meeting Cheat Sheet — MicroClimate-X</title>
+<style>
+  /* ============================================================
+     Print-optimised A4 cheat sheet — open in browser, ⌘+P → PDF
+     ============================================================ */
+  :root {
+    --ink:           #0b0d12;
+    --ink-soft:      #353a44;
+    --muted:         #6b7280;
+    --brand:         #2563eb;
+    --brand-soft:    #dbeafe;
+    --accent:        #b91c1c;
+    --accent-soft:   #fee2e2;
+    --ok:            #166534;
+    --ok-soft:       #dcfce7;
+    --warn:          #b45309;
+    --warn-soft:     #fef3c7;
+    --grid:          #e5e7eb;
+    --bg:            #ffffff;
+    --code-bg:       #f3f4f6;
+  }
+  * { box-sizing: border-box; }
+  html, body { margin: 0; padding: 0; background: var(--bg); color: var(--ink); }
+  body {
+    font-family: -apple-system, BlinkMacSystemFont, "SF Pro Text",
+                 "PingFang SC", "Hiragino Sans GB", "Microsoft YaHei",
+                 system-ui, sans-serif;
+    font-size: 11pt;
+    line-height: 1.45;
+  }
+  /* A4 page sizing */
+  @page { size: A4; margin: 12mm 14mm; }
+  main { max-width: 200mm; margin: 0 auto; padding: 14mm 14mm; }
+  /* Headings */
+  h1 {
+    font-size: 22pt; margin: 0 0 4mm 0;
+    border-bottom: 3px solid var(--brand); padding-bottom: 3mm;
+    page-break-after: avoid;
+  }
+  h1 .zh { display: block; font-size: 13pt; color: var(--muted); font-weight: 500; margin-top: 1mm; }
+  h2 {
+    font-size: 14pt; margin: 9mm 0 3mm 0;
+    color: var(--brand);
+    border-left: 4px solid var(--brand); padding: 1mm 0 1mm 3mm;
+    page-break-after: avoid;
+  }
+  h2 .zh { display: block; font-size: 10pt; color: var(--muted); margin-top: 0.5mm; font-weight: 500; }
+  h3 {
+    font-size: 11.5pt; margin: 5mm 0 2mm 0; color: var(--ink-soft);
+    page-break-after: avoid;
+  }
+  h4 { font-size: 10.5pt; margin: 3mm 0 1mm 0; color: var(--accent); }
+  /* Paragraphs / lists */
+  p, li { margin: 1mm 0; }
+  ul, ol { padding-left: 5mm; }
+  ul li { margin-bottom: 1mm; }
+  /* Quote / supervisor verbatim */
+  .quote {
+    background: var(--warn-soft);
+    border-left: 3px solid var(--warn);
+    padding: 2mm 3mm; margin: 2mm 0;
+    font-style: italic; font-size: 10pt;
+  }
+  .quote::before { content: "🎙️ "; font-style: normal; }
+  /* Bilingual two-column table */
+  table.bilingual, table.steps, table.tabs, table {
+    border-collapse: collapse; width: 100%; margin: 2mm 0 3mm 0;
+    font-size: 10pt;
+  }
+  table.bilingual td, table.steps td, table.tabs td, table th, table td {
+    padding: 1.5mm 2.5mm; vertical-align: top;
+    border: 1px solid var(--grid);
+  }
+  table th {
+    background: #f9fafb; font-weight: 600; text-align: left;
+    color: var(--ink-soft);
+  }
+  table.bilingual td.en { width: 50%; }
+  table.bilingual td.zh { width: 50%; background: #fafbfc; }
+  /* Inline callouts */
+  .callout {
+    margin: 2mm 0; padding: 2mm 3mm;
+    border-left: 3px solid; border-radius: 1mm;
+    font-size: 10pt;
+  }
+  .callout.warn { background: var(--accent-soft); border-color: var(--accent); }
+  .callout.ok   { background: var(--ok-soft); border-color: var(--ok); }
+  .callout.tip  { background: var(--brand-soft); border-color: var(--brand); }
+  .callout-title { font-weight: 700; margin-bottom: 1mm; }
+  /* Code */
+  code, pre, kbd {
+    font-family: "SF Mono", "JetBrains Mono", Menlo, Consolas, monospace;
+    font-size: 9.5pt;
+  }
+  code { background: var(--code-bg); padding: 0.3mm 1mm; border-radius: 1mm; }
+  pre {
+    background: var(--code-bg); padding: 3mm; border-radius: 2mm;
+    overflow-x: auto; margin: 2mm 0;
+    border: 1px solid var(--grid);
+  }
+  pre code { background: transparent; padding: 0; }
+  /* Step grids */
+  .step {
+    display: flex; gap: 3mm;
+    margin: 2mm 0;
+    align-items: flex-start;
+  }
+  .step .num {
+    flex: 0 0 8mm; width: 8mm; height: 8mm; border-radius: 50%;
+    background: var(--brand); color: white; font-weight: 700;
+    display: flex; align-items: center; justify-content: center;
+    font-size: 11pt;
+  }
+  .step .body { flex: 1; }
+  /* Demo blocks */
+  .demo {
+    background: #f0f9ff;
+    border: 1px solid #bae6fd;
+    border-radius: 2mm;
+    padding: 3mm;
+    margin: 3mm 0;
+  }
+  .demo .demo-title { font-weight: 700; color: #075985; margin-bottom: 1mm; }
+  /* Checklist */
+  .check { font-family: "SF Mono", Menlo, monospace; font-size: 9.5pt; line-height: 1.7; }
+  .check .box { display: inline-block; width: 4mm; }
+  /* Page break helpers */
+  .pb { page-break-before: always; }
+  .nobreak { page-break-inside: avoid; }
+  /* Footer */
+  footer {
+    margin-top: 12mm; padding-top: 4mm;
+    border-top: 1px solid var(--grid);
+    color: var(--muted); font-size: 9pt; text-align: center;
+  }
+  /* Print refinements */
+  @media print {
+    body { font-size: 10pt; }
+    h2 { font-size: 13pt; }
+    .no-print { display: none; }
+    a { color: var(--ink); text-decoration: none; }
+  }
+  /* Toolbar (screen only) */
+  .toolbar {
+    position: sticky; top: 0; z-index: 100;
+    background: var(--brand); color: white;
+    padding: 2mm 4mm; display: flex; justify-content: space-between;
+    align-items: center; font-size: 10pt;
+  }
+  .toolbar button {
+    background: white; color: var(--brand); border: 0;
+    padding: 1.5mm 4mm; border-radius: 1mm; font-weight: 600;
+    cursor: pointer; font-size: 10pt;
+  }
+  .toolbar button:hover { background: #f3f4f6; }
+  /* Section spacing on cover */
+  .cover-meta {
+    display: flex; gap: 4mm; flex-wrap: wrap;
+    margin: 3mm 0;
+    color: var(--muted); font-size: 9.5pt;
+  }
+  .cover-meta span {
+    background: var(--code-bg); padding: 0.5mm 2mm; border-radius: 1mm;
+  }
+</style>
+</head>
+<body>
+<div class="toolbar no-print">
+  <strong>Supervisor Meeting Cheat Sheet · MicroClimate-X</strong>
+  <button onclick="window.print()">🖨 Print / Save as PDF</button>
+</div>
+<main>
+<h1>Supervisor Meeting Cheat Sheet
+  <span class="zh">导师开会一页通 — MicroClimate-X 答辩准备</span>
+</h1>
+<div class="cover-meta">
+  <span>📅 2026-05-11</span>
+  <span>🎓 UKM FYP</span>
+  <span>🏛️ KyoukoLi/microclimate-x</span>
+  <span>✅ CI passing · 97% coverage · 70 tests</span>
+</div>
+<div class="callout tip">
+  <div class="callout-title">How to use this cheat sheet · 怎么用这份小抄</div>
+  Keep this open on screen during the meeting. Don't read it aloud — glance at the relevant section when needed. Every key sentence is provided in both English and Chinese so you can default to whichever the supervisor speaks at that moment.
+  <br><br>
+  开会时打开在屏幕上做兜底。<strong>不要照念</strong>——需要时扫一眼对应小节。所有关键句子都给了中英对照，老师用什么语言你就用什么语言。
+</div>
+<!-- ===== Section 0: pre-meeting prep ===== -->
+<h2>0 · Before the meeting (10 min before)
+  <span class="zh">会前 10 分钟准备</span>
+</h2>
+<p>Run these in a terminal, in order. <strong>Do not skip any.</strong><br>
+在终端按顺序执行，<strong>一条都不能少</strong>：</p>
+<pre><code>cd ~/Projects/microclimate-x
+# 1. Pull latest + verify clean working tree
+git pull &amp;&amp; git status        # should print "working tree clean"
+# 2. Start the backend (leave running)
+make run                      # uvicorn boots on http://localhost:8000
+# 3. In a NEW terminal: verify API is alive + model is loaded
+curl -s http://localhost:8000/api/health | python3 -m json.tool
+# expect: "status": "ok", "ml_loaded": true</code></pre>
+<h3>Browser tabs — open in this exact order / 浏览器按顺序开标签页</h3>
+<table class="tabs">
+  <tr><th>#</th><th>URL</th><th>Purpose</th></tr>
+  <tr><td>1</td><td><code>file:///…/docs/MEETING_CHEAT_SHEET.html</code></td><td>This cheat sheet (safety net)</td></tr>
+  <tr><td>2</td><td><code>github.com/KyoukoLi/microclimate-x</code></td><td>Green CI badge</td></tr>
+  <tr><td>3</td><td><code>docs/dataset.md</code></td><td>For Concern #1 + #2</td></tr>
+  <tr><td>4</td><td><code>figures/01_roc_curve.png</code></td><td>Concern #4 — ML metrics</td></tr>
+  <tr><td>5</td><td><code>figures/03_calibration_curve.png</code></td><td>Calibration</td></tr>
+  <tr><td>6</td><td><code>figures/04_threshold_sweep.png</code></td><td>F2 threshold</td></tr>
+  <tr><td>7</td><td><code>figures/05_feature_importance.png</code></td><td>What model learned</td></tr>
+  <tr><td>8</td><td><code>docs/architecture.md</code></td><td>Rule engine deep-dive</td></tr>
+  <tr><td>9</td><td><code>http://localhost:8000/app/</code></td><td><strong>THE APP — OPEN LAST</strong></td></tr>
+  <tr><td>10</td><td><code>models/MODEL_CARD.md</code></td><td>Q&amp;A backup</td></tr>
+</table>
+<div class="callout warn">
+  <strong>🚨 Tab 9 must be opened LAST.</strong> If you accidentally show the app first, the supervisor will instantly remember last meeting's complaint ("app is last") and you lose credibility before you've said a word.<br>
+  <strong>🚨 标签 9（app）一定要最后打开。</strong>不小心先打开 app，老师会立刻想起上次 "app is last" 的批评——还没开口就掉分。
+</div>
+<!-- ===== Section 1: Opening ===== -->
+<h2>1 · Opening (30 seconds)
+  <span class="zh">开场 30 秒</span>
+</h2>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Sir, since our last meeting I have addressed every point of your feedback. May I walk you through them in the correct order — <strong>dataset first, then model, then app</strong> — as you instructed?"</td>
+    <td class="zh">"老师，按您上次反馈，我已经把每一条都改了。我按您要求的顺序——<strong>先 dataset，再 model，最后才是 app</strong>——给您过一遍可以吗？"</td>
+  </tr>
+</table>
+<div class="callout ok">
+  <strong>Why this works · 为什么有效</strong>: it directly quotes his words back to him. Watch him relax immediately.<br>
+  直接复述了他自己的话——看着他立刻放松。
+</div>
+<!-- ===== Section 2: Concern #1 ===== -->
+<h2 class="pb">2 · Concern #1 — "Y is missing"
+  <span class="zh">反馈一 · Y 列缺失</span>
+</h2>
+<div class="quote">"Y is missing. I don't have the output variable. If you don't have target, you cannot train a machine learning model."</div>
+<h3>On screen → Tab 3 (<code>docs/dataset.md</code>) → §5 Target label derivation</h3>
+<pre><code class="python">df['is_rain_event'] = (df['precipitation'].shift(-1) &gt; 0.1).astype(int)</code></pre>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Sir, you were right — the raw Open-Meteo CSV has no Y column. I have engineered the target explicitly. The variable is <code>is_rain_event</code>: <strong>1 if precipitation in the next hour exceeds 0.1 mm, else 0</strong>."</td>
+    <td class="zh">"老师您说得对，原始 CSV 没有 Y 列。我现在显式构造了目标变量 <code>is_rain_event</code>——<strong>下一小时降雨量 &gt; 0.1 mm 则为 1，否则为 0</strong>。"</td>
+  </tr>
+  <tr>
+    <td class="en">"Three things: <strong>(1)</strong> <code>.shift(-1)</code> uses <strong>future</strong> rain as label — features at hour t predict outcome at t+1h, so no temporal data leakage."</td>
+    <td class="zh">"三个要点：<strong>(1)</strong> <code>.shift(-1)</code> 表示用<strong>下一小时</strong>的降雨作标签，特征是 t 时刻、预测 t+1 小时——<strong>无时间泄漏</strong>。"</td>
+  </tr>
+  <tr>
+    <td class="en"><strong>(2)</strong> "0.1 mm matches the <strong>WMO definition of trace precipitation</strong> — not an arbitrary choice."</td>
+    <td class="zh"><strong>(2)</strong> "0.1 mm 这个阈值不是我随便定的，对应 <strong>WMO 微量降水标准</strong>。"</td>
+  </tr>
+  <tr>
+    <td class="en"><strong>(3)</strong> "It is <strong>binary classification</strong>, not regression, because the downstream user decision is binary — go or no-go."</td>
+    <td class="zh"><strong>(3)</strong> "是<strong>二分类</strong>不是回归，因为下游用户决策本身就是二元的——去 / 不去。"</td>
+  </tr>
+</table>
+<!-- ===== Section 3: Concern #2 ===== -->
+<h2>3 · Concern #2 — "Features don't match Excel"
+  <span class="zh">反馈二 · 文档特征和 CSV 列名对不上</span>
+</h2>
+<div class="quote">"The features that you presented here, not... not mentioned in the Excel. So, it must be matched."</div>
+<h3>On screen → stay on Tab 3 → scroll <em>up</em> to §4 Schema</h3>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Sir, that was also fair. I have rewritten the dataset specification so the documentation lists <strong>exactly the same column names</strong> as the CSV. One-to-one mapping in §4."</td>
+    <td class="zh">"老师，这条您也说得对。我已经重写了数据集文档——文档列出的就是 CSV 里的<strong>真实列名</strong>，一一对应，就在第 4 节。"</td>
+  </tr>
+  <tr>
+    <td class="en">"Every row is one CSV column. The 'role' column says whether it is a feature (<strong>X</strong>), the target (<strong>Y</strong>), or metadata."</td>
+    <td class="zh">"表里每一行就是 CSV 一列，role 列写明它是 feature（<strong>X</strong>）、target（<strong>Y</strong>）还是 metadata。"</td>
+  </tr>
+</table>
+<!-- ===== Section 4: Concern #3 ===== -->
+<h2>4 · Concern #3 — "Study the data source"
+  <span class="zh">反馈三 · 研究数据源本身</span>
+</h2>
+<div class="quote">"Please study the link. What is the purpose of the dataset? What is design for? What is the output variable?"</div>
+<h3>On screen → stay on Tab 3 → scroll up to §1-3</h3>
+<table class="bilingual">
+  <tr>
+    <td class="en">"I read Open-Meteo's documentation carefully. The dataset is the <strong>ERA5 reanalysis archive</strong> — ECMWF's gold-standard hourly reanalysis."</td>
+    <td class="zh">"我把 Open-Meteo 文档仔细读了。我用的是 <strong>ERA5 再分析数据</strong>，ECMWF 出的金标准同化产品。"</td>
+  </tr>
+  <tr>
+    <td class="en">"It is <strong>not a forecast</strong> — it is a physically-consistent reconstruction of past weather. ECMWF themselves use ERA5 to <strong>validate other forecast models</strong>. That makes it the right dataset for ML training: <strong>reliable ground-truth labels</strong>."</td>
+    <td class="zh">"它<strong>不是</strong>预报，是对过去天气的物理一致重建。ECMWF 自己拿 ERA5 去<strong>校验别的预报模型</strong>——所以训练 ML 是合适的，<strong>标签是可靠的 ground truth</strong>。"</td>
+  </tr>
+  <tr>
+    <td class="en"><strong>Spatial</strong>: 5 Malaysian mountain sites — Genting, Cameron, Fraser's Hill, Klang Valley, Kinabalu — elevations 100 m to 1865 m, terrain from valley to slope.</td>
+    <td class="zh"><strong>空间</strong>：5 个马来西亚山地点位——云顶、金马仑、福隆港、巴生谷、神山——海拔 100 m – 1865 m，地形从山谷到山坡。</td>
+  </tr>
+  <tr>
+    <td class="en"><strong>Temporal</strong>: 5 years, hourly, 175 315 rows total.</td>
+    <td class="zh"><strong>时间</strong>：5 年，每小时一行，总共 175 315 行。</td>
+  </tr>
+</table>
+<!-- ===== Section 5: Concern #4 ===== -->
+<h2 class="pb">5 · Concern #4 — "App is the last"
+  <span class="zh">反馈四 · App 最后做（最重要！）</span>
+</h2>
+<div class="quote">"First identify a dataset. And then train the model. And then predict it. Once everything is finished, you can develop the app. <strong>App is the last.</strong>"</div>
+<div class="callout warn">
+  <strong>🚨 This is the most important section.</strong> Pace yourself — 2-3 min total. <strong>Don't open the app until the end.</strong><br>
+  <strong>🚨 这是最重要的一节。</strong>控制节奏，总共 2-3 分钟。<strong>不要提前打开 app。</strong>
+</div>
+<div class="step">
+  <div class="num">2a</div>
+  <div class="body">
+    <strong>→ Tab 4 (<code>figures/01_roc_curve.png</code>)</strong>
+    <table class="bilingual">
+      <tr>
+        <td class="en">"Step 2, model training. Test ROC AUC is <strong>0.871</strong> on 35 063 held-out hourly samples. Hold-out is the <strong>last 20 % chronologically</strong>, not random — random splits leak temporal autocorrelation and inflate accuracy by 5-15 pp."</td>
+        <td class="zh">"第二步，模型训练。测试集 35 063 行，<strong>ROC AUC = 0.871</strong>。划分用<strong>按时间排序的最后 20%</strong>，不是随机——随机划分会泄漏时间自相关，把准确率虚高 5-15 个百分点。"</td>
+      </tr>
+    </table>
+  </div>
+</div>
+<div class="step">
+  <div class="num">2b</div>
+  <div class="body">
+    <strong>→ Tab 5 (<code>figures/03_calibration_curve.png</code>)</strong>
+    <table class="bilingual">
+      <tr>
+        <td class="en">"Brier score <strong>0.138</strong> — predicted probabilities are well-calibrated. When the model says 70 %, the actual rate is close to 70 %. No need for Platt scaling or isotonic post-hoc."</td>
+        <td class="zh">"Brier 分数 = <strong>0.138</strong>，预测概率<strong>校准良好</strong>——模型说 70% 时实际频率接近 70%。<strong>不需要</strong> Platt scaling 或 isotonic 校准。"</td>
+      </tr>
+    </table>
+  </div>
+</div>
+<div class="step">
+  <div class="num">2c</div>
+  <div class="body">
+    <strong>→ Tab 6 (<code>figures/04_threshold_sweep.png</code>)</strong>
+    <table class="bilingual">
+      <tr>
+        <td class="en">"I optimised for <strong>F2 score</strong>, not F1 — this is safety-critical, a missed rain event on a windward slope can cause flash flooding. False negatives are far worse than false positives. F2 weights recall 4× over precision. Optimal τ = <strong>0.20</strong>, F2 = 0.778, <strong>recall 93.4 %</strong>."</td>
+        <td class="zh">"我用 <strong>F2 分数</strong>而不是 F1——安全关键场景，<strong>漏报</strong>比误报严重得多。F2 把召回权重设为精度的 4 倍。最优阈值 τ = <strong>0.20</strong>，F2 = 0.778，<strong>召回率 93.4%</strong>。"</td>
+      </tr>
+    </table>
+  </div>
+</div>
+<div class="step">
+  <div class="num">2d</div>
+  <div class="body">
+    <strong>→ Tab 7 (<code>figures/05_feature_importance.png</code>)</strong>
+    <table class="bilingual">
+      <tr>
+        <td class="en">"Top 3 features: previous-hour rain, time-of-day cyclic encoding, 3-hour pressure tendency. These match the meteorology literature — autocorrelation, diurnal cycle, storm precursor. <strong>The model learned physically meaningful signal</strong>."</td>
+        <td class="zh">"最重要的 3 个特征：上一小时降水、时间周期编码、3 小时气压变化——<strong>跟气象文献吻合</strong>：自相关、日变化、风暴前兆。<strong>模型学到的是物理上有意义的信号</strong>。"</td>
+      </tr>
+    </table>
+  </div>
+</div>
+<div class="step">
+  <div class="num">3</div>
+  <div class="body">
+    <strong>→ Tab 9 (<code>http://localhost:8000/app/</code>) — FINALLY the app</strong>
+    <table class="bilingual">
+      <tr>
+        <td class="en">"<strong>Now</strong>, Step 3, the app. FastAPI + Vue using the trained model from Step 2 — not a separate model, not a placeholder. Click any coordinate, the system returns the probability and four hazard sub-scores per proposal §3.7."</td>
+        <td class="zh">"<strong>现在</strong>第三步，app。FastAPI + Vue 调用刚才<strong>第二步训好的模型</strong>——不是另一个模型、不是占位符。点地图任意一点，系统返回概率和四个分项灾害评分（按开题 §3.7）。"</td>
+      </tr>
+    </table>
+  </div>
+</div>
+<div class="demo">
+  <div class="demo-title">🇲🇾 Demo A — Genting Highlands (in-distribution)</div>
+  <ol>
+    <li>Click <strong>🇲🇾 Genting Highlands · slope</strong> in the scenario dropdown (top right)</li>
+    <li>Wait ~1 second for the loading spinner</li>
+    <li>Point to the <strong>risk gauge</strong> (the main number)</li>
+    <li>Point to the <strong>4 mini-gauges</strong> below (rainfall / fog / wind / thunderstorm)</li>
+  </ol>
+  <table class="bilingual">
+    <tr>
+      <td class="en">"Genting is 1865 m slope. Model gives moderate rain probability, rule engine detects orographic lift on the windward side, composite reflects both. The 4 mini-gauges decompose risk by hazard type — user knows whether to worry about rain, fog, wind, or thunder specifically."</td>
+      <td class="zh">"云顶 1865 m 山坡。模型给出中等降雨概率，规则引擎检测到迎风坡地形抬升，最终评分综合两者。4 个 mini-gauge 把风险按类型拆解——用户清楚该担心降雨、雾、风、还是雷暴。"</td>
+    </tr>
+  </table>
+</div>
+<div class="demo">
+  <div class="demo-title">🏔️ Demo B — Mt Everest (OUT-OF-DISTRIBUTION STRESS TEST)</div>
+  <ol>
+    <li>Click <strong>🏔️ Mt Everest · 8 848 m (OOD)</strong> in the dropdown</li>
+    <li>Wait for the result</li>
+    <li>Point to the <strong>Veto triggers</strong> section (red box)</li>
+  </ol>
+  <table class="bilingual">
+    <tr>
+      <td class="en">"<strong>This is the critical test.</strong> The model was trained only on Malaysian mountains — it has never seen anything above 2000 m. A pure ML system would give a low probability here and falsely return 'safe'. <strong>A hiker could die.</strong>"</td>
+      <td class="zh">"<strong>这是关键测试</strong>。模型只在马来西亚山地训练过——从未见过 2000 m 以上的地点。<strong>纯 ML 系统</strong>会给出低概率然后错误地返回"安全"——<strong>登山者可能因此遇难</strong>。"</td>
+    </tr>
+    <tr>
+      <td class="en">"But the hybrid architecture intervenes: the Veto cascade fires three overrides — altitude &gt; 3500 m triggers hypoxia veto, temperature ≤ −5 °C triggers frostbite veto, wind ≥ 40 km/h triggers gale veto. Composite is <strong>forced to 100 = Danger</strong>, regardless of the ML output. <strong>This is exactly the OOD safety net the rule engine provides.</strong>"</td>
+      <td class="zh">"但混合架构介入了：<strong>Veto 级联触发了三个否决</strong>——海拔 &gt; 3500 m（缺氧）、温度 ≤ −5°C（冻伤）、风速 ≥ 40 km/h（大风）。无论 ML 输出什么，综合评分<strong>被强制设为 100 = Danger</strong>。<strong>这就是规则引擎对 OOD 输入的安全网作用</strong>。"</td>
+    </tr>
+  </table>
+  <div class="callout ok" style="margin-top: 2mm;">
+    🎯 <strong>The Everest demo is your strongest defensive argument.</strong> Pre-tested in <code>tests/test_rule_engine.py::test_mt_everest_veto_hypoxia</code>.<br>
+    🎯 <strong>珠峰演示是你最强的辩护点</strong>。有单元测试覆盖（<code>test_mt_everest_veto_hypoxia</code>）。
+  </div>
+</div>
+<!-- ===== Section 6: Concern #5 ===== -->
+<h2 class="pb">6 · Concern #5 — "Regression or classification?"
+  <span class="zh">反馈五 · 回归还是分类</span>
+</h2>
+<div class="quote">"I don't think this is a classification problem because there is no class label. So I think this is a regression problem."</div>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Sir, when you first looked at the raw CSV, no class label existed — regression seemed the only option. I considered both. I chose <strong>binary classification</strong> for three reasons:"</td>
+    <td class="zh">"老师，您当时看 CSV 没有 class label，看上去像 regression。我两个都考虑过，最后选了<strong>二分类</strong>，三个理由："</td>
+  </tr>
+  <tr>
+    <td class="en"><strong>(1)</strong> "Downstream decision is binary — go outside or don't. Regressing mm of rain would still need a threshold to convert to go/no-go — I would have to pick the threshold anyway."</td>
+    <td class="zh"><strong>(1)</strong> "下游决策本身就是二元——出门 vs 不出门。即使回归预测毫米数，最后也要拿阈值转成 go/no-go——<strong>那个阈值反正要选</strong>。"</td>
+  </tr>
+  <tr>
+    <td class="en"><strong>(2)</strong> "Classification lets me optimise <strong>F2 score</strong> directly — the right metric for safety-critical recall. I cannot directly optimise F2 on a regression target."</td>
+    <td class="zh"><strong>(2)</strong> "做分类才能直接优化 <strong>F2 分数</strong>——安全关键场景下召回比精度更重要，<strong>这个指标只在分类任务下有意义</strong>。"</td>
+  </tr>
+  <tr>
+    <td class="en"><strong>(3)</strong> "But I still expose the <strong>raw probability</strong> in the API response — any downstream component that needs a continuous score (e.g. the rule engine's rainfall sub-scorer) can still use it. <strong>Best of both worlds.</strong>"</td>
+    <td class="zh"><strong>(3)</strong> "但 API 还是把<strong>原始概率</strong>暴露出来——下游需要连续分数的组��（例如规则引擎的降雨子评分器）照样能用。<strong>两全其美。</strong>"</td>
+  </tr>
+</table>
+<!-- ===== Section 7: Q&A ===== -->
+<h2>7 · Anticipated Q&amp;A
+  <span class="zh">老师可能追问</span>
+</h2>
+<h3>Q1 — "Why Random Forest and not deep learning / LSTM?" / 为什么不是深度学习？</h3>
+<table class="bilingual">
+  <tr><td class="en">"Three reasons. <strong>(1)</strong> Interpretability — feature importance lets me defend predictions. Essential for safety-critical. Neural net is a black box."</td><td class="zh">"三个理由：<strong>(1)</strong> <strong>可解释性</strong>——feature importance 让我能为每个预测辩护，安全关键应用必须，神经网络是黑盒。"</td></tr>
+  <tr><td class="en"><strong>(2)</strong> "Data efficiency — with 175 K samples, RF reaches state-of-the-art. LSTM would need an order of magnitude more data to outperform it."</td><td class="zh"><strong>(2)</strong> "<strong>数据效率</strong>——17 万样本下 RF 已经 SOTA，LSTM 需要至少 10 倍数据才能超过它。"</td></tr>
+  <tr><td class="en"><strong>(3)</strong> "Inference latency — RF inference is sub-millisecond, our FastAPI+cache architecture depends on it. LSTM would be 10× slower and need GPU at inference."</td><td class="zh"><strong>(3)</strong> "<strong>推理延迟</strong>——RF 推理 &lt; 1 ms，FastAPI+缓存架构依赖这一点；LSTM 至少慢 10 倍且推理时需要 GPU。"</td></tr>
+</table>
+<h3>Q2 — "How do you handle out-of-distribution input?" / 分布外输入怎么处理？</h3>
+<div class="callout tip"><strong>→ Just show the Mt Everest demo from §5.</strong> That IS the answer. Don't theorise — let the system speak.<br>
+<strong>→ 直接展示第 5 节的珠峰 demo</strong>。那就是答案。不要讲理论——让系统说话。</div>
+<h3>Q3 — "What is the rule engine's contribution? Could you just use ML alone?" / 规则引擎的贡献？只用 ML 不行吗？</h3>
+<table class="bilingual">
+  <tr><td class="en">"Pure ML is statistical — learns averages. But terrain in complex mountains amplifies precipitation locally by <strong>orders of magnitude</strong> (Roe 2005, Annual Rev Earth &amp; Planetary Sciences)."</td><td class="zh">"纯 ML 是统计性的——学的是平均值。但复杂山地的地形把降水<strong>局部放大几个数量级</strong>（Roe 2005, Annual Rev Earth &amp; Planetary Sciences）。"</td></tr>
+  <tr><td class="en">"R1 in our decision table captures exactly this: when macro rain probability is low <strong>but</strong> wind impinges on a windward slope with falling pressure, hidden rain risk emerges. ML would say 'safe'; rule engine fires R1 and warns."</td><td class="zh">"决策表 R1 抓的就是这点：宏观降雨概率低、<strong>但</strong>风正对迎风坡且气压下降时——<strong>存在隐藏的降雨风险</strong>。ML 会说"安全"；规则引擎触发 R1 警告。"</td></tr>
+  <tr><td class="en">"This is the <strong>Neuro-Symbolic AI</strong> paradigm — learn what is learnable, hand-code what is physical."</td><td class="zh">"这就是 <strong>Neuro-Symbolic AI</strong> 范式——能学的让 ML 学，物理规律手工编码。"</td></tr>
+</table>
+<h3>Q4 — "Cross-validation? Overfitting check?" / 交叉验证？过拟合？</h3>
+<table class="bilingual">
+  <tr><td class="en">"Yes, Sir. <strong>Time-series 5-fold CV</strong> on the training portion — not random K-fold (would leak temporal info)."</td><td class="zh">"做了老师，<strong>时间序列 5 折交叉验证</strong>——不是随机 K 折（会泄漏时间信息）。"</td></tr>
+  <tr><td class="en">"Fold AUCs range 0.828 to 0.908, mean ≈ 0.858 — close to held-out test AUC 0.871. <strong>Confirms no overfitting to a single temporal slice.</strong>"</td><td class="zh">"各折 AUC 0.828–0.908，均值约 0.858——跟独立测试集 AUC 0.871 非常接近。<strong>没有对某个时间段过拟合</strong>。"</td></tr>
+  <tr><td class="en">"All in <code>models/training_report.json</code> and the model card."</td><td class="zh">"全部在 <code>models/training_report.json</code> 和 model card 里。"</td></tr>
+</table>
+<h3>Q5 — "Real-world validation plan?" / 真实世界怎么验证？</h3>
+<table class="bilingual">
+  <tr><td class="en">"Chapter 5: two-pronged. <strong>(1) Hindcast validation</strong> — replay against publicly documented Malaysian floods/landslides from NaDMA archives; check if system would have produced Warning/Danger at the right time."</td><td class="zh">"Chapter 5 两条腿走路：<strong>(1) 历史事件回放</strong>——用 NaDMA 公开的马来西亚洪水/滑坡事件，看系统在事件发生时是否会给出 Warning 或 Danger。"</td></tr>
+  <tr><td class="en"><strong>(2) User study</strong> — small panel of mountain hikers compare system's recommendations to their own field judgment over one month. <strong>Both are standard practice in operational meteorology.</strong></td><td class="zh"><strong>(2) 用��研究</strong>——找一小批登山者，一个月内对比系统建议和他们自己的判断。<strong>两种方法都是业务气象学界标准做法</strong>。</td></tr>
+</table>
+<h3>Q6 — "Risk levels Safe/Caution/Warning/Danger?" / 四个等级怎么定？</h3>
+<table class="bilingual">
+  <tr><td class="en">"Thresholds 30 / 55 / 80 on 0-100 composite. Calibrated so the <strong>mean output across training data</strong> falls in mid-Caution — system uses full dynamic range. Each level maps to a different recommended action in bilingual advice."</td><td class="zh">"阈值 0-100 综合分上的 30 / 55 / 80。校准依据：<strong>训练集平均输出</strong>正好落在 Caution 区间中部——系统能用满整个动态范围。每个等级对应不同的双语建议行动。"</td></tr>
+</table>
+<h3>Q7 — "What if model or API fails in production?" / 生产环境挂了怎么办？</h3>
+<table class="bilingual">
+  <tr><td class="en">"<strong>Three layers of graceful degradation.</strong> (1) Model load fails → physics-motivated heuristic. (2) Internal exception → typed <code>ErrorResponse</code> JSON. (3) Rule engine's Veto cascade runs <strong>independently</strong> of ML — even if ML returns garbage, safety thresholds still fire."</td><td class="zh">"<strong>三层降级：</strong>(1) 模型加载失败→<strong>物理启发式</strong>。(2) 内部异常→<strong>类型化的 <code>ErrorResponse</code> JSON</strong>。(3) <strong>规则引擎 Veto 级联独立于 ML</strong>——即使 ML 返回乱码，安全阈值仍触发。"</td></tr>
+</table>
+<!-- ===== Section 8: Closing ===== -->
+<h2 class="pb">8 · Closing (30 seconds)
+  <span class="zh">收尾 30 秒</span>
+</h2>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Sir, to summarise: I have addressed every point of your feedback. The missing Y is now derived. Documentation matches the data. Model is trained and evaluated <strong>before</strong> the app. Choice of classification over regression is justified by the safety-critical nature of the application."</td>
+    <td class="zh">"老师，总结一下：您每条反馈我都已经回应——Y 已经构造好、文档跟数据完全对齐、模型在 app <strong>之前</strong>就训好并评估过、分类而不是回归是因为应用本身就是安全关键。"</td>
+  </tr>
+  <tr>
+    <td class="en">"Code is on GitHub at <code>KyoukoLi/microclimate-x</code>, CI passing, 97 % test coverage, published model card. <strong>May I have your guidance on the next priorities for Chapter 5?</strong>"</td>
+    <td class="zh">"代码在 GitHub <code>KyoukoLi/microclimate-x</code>，CI 全过、测试覆盖率 97%、有完整的 model card。<strong>请问 Chapter 5 接下来您建议我重点做哪部分？</strong>"</td>
+  </tr>
+</table>
+<!-- ===== Section 9: Psychology ===== -->
+<h2>9 · Psychological reminders
+  <span class="zh">心理建设 · 老师真正在意什么</span>
+</h2>
+<div class="step">
+  <div class="num">1</div>
+  <div class="body">
+    <strong>Did you LISTEN to him? / 你听进去他的话了吗？</strong><br>
+    He asked "Do you understand my English?" multiple times. Reassure him by <strong>quoting his exact words back</strong> ("as you instructed: dataset first, then model, then app").<br>
+    他反复问 "Understand my English?" 用<strong>复述他原话</strong>让他放心。
+  </div>
+</div>
+<div class="step">
+  <div class="num">2</div>
+  <div class="body">
+    <strong>Do you understand basic ML? / 你懂 ML 基础吗？</strong><br>
+    He explained X/Y, rows/columns, "if-then is the target" — patiently, like a tutor. <strong>Don't open with hybrid / neuro-symbolic / TPI / CAPE.</strong> Start with: dataset, target, feature, train, predict. <strong>Earn the right</strong> to use fancy vocabulary by first speaking his language.<br>
+    <strong>不要上来就抛 hybrid、neuro-symbolic、TPI、CAPE。</strong>先用他的词汇：dataset、target、feature、train、predict。<strong>先证明你懂基础</strong>再升级。
+  </div>
+</div>
+<div class="step">
+  <div class="num">3</div>
+  <div class="body">
+    <strong>Did you follow his process? / 你按他的流程做了吗？</strong><br>
+    "App is the last" — he said it <strong>three times</strong>. The visual order in which you open tabs IS the answer. <strong>No app until the very end.</strong><br>
+    "app is the last" 他说了三次。<strong>你打开标签页的顺序就是答案</strong>。<strong>绝对不要提前打开 app。</strong>
+  </div>
+</div>
+<h3>Defensive lines if you get stuck / 答不出来时的兜底话术</h3>
+<table>
+  <tr><th>Situation</th><th>EN</th><th>ZH</th></tr>
+  <tr>
+    <td>Don't know answer</td>
+    <td>"That is a good question, Sir. I haven't fully worked out the answer yet — may I prepare a written response by next meeting?"</td>
+    <td>"老师这是个好问题，我还没完全想清楚——能否下次开会前给您一份书面回复？"</td>
+  </tr>
+  <tr>
+    <td>He challenges a threshold</td>
+    <td>"Sir, the threshold is documented in <code>docs/thresholds.md</code> with the academic citation. Let me open it."</td>
+    <td>"老师，这个阈值的学术引用在 <code>docs/thresholds.md</code> 里，我打开给您看。"</td>
+  </tr>
+  <tr>
+    <td>"This doesn't match what I expected"</td>
+    <td>"Yes Sir — that is exactly what I want to confirm with you. Could you describe what you expected, so I can align?"</td>
+    <td>"老师<strong>这正是我想跟您确认的点</strong>——能否说说您预期的样子？我好对齐。"</td>
+  </tr>
+</table>
+<!-- ===== Section 10: Backup ===== -->
+<h2>10 · Backup plan / 设备出问题的备份方案</h2>
+<table>
+  <tr><th>Problem</th><th>Fallback</th><th>中文</th></tr>
+  <tr><td>WiFi down</td><td>Synthetic dataset works offline — <code>make synth</code> already ran</td><td>合成数据集已经跑过，本地能演</td></tr>
+  <tr><td><code>make run</code> fails</td><td>Show GitHub repo with green CI badge — same artefacts visible there</td><td>直接给 GitHub repo 看 CI 绿勾，artefact 一样能看</td></tr>
+  <tr><td>Demo doesn't load</td><td>Use cached responses — recent results in <code>cache.sqlite3</code></td><td>用缓存的结果——最近查询都在 <code>cache.sqlite3</code> 里</td></tr>
+  <tr><td>Browser crashes</td><td>Open this cheat sheet on your phone — every key number is here</td><td>手机打开这份 cheat sheet——所有关键数字都在</td></tr>
+</table>
+<!-- ===== Section 11: Pre-flight ===== -->
+<h2>11 · Pre-flight checklist (60 seconds before)
+  <span class="zh">起飞前最后 60 秒自检</span>
+</h2>
+<div class="check">
+  <div><span class="box">☐</span> Laptop ≥ 80 % battery, charger in bag / 笔记本电池 ≥ 80%，充电器在包里</div>
+  <div><span class="box">☐</span> <code>make run</code> is running in a terminal (don't close it!) / <code>make run</code> 在另一个终端跑着（不要关！）</div>
+  <div><span class="box">☐</span> <code>/api/health</code> returns <code>ml_loaded: true</code> / <code>/api/health</code> 返回 <code>ml_loaded: true</code></div>
+  <div><span class="box">☐</span> All 10 browser tabs open in correct order (app is LAST) / 10 个标签页按顺序开好（app 在最后）</div>
+  <div><span class="box">☐</span> This cheat sheet open on screen — but NOT to be read word-for-word / 这份 cheat sheet 开着，但不要照念</div>
+  <div><span class="box">☐</span> Phone on silent / 手机静音</div>
+  <div><span class="box">☐</span> Deep breath. You have done the work. / 深呼吸。你已经做完了所有该做的工作。</div>
+</div>
+<footer>
+  Generated 2026-05-11 · MicroClimate-X · KyoukoLi/microclimate-x ·
+  CI passing · 97 % coverage · 70 tests
+  <br>
+  此页为 2026-05-11 UKM 毕业设计 MicroClimate-X 导师答辩准备文档
+</footer>
+</main>
+</body>
+</html>

docs/MEETING_CHEAT_SHEET.md ADDED Viewed

	@@ -0,0 +1,372 @@

+# 📋 Supervisor Meeting Cheat Sheet
+# 📋 导师开会一页通
+> **Open this on your laptop during the meeting.** Print it if you prefer paper.
+> Everything you need is in this single document.
+>
+> **开会时电脑屏幕开着这一页就够。** 想要纸质版直接打印。
+> 所有内容都在这一份文档里。
+---
+## 🔧 0. Before the meeting (10 minutes before)
+## 🔧 0. 会前 10 分钟准备
+Run these in a terminal, in order. **Do not skip any.**
+在终端按顺序执行，**一条都不能少**：
+```bash
+cd ~/Projects/microclimate-x
+# 1. Pull latest + verify clean working tree
+git pull && git status        # should print "working tree clean"
+# 2. Start the backend (leave running in this terminal)
+make run                      # uvicorn boots on http://localhost:8000
+# 3. In a NEW terminal: verify the API is alive + model is loaded
+curl -s http://localhost:8000/api/health | python3 -m json.tool
+# expect: "status": "ok", "ml_loaded": true
+```
+If `ml_loaded` is **false**, run `make train` first — but this should already be done.
+如果 `ml_loaded` 显示 **false**，先跑 `make train` —— 但理论上之前已经训好了。
+### Browser tabs to open in this exact order / 浏览器按顺序开好这几个标签页
+| # | URL | Purpose |
+|---|---|---|
+| 1 | `file:///…/microclimate-x/docs/MEETING_CHEAT_SHEET.md` (this file) | Your safety net |
+| 2 | `https://github.com/KyoukoLi/microclimate-x` | Show CI green badge |
+| 3 | `file:///…/microclimate-x/docs/dataset.md` | For Concern #1 + #2 |
+| 4 | `file:///…/microclimate-x/figures/01_roc_curve.png` | For Concern #4 step 2 |
+| 5 | `file:///…/microclimate-x/figures/03_calibration_curve.png` | |
+| 6 | `file:///…/microclimate-x/figures/04_threshold_sweep.png` | |
+| 7 | `file:///…/microclimate-x/figures/05_feature_importance.png` | |
+| 8 | `file:///…/microclimate-x/docs/architecture.md` | For rule engine section |
+| 9 | `http://localhost:8000/app/` | **The actual app — OPEN LAST** |
+| 10 | `file:///…/microclimate-x/models/MODEL_CARD.md` | Q&A backup |
+🚨 **Tab 9 (the app) MUST be opened LAST.** If you accidentally show the app first the supervisor will remember last meeting's complaint ("app is last") and you lose credibility.
+🚨 **标签 9（app）一定要最后打开。** 不小心先打开 app 老师就会立刻想起上次 "app is last" 的批评。
+---
+## 🎬 1. Opening (30 seconds)
+## 🎬 1. 开场（30 秒）
+> **EN**: "Sir, since our last meeting I have addressed every point of your feedback. May I walk you through them in the correct order — **dataset first, then model, then app** — as you instructed?"
+>
+> **ZH**: "老师，按您上次反馈，我已经把每一条都改了。我按您要求的顺序——**先 dataset，再 model，最后才是 app**——给您过一遍可以吗？"
+**Why this works**: directly quotes his words back to him. He relaxes immediately.
+**为什么有效**：直接复述了他自己的话，他会立刻放松。
+---
+## 📊 2. Concern #1 — "Y is missing"
+## 📊 2. 反馈一 —— Y 列缺失
+**His original words / 老师原话**: *"Y is missing. I don't have the output variable. If you don't have target, you cannot train a machine learning model."*
+### What to do on screen / 屏幕操作
+1. Switch to Tab 3 (`docs/dataset.md`)
+2. Scroll to **§5 Target label derivation**
+3. Point to the highlighted code line:
+```python
+df['is_rain_event'] = (df['precipitation'].shift(-1) > 0.1).astype(int)
+```
+### What to say / 怎么说
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Sir, you were right — the raw Open-Meteo CSV has no Y column. I have engineered the target explicitly. The variable is called `is_rain_event` and it is defined as **1 if the precipitation in the next hour is greater than 0.1 mm, else 0**." | "老师您说得对，原始 CSV 没有 Y 列。我现在已经显式构造了目标变量 **`is_rain_event`**——**下一小时降雨量 > 0.1 mm 则为 1，否则为 0**。" |
+| "Three things to notice. First, `.shift(-1)` means I use **future** rain as the label — features at hour t predict outcome at t+1h, so there is no temporal data leakage." | "三个要点：(1) `.shift(-1)` 表示用**下一小时**的降雨作标签，特征是 t 时刻、预测的是 t+1 小时——**无时间泄漏**。" |
+| "Second, the 0.1 mm threshold matches the **WMO definition of trace precipitation** — it is not an arbitrary choice." | "(2) 0.1 mm 这个阈值不是我随便定的，对应 **WMO 微量降水标准**。" |
+| "Third, it is **binary classification**, not regression, because the downstream user decision is binary — go or no-go." | "(3) 是**二分类**不是回归，因为下游用户决策本身就是二元的——去 / 不去。" |
+---
+## 📊 3. Concern #2 — "Features in document don't match Excel"
+## 📊 3. 反馈二 —— 文档里的特征和 CSV 列名对不上
+**His original words / 老师原话**: *"The features that you presented here, not... not mentioned in the Excel. So, it must be matched."*
+### What to do on screen / 屏幕操作
+Stay on Tab 3 (`docs/dataset.md`). Scroll **up** to **§4 Schema**. Show the column table.
+### What to say / 怎么说
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Sir, that was also a fair point. I have rewritten the dataset specification so the documentation lists **exactly the same column names** that appear in the CSV. There is a one-to-one mapping right here in §4." | "老师，这条您也说得对。我已经重写了数据集文档，文档里列出的就是 CSV 里的**真实列名**，一一对应，就在第 4 节这里。" |
+| "Every row in this table is one column in the actual CSV. The 'role' column says whether it is a feature (**X**), the target (**Y**), or just metadata." | "表里每一行就是 CSV 里的一列，role 列写明了它是 feature（**X**）、target（**Y**）还是 metadata。" |
+---
+## 📊 4. Concern #3 — "Study the data source"
+## 📊 4. 反馈三 —— 研究数据源本身
+**His original words / 老师原话**: *"Please study the link. What is the purpose of the dataset? What is design for? What is the output variable?"*
+### What to do on screen / 屏幕操作
+Stay on Tab 3 (`docs/dataset.md`). Scroll back **up** to **§1-3** (Source / Spatial coverage / Temporal coverage).
+### What to say / 怎么说
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "I read the Open-Meteo API documentation carefully. The dataset I use is the **ERA5 reanalysis archive**, which is ECMWF's gold-standard hourly reanalysis." | "我把 Open-Meteo 文档仔细读了。我用的是 **ERA5 再分析数据**，是 ECMWF 出的金标准同化产品。" |
+| "It is *not* a forecast — it is a physically-consistent reconstruction of past weather. ECMWF themselves use ERA5 to **validate other forecast models**. That is why it is the right dataset for training ML: the labels are reliable ground truth." | "它**不是**预报，是对过去天气的物理一致的重建。ECMWF 自己用 ERA5 去**校验别的预报模型**——所以拿来训练 ML 是合适的，**标签是可靠的 ground truth**。" |
+| "Spatial coverage: 5 Malaysian mountain sites — Genting, Cameron, Fraser's Hill, Klang Valley, Kinabalu — chosen to span elevations from 100 m to 1865 m and terrain from valley to slope." | "空间覆盖 5 个马来西亚山地点位——云顶、金马仑、福隆港、巴生谷、神山——海拔 100 m 到 1865 m，地形从山谷到山坡都有。" |
+| "Temporal coverage: 5 years, hourly, 175 315 rows total." | "时间范围 5 年，每小时一行，总共 175 315 行。" |
+---
+## 📊 5. Concern #4 — "App is the last"
+## 📊 5. 反馈四 —— App 放在最后做
+**His original words / 老师原话**: *"First, identify a dataset. And then train the model. And then predict it. Once everything is finished, you can develop the app. App is the last."*
+🚨 **This is the most important section.** Pace yourself — about 2-3 minutes total. **Don't open the app until the very end.**
+🚨 **这是最重要的一节。** 控制节奏，总共大约 2-3 分钟。**不要提前打开 app。**
+### Step-by-step on-screen demo / 逐步演示
+#### Step 2a — ROC curve / 第二步 a：ROC 曲线
+→ Switch to **Tab 4** (`figures/01_roc_curve.png`)
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Step 2, model training. Test ROC AUC is **0.871** on 35 063 held-out hourly samples. The hold-out is the **last 20 % chronologically**, not a random split — random splits leak temporal autocorrelation and would inflate accuracy unrealistically by 5-15 percentage points." | "第二步，模型训练。测试集 35 063 行，**ROC AUC = 0.871**。划分用的是**按时间排序的最后 20%**，不是随机划分——随机划分会泄漏时间自相关，把准确率虚高 5-15 个百分点。" |
+#### Step 2b — Calibration / 第二步 b：校准度
+→ Switch to **Tab 5** (`figures/03_calibration_curve.png`)
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Brier score is **0.138**, which means the predicted probabilities are well-calibrated — when the model says 70 % chance of rain, the actual rate is close to 70 %. So I do not need post-hoc calibration like Platt scaling or isotonic regression." | "Brier 分数 = **0.138**，说明预测概率**校准良好**——模型说 70% 概率时，实际频率接近 70%。**不需要额外做** Platt scaling 或 isotonic 校准。" |
+#### Step 2c — Threshold choice / 第二步 c：阈值选择
+→ Switch to **Tab 6** (`figures/04_threshold_sweep.png`)
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "I optimised the decision threshold for **F2 score**, not F1, because in this safety-critical application a missed rain event on a windward slope can lead to flash flooding — false negatives are much worse than false positives." | "我用 **F2 分数**而不是 F1 来选最优阈值——因为这是安全关键应用，**漏报**比误报严重得多。" |
+| "F2 weights recall four times more than precision. The optimal threshold is τ = **0.20**, giving F2 = 0.778 and **93.4 % recall**." | "F2 把召回率的权重设为精度的 4 倍。最优阈值是 τ = **0.20**，F2 = 0.778，**召回率 93.4%**。" |
+#### Step 2d — What the model learned / 第二步 d：模型学到了什么
+→ Switch to **Tab 7** (`figures/05_feature_importance.png`)
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Top three features: previous hour's rain, time-of-day cyclic encoding, and 3-hour pressure tendency. These match the meteorological literature — autocorrelation, diurnal cycle, and storm precursor. So the model has learned something physically meaningful." | "模型最看重的 3 个特征：上一小时降水、时间周期编码、3 小时气压变化。**跟气象文献吻合**——自相关、日变化、风暴前兆。模型学到的是**物理上有意义的信号**。" |
+#### Step 3 — The app (last) / 第三步：App（最后）
+→ Switch to **Tab 9** (`http://localhost:8000/app/`)
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "**Now**, Step 3, the app. This is FastAPI plus Vue using the trained model from Step 2 — not a separate model, not a placeholder. When I click any coordinate, the system returns the probability and the four hazard sub-scores per proposal §3.7." | "**现在**第三步，app。这是 FastAPI + Vue 调用刚才**第二步训好的模型**——不是另一个模型、也不是占位符。点地图任意一点，系统返回概率和四个分项灾害评分（按开题 §3.7）。" |
+### Demo scenario A — Genting Highlands (familiar territory)
+### Demo 场景 A —— 云顶高原（训练数据内）
+1. Click the **🇲🇾 Genting Highlands · slope** option in the scenario dropdown (top right)
+2. Wait ~1 second for the loading spinner to finish
+3. Point to the **risk gauge** (main number)
+4. Point to the **4 mini-gauges** below (rainfall / fog / wind / thunderstorm)
+| Say in EN | 用中文说 |
+|---|---|
+| "Genting is a slope at 1865 m. The model gives a moderate rain probability, the rule engine picks up orographic lift on the windward side, and the composite score reflects both. The 4 mini-gauges decompose the risk by hazard type so the user knows whether to worry about rain, fog, wind, or thunder specifically." | "云顶是 1865 m 的山坡，模型给出中等降雨概率，规则引擎检测到迎风坡的地形抬升，最终评分综合两者。4 个 mini-gauge 把风险按类型拆解——用户能看出该担心降雨、雾、风、还是雷暴。" |
+### Demo scenario B — Mt Everest (out-of-distribution stress test)
+### Demo 场景 B —— 珠穆朗玛峰（分布外压力测试）
+1. Click the **🏔️ Mt Everest · 8 848 m (OOD)** option in the dropdown
+2. Wait for the result
+3. Point to the **Veto triggers** section (blinking red box)
+| Say in EN | 用中文说 |
+|---|---|
+| "This is the critical test. The model was trained only on Malaysian mountains — it has never seen anything above 2000 m. A pure ML system would give a low probability here and falsely return 'safe', and a hiker could die." | "**这是关键测试**。模型只在马来西亚山地训练过——从未见过 2000 m 以上的地点。**纯 ML 系统**会给出低概率然后错误地返回"安全"——登山者可能因此遇难。" |
+| "But the hybrid architecture intervenes: the Veto cascade fires three independent overrides — altitude > 3500 m triggers hypoxia veto, temperature ≤ −5 °C triggers frostbite veto, wind ≥ 40 km/h triggers gale veto. The composite is forced to 100 = Danger, regardless of the ML output. This is exactly the OOD safety net the rule engine provides." | "但混合架构介入了：**Veto 级联触发了三个独立否决**——海拔 > 3500 m（缺氧）、温度 ≤ −5°C（冻伤）、风速 ≥ 40 km/h（大风）。无论 ML 输出什么，综合评分被强制设为 100 = Danger。**这就是规则引擎对 OOD 输入的安全网作用**。" |
+🎯 **The Mt Everest demo is your strongest defensive argument.** It's also pre-tested — see `tests/test_rule_engine.py::test_mt_everest_veto_hypoxia`.
+🎯 **珠峰演示是你最强的辩护点**。也是有单元测试覆盖的——见 `test_mt_everest_veto_hypoxia`。
+---
+## 📊 6. Concern #5 — "Regression or classification?"
+## 📊 6. 反馈五 —— 回归还是分类？
+**His original words / 老师原话**: *"I don't think this is a classification problem because there is no class label. So I think this is a regression problem."*
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Sir, when you first looked at the raw CSV, there was no class label, so regression looked like the only option. I considered both. I chose **binary classification** for three reasons:" | "老师，您当时看 CSV 没有 class label，所以看上去像 regression。我两个都考虑过，最后选了**二分类**，三个理由：" |
+| **(1)** "The downstream decision is binary — go outside or don't. Regressing on mm of rain would still need a threshold to convert to a go/no-go output, so I would have to pick the threshold anyway." | **(1)** "下游决策本身就是二元的——出门 vs 不出门。即使做回归预测降雨毫米数，最后也要拿一个阈值转成 go/no-go，**那个阈值反正要选**。" |
+| **(2)** "Classification lets me optimise **F2 score** directly, which is the right metric for safety-critical recall. I cannot directly optimise F2 on a regression target." | **(2)** "做分类才能直接优化 **F2 分数**——安全关键场景下召回比精度更重要，**这个指标只在分类任务下有意义**。" |
+| **(3)** "But I still expose the **raw probability** in the API response, so any downstream component that needs a continuous score — for example the rule engine's rainfall sub-scorer — can still use it. So I keep the best of both worlds." | **(3)** "但 API 还是把**原始概率**暴露出来了，下游需要连续分数的组件（比如规则引擎的降雨子评分器）照样能用。**两全其美**。" |
+---
+## 🛡️ 7. Anticipated follow-up Q&A
+## 🛡️ 7. 老师可能追问的问题
+### Q1 — "Why Random Forest and not deep learning / LSTM?"
+### Q1 ——为什么选 Random Forest 而不是深度学习 / LSTM？
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Three reasons. First, **interpretability** — feature importance lets me defend why the model predicts what it predicts. Essential for safety-critical applications. A neural net is a black box." | "三个理由：(1) **可解释性**——feature importance 让我能为每个预测**辩护**，安全关键应用必须有这一点，神经网络是黑盒。" |
+| "Second, **data efficiency** — with 175 K samples, Random Forest reaches state-of-the-art performance. LSTM would need an order of magnitude more data to outperform it." | "(2) **数据效率**——17 万样本下 RF 已经达到 SOTA，LSTM 需要至少 10 倍数据才能超过它。" |
+| "Third, **inference latency** — RF inference is sub-millisecond, which the FastAPI plus cache architecture depends on. LSTM would be at least 10× slower and require GPU at inference time." | "(3) **推理延迟**——RF 推理 < 1 ms，FastAPI + 缓存架构依赖这一点；LSTM 至少慢 10 倍且推理时需要 GPU。" |
+### Q2 — "How do you handle out-of-distribution input?"
+### Q2 ——分布外输入怎么处理？
+**Just show the Mt Everest demo from Section 5 — that IS the answer.**
+**直接展示第 5 节的珠峰 demo —— 那就是答案。**
+### Q3 — "What is the contribution of the topographic rule engine? Could you just use ML alone?"
+### Q3 ——地形规则引擎的贡献是什么？只用 ML 不行吗？
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Pure ML is statistical — it learns averages. But terrain in complex mountainous regions amplifies precipitation locally by **orders of magnitude**, see Roe 2005, *Annual Review of Earth & Planetary Sciences*." | "纯 ML 是统计性的——它学的是平均值。但复杂山地的地形会把降水**局部放大几个数量级**（Roe 2005, Annual Review of Earth & Planetary Sciences）。" |
+| "The R1 rule in our decision table captures exactly this: when macro rain probability is low **but** the wind impinges on a windward slope with falling pressure, hidden rain risk emerges. The ML model would say 'safe' here; the rule engine fires R1 and warns the user." | "我们决策表的 R1 规则抓住的正是这一点：宏观降雨概率低、但风正对迎风坡且气压下降时——**存在隐藏的降雨风险**。ML 在这种情况下会说"安全"；规则引擎会触发 R1 警告用户。" |
+| "This is the **Neuro-Symbolic AI** paradigm — learn what is learnable, hand-code what is physical." | "这就是 **Neuro-Symbolic AI** 范式——能学的让 ML 学，物理规律手工编码。" |
+### Q4 — "Did you do cross-validation? Did you check for overfitting?"
+### Q4 ——做过交叉验证吗？检查过过拟合吗？
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Yes Sir, **time-series cross-validation** with 5 folds on the training portion — not random K-fold, which would leak temporal information." | "做了老师，**时间序列交叉验证**，5 折，**不是**随机 K 折——随机划分会泄漏时间信息。" |
+| "The fold AUCs range from 0.828 to 0.908, mean approximately 0.858 — very close to the held-out test AUC of 0.871. This consistency confirms the model is not overfitting to a single temporal slice." | "各折 AUC 在 0.828 到 0.908 之间，均值约 0.858——跟独立测试集 AUC 0.871 非常接近。**说明模型没有对某个时间段过拟合**。" |
+| "All fold metrics are in `models/training_report.json` and the model card." | "所有指标都在 `models/training_report.json` 和 model card 里。" |
+### Q5 — "How will you validate this in the real world?"
+### Q5 ——你怎么在真实世界验证这套系统？
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Two-pronged plan for Chapter 5 evaluation. First, **hindcast validation** — I will replay the system against publicly documented Malaysian flood and landslide events from NaDMA archives and check whether the system would have produced a Warning or Danger verdict at the right time." | "Chapter 5 评估两条腿走路：(1) **历史事件回放**——用 NaDMA 公开记录的马来西亚洪水/滑坡事件，看系统在事件发生时是否会给出 Warning 或 Danger。" |
+| "Second, **user study** — a small panel of mountain hikers will compare the system's recommendations against their own field judgment over a one-month period. Both methodologies follow standard practice in operational meteorology." | "(2) **用户研究**——找一小批登山者，一个月内对比系统建议和他们自己的判断。**两种方法都是业务气象学界的标准做法**。" |
+### Q6 — "What about the four risk levels — Safe, Caution, Warning, Danger?"
+### Q6 ——四个风险等级（Safe / Caution / Warning / Danger）是怎么定的？
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "The thresholds are 30 / 55 / 80 on the 0-100 composite score. They are calibrated so that the **mean output across all training data** falls in the middle of the Caution band — that way the system uses its full dynamic range. Each level maps to a different recommended action in the bilingual advice." | "阈值是 0-100 综合分上的 30 / 55 / 80。校准依据：**训练集平均输出**正好落在 Caution 区间中部——这样系统能用满整个动态范围。每个等级对应不同的双语建议行动。" |
+### Q7 — "What if the API or model fails in production?"
+### Q7 ——生产环境 API 或模型挂了怎么办？
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Three layers of graceful degradation. First, if the trained model fails to load, the engine falls back to a physics-motivated heuristic. Second, every internal exception is caught and surfaced as a typed `ErrorResponse` JSON document. Third, the rule engine's Veto cascade runs **independently** of the ML model — even if ML returns garbage, the safety thresholds still fire." | "三层降级：(1) 模型加载失败时回退到**物理启发式**。(2) 所有内部异常被捕获并返回**类型化的 `ErrorResponse` JSON**。(3) **规则引擎的 Veto 级联独立于 ML 模型**——即使 ML 返回乱码，安全阈值仍然会触发。" |
+---
+## 🎬 8. Closing (30 seconds)
+## 🎬 8. 收尾（30 秒）
+| 🇬🇧 EN | 🇨🇳 ZH |
+|---|---|
+| "Sir, to summarise: I have addressed every point of your feedback. The missing Y is now derived. The documentation matches the data. The model is trained and evaluated **before** the app. And the choice of classification over regression is justified by the safety-critical nature of the application." | "老师，总结一下：您每条反馈我都已经回应——Y 已经构造好、文档跟数据完全对齐、模型在 app **之前**就训好并评估过、分类而不是回归是因为应用本身就是安全关键。" |
+| "The code is on GitHub at `KyoukoLi/microclimate-x` with CI passing, 97 % test coverage, and a published model card. May I have your guidance on the next priorities for Chapter 5?" | "代码在 GitHub `KyoukoLi/microclimate-x`，CI 全过、测试覆盖率 97%、有完整的 model card。请问 **Chapter 5 接下来您建议我重点做哪部分**？" |
+---
+## 🧠 9. Psychological reminders
+## 🧠 9. 心理建设
+From the meeting recordings, the supervisor cares about three things above all else:
+从录音里可以听出来，老师**最在意三件事**：
+1. **Did you LISTEN to him?** — He asked "Do you understand my English?" multiple times. Reassure him by **quoting his exact words back** ("as you instructed: dataset first, then model, then app").
+   **你听进去他的话了吗？** —— 他反复问 "Understand my English?" 用**复述他原话**让他放心。
+2. **Do you understand basic ML?** — He explained X/Y, rows/columns, "if-then is the target" — patiently, like a tutor. Don't open with hybrid / neuro-symbolic / TPI / CAPE. Start with: dataset, target, feature, train, predict. **Earn the right** to use fancier vocabulary by first speaking his language.
+   **你懂 ML 基础吗？** —— 不要上来就抛 hybrid、neuro-symbolic、TPI、CAPE。**先用他的词汇**：dataset、target、feature、train、predict。**先证明你懂基础**再升级。
+3. **Did you follow his process?** — "App is the last" three times. The visual order in which you open tabs IS the answer. **No app until the very end.**
+   **你按他的流程做了吗？** —— "app is the last" 他说了三次。**你打开标签页的顺序就是答案**。**绝对不要提前打开 app**。
+### Defensive lines if you get stuck / 答不出来时的兜底话术
+| Situation | Say (EN) | 说（ZH） |
+|---|---|---|
+| Don't know the answer | "That is a good question, Sir. I haven't fully worked out the answer yet — may I prepare a written response by next meeting?" | "老师这是个好问题，我还没完全想清楚——能否下次开会前��您一份书面回复？" |
+| He challenges a threshold | "Sir, the threshold is documented in `docs/thresholds.md` with the academic citation. Let me open it." | "老师，这个阈值的学术引用在 `docs/thresholds.md` 里，我打开给您看。" |
+| He says "this doesn't match what I expected" | "Yes Sir — that is exactly what I want to confirm with you. Could you describe what you expected so I can align?" | "老师**这正是我想跟您确认的点**——能否说说您预期的样子？我好对齐。" |
+---
+## ⚙️ 10. Backup plan if technical issues
+## ⚙️ 10. 设备出问题的备份方案
+| Problem | Fallback |
+|---|---|
+| WiFi / network down | The synthetic dataset works offline — `make synth` already ran |
+| `make run` fails | Show the GitHub repo with CI green badge instead — the same artefacts are visible there |
+| Demo doesn't load (open-meteo / open-topo-data API blocked) | Use the cached responses — recent results survive in `cache.sqlite3` |
+| Browser crashes | Open this cheat sheet on your phone — every key number / sentence is here |
+| 网络挂了 | 合成数据集已经跑过，本地能演 |
+| `make run` 起不来 | 直接给 GitHub repo 看 CI 绿勾，artefact 一样能看到 |
+| Demo 加载失败 | 用缓存的结果——最近查询都在 `cache.sqlite3` 里 |
+| 浏览器崩了 | 手机打开这份 cheat sheet —— 所有关键数字和句子都在里面 |
+---
+## 📐 11. Final pre-flight checklist (do this 60 seconds before walking in)
+## 📐 11. 起飞前最后 60 秒自检
+```
+☐ Laptop ≥ 80% battery, charger in bag
+☐ make run is running in a terminal (don't close it!)
+☐ http://localhost:8000/api/health returns ml_loaded: true
+☐ All 10 browser tabs open in the order above (#9 — the app — is LAST in the tab bar)
+☐ This cheat sheet open on screen, but NOT to be read word-for-word
+☐ Phone on silent
+☐ Deep breath. You have done the work.
+```
+```
+☐ 笔记本电池 ≥ 80%，充电器在包里
+☐ make run 在另一个终端跑着（不要关掉！）
+☐ http://localhost:8000/api/health 返回 ml_loaded: true
+☐ 10 个浏览器标签页按上面顺序开好（第 9 个 app 在标签栏最后）
+☐ 这份 cheat sheet 开着，但不要照念
+☐ 手机静音
+☐ 深呼吸。你已经做完了所有该做的工作。
+```
+---
+## 📎 Cross-references / 相关文档索引
+| Topic | File |
+|---|---|
+| Detailed dataset spec | [`docs/dataset.md`](dataset.md) |
+| Architecture deep-dive | [`docs/architecture.md`](architecture.md) |
+| Threshold citations | [`docs/thresholds.md`](thresholds.md) |
+| Pipeline order ASCII chart | [`docs/pipeline_order.md`](pipeline_order.md) |
+| Model card | [`../models/MODEL_CARD.md`](../models/MODEL_CARD.md) |
+| Full thesis-defence brief | [`supervisor_meeting_brief.md`](supervisor_meeting_brief.md) |
+| Evaluation summary JSON | [`../figures/evaluation_summary.json`](../figures/evaluation_summary.json) |
+---
+> *Generated 2026-05-11 for the MicroClimate-X final-year-project supervisor meeting at UKM.
+> 此页为 2026-05-11 UKM 毕业设计 MicroClimate-X 导师答辩准备文档。*

docs/architecture.md ADDED Viewed

	@@ -0,0 +1,116 @@

+# Architecture / 架构
+## Request flow / 请求流程
+```
+┌──────────────┐ 1. click(lat,lon)  ┌──────────────────────────────┐
+│   Browser    │ ─────────────────► │  FastAPI  /api/predict        │
+│  Vue3 + Map  │                    │                               │
+└──────────────┘ ◄───────────────── │  ┌─────────────────────────┐  │
+                  6. JSON response  │  │  Cache lookup           │  │
+                                    │  │  (WAL SQLite, 60-600s)  │  │
+                                    │  └────────┬────────────────┘  │
+                                    │           │ miss              │
+                                    │           ▼                   │
+                                    │  ┌─────────────────────────┐  │
+                                    │  │ 2. Parallel fetch       │  │
+                                    │  │  - Open-Meteo (weather) │  │
+                                    │  │  - Open-Topo-Data (DEM) │  │
+                                    │  └────────┬────────────────┘  │
+                                    │           ▼                   │
+                                    │  ┌─────────────────────────┐  │
+                                    │  │ 3. Engine A — RandomFor │  │
+                                    │  │    predict_proba → P    │  │
+                                    │  └────────┬────────────────┘  │
+                                    │           ▼                   │
+                                    │  ┌─────────────────────────┐  │
+                                    │  │ 4. Engine B — Rules     │  │
+                                    │  │  ┌───────────────────┐  │  │
+                                    │  │  │ P4.3 four hazard  │  │  │
+                                    │  │  │  sub-scorers      │  │  │
+                                    │  │  └─────────┬─────────┘  │  │
+                                    │  │  ┌───────────────────┐  │  │
+                                    │  │  │ §3.7.2 decision   │  │  │
+                                    │  │  │  table R1-R4      │  │  │
+                                    │  │  └─────────┬─────────┘  │  │
+                                    │  │  ┌───────────────────┐  │  │
+                                    │  │  │ Veto cascade      │  │  │
+                                    │  │  └─────────┬─────────┘  │  │
+                                    │  │  ┌───────────────────┐  │  │
+                                    │  │  │ P4.4 activity-    │  │  │
+                                    │  │  │  weighted composite│ │  │
+                                    │  │  └─────────┬─────────┘  │  │
+                                    │  │    Bilingual advice    │  │
+                                    │  └────────┬───────────────┘  │
+                                    │           ▼                   │
+                                    │  ┌─────────────────────────┐  │
+                                    │  │ 5. Cache + audit log    │  │
+                                    │  │    risk-adaptive TTL    │  │
+                                    │  └────────┬────────────────┘  │
+                                    │           ▼                   │
+                                    │      response JSON            │
+                                    └──────────────────────────────┘
+```
+## Why "Hybrid"? / 为什么是混合架构？
+**Failure mode of pure ML**: feed Mt Everest coordinates → trained on tropical Malaysian mountains → predicts ~0 % rain → ignores -30 °C, 80 km/h winds, 8800 m hypoxia → returns "Safe". A hiker dies.
+**Mitigation**: the Rule Engine is the **safety net**. It encodes physical / medical thresholds that are *true everywhere*, not learned from data. ML provides nuanced in-distribution probability; rules provide bounded out-of-distribution guarantees.
+This split — learnable component + symbolic component — is the **Neuro-Symbolic AI** paradigm (Garcez & Lamb, 2020).
+## Engine B internals (D5 proposal §3.7 — P4)
+Engine B is structured in **one-to-one correspondence** with sub-process §3.7 of the proposal so the thesis chapter can quote line numbers directly:
+| Proposal section | Code artefact | What it does |
+|---|---|---|
+| **P4.1** Load Dynamic Risk Rules | `backend/config.py` — `DECISION_TABLE_3_7_2`, `ACTIVITY_WEIGHTS`, all `PENALTY_*` / threshold constants | Single source of truth for every threshold, weight, and rule, each annotated with the citation it is derived from. |
+| **P4.2** Fetch User Context | `?activity={hiker,driver,construction,general}` query parameter, plumbed to `evaluate(activity=…)` | Captures who the user is so weights can be applied later. |
+| **P4.3** Evaluate Environmental Risks | Four `score_*_risk()` functions in `rule_engine.py`: rainfall, fog, wind gust, thunderstorm | Each returns a 0-100 sub-score using ML probability + weather + terrain inputs. |
+| **§3.7.2 Table 4.2** Decision Table | `apply_decision_table_3_7_2()` | Returns which of R1-R4 fire (hidden rain on windward slope; no amplification on leeward; heavy downpour incoming; normal rain). Emits an `[table]` line in the XAI log per match. |
+| **Veto cascade** | `_collect_veto_triggers()` | Life-safety overrides (altitude hypoxia, extreme cold, gale wind, high CAPE, low visibility, valley flash-flood, orographic-lift storm). When any fires, composite is capped at 100 and a `Danger` verdict is returned regardless of ML probability. |
+| **P4.4** Activity-Specific Weighting | `apply_activity_weighting()` + `ACTIVITY_WEIGHTS` matrix | Weights per (activity × hazard) pair (e.g. driver weights fog 1.5×, construction weights wind 1.5×). |
+| **P4.5** Composite Risk Score | Same function | Composite = 0.80 · max(weighted sub-scores) + 0.20 · mean(rest). Dominant hazard wins; secondary hazards lift the score modestly. |
+| **P4.6** Actionable Advice | `_normal_advice()` / `_veto_advice()` | Bilingual EN/ZH narrative mentioning the dominant hazard, the terrain, and the activity. |
+### Why "dominant-hazard composite" instead of a plain weighted sum?
+A naive arithmetic mean dilutes the dominant hazard — a thunderstorm sub-score of 90 averaged with three sub-scores of 10 would yield only 30, which understates real danger. The dominant-hazard formula gives the **single worst hazard for that user** 80 % of the weight; the remaining 20 % captures the compounding effect when multiple hazards are simultaneously elevated. Per-hazard scores are clipped to 100 before aggregation so a weight > 1 cannot push a single sub-score past saturation.
+## Module responsibilities
+| Module | Responsibility |
+|---|---|
+| `backend/main.py` | FastAPI app + lifespan (model load, DB init, HTTP client) |
+| `backend/ml_engine.py` | Load joblib RF, run `predict_proba`; heuristic fallback when no model artefact |
+| `backend/rule_engine.py` | Veto cascade + additive scoring + bilingual advice + XAI log |
+| `backend/terrain.py` | 3×3 DEM fetch, slope/aspect/TPI, orographic-uplift dot product |
+| `backend/cache.py` | WAL-SQLite grid cache, risk-adaptive TTL, inference audit log |
+| `backend/config.py` | Single source of truth for thresholds + academic citations |
+| `backend/schemas.py` | Pydantic v2 request/response contract |
+| `scripts/1_download_dataset.py` | Open-Meteo + Open-Topo-Data ingestion (5 Malaysian sites, 5 years) |
+| `scripts/2_preprocess.py` | Feature engineering + `is_rain_event` label derivation |
+| `scripts/3_train_model.py` | Random Forest + time-based CV + classification report + feature importance |
+| `frontend/index.html` | Single-file Vue3 SPA: Leaflet map, gauge, XAI log, EN/ZH toggle |
+## Concurrency model
+* FastAPI is single-event-loop async. All blocking I/O (SQLite) is wrapped in `asyncio.to_thread` so it never stalls the loop.
+* SQLite is opened in **WAL** mode (`PRAGMA journal_mode=WAL`) so readers don't block on writers.
+* `httpx.AsyncClient` is shared across the app via `app.state.http`, instantiated in lifespan.
+* External calls use exponential-backoff retries (`tenacity`) and 15 s timeouts.
+## Cache strategy
+A naive fixed TTL is unsafe — a 10-minute-stale "Safe" verdict during a developing storm can kill someone. We use **risk-adaptive TTL**:
+| Risk score / Veto | TTL |
+|---|---|
+| Any Veto fired, or score ≥ 70 | **60 s** |
+| Score 40-70 | 300 s |
+| Score < 40 | 600 s |
+Grid key quantises (lat, lon) to ~1.1 km cells (`GRID_RESOLUTION_DEG = 0.01`).

docs/dataset.md ADDED Viewed

	@@ -0,0 +1,111 @@

+# Dataset Specification
+# 数据集说明
+> The exact dataset structure that the supervisor approved at the 4/15 review.
+> 4 月 15 日导师 review 后确认的数据集结构。
+## 1. Source / 数据来源
+| Component | Source | URL |
+|---|---|---|
+| Hourly weather | Open-Meteo Historical Weather API (ECMWF ERA5 reanalysis) | https://open-meteo.com/en/docs/historical-weather-api |
+| Elevation     | Open-Topo-Data (SRTM 30 m DEM) | https://www.opentopodata.org/datasets/srtm/ |
+ERA5 is the gold-standard reanalysis dataset in academic meteorology, providing physically-consistent hourly values from 1940 to present.
+## 2. Spatial coverage / 空间覆盖
+Five Malaysian mountain locations, chosen to span a range of elevations and terrain types:
+| Site | Latitude | Longitude | Approx. elev. | Terrain |
+|---|---|---|---|---|
+| Genting Highlands  | 3.4225 | 101.7935 | ~1865 m | Slope |
+| Cameron Highlands  | 4.4694 | 101.3776 | ~1500 m | Highland plateau |
+| Fraser's Hill      | 3.7256 | 101.7378 | ~1300 m | Slope |
+| Klang Valley       | 3.0738 | 101.5183 |  ~100 m | Valley floor |
+| Mt Kinabalu (base) | 6.0535 | 116.5586 | ~1800 m | Mountain |
+## 3. Temporal coverage / 时间范围
+**2020-01-01 → 2023-12-31**, hourly resolution (one row per hour per site).
+Expected sample count: 5 sites × 4 years × 365.25 days × 24 hours ≈ **175 320 rows**.
+## 4. Schema / 列结构
+| Position | Column | Type | Role | Description |
+|---|---|---|---|---|
+| 0 | `site`               | str   | meta    | Site name |
+| 1 | `latitude`           | float | meta    | WGS84 |
+| 2 | `longitude`          | float | meta    | WGS84 |
+| 3 | `elevation_m`        | float | **X**   | DEM-derived altitude (static per site) |
+| 4 | `time`               | datetime | meta | Hourly UTC+8 (Asia/Kuala_Lumpur) |
+| 5 | `temperature_c`      | float | **X**   | 2 m air temperature |
+| 6 | `humidity_pct`       | float | **X**   | Relative humidity 0-100 |
+| 7 | `precipitation`      | float | (raw)   | mm in past hour — used to derive Y |
+| 8 | `wind_speed_kmh`     | float | **X**   | 10 m wind speed |
+| 9 | `wind_direction_deg` | float | **X**   | Direction FROM which wind blows, 0-360° |
+| 10 | `wind_u`            | float | **X**   | u = speed · sin(dir) |
+| 11 | `wind_v`            | float | **X**   | v = speed · cos(dir) |
+| 12 | `pressure_hpa`      | float | **X**   | Surface pressure |
+| 13 | `pressure_change_3h`| float | **X**   | Δp over preceding 3 h (storm precursor) |
+| 14 | `dew_point_c`       | float | **X**   | 2 m dew-point |
+| 15 | `dew_point_depression` | float | **X** | T − T_dew (saturation proxy) |
+| 16 | `cloud_cover_pct`   | float | **X**   | Total cloud cover 0-100 |
+| 17 | `cape_jkg`          | float | **X**   | Convective Available Potential Energy |
+| 18 | `precipitation_lag_1h` | float | **X** | Previous hour's precipitation |
+| 19 | `hour_sin`, `hour_cos` | float | **X** | Cyclic encoding of hour-of-day |
+| 20 | `month_sin`, `month_cos` | float | **X** | Cyclic encoding of month (captures monsoon) |
+| 21 | **`is_rain_event`** | **int {0,1}** | **Y** | **1 if `precipitation(t+1h) > 0.1 mm` else 0** |
+## 5. Target label derivation / 目标标签的衍生
+This is **THE** column that earlier supervisor feedback flagged as missing in the raw CSV. It is engineered explicitly in `scripts/2_preprocess.py`:
+```python
+df['is_rain_event'] = (df['precipitation'].shift(-1) > 0.1).astype(int)
+```
+Three things the panel should notice:
+1. **`.shift(-1)` means future**: features at time `t` are paired with the rain outcome at `t+1h`. The model never sees future data as input — this prevents temporal data leakage.
+2. **0.1 mm threshold**: this matches the **WMO definition of trace precipitation** — i.e. it is *not* an arbitrary cutoff.
+3. **Binary**, not amount-of-rain. The pipeline could be extended to a regression task; we deliberately model classification because the downstream user decision is binary ("go / no-go").
+## 6. Train / test split / 划分策略
+**Time-based**, not random. The last 20 % of each site's chronological data is reserved as the hold-out test set; the remaining 80 % goes to a 5-fold `TimeSeriesSplit` cross-validation. Random splits would leak temporal autocorrelation and inflate accuracy by 5-15 percentage points.
+## 7. Class balance / 类别分布
+Empirically in tropical Malaysia, `is_rain_event = 1` holds in approximately 20-30 % of hours (more in monsoon months, less in dry season). We pass `class_weight='balanced'` to the Random Forest to prevent it from collapsing to a trivial "always predict no-rain" classifier.
+## 8. Reproducibility / 可复现性
+```bash
+# Real ERA5 path (preferred)
+python scripts/1_download_dataset.py    # ~5-10 min, network-bound
+python scripts/2_preprocess.py          # < 30 s
+python scripts/3_train_model.py         # ~30-90 s on a modern laptop
+```
+All scripts are idempotent — re-running them does not duplicate data or re-download files that already exist locally.
+## 9. Offline / synthetic-data fallback / 离线合成数据回退
+For environments without network access (e.g. exam labs, restricted classroom networks) we ship `scripts/1b_synth_dataset.py`, a deterministic physics-informed synthetic generator (seed = 42, see file header for the meteorological assumptions encoded).
+The synthetic dataset:
+- has the **identical schema** as the Open-Meteo download,
+- preserves Malaysia's bimodal monsoon seasonality, tropical diurnal cycle, lapse rate, hydrostatic pressure decay, and zero-inflated rain distribution,
+- yields a comparable class balance (~26 % positive),
+- lets the **entire pipeline + frontend + tests** be exercised without any external network calls.
+It is **not** a substitute for real ERA5 data in the final thesis evaluation. The recommended workflow once network is restored is:
+```bash
+rm data/raw_*.csv data/processed.csv         # clear synthetic data
+python scripts/1_download_dataset.py         # fetch real ERA5 via Open-Meteo
+python scripts/2_preprocess.py
+python scripts/3_train_model.py              # retrain on real data
+```

docs/pipeline_order.md ADDED Viewed

	@@ -0,0 +1,109 @@

+# Project pipeline order — "App is the last"
+# 项目流程顺序 —— "App 放在最后"
+> Direct response to supervisor feedback 4/15: "First identify a dataset.
+> And then train the model. And then predict it. Once everything is
+> finished, you can develop the app. App is the last."
+>
+> 4/15 导师反馈直接回应：先 dataset，再 model，再 predict，最后才是 app。
+---
+## Current state (May 2026) / 当前状态（2026 年 5 月）
+```
+┌──────────────────────────────────────────────────────────────────────┐
+│ STEP 1 — DATASET                                            ✅ DONE  │
+│ ────────────────────────────────────────────                         │
+│ Source       : Open-Meteo Historical Archive (ECMWF ERA5)            │
+│ Coverage     : 5 Malaysian mountain sites, 5 years hourly            │
+│ Rows         : 175 315                                               │
+│ Target Y     : is_rain_event ∈ {0, 1}  (next-hour rain > 0.1 mm)     │
+│ Code         : scripts/{1_download, 1b_synth, 2_preprocess}.py        │
+│ Documentation: docs/dataset.md                                       │
+└──────────────────────────────────────────────────────────────────────┘
+                                  │
+                                  ▼
+┌──────────────────────────────────────────────────────────────────────┐
+│ STEP 2 — MODEL TRAINING                                     ✅ DONE  │
+│ ────────────────────────────────────────────                         │
+│ Algorithm    : Random Forest, class_weight='balanced'                │
+│ Split        : Time-based, last 20% chronological holdout            │
+│ CV           : 5-fold TimeSeriesSplit on training portion            │
+│ Test results : ROC AUC 0.871 · PR AP 0.750 · Brier 0.138             │
+│ Operating pt : τ = 0.20  →  F2 = 0.778, Recall = 0.934               │
+│ Code         : scripts/3_train_model.py                              │
+│ Documentation: models/MODEL_CARD.md                                  │
+└──────────────────────────────────────────────────────────────────────┘
+                                  │
+                                  ▼
+┌──────────────────────────────────────────────────────────────────────┐
+│ STEP 3 — MODEL EVALUATION                                   ✅ DONE  │
+│ ────────────────────────────────────────────                         │
+│ Figures      : 6 publication-quality PNGs in figures/                │
+│   01_roc_curve.png         · ROC + AUC                               │
+│   02_pr_curve.png          · Precision-Recall + AP                   │
+│   03_calibration_curve.png · Reliability + Brier                     │
+│   04_threshold_sweep.png   · F1/F2/Precision/Recall vs threshold     │
+│   05_feature_importance.png· Top-20 features                         │
+│   06_confusion_matrix.png  · CM at F2-optimal threshold              │
+│ Summary      : figures/evaluation_summary.json                       │
+│ Code         : scripts/4_evaluate_model.py                           │
+└──────────────────────────────────────────────────────────────────────┘
+                                  │
+                                  ▼
+┌──────────────────────────────────────────────────────────────────────┐
+│ STEP 4 — RULE ENGINE (D5 proposal §3.7 P4.1-P4.6)           ✅ DONE  │
+│ ────────────────────────────────────────────                         │
+│ P4.1 Load dynamic risk rules  → backend/config.py                    │
+│ P4.2 Fetch user context        → ?activity= query parameter          │
+│ P4.3 Evaluate environmental    → 4 score_*_risk() functions          │
+│         risks (rainfall, fog, wind gust, thunderstorm)               │
+│ §3.7.2  Decision table R1-R4   → apply_decision_table_3_7_2()        │
+│ Veto cascade                   → _collect_veto_triggers()            │
+│ P4.4 Activity weighting        → apply_activity_weighting()          │
+│ P4.5 Composite risk score      → dominant-hazard + secondary         │
+│ P4.6 Actionable advice         → _normal_advice / _veto_advice       │
+│ Code         : backend/rule_engine.py                                │
+│ Documentation: docs/architecture.md, docs/thresholds.md              │
+└──────────────────────────────────────────────────────────────────────┘
+                                  │
+                                  ▼
+┌──────────────────────────────────────────────────────────────────────┐
+│ STEP 5 — APP (LAST, as instructed)                          ✅ DONE  │
+│ ────────────────────────────────────────────                         │
+│ Backend     : FastAPI + uvicorn — wraps trained model from Step 2    │
+│                + rule engine from Step 4                             │
+│ Frontend    : Vue 3 SPA — bilingual EN/ZH, 4 mini-gauges,            │
+│                R1-R4 indicators, demo scenarios, error toasts        │
+│ Container   : Multi-stage Dockerfile + docker-compose.yml            │
+│ Tests       : 70 tests, 97% backend coverage                         │
+│ CI          : .github/workflows/ci.yml                               │
+└──────────────────────────────────────────────────────────────────────┘
+                                  │
+                                  ▼
+┌──────────────────────────────────────────────────────────────────────┐
+│ STEP 6 — EVALUATION FOR THESIS CHAPTER 5                    🔄 PLAN  │
+│ ────────────────────────────────────────────                         │
+│ 6a · Hindcast validation against NaDMA flood / landslide archives    │
+│ 6b · Small user study with mountain hikers (1-month panel)           │
+│ 6c · Comparative ablation: RF only vs Rule only vs Hybrid            │
+│ 6d · Threshold sensitivity analysis (τ ∈ {0.10, 0.15, 0.20, 0.25})   │
+└──────────────────────────────────────────────────────────────────────┘
+```
+## Reading order for the supervisor / 给导师过的阅读顺序
+When walking the supervisor through the project, **strictly follow Steps 1 → 5**:
+| # | Open this | Spend |
+|---|---|---|
+| 1 | `docs/dataset.md` §4 schema, §5 Y derivation | 60 s |
+| 2 | `figures/01_roc_curve.png` + `figures/03_calibration_curve.png` | 30 s |
+| 3 | `figures/04_threshold_sweep.png` + `figures/05_feature_importance.png` | 60 s |
+| 4 | `docs/architecture.md` §"Engine B internals" — show P4.1→P4.6 mapping | 60 s |
+| 5 | `frontend/index.html` running locally — demo with the Genting & Everest scenarios | 60-90 s |
+Total ≈ 5 minutes before any Q&A. App is opened **last** as agreed.
+按这个顺序给导师过，**严格按 1→5**，整体大概 5 分钟过完再进入 Q&A。**app 一定放最后开**，跟导师上次说的完全一致。

docs/progress_update_brief.html ADDED Viewed

	@@ -0,0 +1,619 @@

+<!doctype html>
+<html lang="en">
+<head>
+<meta charset="utf-8">
+<title>Progress-Update Brief — MicroClimate-X</title>
+<style>
+  /* ============================================================
+     Print-optimised A4 progress-update brief
+     Open in browser → ⌘+P → Save as PDF, or read on screen
+     ============================================================ */
+  :root {
+    --ink:           #0b0d12;
+    --ink-soft:      #353a44;
+    --muted:         #6b7280;
+    --brand:         #2563eb;
+    --brand-soft:    #dbeafe;
+    --accent:        #b91c1c;
+    --accent-soft:   #fee2e2;
+    --ok:            #166534;
+    --ok-soft:       #dcfce7;
+    --warn:          #b45309;
+    --warn-soft:     #fef3c7;
+    --grid:          #e5e7eb;
+    --bg:            #ffffff;
+    --code-bg:       #f3f4f6;
+  }
+  * { box-sizing: border-box; }
+  html, body { margin: 0; padding: 0; background: var(--bg); color: var(--ink); }
+  body {
+    font-family: -apple-system, BlinkMacSystemFont, "SF Pro Text",
+                 "PingFang SC", "Hiragino Sans GB", "Microsoft YaHei",
+                 system-ui, sans-serif;
+    font-size: 11pt;
+    line-height: 1.45;
+  }
+  @page { size: A4; margin: 12mm 14mm; }
+  main { max-width: 200mm; margin: 0 auto; padding: 14mm 14mm; }
+  /* Headings */
+  h1 {
+    font-size: 22pt; margin: 0 0 4mm 0;
+    border-bottom: 3px solid var(--brand); padding-bottom: 3mm;
+    page-break-after: avoid;
+  }
+  h1 .zh { display: block; font-size: 13pt; color: var(--muted); font-weight: 500; margin-top: 1mm; }
+  h2 {
+    font-size: 14pt; margin: 9mm 0 3mm 0;
+    color: var(--brand);
+    border-left: 4px solid var(--brand); padding: 1mm 0 1mm 3mm;
+    page-break-after: avoid;
+  }
+  h2 .zh { display: block; font-size: 10pt; color: var(--muted); margin-top: 0.5mm; font-weight: 500; }
+  h3 {
+    font-size: 11.5pt; margin: 5mm 0 2mm 0; color: var(--ink-soft);
+    page-break-after: avoid;
+  }
+  h4 { font-size: 10.5pt; margin: 3mm 0 1mm 0; color: var(--accent); }
+  p, li { margin: 1mm 0; }
+  ul, ol { padding-left: 5mm; }
+  ul li { margin-bottom: 1mm; }
+  /* Quote / supervisor verbatim */
+  .quote {
+    background: var(--warn-soft);
+    border-left: 3px solid var(--warn);
+    padding: 2mm 3mm; margin: 2mm 0;
+    font-style: italic; font-size: 10pt;
+  }
+  .quote::before { content: "🎙️ "; font-style: normal; }
+  /* Tables */
+  table.bilingual, table.steps, table.tabs, table.plan, table {
+    border-collapse: collapse; width: 100%; margin: 2mm 0 3mm 0;
+    font-size: 10pt;
+  }
+  table.bilingual td, table.steps td, table.tabs td, table.plan td,
+  table th, table td {
+    padding: 1.5mm 2.5mm; vertical-align: top;
+    border: 1px solid var(--grid);
+  }
+  table th {
+    background: #f9fafb; font-weight: 600; text-align: left;
+    color: var(--ink-soft);
+  }
+  table.bilingual td.en { width: 50%; }
+  table.bilingual td.zh { width: 50%; background: #fafbfc; }
+  table.plan td.estimate { width: 14%; text-align: center; color: var(--brand); font-weight: 600; }
+  /* Inline callouts */
+  .callout {
+    margin: 2mm 0; padding: 2mm 3mm;
+    border-left: 3px solid; border-radius: 1mm;
+    font-size: 10pt;
+  }
+  .callout.warn { background: var(--accent-soft); border-color: var(--accent); }
+  .callout.ok   { background: var(--ok-soft); border-color: var(--ok); }
+  .callout.tip  { background: var(--brand-soft); border-color: var(--brand); }
+  .callout-title { font-weight: 700; margin-bottom: 1mm; }
+  /* Code */
+  code, pre, kbd {
+    font-family: "SF Mono", "JetBrains Mono", Menlo, Consolas, monospace;
+    font-size: 9.5pt;
+  }
+  code { background: var(--code-bg); padding: 0.3mm 1mm; border-radius: 1mm; }
+  pre {
+    background: var(--code-bg); padding: 3mm; border-radius: 2mm;
+    overflow-x: auto; margin: 2mm 0;
+    border: 1px solid var(--grid);
+  }
+  pre code { background: transparent; padding: 0; }
+  /* Step indicators */
+  .step {
+    display: flex; gap: 3mm;
+    margin: 2mm 0;
+    align-items: flex-start;
+  }
+  .step .num {
+    flex: 0 0 8mm; width: 8mm; height: 8mm; border-radius: 50%;
+    background: var(--brand); color: white; font-weight: 700;
+    display: flex; align-items: center; justify-content: center;
+    font-size: 11pt;
+  }
+  .step .body { flex: 1; }
+  /* Demo / decision blocks */
+  .demo {
+    background: #f0f9ff;
+    border: 1px solid #bae6fd;
+    border-radius: 2mm;
+    padding: 3mm;
+    margin: 3mm 0;
+  }
+  .demo .demo-title { font-weight: 700; color: #075985; margin-bottom: 1mm; }
+  .decision {
+    background: #fefce8;
+    border: 1px solid #fde047;
+    border-radius: 2mm;
+    padding: 3mm;
+    margin: 2mm 0;
+  }
+  .decision .decision-title {
+    font-weight: 700; color: #854d0e; margin-bottom: 1mm;
+    text-transform: uppercase; letter-spacing: 0.5pt; font-size: 9pt;
+  }
+  /* Status pill */
+  .pill {
+    display: inline-block; padding: 0.2mm 1.5mm;
+    border-radius: 4mm; font-size: 8.5pt; font-weight: 600;
+    vertical-align: middle;
+  }
+  .pill.done { background: var(--ok-soft); color: var(--ok); }
+  .pill.plan { background: var(--brand-soft); color: var(--brand); }
+  .pill.risk { background: var(--accent-soft); color: var(--accent); }
+  /* Checklist */
+  .check { font-family: "SF Mono", Menlo, monospace; font-size: 9.5pt; line-height: 1.7; }
+  .check .box { display: inline-block; width: 4mm; }
+  /* Page break helpers */
+  .pb { page-break-before: always; }
+  .nobreak { page-break-inside: avoid; }
+  /* Footer */
+  footer {
+    margin-top: 12mm; padding-top: 4mm;
+    border-top: 1px solid var(--grid);
+    color: var(--muted); font-size: 9pt; text-align: center;
+  }
+  /* Print refinements */
+  @media print {
+    body { font-size: 10pt; }
+    h2 { font-size: 13pt; }
+    .no-print { display: none; }
+    a { color: var(--ink); text-decoration: none; }
+  }
+  /* Toolbar (screen only) */
+  .toolbar {
+    position: sticky; top: 0; z-index: 100;
+    background: var(--brand); color: white;
+    padding: 2mm 4mm; display: flex; justify-content: space-between;
+    align-items: center; font-size: 10pt;
+  }
+  .toolbar button {
+    background: white; color: var(--brand); border: 0;
+    padding: 1.5mm 4mm; border-radius: 1mm; font-weight: 600;
+    cursor: pointer; font-size: 10pt;
+  }
+  .toolbar button:hover { background: #f3f4f6; }
+  /* Cover meta strip */
+  .cover-meta {
+    display: flex; gap: 4mm; flex-wrap: wrap;
+    margin: 3mm 0;
+    color: var(--muted); font-size: 9.5pt;
+  }
+  .cover-meta span {
+    background: var(--code-bg); padding: 0.5mm 2mm; border-radius: 1mm;
+  }
+  /* Timeline strip in §0.2 */
+  table.timeline td.block { width: 8%; text-align: center; font-weight: 700; color: var(--brand); }
+  table.timeline td.time  { width: 18%; font-family: "SF Mono", Menlo, monospace; color: var(--muted); }
+</style>
+</head>
+<body>
+<div class="toolbar no-print">
+  <strong>Progress-Update Brief · MicroClimate-X</strong>
+  <button onclick="window.print()">🖨 Print / Save as PDF</button>
+</div>
+<main>
+<h1>Supervisor Progress-Update Brief
+  <span class="zh">导师进度汇报双语逐字稿 — MicroClimate-X</span>
+</h1>
+<div class="cover-meta">
+  <span>📅 2026-05-13</span>
+  <span>🎓 UKM FYP</span>
+  <span>🏛️ KyoukoLi/microclimate-x</span>
+  <span>🚀 v1.0.0 shipped 2026-05-11</span>
+  <span>✅ 70 tests · 97% coverage</span>
+</div>
+<div class="callout tip">
+  <div class="callout-title">How to use this brief · 怎么用这份汇报稿</div>
+  Follow-up meeting after the v1.0.0 hardening pass on 2026-05-11. Walk-through order is unchanged: <strong>dataset → model → app → next steps</strong>. Open this file on screen during the meeting; <strong>do not read word-for-word</strong>.<br><br>
+  紧接 2026-05-11 v1.0.0 强化提交之后的<strong>进度汇报</strong>会议。顺序一律不变：<strong>dataset → model → app → 下一步</strong>。开会时屏幕上打开本文档，<strong>不要照念</strong>，当兜底用即可。
+</div>
+<!-- ===== Section 0: what you need to do ===== -->
+<h2>0 · What you need to do — three time windows
+  <span class="zh">你要做的事 —— 三个时间窗口</span>
+</h2>
+<h3>0.1 · Before the meeting (T-15 min) / 会前 15 分钟</h3>
+<table class="check">
+  <tr><th style="width:6%">☐</th><th>English</th><th>中文</th></tr>
+  <tr><td>☐</td><td>Charge laptop ≥ 80 %; charger in bag.</td><td>笔记本充满 ≥ 80%，充电器带上。</td></tr>
+  <tr><td>☐</td><td><code>cd ~/Projects/microclimate-x &amp;&amp; git pull &amp;&amp; git status</code> — must print "working tree clean".</td><td>拉最新代码，确认 working tree clean。</td></tr>
+  <tr><td>☐</td><td><code>make run</code> in <strong>terminal A</strong> (leave it running).</td><td>终端 A 起后端，<strong>不要关</strong>。</td></tr>
+  <tr><td>☐</td><td><code>curl -s http://localhost:8000/api/health | python3 -m json.tool</code> in <strong>terminal B</strong> — verify <code>"ml_loaded": true</code>.</td><td>终端 B 验证健康检查，<code>ml_loaded</code> 必须为 <code>true</code>。</td></tr>
+  <tr><td>☐</td><td>Open the 10 browser tabs in the order from <code>MEETING_CHEAT_SHEET.md</code> §0 — <strong>app tab is last</strong>.</td><td>按 cheat-sheet §0 顺序开 10 个标签页，<strong>app 标签放最后</strong>。</td></tr>
+  <tr><td>☐</td><td>This file (<code>progress_update_brief.html</code>) open on a separate screen / phone.</td><td>把本文档单独开在副屏或手机上。</td></tr>
+  <tr><td>☐</td><td>Phone on silent. Deep breath.</td><td>手机静音，深呼吸。</td></tr>
+</table>
+<h3>0.2 · During the meeting (≈ 8 minutes) / 会中 ≈ 8 分钟</h3>
+<table class="timeline">
+  <tr><th>Block</th><th>EN heading</th><th>中文标题</th><th>Time</th></tr>
+  <tr><td class="block">1</td><td>Opening 30 s</td><td>开场 30 秒</td><td class="time">0:00 → 0:30</td></tr>
+  <tr><td class="block">2</td><td>What changed since last meeting</td><td>自上次会以来的进展</td><td class="time">0:30 → 2:00</td></tr>
+  <tr><td class="block">3</td><td>Live demo — dataset → model → app</td><td>现场演示（顺序不变）</td><td class="time">2:00 → 5:00</td></tr>
+  <tr><td class="block">4</td><td>Next steps for Chapter 5</td><td>Chapter 5 下一步</td><td class="time">5:00 → 6:30</td></tr>
+  <tr><td class="block">5</td><td>Asks + closing</td><td>请示 + 收尾</td><td class="time">6:30 → 8:00</td></tr>
+</table>
+<h3>0.3 · After the meeting (T+24 h) / 会后 24 小时内</h3>
+<table class="check">
+  <tr><th style="width:6%">☐</th><th>English</th><th>中文</th></tr>
+  <tr><td>☐</td><td>Write meeting minutes — capture every supervisor decision in <code>docs/meeting_log_&lt;date&gt;.md</code>.</td><td>写会议纪要，把老师每条决定记到 <code>docs/meeting_log_&lt;日期&gt;.md</code>。</td></tr>
+  <tr><td>☐</td><td>Open one GitHub issue per agreed action item (label: <code>chapter-5</code>).</td><td>每个 action item 在 GitHub 开一个 issue，打 <code>chapter-5</code> 标签。</td></tr>
+  <tr><td>☐</td><td>Email a 3-bullet summary back to the supervisor for written confirmation.</td><td>给老师发 3 条要点的总结邮件，留<strong>书面确认</strong>。</td></tr>
+  <tr><td>☐</td><td>Update <code>README.md</code> §9 Roadmap — tick boxes that were signed off.</td><td>更新 <code>README.md</code> 第 9 节 Roadmap，把通过的项打勾。</td></tr>
+  <tr><td>☐</td><td>Tag a new release if scope was confirmed (<code>git tag v1.1.0-rc.1</code>).</td><td>如果范围确认了，打个新 tag (<code>v1.1.0-rc.1</code>)。</td></tr>
+</table>
+<!-- ===== Section 1: Opening ===== -->
+<h2 class="pb">1 · Opening (30 seconds)
+  <span class="zh">开场 30 秒</span>
+</h2>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Sir, thank you for your time. Following up on our last session, I've completed a production-grade hardening pass — version 1.0.0 — and the full pipeline is now reproducible end-to-end. May I walk you through what's new in the same order as before — <strong>dataset, then model, then app</strong> — and finish with my proposed plan for Chapter 5?"</td>
+    <td class="zh">"老师感谢您抽时间。接着上次的内容，我做完了 <strong>v1.0.0 工程化强化</strong>，整条流水线现在可以<strong>端到端复现</strong>。我按上次的顺序——<strong>dataset、model、app</strong>——给您过一遍新的进展，最后讲我对 Chapter 5 的下一步计划，可以吗？"</td>
+  </tr>
+</table>
+<div class="callout ok">
+  <strong>Why this opening · 为什么这样开场</strong>: (a) restates the supervisor's preferred process order without him asking, (b) signals you've made forward progress (not just polish), (c) ends with an explicit ask for direction on Chapter 5 — which is what <em>he</em> wants to talk about.<br>
+  (a) 不用他提就主动按他的流程顺序；(b) 强调是<strong>前进了</strong>而不是只在抛光；(c) 用对 Chapter 5 的请示收尾，<strong>这正是他想聊的话题</strong>。
+</div>
+<!-- ===== Section 2: progress recap ===== -->
+<h2>2 · What changed since the last meeting
+  <span class="zh">自上次会议以来的进展</span>
+</h2>
+<p style="color: var(--muted); font-size: 9.5pt;">
+  ≈ 90 seconds. Stay on the GitHub repo tab — point to the commit history, the green CI badge, the v1.0.0 release.<br>
+  ≈ 90 秒。停在 GitHub repo 标签页，指给老师看 commit 历史、CI 绿勾、v1.0.0 release。
+</p>
+<table class="bilingual">
+  <tr><th style="width:18%">Area / 模块</th><th>English</th><th>中文</th></tr>
+  <tr>
+    <td><strong>Backend hardening</strong><br><span style="color:var(--muted);font-size:9pt">后端强化</span></td>
+    <td>"I added a request-ID middleware, a typed <code>ErrorResponse</code> contract so no bare HTML 500s leak, structured logging, and an enriched <code>/api/health</code> exposing uptime, cache stats, and the loaded ML feature schema."</td>
+    <td>"后端我加了 <strong>request-ID 中间件</strong>、<strong>类型化错误协议</strong> <code>ErrorResponse</code>（不再泄漏裸 HTML 500）、结构化日志、以及<strong>升级版 <code>/api/health</code></strong>（暴露 uptime、缓存统计、ML 特征 schema）。"</td>
+  </tr>
+  <tr>
+    <td><strong>ML pipeline</strong><br><span style="color:var(--muted);font-size:9pt">ML 流水线</span></td>
+    <td>"I shipped <code>scripts/4_evaluate_model.py</code> which produces six publication-quality figures plus a machine-readable <code>evaluation_summary.json</code>. I also wrote a HuggingFace-style <code>MODEL_CARD.md</code> covering intended use, training data, metrics, limitations, and ethical considerations."</td>
+    <td>"ML 流水线加了<strong>评估脚本</strong> <code>scripts/4_evaluate_model.py</code>，自动出 6 张论文级别图 + 一份 <code>evaluation_summary.json</code>。还写了 HuggingFace 风格的 <strong>MODEL_CARD.md</strong>，覆盖用途、训练数据、指标、局限���伦理考量。"</td>
+  </tr>
+  <tr>
+    <td><strong>Tests + CI</strong><br><span style="color:var(--muted);font-size:9pt">测试 + CI</span></td>
+    <td>"Total tests went from 19 to <strong>70</strong>, backend coverage is <strong>97 %</strong>. CI runs on Python 3.9 / 3.11 / 3.12 plus a Docker image-build smoke test."</td>
+    <td>"测试数从 19 涨到 <strong>70</strong>，<strong>后端覆盖率 97%</strong>。CI 跑 Python 3.9/3.11/3.12 矩阵，外加 Docker 镜像构建烟测。"</td>
+  </tr>
+  <tr>
+    <td><strong>Dev-ex</strong><br><span style="color:var(--muted);font-size:9pt">开发体验</span></td>
+    <td>"Multi-stage Dockerfile, docker-compose, Makefile single-word recipes, pre-commit hooks. The whole project is now <code>docker compose up --build</code> away from a clean machine."</td>
+    <td>"多阶段 Dockerfile + compose + Makefile 单词命令 + pre-commit hooks。<strong>新机器一句 <code>docker compose up --build</code> 就能跑起来</strong>。"</td>
+  </tr>
+  <tr>
+    <td><strong>Documentation</strong><br><span style="color:var(--muted);font-size:9pt">文档</span></td>
+    <td>"Three new docs — <code>architecture.md</code>, <code>thresholds.md</code> with citations for every Veto threshold, and <code>pipeline_order.md</code> which explicitly enforces the dataset → model → app order you asked for."</td>
+    <td>"三份新文档——<code>architecture.md</code>、<code>thresholds.md</code>（每个 Veto 阈值都附学术引用）、以及 <code>pipeline_order.md</code>（<strong>显式按您要求的 dataset→model→app 顺序写死</strong>）。"</td>
+  </tr>
+</table>
+<div class="callout tip">
+  <strong>Artefact to show · 展示物</strong>: GitHub commit history page; the green CI badge on the README; <code>CHANGELOG.md</code> v1.0.0 entry.<br>
+  GitHub commit 历史页；README 上的 CI 绿勾；<code>CHANGELOG.md</code> 中 v1.0.0 那一段。
+</div>
+<!-- ===== Section 3: live demo ===== -->
+<h2 class="pb">3 · Live demo — dataset → model → app
+  <span class="zh">现场演示（顺序不变）</span>
+</h2>
+<p style="color: var(--muted); font-size: 9.5pt;">
+  ≈ 3 minutes. Same order as the 5/11 dry-run script — no surprises for the supervisor.<br>
+  ≈ 3 分钟。跟 5/11 的脚本完全一样的顺序，<strong>老师不会被打乱节奏</strong>。
+</p>
+<div class="step">
+  <div class="num">1</div>
+  <div class="body">
+    <h3>Dataset (Tab <code>docs/dataset.md</code>) — 30 s</h3>
+    <table class="bilingual">
+      <tr>
+        <td class="en">"Same dataset as last time — ERA5 reanalysis, 5 Malaysian mountain sites, 175 315 hourly rows. The Y column <code>is_rain_event</code> is derived in one line and documented in §5. <strong>No change here</strong>, just confirming the foundation is unchanged."</td>
+        <td class="zh">"数据集跟上次一样——ERA5 再分析、马来西亚 5 个山地点位、17.5 万行小时数据。Y 列 <code>is_rain_event</code> 一行代码构造，文档在 §5。<strong>这里没有变</strong>，只是确认地基没动。"</td>
+      </tr>
+    </table>
+  </div>
+</div>
+<div class="step">
+  <div class="num">2</div>
+  <div class="body">
+    <h3>Model (Tabs <code>01_roc</code> → <code>03_calibration</code> → <code>04_threshold</code> → <code>05_feature_importance</code>) — 90 s</h3>
+    <table class="bilingual">
+      <tr>
+        <td class="en">"Same model as last time — Random Forest, time-based split, τ = 0.20. Test ROC AUC <strong>0.871</strong>, PR AP <strong>0.750</strong>, Brier <strong>0.138</strong>, recall <strong>93.4 %</strong>. <strong>What's new is the 6 figures plus the model card</strong> — every number you see here is reproducible from <code>make evaluate</code>."</td>
+        <td class="zh">"模型跟上次一样——RF、时间序列切分、τ = 0.20。测试 AUC <strong>0.871</strong>、PR AP <strong>0.750</strong>、Brier <strong>0.138</strong>、召回率 <strong>93.4%</strong>。<strong>新东西</strong>是 6 张图 + model card——上面任何一个数字都可以用 <code>make evaluate</code> 复现。"</td>
+      </tr>
+    </table>
+  </div>
+</div>
+<div class="step">
+  <div class="num">3</div>
+  <div class="body">
+    <h3>App (Tab <code>http://localhost:8000/app/</code>) — 60-90 s</h3>
+    <table class="bilingual">
+      <tr>
+        <td class="en">"Step 3, the app — opened <strong>last</strong> as agreed. Two demo scenarios. First, <strong>Genting Highlands</strong> — a slope at 1865 m inside the training distribution. The model gives a moderate rain probability; the rule engine picks up orographic lift; the four mini-gauges decompose the risk by hazard type."</td>
+        <td class="zh">"第三步 app——按约定<strong>最后才开</strong>。两个 demo 场景。第一个<strong>云顶高原</strong>——1865 m 的山坡，<strong>在训练分布之内</strong>。模型给中等降雨概率，规则引擎检测到地形抬升，四个 mini-gauge 把风险按灾害类型拆解。"</td>
+      </tr>
+      <tr>
+        <td class="en">"Second, <strong>Mt Everest</strong> — completely out of distribution. The model alone would say 'safe'. The Veto cascade fires three independent overrides — hypoxia, frostbite, gale — and the composite is forced to Danger. There's a unit test for exactly this: <code>test_mt_everest_veto_hypoxia</code>."</td>
+        <td class="zh">"第二个<strong>珠峰</strong>——<strong>完全分布外</strong>。光看模型会说"安全"，但 Veto 级联触发<strong>三个独立否决</strong>——缺氧、冻伤、大风——综合分被强制设为 Danger。<strong>专门有单元测试覆盖这个场景</strong>：<code>test_mt_everest_veto_hypoxia</code>。"</td>
+      </tr>
+    </table>
+  </div>
+</div>
+<!-- ===== Section 4: Chapter 5 plan ===== -->
+<h2 class="pb">4 · Next steps for Chapter 5
+  <span class="zh">Chapter 5 下一步</span>
+</h2>
+<div class="callout warn">
+  ≈ 90 seconds. <strong>This is the section the supervisor will react to most.</strong> Frame each item as a concrete deliverable + estimated time + dependency.<br>
+  ≈ 90 秒。<strong>老师反应最强烈的就是这一节</strong>。每一项都以"<strong>交付物 + 估时 + 依赖</strong>"形式呈现。
+</div>
+<h3>4.1 · Proposed Chapter 5 work plan / Chapter 5 工作计划</h3>
+<table class="plan">
+  <tr><th>#</th><th>Deliverable / 交付物</th><th>EN one-liner</th><th>中文一句话</th><th class="estimate">Estimate</th></tr>
+  <tr>
+    <td><span class="pill plan">5.1</span></td>
+    <td><strong>Comparative ablation</strong><br><span style="color:var(--muted);font-size:9pt">对比实验</span></td>
+    <td>"Train LogReg + XGBoost on the same features and report ROC / PR / F2 side-by-side with RF — answers 'why RF?' empirically."</td>
+    <td>"在同一特征集上训 LogReg + XGBoost，对比 ROC / PR / F2，<strong>用数据回答"为什么选 RF"</strong>。"</td>
+    <td class="estimate">1 week</td>
+  </tr>
+  <tr>
+    <td><span class="pill plan">5.2</span></td>
+    <td><strong>Hindcast validation</strong><br><span style="color:var(--muted);font-size:9pt">历史事件回放</span></td>
+    <td>"Replay 2020-2024 NaDMA-documented Malaysian flood / landslide events and check whether the system would have raised Warning / Danger at the right time. Reports hit-rate, lead-time, false-alarm rate."</td>
+    <td>"把 2020-2024 NaDMA 公开的马来西亚洪水/滑坡事件<strong>逐一回放</strong>，看系统能否在事发前给出 Warning/Danger。报告命中率、提前量、误报率。"</td>
+    <td class="estimate">2 weeks</td>
+  </tr>
+  <tr>
+    <td><span class="pill plan">5.3</span></td>
+    <td><strong>Threshold sensitivity</strong><br><span style="color:var(--muted);font-size:9pt">阈值灵敏度</span></td>
+    <td>"Sweep τ ∈ {0.10, 0.15, 0.20, 0.25, 0.30}, plot precision-recall trade-off, and justify the operating point with a cost-of-error analysis."</td>
+    <td>"扫 τ ∈ {0.10, 0.15, 0.20, 0.25, 0.30}，画精度-召回权衡曲线，用<strong>误差代价分析</strong>为最终选点辩护。"</td>
+    <td class="estimate">3 days</td>
+  </tr>
+  <tr>
+    <td><span class="pill plan">5.4</span></td>
+    <td><strong>Component ablation</strong><br><span style="color:var(--muted);font-size:9pt">组件消融</span></td>
+    <td>"Compare three system variants — RF only / Rule only / Hybrid — on the held-out test set and on the OOD Mt Everest case. Quantifies the rule-engine contribution."</td>
+    <td>"对比三个系统变体——<strong>纯 RF / 纯规则 / 混合</strong>——在测试集和 OOD 珠峰场景上的表现。<strong>量化规则引擎的贡献</strong>。"</td>
+    <td class="estimate">4 days</td>
+  </tr>
+  <tr>
+    <td><span class="pill risk">5.5</span></td>
+    <td><strong>Small user study</strong> <em>(optional)</em><br><span style="color:var(--muted);font-size:9pt">用户研究（可选）</span></td>
+    <td>"Recruit 5-8 mountain hikers, run a 4-week panel, log system advice vs. their field judgment. Reports inter-rater agreement (Cohen's κ)."</td>
+    <td>"招募 5-8 名登山者，4 周面板研究，记录系统建议 vs 他们现场判断，报告 Cohen's κ 一致性。"</td>
+    <td class="estimate">4 weeks</td>
+  </tr>
+  <tr>
+    <td><span class="pill done">5.6</span></td>
+    <td><strong>Thesis Chapter 5 draft</strong><br><span style="color:var(--muted);font-size:9pt">章节初稿</span></td>
+    <td>"Pull §5.1-5.5 into a single 12-15 page evaluation chapter with all figures, tables, and discussion."</td>
+    <td>"把 §5.1-5.5 整合成 12-15 页的评估章节，含全部图表和讨论。"</td>
+    <td class="estimate">1 week</td>
+  </tr>
+</table>
+<h3>4.2 · Decision tree to ask the supervisor / 请示决策树</h3>
+<div class="decision">
+  <div class="decision-title">Q1 · Priorities</div>
+  <table class="bilingual">
+    <tr>
+      <td class="en">"Sir, of the five evaluation tracks above, <strong>which two should I prioritise for the next four weeks</strong> before we converge on the Chapter 5 outline?"</td>
+      <td class="zh">"老师，上面 5 条评估方向，<strong>未来四周</strong>您建议我重点做哪两条，然后再收敛到 Chapter 5 大纲？"</td>
+    </tr>
+  </table>
+</div>
+<div class="decision">
+  <div class="decision-title">Q2 · User study yes/no</div>
+  <table class="bilingual">
+    <tr>
+      <td class="en">"Do you want me to include the user study (5.5)? It is the longest item and depends on participant recruitment — I want your call before committing."</td>
+      <td class="zh">"<strong>用户研究 (5.5) 您要不要做</strong>？这一条最长、依赖招募——想请您拍板再投入。"</td>
+    </tr>
+  </table>
+</div>
+<div class="decision">
+  <div class="decision-title">Q3 · Framing of the comparative study</div>
+  <table class="bilingual">
+    <tr>
+      <td class="en">"For the comparative ablation, do you want it framed as <strong>'why RF wins'</strong> (defending current choice) or <strong>'what if XGBoost wins'</strong> (open exploration)? The framing affects how I report inconclusive results."</td>
+      <td class="zh">"<strong>对比实验</strong>您希望框成"为什么 RF 胜出"（<strong>捍卫现有选择</strong>）还是"如果 XGBoost 更好怎么办"（<strong>开放探索</strong>）？两种 framing 对<strong>模棱两可结果</strong>的报告方式不同。"</td>
+    </tr>
+  </table>
+</div>
+<div class="decision">
+  <div class="decision-title">Q4 · Mt Everest weight in the thesis</div>
+  <table class="bilingual">
+    <tr>
+      <td class="en">"Should I treat the Mt Everest OOD test as a <strong>thesis-level contribution</strong> (a stand-alone subsection on safety) or just an <strong>appendix item</strong>?"</td>
+      <td class="zh">"<strong>珠峰 OOD 测试</strong>算论文级别的贡献（单独一节讲安全性），还是放附录就够？"</td>
+    </tr>
+  </table>
+</div>
+<!-- ===== Section 5: closing ===== -->
+<h2 class="pb">5 · Asks + closing (60 seconds)
+  <span class="zh">请示 + 收尾 60 秒</span>
+</h2>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Sir, to summarise: since the last meeting I've shipped v1.0.0 — production-grade hardening, 70 tests at 97 % coverage, six evaluation figures, a published model card, full Docker reproducibility. The pipeline order is unchanged from what you asked: <strong>dataset, model, app</strong>. For Chapter 5 I have <strong>five evaluation tracks scoped</strong>; I'd like your guidance on which two to prioritise for the next four weeks."</td>
+    <td class="zh">"老师，总结：自上次会议以来交付了 <strong>v1.0.0</strong>——工程化强化、70 个测试 97% 覆盖率、6 张评估图、model card、Docker 全复现。流水线顺序按您要求<strong>没动</strong>：dataset、model、app。Chapter 5 我列了 <strong>5 条评估方向</strong>，<strong>接下来四周您建议我先做哪两条</strong>？"</td>
+  </tr>
+  <tr>
+    <td class="en">"I'll send you a 3-bullet email summary by tomorrow morning so we have <strong>written agreement</strong> on the priorities. Thank you for your time."</td>
+    <td class="zh">"明早之前给您发 3 条要点的邮件总结，<strong>留个书面确认</strong>。谢谢老师。"</td>
+  </tr>
+</table>
+<!-- ===== Section 6: defensive Q&A ===== -->
+<h2>6 · Q&amp;A defensive lines (this update only)
+  <span class="zh">本次进度汇报的兜底话术</span>
+</h2>
+<div class="callout tip">
+  Anticipated follow-up questions <strong>specific to this progress update</strong>. The classic Q1-Q7 from the 5/11 brief are still live — just don't repeat them here.<br>
+  <strong>针对本次进度汇报</strong>可能出现的追问。5/11 那份的经典 Q1-Q7 仍然有效，不重复罗列。
+</div>
+<h3>Q-N1 — "Why are you spending time on tests and Docker instead of the thesis?"</h3>
+<h3 style="margin-top:-2mm">Q-N1 ——为什么你在写测试和 Docker 上花时间，不写论文？</h3>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Sir, the v1.0.0 hardening was a <strong>one-time investment</strong> to make every Chapter 5 number reproducible by the examiner with a single command. Without it, every evaluation result would be a black box — the examiner could not verify the AUC of 0.871 herself. With <code>make evaluate</code> reproducing all six figures byte-for-byte, the thesis claims become <strong>falsifiable</strong>. From this point on, all my time goes to evaluation and writing."</td>
+    <td class="zh">"老师，v1.0.0 的强化是<strong>一次性投资</strong>——为了让评审老师<strong>用一行命令就能复现 Chapter 5 的每一个数字</strong>。没有它，AUC = 0.871 就是黑盒，<strong>评审无法独立验证</strong>。现在 <code>make evaluate</code> 能把 6 张图按字节复现，论文的每个 claim 都<strong>可证伪</strong>。从今天起所有时间都给评估和写作。"</td>
+  </tr>
+</table>
+<h3>Q-N2 — "Why hasn't the model improved since last time?"</h3>
+<h3 style="margin-top:-2mm">Q-N2 ——模型为什么自上次以后没提升？</h3>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Two reasons. First, the supervisor's instruction was to <em>consolidate</em> dataset and model before adding more capacity — which is what I did. Second, the bottleneck right now is <strong>not the model</strong> but the <strong>rule engine's coverage of OOD scenarios</strong>, which is a Chapter 5 contribution rather than a hyperparameter tweak. I'd rather report a defensible 0.871 with a calibrated rule engine than chase 0.88 with an unprincipled stack."</td>
+    <td class="zh">"两个理由：(1) 您上次的指示是<strong>先把 dataset 和 model 巩固好</strong>再加复杂度——我严格照做了。(2) <strong>当前瓶颈不是模型本身</strong>，而是<strong>规则引擎对 OOD 场景的覆盖</strong>——这是 Chapter 5 的研究贡献，不是调超参。我宁愿报一个<strong>可辩护的 0.871</strong> 加一个校准好的规则引擎，<strong>也不要不讲原理地堆栈到 0.88</strong>。"</td>
+  </tr>
+</table>
+<h3>Q-N3 — "Show me one concrete weakness you have not yet fixed."</h3>
+<h3 style="margin-top:-2mm">Q-N3 ——给我说一个你目前还没修的具体弱点。</h3>
+<table class="bilingual">
+  <tr>
+    <td class="en">"Honestly, Sir, the biggest one is <code>cape_jkg</code> — the ERA5 archive returns predominantly zero CAPE for these Malaysian coordinates, which is a <strong>known coverage gap</strong>. The Random Forest learns nothing from it (0 % importance). The rule engine still uses live Open-Meteo CAPE at inference time, so the production output is fine, but the <em>training</em> signal for thunderstorm risk is weaker than I'd like. I plan to address this in §5.4 ablation by quantifying how much it matters."</td>
+    <td class="zh">"老实说，老师，最大的弱点是 <code>cape_jkg</code>——ERA5 在这些马来西亚坐标上的 CAPE 几乎全为零（<strong>已知覆盖缺口</strong>），<strong>RF 完全没学到东西</strong>（特征重要性 0%）。规则引擎在推理时用的是 Open-Meteo 实时 CAPE，所以生产输出没问题，但<strong>雷暴风险的训练信号</strong>比我希望的弱。计划在 §5.4 消融实验里<strong>量化它的影响</strong>。"</td>
+  </tr>
+</table>
+<h3>Q-N4 — "When can I see the first draft of Chapter 5?"</h3>
+<h3 style="margin-top:-2mm">Q-N4 ——Chapter 5 初稿什么时候能给我看？</h3>
+<table class="bilingual">
+  <tr>
+    <td class="en">"If you sign off on tracks <strong>5.1 + 5.2 + 5.4</strong> today, the data collection finishes in 3 weeks, writing takes 1 week, so you'd have a draft in <strong>4 weeks from today</strong>. If you also want 5.5 (user study), add 4 weeks. <strong>I'll lock the date the moment you confirm the scope.</strong>"</td>
+    <td class="zh">"如果今天您拍板 <strong>5.1 + 5.2 + 5.4</strong> 三条，<strong>3 周收数据 + 1 周写作 = 4 周后给您初稿</strong>。如果再加 <strong>5.5（用户研究）</strong>，再加 4 周。<strong>您一确认范围，我立刻锁定交稿日</strong>。"</td>
+  </tr>
+</table>
+<!-- ===== Section 7: pre-flight checklist ===== -->
+<h2 class="pb">7 · Pre-flight checklist (T-60 sec)
+  <span class="zh">起飞前 60 秒自检</span>
+</h2>
+<div class="check">
+<pre><code>☐ Laptop ≥ 80 % battery, charger in bag
+☐ Terminal A: `make run` is running, do not close
+☐ Terminal B: `curl /api/health` returned ml_loaded: true within last 5 min
+☐ 10 browser tabs open in cheat-sheet §0 order — app tab is LAST
+☐ This file open on a separate screen / phone, NOT to be read aloud
+☐ docs/MEETING_CHEAT_SHEET.md open as a fall-back
+☐ models/MODEL_CARD.md open in case any number is challenged
+☐ figures/evaluation_summary.json downloadable on demand
+☐ Phone on silent
+☐ One deep breath. You shipped v1.0.0. You're prepared.</code></pre>
+</div>
+<div class="check">
+<pre><code>☐ 笔记本电池 ≥ 80%，充电器已带
+☐ 终端 A：`make run` 跑着，不要关
+☐ 终端 B：5 分钟内 `curl /api/health` 返回 ml_loaded: true
+☐ 10 个浏览器标签页按 cheat-sheet §0 顺序开好——app 标签放最后
+☐ 本文档开在副屏 / 手机，不要照念
+☐ docs/MEETING_CHEAT_SHEET.md 开着兜底
+☐ models/MODEL_CARD.md 开着，老师质疑任何数字立刻打开
+☐ figures/evaluation_summary.json 随时可发
+☐ 手机静音
+☐ 深呼吸。v1.0.0 已经交付。你准备好了。</code></pre>
+</div>
+<!-- ===== Section 8: cross references ===== -->
+<h2>8 · Cross-references
+  <span class="zh">相关文档索引</span>
+</h2>
+<table>
+  <tr><th>Topic / 主题</th><th>File / 文件</th></tr>
+  <tr><td>Original 5/11 reply to 4/15 feedback</td><td><a href="supervisor_meeting_brief.md"><code>supervisor_meeting_brief.md</code></a></td></tr>
+  <tr><td>One-page cheat sheet (tab order, demo script)</td><td><a href="MEETING_CHEAT_SHEET.html"><code>MEETING_CHEAT_SHEET.html</code></a></td></tr>
+  <tr><td>Pipeline order ASCII chart</td><td><a href="pipeline_order.md"><code>pipeline_order.md</code></a></td></tr>
+  <tr><td>Dataset spec + Y derivation</td><td><a href="dataset.md"><code>dataset.md</code></a></td></tr>
+  <tr><td>Architecture deep-dive</td><td><a href="architecture.md"><code>architecture.md</code></a></td></tr>
+  <tr><td>Threshold citations</td><td><a href="thresholds.md"><code>thresholds.md</code></a></td></tr>
+  <tr><td>Model card</td><td><a href="../models/MODEL_CARD.md"><code>../models/MODEL_CARD.md</code></a></td></tr>
+  <tr><td>Evaluation summary JSON</td><td><a href="../figures/evaluation_summary.json"><code>../figures/evaluation_summary.json</code></a></td></tr>
+  <tr><td>What changed in v1.0.0</td><td><a href="../CHANGELOG.md"><code>../CHANGELOG.md</code></a></td></tr>
+</table>
+<footer>
+  Generated 2026-05-13 for the MicroClimate-X progress-update meeting at UKM.<br>
+  此页为 2026-05-13 UKM 毕业设计 MicroClimate-X 进度汇报准备文档。<br>
+  <span style="color: var(--brand);">L.ZH @ UKM · KyoukoLi/microclimate-x</span>
+</footer>
+</main>
+</body>
+</html>

docs/progress_update_brief.md ADDED Viewed

	@@ -0,0 +1,235 @@

+# Supervisor Progress-Update Brief — bilingual script
+# 导师进度汇报双语逐字稿
+> Follow-up meeting after the v1.0.0 hardening pass on 2026-05-11.
+> Walk-through order is unchanged: **dataset → model → app → next steps**.
+> Open this file on screen during the meeting; do not read word-for-word.
+>
+> 紧接 2026-05-11 v1.0.0 强化提交之后的**进度汇报**会议。
+> 顺序一律不变：**dataset → model → app → 下一步**。
+> 开会时屏幕上打开本文档，**不要照念**，当兜底用即可。
+---
+## 0. What you need to do — three time windows
+## 0. 你要做的事 —— 三个时间窗口
+### 0.1 Before the meeting (T-15 min) / 会前 15 分钟
+| ☐ | English | 中文 |
+|---|---|---|
+| ☐ | Charge laptop ≥ 80 %; charger in bag. | 笔记本充满 ≥ 80%，充电器带上。 |
+| ☐ | `cd ~/Projects/microclimate-x && git pull && git status` — must print "working tree clean". | 拉最新代码，确认 working tree clean。 |
+| ☐ | `make run` in **terminal A** (leave it running). | 终端 A 起后端，**不要关**。 |
+| ☐ | `curl -s http://localhost:8000/api/health \| python3 -m json.tool` in **terminal B** — verify `"ml_loaded": true`. | 终端 B 验证健康检查，`ml_loaded` 必须为 `true`。 |
+| ☐ | Open the 10 browser tabs in the order from `docs/MEETING_CHEAT_SHEET.md` §0 — **app tab is last**. | 按 cheat-sheet §0 顺序开 10 个标签页，**app 标签放最后**。 |
+| ☐ | This file (`docs/progress_update_brief.md`) open on a separate screen / phone. | 把本文档单独开在副屏或手机上。 |
+| ☐ | Phone on silent. Deep breath. | 手机静音，深呼吸。 |
+### 0.2 During the meeting (≈ 8 minutes) / 会中 ≈ 8 分钟
+| Block | EN heading | 中文标题 | Time |
+|---|---|---|---|
+| 1 | Opening 30 s | 开场 30 秒 | 0:00 → 0:30 |
+| 2 | What changed since last meeting | 自上次会以来的进展 | 0:30 → 2:00 |
+| 3 | Live demo — dataset → model → app | 现场演示（顺序不变） | 2:00 → 5:00 |
+| 4 | Next steps for Chapter 5 | Chapter 5 下一步 | 5:00 → 6:30 |
+| 5 | Asks + closing | 请示 + 收尾 | 6:30 → 8:00 |
+### 0.3 After the meeting (T+24 h) / 会后 24 小时内
+| ☐ | English | 中文 |
+|---|---|---|
+| ☐ | Write meeting minutes — capture every supervisor decision in `docs/meeting_log_<date>.md`. | 写会议纪要，把老师每条决定记到 `docs/meeting_log_<日期>.md`。 |
+| ☐ | Open one GitHub issue per agreed action item (label: `chapter-5`). | 每个 action item 在 GitHub 开一个 issue，打 `chapter-5` 标签。 |
+| ☐ | Email a 3-bullet summary back to the supervisor for written confirmation. | 给老师发 3 条要点的总结邮件，留书面确认。 |
+| ☐ | Update `README.md` §9 Roadmap — tick boxes that were signed off. | 更新 `README.md` 第 9 节 Roadmap，把通过的项打勾。 |
+| ☐ | Tag a new release if scope was confirmed (`git tag v1.1.0-rc.1`). | 如果范围确认了，打个新 tag (`v1.1.0-rc.1`)。 |
+---
+## 1. Opening 30 seconds / 开场 30 秒
+| English (say this) | 中文（口头要点） |
+|---|---|
+| "Sir, thank you for your time. Following up on our last session, I've completed a production-grade hardening pass — version 1.0.0 — and the full pipeline is now reproducible end-to-end. May I walk you through what's new in the same order as before — dataset, then model, then app — and finish with my proposed plan for Chapter 5?" | "老师感谢您抽时间。接着上次的内容，我做完了**v1.0.0 工程化强化**，整条流水线现在可以**端到端复现**。我按上次的顺序——**dataset、model、app**——给您过一遍新的进展，最后讲我对 Chapter 5 的下一步计划，可以吗？" |
+**Why this opening**: it (a) restates the supervisor's preferred process order without him asking, (b) signals you've made forward progress not just polish, and (c) ends with an explicit ask for direction on Chapter 5 — which is what *he* wants to talk about.
+**为什么这样开场**：(a) 不用他提就主动按他的流程顺序；(b) 强调是**前进了**而不是只在抛光；(c) 用对 Chapter 5 的请示收尾，**这正是他想聊的话题**。
+---
+## 2. What changed since the last meeting / 自上次会议以来的进展
+> ~ 90 seconds. Stay on the GitHub repo tab — point to the commit history,
+> the green CI badge, the v1.0.0 release.
+>
+> ≈ 90 秒。停在 GitHub repo 标签页，指给老师看 commit 历史、CI 绿勾、v1.0.0 release。
+| Area | English | 中文 |
+|---|---|---|
+| **Backend hardening** | "I added a request-ID middleware, a typed `ErrorResponse` contract so no bare HTML 500s leak, structured logging, and an enriched `/api/health` exposing uptime, cache stats, and the loaded ML feature schema." | "后端我加了 **request-ID 中间件**、**类型化错误协议** `ErrorResponse`（不再泄漏裸 HTML 500）、结构化日志、以及**升级版 `/api/health`**（暴露 uptime、缓��统计、ML 特征 schema）。" |
+| **ML pipeline** | "I shipped `scripts/4_evaluate_model.py` which produces six publication-quality figures plus a machine-readable `evaluation_summary.json`. I also wrote a HuggingFace-style `MODEL_CARD.md` covering intended use, training data, metrics, limitations, and ethical considerations." | "ML 流水线加了 **评估脚本** `scripts/4_evaluate_model.py`，自动出 6 张论文级别图 + 一份 `evaluation_summary.json`。还写了 HuggingFace 风格的 **MODEL_CARD.md**，覆盖用途、训练数据、指标、局限、伦理考量。" |
+| **Tests + CI** | "Total tests went from 19 to **70**, backend coverage is **97 %**. CI runs on Python 3.9 / 3.11 / 3.12 plus a Docker image-build smoke test." | "测试数从 19 涨到 **70**，**后端覆盖率 97%**。CI 跑 Python 3.9/3.11/3.12 矩阵，外加 Docker 镜像构建烟测。" |
+| **Dev-ex** | "Multi-stage Dockerfile, docker-compose, Makefile single-word recipes, pre-commit hooks. The whole project is now `docker compose up --build` away from a clean machine." | "多阶段 Dockerfile + compose + Makefile 单词命令 + pre-commit hooks。**新机器一句 `docker compose up --build` 就能跑起来**。" |
+| **Documentation** | "Three new docs — `architecture.md`, `thresholds.md` with citations for every Veto threshold, and `pipeline_order.md` which explicitly enforces the dataset → model → app order you asked for." | "三份新文档——`architecture.md`、`thresholds.md`（每个 Veto 阈值都附学术引用）、以及 `pipeline_order.md`（**显式按您要求的 dataset→model→app 顺序写死**）。" |
+**Artefact to show**: the GitHub commit history page; the green CI badge on the README; `CHANGELOG.md` v1.0.0 entry.
+**展示物**：GitHub commit 历史页；README 上的 CI 绿勾；`CHANGELOG.md` 中 v1.0.0 那一段。
+---
+## 3. Live demo — dataset → model → app / 现场演示（顺序不变）
+> ~ 3 minutes. Same order as the 5/11 dry-run script — no surprises for the supervisor.
+>
+> ≈ 3 分钟。跟 5/11 的脚本完全一样的顺序，**老师不会被打乱节奏**。
+### 3.1 Dataset (Tab `docs/dataset.md`) — 30 s
+| EN | 中文 |
+|---|---|
+| "Same dataset as last time — ERA5 reanalysis, 5 Malaysian mountain sites, 175 315 hourly rows. The Y column `is_rain_event` is derived in one line and documented in §5. No change here, just confirming the foundation is unchanged." | "数据集跟上次一样——ERA5 再分析、马来西亚 5 个山地点位、17.5 万行小时数据。Y 列 `is_rain_event` 一行代码构造，文档在 §5。**这里没有变**，只是确认地基没动。" |
+### 3.2 Model (Tabs `01_roc_curve.png` → `03_calibration_curve.png` → `04_threshold_sweep.png` → `05_feature_importance.png`) — 90 s
+| EN | 中文 |
+|---|---|
+| "Same model as last time — Random Forest, time-based split, τ = 0.20. Test ROC AUC **0.871**, PR AP **0.750**, Brier **0.138**, recall **93.4 %**. What's new is the **6 figures plus the model card** — every number you see here is reproducible from `make evaluate`." | "模型跟上次一样——RF、时间序列切分、τ = 0.20。测试 AUC **0.871**、PR AP **0.750**、Brier **0.138**、召回率 **93.4%**。**新东西**是 6 张图 + model card——上面任何一个数字都可以用 `make evaluate` 复现。" |
+### 3.3 App (Tab `http://localhost:8000/app/`) — 60-90 s
+| EN | 中文 |
+|---|---|
+| "Step 3, the app — opened **last** as agreed. Two demo scenarios. First, Genting Highlands — a slope at 1865 m inside the training distribution. The model gives a moderate rain probability; the rule engine picks up orographic lift; the four mini-gauges decompose the risk by hazard type." | "第三步 app——按约定**最后才开**。两个 demo 场景。第一个云顶高原——1865 m 的山坡，**在训练分布之内**。模型给中等降雨概率，规则引擎检测到地形抬升，四个 mini-gauge 把风险按灾害类型拆解。" |
+| "Second, Mt Everest — completely out of distribution. The model alone would say 'safe'. The Veto cascade fires three independent overrides — hypoxia, frostbite, gale — and the composite is forced to Danger. There's a unit test for exactly this: `test_mt_everest_veto_hypoxia`." | "第二个珠峰——**完全分布外**。光看模型会说"安全"，但 Veto 级联触发**三个独立否决**——缺氧、冻伤、大风——综合分被强制设为 Danger。**专门有单元测试覆盖这个场景**：`test_mt_everest_veto_hypoxia`。" |
+---
+## 4. Next steps for Chapter 5 / Chapter 5 下一步
+> ~ 90 seconds. **This is the section the supervisor will react to most.**
+> Frame each item as a concrete deliverable + estimated time + dependency.
+>
+> ≈ 90 秒。**老师反应最强烈的就是这一节**。每一项都以"**交付物 + 估时 + 依赖**"形式呈现。
+### 4.1 Proposed Chapter 5 work plan / Chapter 5 工作计划
+| # | Deliverable | EN one-liner | 中文一句话 | Estimate |
+|---|---|---|---|---|
+| 5.1 | **Comparative ablation** | "Train LogReg + XGBoost on the same features and report ROC / PR / F2 side-by-side with RF — answers 'why RF?' empirically." | "在同一特征集上训 LogReg + XGBoost，对比 ROC / PR / F2，**用数据回答"为什么选 RF"**。" | 1 week |
+| 5.2 | **Hindcast validation** | "Replay 2020-2024 NaDMA-documented Malaysian flood / landslide events and check whether the system would have raised Warning / Danger at the right time. Reports hit-rate, lead-time, false-alarm rate." | "把 2020-2024 NaDMA 公开的马来西亚洪水/滑坡事件**逐一回放**，看系统能否在事发前给出 Warning/Danger。报告命中率、提前量、误报率。" | 2 weeks |
+| 5.3 | **Threshold sensitivity** | "Sweep τ ∈ {0.10, 0.15, 0.20, 0.25, 0.30}, plot precision-recall trade-off, and justify the operating point with a cost-of-error analysis." | "扫 τ ∈ {0.10, 0.15, 0.20, 0.25, 0.30}，画精度-召回权衡曲线，用**误差代价分析**为最终选点辩护。" | 3 days |
+| 5.4 | **Component ablation** | "Compare three system variants — RF only / Rule only / Hybrid — on the held-out test set and on the OOD Mt Everest case. Quantifies the rule-engine contribution." | "对比三个系统变体——**纯 RF / 纯规则 / 混合**——在测试集和 OOD 珠峰场景上的表现。**量化规则引擎的贡献**。" | 4 days |
+| 5.5 | **Small user study** *(optional)* | "Recruit 5-8 mountain hikers, run a 4-week panel, log system advice vs. their field judgment. Reports inter-rater agreement (Cohen's κ)." | "招募 5-8 名登山者，4 周面板研究，记录系统建议 vs 他们现场判断，报告 Cohen's κ 一致性。" | 4 weeks |
+| 5.6 | **Thesis Chapter 5 draft** | "Pull §5.1-5.5 into a single 12-15 page evaluation chapter with all figures, tables, and discussion." | "把 §5.1-5.5 整合成 12-15 页的评估章节，含全部图表和讨论。" | 1 week (after 5.1-5.4) |
+### 4.2 Decision tree to ask the supervisor / 请示决策树
+| Question to ask | EN | 中文 |
+|---|---|---|
+| **Q1** | "Sir, of the five evaluation tracks above, which two should I prioritise for the **next four weeks** before we converge on the Chapter 5 outline?" | "老师，上面 5 条评估方向，**未来四周**您建议我重点做哪两条，然后再收敛到 Chapter 5 大纲？" |
+| **Q2** | "Do you want me to include the user study (5.5)? It is the longest item and depends on participant recruitment — I want your call before committing." | "**用户研究 (5.5) 您要不要做**？这一条最长、依赖招募——想请您拍板再投入。" |
+| **Q3** | "For the comparative ablation, do you want the comparison framed as 'why RF wins' (defending current choice) or 'what if XGBoost wins' (open exploration)? The framing affects how I report inconclusive results." | "**对比实验**您希望框成"为什么 RF 胜出"（**捍卫现有选择**）还是"如果 XGBoost 更好怎么办"（**开放探索**）？两种 framing 对**模棱两可结果**的报告方式不同。" |
+| **Q4** | "Should I treat the Mt Everest OOD test as a thesis-level contribution (a stand-alone subsection on safety) or just an appendix item?" | "**珠峰 OOD 测试**算论文级别的贡献（单独一节讲安全性），还是放附录就够？" |
+---
+## 5. Asks + closing 60 seconds / 请示 + 收尾 60 秒
+| EN (say this) | 中文（口头要点） |
+|---|---|
+| "Sir, to summarise: since the last meeting I've shipped v1.0.0 — production-grade hardening, 70 tests at 97 % coverage, six evaluation figures, a published model card, full Docker reproducibility. The pipeline order is unchanged from what you asked: dataset, model, app. For Chapter 5 I have five evaluation tracks scoped; I'd like your guidance on which two to prioritise for the next four weeks." | "老师，总结：自上次会议以来交付了 **v1.0.0**——工程化强化、70 个测试 97% 覆盖率、6 张评估图、model card、Docker 全复现。流水线顺序按您要求**没动**：dataset、model、app。Chapter 5 我列了 5 条评估方向，**接下来四周您建议我先做哪两条**？" |
+| "I'll send you a 3-bullet email summary by tomorrow morning so we have written agreement on the priorities. Thank you for your time." | "明早之前给您发 3 条要点的邮件总结，**留个书面确认**。谢谢老师。" |
+---
+## 6. Q&A defensive lines / Q&A 兜底话术
+> Anticipated follow-up questions from this update specifically (not the
+> classics from the 5/11 brief — those are still live, just don't repeat
+> them here).
+>
+> **针对本次进度汇报**可能出现的追问（5/11 那份的经典 Q1-Q7 仍然有效，
+> 不重复罗列）。
+### Q-N1 — "Why are you spending time on tests and Docker instead of the thesis?"
+### Q-N1 ——为什么你在写测试和 Docker 上花时间，不写论文？
+| EN | 中文 |
+|---|---|
+| "Sir, the v1.0.0 hardening was a one-time investment to make every Chapter 5 number reproducible by the examiner with a single command. Without it, every evaluation result would be a black box — the examiner could not verify the AUC of 0.871 herself. With `make evaluate` reproducing all six figures byte-for-byte, the thesis claims become falsifiable. From this point on, all my time goes to evaluation and writing." | "老师，v1.0.0 的强化是**一次性投资**——为了让评审老师**用一行命令就能复现 Chapter 5 的每一个数字**。没有它，AUC = 0.871 就是黑盒，**评审无法独立验证**。现在 `make evaluate` 能把 6 张图按字节复现，论文的每个 claim 都**可证伪**。从今天起所有时间都给评估和写作。" |
+### Q-N2 — "Why hasn't the model improved since last time?"
+### Q-N2 ——模型为什么自上次以后没提升？
+| EN | 中文 |
+|---|---|
+| "Two reasons. First, the supervisor's instruction was to *consolidate* dataset and model before adding more capacity — which is what I did. Second, the bottleneck right now is **not the model** but the **rule engine's coverage of OOD scenarios**, which is a Chapter 5 contribution rather than a hyperparameter tweak. I'd rather report a defensible 0.871 with a calibrated rule engine than chase 0.88 with an unprincipled stack." | "两个理由：(1) 您上次的指示是**先把 dataset 和 model 巩固好**再加复杂度——我严格照做了。(2) **当前瓶颈不是模型本身**，而是**规则引擎对 OOD 场景的覆盖**——这是 Chapter 5 的研究贡献，不是调超参。我宁愿报一个**可辩护的 0.871** 加一个校准好的规则引擎，**也不要不讲原理地堆栈到 0.88**。" |
+### Q-N3 — "Show me one concrete weakness you have not yet fixed."
+### Q-N3 ——给我说一个你目前**还没修**的具体弱点。
+| EN | 中文 |
+|---|---|
+| "Honestly, Sir, the biggest one is `cape_jkg` — the ERA5 archive returns predominantly zero CAPE for these Malaysian coordinates, which is a known coverage gap. The Random Forest learns nothing from it (0 % importance). The rule engine still uses live Open-Meteo CAPE at inference time, so the production output is fine, but the *training* signal for thunderstorm risk is weaker than I'd like. I plan to address this in §5.4 ablation by quantifying how much it matters." | "老实说，老师，最大的弱点是 **`cape_jkg`**——ERA5 在这些马来西亚坐标上的 CAPE 几乎全为零（**已知覆盖缺口**），**RF 完全没学到东西**（特征重要性 0%）。规则引擎在推理时用的是 Open-Meteo 实时 CAPE，所以生产输出没问题，但**雷暴风险的训练信号**比我希望的弱。计划在 §5.4 消融实验里**量化它的影响**。" |
+### Q-N4 — "When can I see the first draft of Chapter 5?"
+### Q-N4 ——Chapter 5 初稿什么时候能给我看？
+| EN | 中文 |
+|---|---|
+| "If you sign off on tracks 5.1 + 5.2 + 5.4 today, the data collection finishes in 3 weeks, writing takes 1 week, so you'd have a draft in **4 weeks from today**. If you also want 5.5 (user study), add 4 weeks. I'll lock the date the moment you confirm the scope." | "如果今天您拍板 **5.1 + 5.2 + 5.4** 三条，**3 周收数据 + 1 周写作 = 4 周后给您初稿**。如果再加 **5.5（用户研究）**，再加 4 周。**您一确认范围，我立刻锁定交稿日**。" |
+---
+## 7. Materials checklist before walking in / 开会前自检清单
+```
+☐ Laptop ≥ 80 % battery, charger in bag
+☐ Terminal A: `make run` is running, do not close
+☐ Terminal B: `curl /api/health` returned ml_loaded: true within last 5 min
+☐ 10 browser tabs open in cheat-sheet §0 order — app tab is LAST
+☐ This file open on a separate screen / phone, NOT to be read aloud
+☐ docs/MEETING_CHEAT_SHEET.md open as a fall-back
+☐ models/MODEL_CARD.md open in case any number is challenged
+☐ figures/evaluation_summary.json downloadable on demand
+☐ Phone on silent
+☐ One deep breath. You shipped v1.0.0. You're prepared.
+```
+```
+☐ 笔记本电池 ≥ 80%，充电器已带
+☐ 终端 A：`make run` 跑着，不要关
+☐ 终端 B：5 分钟内 `curl /api/health` 返回 ml_loaded: true
+☐ 10 个浏览器标签页按 cheat-sheet §0 顺序开好——app 标签放最后
+☐ 本文档开在副屏 / 手机，不要照念
+☐ docs/MEETING_CHEAT_SHEET.md 开着兜底
+☐ models/MODEL_CARD.md 开着，老师质疑任何数字立刻打开
+☐ figures/evaluation_summary.json 随时可发
+☐ 手机静音
+☐ 深呼吸。v1.0.0 已经交付。你准备好了。
+```
+---
+## 8. Cross-references / 相关文档索引
+| Topic | File |
+|---|---|
+| Original 5/11 reply to 4/15 feedback | [`supervisor_meeting_brief.md`](supervisor_meeting_brief.md) |
+| One-page cheat sheet (tab order, demo script) | [`MEETING_CHEAT_SHEET.md`](MEETING_CHEAT_SHEET.md) |
+| Pipeline order ASCII chart | [`pipeline_order.md`](pipeline_order.md) |
+| Dataset spec + Y derivation | [`dataset.md`](dataset.md) |
+| Architecture deep-dive | [`architecture.md`](architecture.md) |
+| Threshold citations | [`thresholds.md`](thresholds.md) |
+| Model card | [`../models/MODEL_CARD.md`](../models/MODEL_CARD.md) |
+| Evaluation summary JSON | [`../figures/evaluation_summary.json`](../figures/evaluation_summary.json) |
+| What changed in v1.0.0 | [`../CHANGELOG.md`](../CHANGELOG.md) |
+---
+> *Generated 2026-05-13 for the MicroClimate-X progress-update meeting at UKM.
+> 此页为 2026-05-13 UKM 毕业设计 MicroClimate-X 进度汇报准备文档。*

docs/supervisor_meeting_brief.md ADDED Viewed

	@@ -0,0 +1,161 @@

+# Supervisor Meeting Brief — bilingual script
+# 导师开会双语逐字稿
+> Single-page meeting brief addressing every point of feedback from the
+> 4/15 supervisor session. Bring this document open on screen during the
+> meeting and walk through it in order.
+>
+> 一页式开会简报，逐条回应 4/15 导师 review 的所有反馈。开会时直接打开
+> 此页，按顺序走一遍即可。
+---
+## Opening 30 seconds / 开场 30 秒
+| English (say this) | 中文（口头要点） |
+|---|---|
+| "Sir, since our last meeting I have addressed every point of your feedback. May I walk you through them in the correct order — dataset first, then model, then app — as you instructed?" | "老师，按您上次反馈，我已经把每一条都改了。我按您要求的顺序——**先 dataset，再 model，最后才是 app**——给您过一遍可以吗？" |
+**Why this opening works**: it explicitly *names* the supervisor's #1 process complaint ("app is last"). He'll relax immediately because he can see you listened.
+---
+## Concern #1 — Y target was missing
+## 反馈一 · 缺少目标列 Y
+**His original words**: "Y is missing. I don't have the output variable. If you don't have target, you cannot train a machine learning model."
+| English (say this) | 中文（口头要点） |
+|---|---|
+| "Sir, you were right — the raw Open-Meteo CSV has no Y column. I have engineered the target explicitly. The variable is called `is_rain_event` and it is defined as 1 if the precipitation in the **next hour** is greater than 0.1 mm, else 0. The code is one line in `scripts/2_preprocess.py`." | "老师您说得对，原始 Open-Meteo CSV 确实没有 Y 列。我现在已经显式构造了目标变量，叫做 **`is_rain_event`**，定义是：**下一小时降雨量 > 0.1 mm 则为 1，否则为 0**。代码就一行，写在 `scripts/2_preprocess.py`。" |
+| [Show this code on screen:] `df['is_rain_event'] = (df['precipitation'].shift(-1) > 0.1).astype(int)` | （把这一行代码投出来给老师看） |
+| "Three things to notice: `.shift(-1)` means I use **future** rain as the label — features at hour t predict outcome at t+1h, so there is no temporal leakage. The 0.1 mm threshold matches the **WMO definition** of trace precipitation, not an arbitrary choice. And it is binary classification, not regression, because the downstream decision is binary." | "三个要点：(1) `.shift(-1)` 表示用**下一小时**的降雨作为标签，特征是 t 时刻、预测的是 t+1 小时——没有时间泄漏。(2) 0.1 mm 这个阈值不是我随便定的，对应 **WMO 微量降水标准**。(3) 是二分类不是回归，因为下游用户决策本身就是二元的（去 / 不去）。" |
+**Artefact to show**: `docs/dataset.md` §5 (Target label derivation) — has all three points written out.
+---
+## Concern #2 — features in the document did not match the Excel
+## 反馈二 · 文档里的特征跟 CSV 列名对不上
+**His original words**: "The features that you presented here, not... not mentioned in the Excel. So, it must be matched."
+| English (say this) | 中文（口头要点） |
+|---|---|
+| "Sir, that was also a fair point. I have rewritten the dataset specification so the documentation lists exactly the **same column names** that appear in the CSV. There is a one-to-one mapping in `docs/dataset.md` §4." | "老师，这条您也说对了。我已经把数据集文档完全重写，文档里列出的就是 CSV 里的**真实列名**，一一对应。在 `docs/dataset.md` 第 4 节。" |
+| [Open dataset.md §4 schema table] "Every row in this table is one column in the actual CSV. The role column says whether it is a feature (X), the target (Y), or just metadata." | （打开 dataset.md §4 列结构表）"表里每一行就是 CSV 里的一列，role 列写明了它是 feature（X）、target（Y）还是 metadata。" |
+**Artefact to show**: `docs/dataset.md` §4 — single canonical schema table.
+---
+## Concern #3 — study the data source
+## 反馈三 · 研究数据源本身
+**His original words**: "Please study the link. What is the purpose of the dataset? What is design for? What is the output variable?"
+| English (say this) | 中文（口头要点） |
+|---|---|
+| "I read the Open-Meteo API documentation carefully. The dataset I use is the **ERA5 reanalysis archive**, which is ECMWF's gold-standard hourly reanalysis — they use it to validate other forecast models. It is *not* a forecast, it is a physically-consistent reconstruction of past weather, which is why it is the right dataset for training: the labels are reliable ground truth." | "我把 Open-Meteo 文档仔细读了。我用的是 **ERA5 再分析数据**，是 ECMWF 出的同化产品，气象学界用它当作**真值**去校验别的预报模型。它**不是**预报，而是对过去天气的物理一致的重建。所以用来训练 ML 是合适的——标签是可靠的 ground truth。" |
+| "Spatial coverage: 5 Malaysian mountain sites — Genting, Cameron, Fraser's Hill, Klang Valley, Kinabalu — chosen to span elevations from 100 m to 1865 m and terrain types from valley to slope." | "空间覆盖 5 个马来西亚山地点位——云顶、金马仑、福隆港、巴生谷、神山——海拔从 100 m 到 1865 m，地形从山谷到山坡都有。" |
+| "Temporal coverage: 5 years, hourly, 175 315 rows in total." | "时间范围 5 年，每小时一行，总共 175 315 行。" |
+**Artefact to show**: `docs/dataset.md` §1-3, or open the Open-Meteo documentation page itself if he wants the original source.
+---
+## Concern #4 — process order was wrong: app should be last
+## 反馈四 · 流程顺序错了，app 应该最后做
+**His original words**: "First, identify a dataset. Identify a dataset. And then train the model. And then predict it. First. Once everything is finished... okay, you can develop the app. App is the last."
+| English (say this) | 中文（口头要点） |
+|---|---|
+| "Yes Sir, I followed your process. The current state is: Step 1 dataset is identified and documented. Step 2 the model is trained — let me show you the results before I open the app." | "好的老师，我严格按您的流程做的。当前状态是：**第一步 dataset 已确认并文档化**；**第二步模型已训练完毕**——在打开 app 之前，先给您看训练结果。" |
+| [Open `figures/01_roc_curve.png`] "Test ROC AUC is 0.871 on 35 063 held-out hourly samples. The hold-out is the **last 20 % chronologically**, not a random split — random splits leak temporal autocorrelation and would inflate accuracy unrealistically." | （打开 ROC 图）"测试集 35 063 行，ROC AUC = **0.871**。划分用的是**按时间排序的最后 20%**，不是随机划分——随机划分会泄漏时间自相关，把准确率虚高 5-15 个百分点。" |
+| [Open `figures/03_calibration_curve.png`] "Brier score is 0.138, which means the predicted probabilities are well-calibrated — when the model says 70 % chance of rain, the actual rate is close to 70 %." | （打开 calibration 图）"Brier 分数 = 0.138，说明预测概率**校准良好**——模型说 70% 下雨概率时，实际频率接近 70%。" |
+| [Open `figures/04_threshold_sweep.png`] "I optimised the decision threshold for **F2 score**, not F1, because in this safety-critical application a missed rain event on a windward slope can lead to flash flooding — false negatives are much worse than false positives. F2 weights recall four times more than precision. The optimal threshold is τ = 0.20, giving F2 = 0.778 and **93.4 % recall**." | （打开阈值扫描图）"我用 **F2 分数**而不是 F1 来选最优阈值——因为这是安全关键应用，**漏报**比误报严重得多（在迎风坡漏掉一次降雨可能引发山洪）。F2 把召回率的权重设为精度的 4 倍，最优阈值是 τ = 0.20，F2 = 0.778，**召回率 93.4%**。" |
+| [Open `figures/05_feature_importance.png`] "Top-3 features the model relies on: previous hour's rain, time-of-day cyclic encoding, and 3-hour pressure tendency. These match the meteorological literature — autocorrelation, diurnal cycle, and storm precursor." | （打开特征重要性图）"模型最看重的 3 个特征：上一小时降水、时间周期编码、3 小时气压变化。这跟气象文献吻合——自相关、日变化、风暴前兆。" |
+| **[NOW open the app]** "Step 3, the app. This is FastAPI + Vue using the trained model. When I click a coordinate, the system returns the probability and the four hazard sub-scores per the proposal §3.7." | **（这时才打开 app）**"第三步，app。这是 FastAPI + Vue 调用上面训好的模型。我点地图任意一点，系统返回概率和四个分项灾害评分（按开题 §3.7）。" |
+**Why this order matters**: he literally said "App is the last" three times. Showing dataset → ROC → calibration → threshold → importance → THEN the app is exactly the order he asked for. Each chart takes 20-30 seconds to explain; total before opening the app ≈ 2-3 minutes.
+---
+## Concern #5 — regression or classification?
+## 反馈五 · 回归还是分类？
+**His original words**: "I don't think this is a classification problem because there is no class label. So I think this is a regression problem."
+| English (say this) | 中文（口头要点） |
+|---|---|
+| "Sir, when you first looked at the raw CSV, there was no class label, so regression looked like the only option. I considered both. I chose **binary classification** for three reasons:" | "老师，您当时看原始 CSV 的时候确实没有 class label，所以看上去像 regression。我两个都考虑过，最后选了**二分类**，三个理由：" |
+| **(1)** "The downstream decision is binary — go outside or don't. Regressing on mm of rain would still need a threshold to convert to a go/no-go output, so I would have to pick the threshold anyway." | **(1)** "下游决策本身就是二元的——出门 vs 不出门。即使做回归预测降雨毫米数，最后也要拿��个阈值转成 go/no-go，**那个阈值反正要选**。" |
+| **(2)** "Classification lets me optimise **F2 score**, which is the right metric for a safety-critical setting where recall matters more than precision. I cannot directly optimise F2 on a regression target." | **(2)** "做分类才能直接优化 **F2 分数**——安全关键场景下召回比精度更重要，**这个指标只在分类任务下有意义**。" |
+| **(3)** "But I still expose the **raw probability** in the API response, so any downstream component that needs a continuous score (e.g. the rule engine's rainfall sub-scorer) can still use it. So I keep the best of both worlds." | **(3)** "但 API 还是把**原始概率**暴露出来了，下游需要连续分数的组件（比如规则引擎的降雨子评分器）照样能用。**两全其美**。" |
+---
+## Likely follow-up questions / 老师可能追问的问题
+### Q1 — "Why Random Forest and not deep learning / LSTM?"
+### Q1 ——为什么选 Random Forest 而不是深度学习 / LSTM？
+| English | 中文 |
+|---|---|
+| "Three reasons. First, **interpretability**: feature importance lets me defend why the model predicts what it predicts — essential for a safety-critical application. A neural net is a black box. Second, **data efficiency**: with 175 K samples, Random Forest reaches state-of-the-art performance; LSTM would need an order of magnitude more data to outperform it. Third, **inference latency**: RF inference is sub-millisecond, which the FastAPI + cache architecture depends on. LSTM would be at least 10× slower and require GPU at inference time." | "三个理由：(1) **可解释性**——feature importance 让我能为每个预测**辩护**，安全关键应用必须有这一点，神经网络是黑盒。(2) **数据效率**——17 万样本下 RF 已经达到 SOTA，LSTM 需要至少 10 倍数据才能超过它。(3) **推理延迟**——RF 推理 < 1 ms，FastAPI + 缓存架构依赖这一点；LSTM 至少慢 10 倍且推理时需要 GPU。" |
+### Q2 — "How do you handle out-of-distribution input (e.g. Mt Everest)?"
+### Q2 ——分布外输入怎么处理（比如珠峰）？
+| English | 中文 |
+|---|---|
+| "This is exactly what the **hybrid architecture** is for, Sir. The Random Forest only saw Malaysian mountains, so on Everest it returns a low probability. But the rule engine's Veto cascade catches three independent failures — altitude > 3500 m triggers hypoxia veto, temperature ≤ -5 °C triggers frostbite veto, and wind ≥ 40 km/h triggers gale veto. The composite output goes to Danger regardless of the ML probability. There is a unit test for exactly this scenario — `test_mt_everest_veto_hypoxia` in `tests/test_rule_engine.py`." | "老师，这正是我做**混合架构**的原因。RF 只见过马来西亚的山，所以在珠峰上会返回很低的概率。但**规则引擎的 Veto 级联**会捕获三个独立的失败：海拔 > 3500 m 触发缺氧 Veto，温度 ≤ -5°C 触发冻伤 Veto，风速 ≥ 40 km/h 触发大风 Veto。无论 ML 给什么概率，输出都被强制设为 Danger。我专门为这个场景写了单元测试 `test_mt_everest_veto_hypoxia`。" |
+### Q3 — "What is the contribution of the topographic rule engine? Could you just use the ML model alone?"
+### Q3 ——地形规则引擎的贡献是什么？只用 ML 不行吗？
+| English | 中文 |
+|---|---|
+| "ML alone is statistical — it learns averages. But terrain in complex mountainous regions amplifies precipitation locally by orders of magnitude (Roe, 2005, *Annual Review of Earth & Planetary Sciences*). The decision-table R1 in proposal §3.7.2 captures exactly this: when macro rain probability is low but the wind impinges on a windward slope with falling pressure, hidden rain risk emerges. The ML model would say 'safe' here; the rule engine fires R1 and warns the user. This is the **Neuro-Symbolic AI** paradigm — learn what is learnable, hand-code what is physical." | "纯 ML 是统计性的——它学的是平均值。但复杂山地的地形会把降水**局部放大几个数量级**（Roe 2005, Annual Review of Earth & Planetary Sciences）。开题 §3.7.2 的决策表 R1 抓住的正是这一点：宏观降雨概率低、但风正对迎风坡且气压在下降时——存在**隐藏的降雨风险**。ML 在这种情况下会说"安全"；规则引擎会触发 R1 警告用户。这是 **Neuro-Symbolic AI** 范式——能学的让 ML 学，物理规律手工编码。" |
+### Q4 — "Did you do cross-validation? Did you check for overfitting?"
+### Q4 ——做过交叉验证吗？检查过过拟合吗？
+| English | 中文 |
+|---|---|
+| "Yes Sir, **time-series cross-validation** with 5 folds on the training portion — not random K-fold, which would leak temporal information. The fold AUCs range from 0.828 to 0.908, mean ≈ 0.858, which is very close to the held-out test AUC of 0.871. This consistency confirms the model is not overfitting to a single temporal slice. All fold metrics are in `models/training_report.json` and the model card." | "做了，老师。**时间序列交叉验证**，5 折，**不是**随机 K 折——随机划分会泄漏时间信息。各折 AUC 在 0.828 到 0.908 之间，均值约 0.858，跟独立测试集 AUC 0.871 非常接近——说明模型没有对某个时间段过拟合。所有指标都在 `models/training_report.json` 和 model card 里。" |
+### Q5 — "How will you validate this in the real world?"
+### Q5 ——你怎么在真实世界验证这套系统？
+| English | 中文 |
+|---|---|
+| "Two-pronged plan for Chapter 5 evaluation. First, **hindcast validation** — I will replay the system against publicly documented Malaysian flood and landslide events from NaDMA archives and check whether the system would have produced a Warning or Danger verdict at the right time. Second, **user study** — a small panel of mountain hikers will compare the system's recommendations against their own field judgment over a one-month period. Both methodologies follow standard practice in the operational meteorology literature." | "Chapter 5 评估两条腿走路：(1) **历史事件回放** —— 用 NaDMA 公开记录的马来西亚洪水/滑坡事件，看系统在事件发生时是否会给出 Warning 或 Danger。(2) **用户研究** —— 找一小批登山者，一个月内对比系统建议和他们自己的判断。两种方法都是业务气象学界的标准做法。" |
+---
+## Closing 30 seconds / 收尾 30 秒
+| English (say this) | 中文（口头要点） |
+|---|---|
+| "Sir, to summarise: I have addressed every point of your feedback — the missing Y is now derived, the documentation matches the data, the model is trained and evaluated before the app, and the choice of classification over regression is justified by the safety-critical nature of the application. The code is on GitHub at `KyoukoLi/microclimate-x` with CI passing, 97 % test coverage, and a published model card. May I have your guidance on the next priorities for Chapter 5?" | "老师，总结一下：您每条反馈我都已经回应——Y 已经构造好、文档跟数据完全对齐、模型在 app 之前就训好并评估过、分类而不是回归是因为应用本身就是安全关键。代码在 GitHub `KyoukoLi/microclimate-x`，CI 全过、测试覆盖率 97%、有完整的 model card。请问 Chapter 5 接下来您建议我重点做哪部分？" |
+---
+## Materials checklist before walking in / 开会前自检清单
+- [ ] Laptop charged, browser tab open to `docs/dataset.md`.
+- [ ] All 6 figures in `figures/` rendered to a quick-flip slide deck (or just keep the PNG files in a single Finder window).
+- [ ] GitHub repo page open in another tab, ready to show CI green badge + commit history.
+- [ ] Frontend `frontend/index.html` ready to demo (open `make run` in a terminal **before** the meeting — not during).
+- [ ] `models/MODEL_CARD.md` open in a third tab, in case the supervisor asks for written evidence of any number you quote.
+- [ ] This brief (`docs/supervisor_meeting_brief.md`) open on screen — but **don't read from it word-for-word**, treat it as your safety net only.
+中文版：
+- [ ] 笔记本充满电，浏览器开好 `docs/dataset.md`
+- [ ] `figures/` 里 6 张图全部预先点开过一次（图片预览快进就行，避免临时加载）
+- [ ] GitHub repo 页面开另一个标签页，CI 绿勾 + commit 历史随时可看
+- [ ] 前端 `make run` **提前**起好（不要开会时才起）
+- [ ] `models/MODEL_CARD.md` 第三个标签页，老师追问任何数字时打开它
+- [ ] **本文档**开着但**不要照念**，当兜底用即可

docs/thresholds.md ADDED Viewed

	@@ -0,0 +1,150 @@

+# Veto Thresholds & Academic Citations
+# 一票否决阈值与学术引用
+> **Why this document exists**: the thesis defence panel will ask "why 3500 m?", "why -5 °C?", "why 40 km/h?". Every numeric threshold in `backend/config.py` is justified here against authoritative literature so no value is "magic".
+---
+## 1. Altitude hypoxia — `ALTITUDE_HYPOXIA_M = 3500 m`
+**Rule**: any query above 3500 m AGL immediately receives a Veto.
+**Citation**: Luks, A. M., Auerbach, P. S., Freer, L., Grissom, C. K., Keyes, L. E., McIntosh, S. E., Rodway, G. W., Schoene, R. B., Zafren, K., & Hackett, P. H. (2019). *Wilderness Medical Society Clinical Practice Guidelines for the Prevention and Treatment of Acute Altitude Illness: 2019 Update*. **Wilderness & Environmental Medicine**, 30(4), S3-S18. https://doi.org/10.1016/j.wem.2019.04.006
+**Justification**: Acute mountain sickness (AMS) onset is clinically significant above 2500 m and severe physiological hypoxia is the norm above 3500 m without acclimatisation. We adopt 3500 m as the *hard* Veto and 2500-3500 m as a sub-Veto penalty band.
+---
+## 2. Extreme cold — `EXTREME_COLD_C = -5 °C`
+**Rule**: ambient temperature ≤ -5 °C triggers a Veto (frostbite risk).
+**Citation**: Petrone, P., et al. (2014). *Management of accidental hypothermia and cold injury*. **Current Problems in Surgery**, 51(10), 417-431.  And UIAA Medical Commission Standard No. 19 (2017) *Frostbite*. https://www.theuiaa.org/medical_advice/
+**Justification**: Exposed-skin frostbite becomes a real risk when ambient temperatures fall below -5 °C, particularly with any wind. Field guidance from UIAA medical advisors uses -5 °C as a "high vigilance" threshold for outdoor activity.
+---
+## 3. Gale-force winds — `GALE_WIND_KMH = 40 km/h`
+**Rule**: wind speed ≥ 40 km/h triggers a Veto.
+**Citation**: World Meteorological Organization. (2024). *International Codes — Beaufort Wind Force Scale*. https://www.wmo.int/
+**Justification**: Beaufort Force 6 ("Strong Breeze") covers 39-49 km/h, defined as the regime where "umbrellas are used with difficulty" and walking against the wind becomes hazardous. Above 40 km/h, balance loss and being struck by wind-borne debris become real risks for ridge / exposed-slope hikers.
+---
+## 4. High CAPE (lightning) — `HIGH_CAPE_JKG = 1000 J/kg`
+**Rule**: Convective Available Potential Energy ≥ 1000 J/kg triggers a Veto.
+**Citation**: National Weather Service. *Convective Forecasting Handbook* (latest edition). U.S. National Oceanic and Atmospheric Administration.
+**Justification**: NWS guidance characterises CAPE > 1000 J/kg as "moderate instability" capable of sustaining thunderstorms with lightning. CAPE > 2500 J/kg is "strong". For a safety-critical application aimed at hikers, the 1000 J/kg threshold provides early warning before lightning becomes likely.
+---
+## 5. Low visibility — `LOW_VISIBILITY_M = 100 m`
+**Rule**: surface visibility below 100 m triggers a Veto.
+**Citation**: Federal Aviation Administration. (2024). *Aeronautical Information Manual* §7-1-12. https://www.faa.gov/
+**Justification**: AIM defines Category III approach conditions as visibility below 200 m. For non-instrument human navigation, 100 m is the conventional "whiteout / dense fog" threshold below which dead-reckoning over alpine terrain becomes infeasible.
+---
+## 6. Orographic uplift — `OROGRAPHIC_DOT_THRESHOLD = 0.7`
+**Rule**: when the wind-vs-slope-normal dot product ≥ 0.7 AND ML rain probability ≥ 0.5 on a Slope terrain, a Veto fires.
+**Citation**: Roe, G. H. (2005). *Orographic precipitation*. **Annual Review of Earth and Planetary Sciences**, 33, 645-671. https://doi.org/10.1146/annurev.earth.33.092203.122541
+**Justification**: Forced ascent of moisture-laden air over a windward slope is one of the highest-rainfall meteorological mechanisms on Earth — entire climate regimes (e.g. Cherrapunji, India) are produced by it. Even when bulk ML probability is moderate, terrain-forced uplift can locally multiply precipitation by an order of magnitude.
+---
+## 7. Valley flash-flood — `VALLEY_FLOOD_PROB = 0.80`
+**Rule**: ML rain probability ≥ 80 % combined with Valley terrain triggers a Veto.
+**Citation**: Bhuiyan, M. A. E., Anagnostou, E. N., & Kruzdlo, R. (2020). *Improving satellite-based precipitation estimates over complex terrain using machine learning algorithms*. **Journal of Hydrology**, 588, 125060.
+**Justification**: Valley floors collect water from the entire upstream basin. Even modest rainfall amounts upstream concentrate hydrologically downstream, producing flash floods on timescales as short as 30 minutes. The literature documents disproportionate fatality rates from flash floods relative to other rain-driven hazards.
+---
+## 8. Fog sub-hazard — `FOG_HUMIDITY_PCT = 95 %`, `FOG_DEW_DEP_MAX_C = 2 °C`, `FOG_CLOUD_BASE_MAX_M = 800 m`
+**Rule**: the fog sub-scorer awards near-maximum contribution when humidity ≥ 95 %, dew-point depression ≤ 2 °C, and cloud base ≤ 800 m.
+**Citation**: World Meteorological Organization. (2019). *Guide to Meteorological Instruments and Methods of Observation (CIMO Guide)*, WMO-No. 8, Chapter on Visibility. https://library.wmo.int/idurl/4/68695
+**Justification**: WMO surface synoptic codes define fog as visibility < 1 km, which is observed most reliably when humidity is near saturation (typically > 95 %) and dew-point depression is below 2 °C. The 800 m cloud-base ceiling is the value used in the D5 §3.7.2 decision table to detect "low cloud meeting terrain".
+---
+## 9. Wind gust sub-hazard — `GUST_WIND_MIN_KMH = 25 km/h`
+**Rule**: wind gust sub-score scales linearly with sustained wind from 25 km/h up to the gale Veto at 40 km/h, with terrain amplification for ridges and exposed slopes.
+**Citation**: WMO Beaufort Wind Force Scale; Holton, J. R. (2004). *An Introduction to Dynamic Meteorology*, 4th ed., on mountain-wave and pass-acceleration phenomena.
+**Justification**: On exposed ridges and through mountain passes, sustained winds of 25 km/h commonly gust 1.3-1.8× higher (Beaufort F6 territory). Trees and shrubs near peaks become wind-snap hazards, and weight-of-pack stability margins narrow significantly above ~30 km/h sustained.
+---
+## 10. Thunderstorm sub-hazard — `THUNDER_CAPE_MIN_JKG = 500 J/kg`, `THUNDER_PRESSURE_DROP = -2 hPa / 3 h`
+**Rule**: the thunderstorm sub-scorer adds significant contribution when CAPE ≥ 500 J/kg, with a precipitator boost when pressure has dropped ≥ 2 hPa over the past 3 hours.
+**Citation**: National Weather Service Convective Outlook reference values; Doswell, C. A. III, & Schultz, D. M. (2006). *On the Use of Indices and Parameters in Forecasting Severe Storms*. **E-Journal of Severe Storms Meteorology**, 1(3).
+**Justification**: CAPE ≥ 500 J/kg is the conventional "moderate instability" floor at which convective storms become possible (1000 J/kg is the *Veto* — at that level lightning is likely). A 2 hPa / 3 h pressure fall is a textbook frontal-passage / mesoscale-convective-system precursor, well below the rapid-pressure-fall thresholds used in operational forecasting.
+---
+## 11. D5 §3.7.2 / Table 4.2 Decision Table — R1-R4
+| Rule | Trigger | Conclusion |
+|---|---|---|
+| **R1** | macro rain prob ≤ 30 %, humidity > 85 %, wind into a windward slope, pressure tendency < -1.5 hPa/3h, cloud base < 800 m | Hidden orographic-rain risk despite low macro probability |
+| **R2** | Same humidity / pressure / cloud-base as R1, but wind NOT into slope, terrain leeward or valley | No significant rain — macro forecast is correct |
+| **R3** | macro rain prob ≥ 70 %, wind into a windward slope | Heavy downpour incoming — avoid mountains and valleys |
+| **R4** | macro rain prob ≥ 70 %, no terrain amplification | Standard-rain precautions; no orographic amplification |
+**Citation**: D5 Proposal — "MicroClimate-X" §3.7.2 Decision Table 4.2 (own work, derived from Roe 2005 orographic-precipitation theory and standard synoptic-meteorology pressure-tendency / cloud-base rules of thumb).
+**Justification**: This 4-row decision table captures the *thesis-original* contribution — converting macro-scale model output (probability of rain in a coarse grid cell) into a *terrain-aware verdict* by combining wind alignment, humidity, and pressure tendency. The fact that R1 (hidden rain) and R3 (heavy downpour) can both fire on a windward slope while R2 (no risk) fires on a leeward valley with otherwise-identical macro probability is the table's discriminative value.
+---
+## 12. Activity weights — D5 §3.7 / P4.4
+| Activity | Rainfall | Fog | Wind Gust | Thunderstorm |
+|---|---|---|---|---|
+| **hiker**        | 1.0 | **1.3** | 1.0 | **1.4** |
+| **driver**       | 0.8 | **1.5** | 1.3 | 0.9 |
+| **construction** | 1.0 | 0.8 | **1.5** | **1.4** |
+| **general**      | 1.0 | 1.0 | 1.0 | 1.0 |
+**Justification**:
+- *Hikers* die above tree line from lightning and disorientation in fog (NOLS Wilderness Medicine, 2020 incident review).
+- *Drivers* lose vehicle control most often in fog (visibility), with wind a secondary hazard for high-sided vehicles (FHWA *Road Weather Management* program, 2019).
+- *Construction* workers care about wind (crane / scaffolding) and lightning (OSHA 29 CFR §1926.95 *PPE*).
+- *General* preserves a calibration baseline against which the other profiles can be benchmarked.
+Per-sub-score weight is multiplied, then per-hazard score is clipped to 100 so a weight of 1.5 cannot push a single sub-score past saturation; the composite formula then aggregates with 80 % weight on the dominant (worst) hazard.
+---
+## Composite-index validity / 复合指数的效度
+The final 0-100 risk score is a **composite indicator**, not a calibrated probability. Following the methodology of established indices (Fire Weather Index — van Wagner, 1987; Heat Index — Steadman, 1979), validity is established through:
+1. **Construct validity** — each component has an independent scientific basis.
+2. **Discriminant validity** — extreme samples (Mt Everest, hot calm tropical valley) produce extreme outputs in the expected direction.
+3. **Face validity** — domain experts agree the categorical bins (Safe / Caution / Warning / Danger) map sensibly onto action recommendations.
+A future *hindcast validation* against published Malaysian flood / landslide events is a planned thesis Chapter 5 contribution.

docs/项目大白话讲解.html ADDED Viewed

	@@ -0,0 +1,883 @@

+<!doctype html>
+<html lang="zh-CN">
+<head>
+<meta charset="utf-8">
+<title>项目大白话讲解 — MicroClimate-X</title>
+<style>
+  /* ============================================================
+     Long-form reading layout — comfortable for understanding,
+     not just glancing. Optimised for screen first, print second.
+     ============================================================ */
+  :root {
+    --ink:           #1a1d24;
+    --ink-soft:      #353a44;
+    --muted:         #6b7280;
+    --brand:         #2563eb;
+    --brand-soft:    #dbeafe;
+    --accent:        #b91c1c;
+    --accent-soft:   #fee2e2;
+    --ok:            #166534;
+    --ok-soft:       #dcfce7;
+    --warn:          #b45309;
+    --warn-soft:     #fef3c7;
+    --highlight:     #fef08a;
+    --grid:          #e5e7eb;
+    --bg:            #fafafa;
+    --paper:         #ffffff;
+    --code-bg:       #f3f4f6;
+  }
+  * { box-sizing: border-box; }
+  html, body { margin: 0; padding: 0; background: var(--bg); color: var(--ink); }
+  body {
+    font-family: -apple-system, BlinkMacSystemFont, "SF Pro Text",
+                 "PingFang SC", "Hiragino Sans GB", "Microsoft YaHei",
+                 system-ui, sans-serif;
+    font-size: 16px;
+    line-height: 1.75;
+    letter-spacing: 0.01em;
+  }
+  @page { size: A4; margin: 14mm 16mm; }
+  /* Two-column layout: TOC sidebar + article body */
+  .layout {
+    display: grid;
+    grid-template-columns: 220px 1fr;
+    max-width: 1100px;
+    margin: 0 auto;
+    gap: 0;
+  }
+  aside.toc {
+    position: sticky;
+    top: 70px;
+    align-self: start;
+    padding: 32px 16px 32px 32px;
+    height: calc(100vh - 90px);
+    overflow-y: auto;
+    border-right: 1px solid var(--grid);
+    font-size: 13px;
+  }
+  aside.toc h3 {
+    font-size: 11px;
+    text-transform: uppercase;
+    letter-spacing: 1.5px;
+    color: var(--muted);
+    margin: 0 0 12px 0;
+  }
+  aside.toc ol {
+    list-style: none;
+    padding: 0;
+    margin: 0;
+  }
+  aside.toc ol li {
+    margin: 6px 0;
+    line-height: 1.4;
+  }
+  aside.toc a {
+    color: var(--ink-soft);
+    text-decoration: none;
+    display: block;
+    padding: 4px 8px;
+    border-radius: 4px;
+    border-left: 2px solid transparent;
+  }
+  aside.toc a:hover {
+    background: var(--brand-soft);
+    color: var(--brand);
+    border-left-color: var(--brand);
+  }
+  aside.toc a .num { color: var(--muted); margin-right: 6px; font-variant-numeric: tabular-nums; }
+  main {
+    background: var(--paper);
+    padding: 48px 56px 80px 56px;
+    box-shadow: 0 0 0 1px var(--grid);
+    min-height: 100vh;
+  }
+  /* Headings */
+  h1 {
+    font-size: 32px;
+    font-weight: 700;
+    margin: 0 0 8px 0;
+    line-height: 1.2;
+  }
+  .subtitle {
+    font-size: 15px;
+    color: var(--muted);
+    margin: 0 0 8px 0;
+  }
+  .meta {
+    display: flex; gap: 8px; flex-wrap: wrap;
+    margin: 16px 0 32px 0;
+    font-size: 12px;
+  }
+  .meta span {
+    background: var(--code-bg);
+    padding: 3px 10px;
+    border-radius: 12px;
+    color: var(--muted);
+  }
+  h2 {
+    font-size: 24px;
+    margin: 56px 0 16px 0;
+    padding-bottom: 8px;
+    border-bottom: 2px solid var(--brand);
+    color: var(--ink);
+    scroll-margin-top: 80px;
+  }
+  h2 .num {
+    color: var(--brand);
+    font-weight: 700;
+    margin-right: 12px;
+  }
+  h3 {
+    font-size: 18px;
+    margin: 32px 0 12px 0;
+    color: var(--ink-soft);
+    font-weight: 600;
+  }
+  h4 {
+    font-size: 15px;
+    margin: 20px 0 8px 0;
+    color: var(--accent);
+    font-weight: 600;
+  }
+  /* Paragraphs / lists */
+  p { margin: 12px 0; }
+  ul, ol { padding-left: 24px; margin: 12px 0; }
+  ul li, ol li { margin: 6px 0; }
+  strong { color: var(--ink); font-weight: 600; }
+  em { color: var(--ink-soft); }
+  /* Highlight = the BIG punchline sentences */
+  .highlight, mark {
+    background: var(--highlight);
+    padding: 1px 4px;
+    border-radius: 3px;
+    color: var(--ink);
+  }
+  /* Blockquote = "the big punchline" */
+  blockquote {
+    margin: 20px 0;
+    padding: 16px 20px;
+    background: var(--brand-soft);
+    border-left: 4px solid var(--brand);
+    border-radius: 6px;
+    font-size: 16px;
+    color: var(--ink);
+  }
+  blockquote p { margin: 4px 0; }
+  blockquote strong { color: var(--brand); }
+  /* Quote box for supervisor verbatim */
+  .quote {
+    background: var(--warn-soft);
+    border-left: 4px solid var(--warn);
+    padding: 12px 16px;
+    margin: 16px 0;
+    font-style: italic;
+    font-size: 14px;
+    border-radius: 4px;
+  }
+  .quote::before { content: "🎙️ "; font-style: normal; }
+  /* Analogy / metaphor box */
+  .analogy {
+    background: #f0fdf4;
+    border: 1px dashed var(--ok);
+    padding: 16px 20px;
+    border-radius: 8px;
+    margin: 20px 0;
+    font-size: 15px;
+  }
+  .analogy::before {
+    content: "💡 比喻";
+    display: block;
+    font-size: 12px;
+    color: var(--ok);
+    font-weight: 700;
+    margin-bottom: 6px;
+    letter-spacing: 0.5px;
+  }
+  /* Callouts */
+  .callout {
+    margin: 20px 0;
+    padding: 14px 18px;
+    border-left: 4px solid;
+    border-radius: 4px;
+    font-size: 15px;
+  }
+  .callout.warn { background: var(--accent-soft); border-color: var(--accent); }
+  .callout.ok   { background: var(--ok-soft); border-color: var(--ok); }
+  .callout.tip  { background: var(--brand-soft); border-color: var(--brand); }
+  .callout-title {
+    font-weight: 700;
+    margin-bottom: 4px;
+    text-transform: uppercase;
+    letter-spacing: 0.5px;
+    font-size: 11px;
+  }
+  .callout.warn .callout-title { color: var(--accent); }
+  .callout.ok .callout-title   { color: var(--ok); }
+  .callout.tip .callout-title  { color: var(--brand); }
+  /* Code */
+  code, pre, kbd {
+    font-family: "SF Mono", "JetBrains Mono", Menlo, Consolas, monospace;
+  }
+  code {
+    background: var(--code-bg);
+    padding: 1px 6px;
+    border-radius: 3px;
+    font-size: 13px;
+    color: var(--accent);
+  }
+  pre {
+    background: #0f172a;
+    color: #e2e8f0;
+    padding: 16px 20px;
+    border-radius: 8px;
+    overflow-x: auto;
+    margin: 16px 0;
+    font-size: 13px;
+    line-height: 1.6;
+  }
+  pre code { background: transparent; padding: 0; color: inherit; font-size: 13px; }
+  /* Tables */
+  table {
+    border-collapse: collapse;
+    width: 100%;
+    margin: 16px 0;
+    font-size: 14px;
+    background: white;
+  }
+  th, td {
+    padding: 10px 12px;
+    text-align: left;
+    vertical-align: top;
+    border: 1px solid var(--grid);
+  }
+  th {
+    background: #f9fafb;
+    font-weight: 600;
+    color: var(--ink-soft);
+    font-size: 13px;
+  }
+  tbody tr:nth-child(even) { background: #fafbfc; }
+  tbody tr:hover { background: var(--brand-soft); }
+  /* Numbered "step" boxes */
+  .step-box {
+    background: white;
+    border: 1px solid var(--grid);
+    border-left: 4px solid var(--brand);
+    border-radius: 6px;
+    padding: 16px 20px;
+    margin: 16px 0;
+  }
+  .step-box .step-label {
+    font-size: 11px;
+    text-transform: uppercase;
+    letter-spacing: 1px;
+    color: var(--brand);
+    font-weight: 700;
+    margin-bottom: 4px;
+  }
+  /* Compare table — two scenarios side-by-side */
+  table.compare td.bad {
+    background: #fef2f2;
+    border-left: 3px solid var(--accent);
+  }
+  table.compare td.good {
+    background: #f0fdf4;
+    border-left: 3px solid var(--ok);
+  }
+  /* Toolbar */
+  .toolbar {
+    position: sticky; top: 0; z-index: 100;
+    background: var(--brand); color: white;
+    padding: 10px 24px;
+    display: flex; justify-content: space-between;
+    align-items: center;
+    font-size: 14px;
+    box-shadow: 0 2px 8px rgba(0,0,0,0.1);
+  }
+  .toolbar button {
+    background: white; color: var(--brand); border: 0;
+    padding: 6px 16px; border-radius: 4px; font-weight: 600;
+    cursor: pointer; font-size: 13px;
+  }
+  .toolbar button:hover { background: #f3f4f6; }
+  /* Mantra at the end — final 5-sentence summary */
+  .mantra {
+    background: linear-gradient(135deg, #fef3c7 0%, #fde68a 100%);
+    border-radius: 12px;
+    padding: 24px 28px;
+    margin: 24px 0;
+  }
+  .mantra ol {
+    counter-reset: mantra;
+    list-style: none;
+    padding: 0;
+  }
+  .mantra ol li {
+    counter-increment: mantra;
+    position: relative;
+    padding: 12px 12px 12px 56px;
+    margin: 8px 0;
+    background: white;
+    border-radius: 8px;
+    font-size: 15px;
+    line-height: 1.6;
+  }
+  .mantra ol li::before {
+    content: counter(mantra);
+    position: absolute;
+    left: 12px; top: 50%;
+    transform: translateY(-50%);
+    width: 32px; height: 32px;
+    background: var(--accent);
+    color: white;
+    border-radius: 50%;
+    display: flex; align-items: center; justify-content: center;
+    font-weight: 700;
+  }
+  /* Footer */
+  footer {
+    margin-top: 80px;
+    padding-top: 24px;
+    border-top: 1px solid var(--grid);
+    color: var(--muted);
+    font-size: 13px;
+    text-align: center;
+  }
+  /* Responsive — hide TOC on small screens */
+  @media (max-width: 900px) {
+    .layout { grid-template-columns: 1fr; }
+    aside.toc { display: none; }
+    main { padding: 24px 24px 60px 24px; }
+  }
+  /* Print refinements */
+  @media print {
+    body { background: white; }
+    .layout { grid-template-columns: 1fr; }
+    aside.toc, .toolbar { display: none; }
+    main { padding: 0; box-shadow: none; }
+    h2 { page-break-after: avoid; }
+    pre, blockquote, .analogy, .callout { page-break-inside: avoid; }
+  }
+</style>
+</head>
+<body>
+<div class="toolbar">
+  <strong>项目大白话讲解 · MicroClimate-X</strong>
+  <button onclick="window.print()">🖨 打印 / 存为 PDF</button>
+</div>
+<div class="layout">
+<aside class="toc">
+  <h3>目录</h3>
+  <ol>
+    <li><a href="#s0"><span class="num">0</span>一句话讲清楚</a></li>
+    <li><a href="#s1"><span class="num">1</span>为什么有意义</a></li>
+    <li><a href="#s2"><span class="num">2</span>三块拼图</a></li>
+    <li><a href="#s3"><span class="num">3</span>Dataset 数��集</a></li>
+    <li><a href="#s4"><span class="num">4</span>Model 模型</a></li>
+    <li><a href="#s5"><span class="num">5</span>App 应用</a></li>
+    <li><a href="#s6"><span class="num">6</span>做对了什么</a></li>
+    <li><a href="#s7"><span class="num">7</span>回应老师 3 大疑惑</a></li>
+    <li><a href="#s8"><span class="num">8</span>汇报 4 步动作</a></li>
+    <li><a href="#s9"><span class="num">9</span>傻问题速查</a></li>
+    <li><a href="#s10"><span class="num">10</span>终极心法 5 句话</a></li>
+  </ol>
+</aside>
+<main>
+<h1>你的毕业设计 —— 大白话讲解版</h1>
+<p class="subtitle">看完这篇文章，你就能用自己的话把项目讲给完全不懂技术的朋友听。</p>
+<p class="subtitle">不需要背任何术语，理解了原理，老师怎么追问你都不慌。</p>
+<div class="meta">
+  <span>📅 2026-05-13</span>
+  <span>🎓 UKM FYP</span>
+  <span>📖 阅读时间约 30 分钟</span>
+  <span>🎯 目标：彻底搞懂项目</span>
+</div>
+<!-- ===== 0 ===== -->
+<h2 id="s0"><span class="num">0.</span>先用一句话讲清楚你做了什么</h2>
+<blockquote>
+  <p><strong>你做了一个"山区天气危险预警 App" —— 专门给登山者用的，比手机上的天气预报靠谱得多。</strong></p>
+</blockquote>
+<p>就这么简单。下面解释为什么"比手机预报靠谱"。</p>
+<!-- ===== 1 ===== -->
+<h2 id="s1"><span class="num">1.</span>为什么这个项目有意义？（痛点）</h2>
+<p>打开你手机上的天气 App，它告诉你"吉隆坡今天有雨"。</p>
+<p><strong>问题来了</strong>：吉隆坡有几千平方公里，里面有平地、有山、有山谷、有山顶。</p>
+<p>天气预报背后的网格大概是 <strong>20 公里 × 20 公里</strong> 一格 —— 也就是说，<strong>山顶、山谷、迎风坡共用同一个预报</strong>。但实际上：</p>
+<ul>
+  <li><strong>山顶</strong>可能在下暴雨</li>
+  <li><strong>山谷</strong>可能阳光明媚</li>
+  <li><strong>迎风坡</strong>可能起大雾</li>
+</ul>
+<blockquote>
+  <p>这就像有人告诉你"中国今天天气晴" —— 这种粗粒度的信息对登山者<strong>毫无用处</strong>。</p>
+</blockquote>
+<p><strong>你做的事</strong>：把预报精度从 20 公里降到一个具体坐标点，让登山者点地图上任意一个点，就能知道那个具体位置的风险。</p>
+<!-- ===== 2 ===== -->
+<h2 id="s2"><span class="num">2.</span>整个项目分三块：Dataset → Model → App</h2>
+<p>这是导师上次反复强调的顺序 —— <mark>先有数据，再训模型，最后才做 App</mark>。</p>
+<div class="analogy">
+  <p>你要教一个小孩看天气判断会不会下雨：</p>
+  <table>
+    <tr><th>步骤</th><th>比喻</th><th>项目里对应什么</th></tr>
+    <tr><td>1</td><td>找一本天气百科全书给小孩看</td><td><strong>Dataset</strong>（数据集）</td></tr>
+    <tr><td>2</td><td>让小孩反复看书，学会判断规律</td><td><strong>Model</strong>（训练模型）</td></tr>
+    <tr><td>3</td><td>把小孩装到一个"天气问答机器人"里，让别人能问他</td><td><strong>App</strong>（应用）</td></tr>
+  </table>
+</div>
+<!-- ===== 3 ===== -->
+<h2 id="s3"><span class="num">3.</span>Dataset（数据集）—— 你拿什么"教"电脑</h2>
+<h3>3.1 这一步在干什么</h3>
+<p>机器学习的本质是 <strong>"喂样本，让它自己找规律"</strong>。所以第一件事：<strong>准备样本</strong>。</p>
+<h3>3.2 你的数据从哪来？</h3>
+<p><strong>来源</strong>：欧洲气象中心（ECMWF）的 <strong>ERA5 数据库</strong>。</p>
+<p>这个数据库<strong>不是预报</strong>，是<strong>对过去天气的"完美回放"</strong> —— 气象学家会把所有历史观测数据（卫星、气球、地面站）综合起来，反推出"那一天那一刻那个地方真实的天气是怎样的"。</p>
+<div class="analogy">
+  警察破案时调看监控录像 —— 录像就是 ERA5，是<strong>已经发生的事实</strong>。<br>
+  而手机预报是"预测未来"，那是另一回事。
+</div>
+<p><strong>学术界把 ERA5 当作真值</strong> —— 其他预报系统都拿 ERA5 来校准自己。所以拿它训练 ML 模型最合适，因为<mark>答案是可信的</mark>。</p>
+<h3>3.3 你要了多少数据？</h3>
+<table>
+  <tr><th>项</th><th>数值</th></tr>
+  <tr><td>地点</td><td>5 个马来西亚山区（云顶、金马仑、福隆港、巴生谷、神山）</td></tr>
+  <tr><td>时间</td><td>2020-01-01 到 2024-12-31，整整 5 年</td></tr>
+  <tr><td>频率</td><td>每小时一行</td></tr>
+  <tr><td><strong>总行数</strong></td><td><strong>175 315 行</strong>（17.5 万行）</td></tr>
+  <tr><td>每行包含</td><td>温度、湿度、风速、风向、气压、降雨量等十几个数字</td></tr>
+</table>
+<h3>3.4 ⭐ 关键问题：原始数据里<u>没有"答案"</u></h3>
+<div class="callout warn">
+  <div class="callout-title">这是上��老师最大的疑惑</div>
+  原始数据只有"现象"，没有"标签"。
+</div>
+<p>原始数据长这样（简化）：</p>
+<pre><code>时间                   温度   湿度   降雨量
+2023-06-01 14:00      25°C   80%   0.0 mm
+2023-06-01 15:00      24°C   85%   0.3 mm
+2023-06-01 16:00      23°C   90%   1.2 mm</code></pre>
+<p>老师看了说：<em>"这里面没有"答案"啊！没有一列告诉电脑'这是会下雨的情况'还是'这是不会下雨的情况' —— 你怎么训练模型？"</em></p>
+<p><strong>他说的完全正确</strong>。原始数据只有"现象"，没有"标签"。</p>
+<h3>3.5 你的解决方案：自己<u>造</u>一个答案列</h3>
+<p>你想了一个聪明的办法 —— <strong>用未来发生的事，反过来当现在的答案</strong>：</p>
+<pre><code>df['is_rain_event'] = (df['precipitation'].shift(-1) > 0.1).astype(int)</code></pre>
+<p>翻译成大白话：</p>
+<blockquote>
+  <p>看每一行的"下一个小时" —— 如果下一小时下雨超过 0.1 毫米，就在这一行标记 <strong>1</strong>（会下雨）；否则标记 <strong>0</strong>（不会下雨）。</p>
+</blockquote>
+<table>
+  <tr><th>时间</th><th>温度</th><th>湿度</th><th>降雨量</th><th>答案 is_rain_event</th></tr>
+  <tr><td>2023-06-01 14:00</td><td>25°C</td><td>80%</td><td>0.0</td><td><strong>1</strong>（下一小时 0.3 &gt; 0.1）</td></tr>
+  <tr><td>2023-06-01 15:00</td><td>24°C</td><td>85%</td><td>0.3</td><td><strong>1</strong>（下一小时 1.2 &gt; 0.1）</td></tr>
+  <tr><td>2023-06-01 16:00</td><td>23°C</td><td>90%</td><td>1.2</td><td><strong>1</strong></td></tr>
+</table>
+<div class="callout tip">
+  <div class="callout-title">核心思想</div>
+  训练时电脑看到 14:00 那一行的所有特征（温度湿度等），它要预测的"答案"是<strong>那一刻之后会不会下雨</strong>。<br>
+  这样训练完，未来给它一组当前的天气数据，它就能预测"接下来会不会下雨"。
+</div>
+<h3>3.6 这一步有 3 个<u>必须能讲出来</u>的细节</h3>
+<div class="step-box">
+  <div class="step-label">细节 ①</div>
+  <h4 style="margin-top:0"><code>.shift(-1)</code> 的意义 —— 没有"作弊"</h4>
+  <p><code>.shift(-1)</code> 意思是"用未来的数据当答案"。这听起来像作弊，但其实<strong>完全正确</strong>：</p>
+  <ul>
+    <li>训练时：电脑只看"当前"特征，预测"未来"答案</li>
+    <li>预测时（真实使用）：用户给当前特征，模型预测未来 —— <strong>用法一致</strong></li>
+    <li>如果用"当前"特征预测"当前"是否下雨 —— 那不是预测，是<strong>作弊</strong></li>
+  </ul>
+  <p>专业术语叫 <strong>"无时间泄漏"</strong>（no temporal leakage）。</p>
+</div>
+<div class="step-box">
+  <div class="step-label">细节 ②</div>
+  <h4 style="margin-top:0">为什么是 0.1 毫米？—— 不是拍脑袋</h4>
+  <p>0.1 mm 是 <strong>WMO（世界气象组织）官方定义的"微量降水"阈值</strong> —— 下到 0.1 毫米才算真的下雨，更少的算"湿润空气"。</p>
+  <p>这是<strong>国际标准</strong>，不是你随便定的。老师追问时这一点很重要 —— 证明你<strong>读过文献</strong>。</p>
+</div>
+<div class="step-box">
+  <div class="step-label">细节 ③</div>
+  <h4 style="margin-top:0">为什么是 0/1 二分类，不是预测毫米数？</h4>
+  <p>这是上次老师的<strong>第二大疑惑</strong> —— 他认为应该做"回归"（预测降雨多少毫米）。</p>
+  <p>你的答案 3 条：</p>
+  <ol>
+    <li><strong>下游决策本身就是二选一</strong>：登山者只关心"今天能不能去爬山" —— 出门或不出门，<strong>就是 0/1</strong></li>
+    <li><strong>回归还是要选阈值</strong>：哪怕你预测出 5.2 mm，最后还是要拿一个阈值（比如 1 mm）转成"出门 / 不出门" —— <strong>那个阈值反正要选</strong>，不如一开始就用分类</li>
+    <li><strong>退路</strong>：API 仍然返回<strong>概率值</strong>（比如"70% 会下雨"），需要连续值的下游组件照样能用 —— <strong>两全其美</strong></li>
+  </ol>
+</div>
+<!-- ===== 4 ===== -->
+<h2 id="s4"><span class="num">4.</span>Model（模型）—— 让电脑学会判断</h2>
+<h3>4.1 这一步在干什么</h3>
+<p>把 17.5 万行数据<strong>喂</strong>给一个算法，让它<strong>自己找规律</strong>。</p>
+<p>学完之后，未来给它任何一组新天气数据，它能立刻输出"会下雨的概率是 X%"。</p>
+<h3>4.2 你用了什么算法？</h3>
+<p><strong>Random Forest（随机森林）</strong> —— 一种经典的传统机器学习算法。</p>
+<div class="analogy">
+  <p><strong>随机森林 = 一群医生会诊</strong></p>
+  <p>想象你身体不舒服，你不只看一个医生，而是<strong>找 100 个医生分别诊断</strong> ——</p>
+  <ul>
+    <li>每个医生看的"病例资料"略有不同（随机抽一部分）</li>
+    <li>每个医生��关注几个症状（不是全部）</li>
+    <li>最后 <strong>100 个医生投票</strong>，多数说"感冒"那就是感冒</li>
+  </ul>
+  <p>随机森林就是这个原理 —— 它训练 100 棵小决策树，每棵树看一部分数据、问一部分特征，最后投票决定结果。</p>
+</div>
+<h3>4.3 为什么选随机森林，不用 ChatGPT 那种深度学习？</h3>
+<p>老师<strong>很可能问这个</strong>。3 条理由：</p>
+<div class="step-box">
+  <div class="step-label">理由 ①</div>
+  <h4 style="margin-top:0">可解释性</h4>
+  <p>随机森林能告诉你"<strong>它为什么这么判断</strong>" —— 比如"我看到上一小时下了 0.3 毫米雨，所以判断接下来还会下"。</p>
+  <p>深度学习是<strong>黑盒</strong> —— 它说会下雨，<strong>没人知道它为什么这么说</strong>。</p>
+  <p>在<strong>安全关键</strong>应用里（关系到登山者性命），可解释性必须有。</p>
+</div>
+<div class="step-box">
+  <div class="step-label">理由 ②</div>
+  <h4 style="margin-top:0">数据量</h4>
+  <p>深度学习需要<strong>几百万到几千万</strong>条数据才能发挥优势。你只有 17.5 万行 —— <strong>太少了</strong>，深度学习反而不如随机森林。</p>
+</div>
+<div class="step-box">
+  <div class="step-label">理由 ③</div>
+  <h4 style="margin-top:0">速度</h4>
+  <p>随机森林预测一次 <strong>&lt; 1 毫秒</strong>。深度学习要 10 倍以上时间，还要 GPU。</p>
+  <p>你的 App 要做到"用户点地图立刻出结果" —— 快是必须的。</p>
+</div>
+<h3>4.4 模型训练得怎么样？（这是老师最关心的数字）</h3>
+<h4>你必须能背的 4 个数字</h4>
+<table>
+  <tr><th>指标</th><th>数值</th><th>大白话翻译</th></tr>
+  <tr><td><strong>ROC AUC</strong></td><td><strong>0.871</strong></td><td>整体准确度的综合分，<strong>满分 1.0</strong> —— 0.87 算"很好"</td></tr>
+  <tr><td><strong>Recall（召回率）</strong></td><td><strong>93.4%</strong></td><td>真的下了雨的 100 次里，模型成功预警了 93 次（<strong>只漏报 7 次</strong>）</td></tr>
+  <tr><td><strong>Brier Score</strong></td><td><strong>0.138</strong></td><td>概率校准度 —— <strong>越低越好</strong>，0.14 算"校准良好"</td></tr>
+  <tr><td><strong>测试样本数</strong></td><td><strong>35 063 条</strong></td><td>用来打分的数据量（占总数据的 20%）</td></tr>
+</table>
+<h4>怎么"考试"？—— 时间序列切分</h4>
+<p>你<strong>没有</strong>用随机切分（很多人会犯的错）。</p>
+<div class="analogy">
+  老师出期末考试，如果他用学生<strong>平时做过的题</strong>来考 —— 那是作弊。必须用<strong>新的</strong>、学生没见过的题。
+</div>
+<p>你的做法：把 5 年数据按时间顺序排，<strong>最后 1 年（20%）扣下来不给电脑看</strong>，只用前 4 年训练。训练完，拿最后 1 年的数据"考试" —— 这才公平。</p>
+<h4>为什么不用准确率（accuracy）？</h4>
+<p>很多人会问"模型准确率多少"。<strong>陷阱</strong>：</p>
+<ul>
+  <li>马来西亚山区只有 30% 的时间下雨</li>
+  <li>一个<strong>永远预测"不下雨"的傻瓜模型</strong>，准确率自动是 70%</li>
+  <li>但它<strong>永远漏报</strong>，登山者会被淋成落汤鸡</li>
+</ul>
+<p>所以你用 <strong>F2 分数</strong> + <strong>召回率</strong> 而不是准确率 —— 这两个指标<strong>重视"不漏报"</strong>。</p>
+<blockquote>
+  老师如果追问，就说："<strong>安全关键应用，漏报比误报严重得多。漏一次真下雨，登山者可能丧命；误报一次，登山者最多取消行程。所以我用 F2 分数，它把召回率的权重设为精度的 4 倍。</strong>"
+</blockquote>
+<h3>4.5 模型学到了什么？（特征重要性）</h3>
+<p>电脑学完之后，能告诉你"它最看重哪些信号"。前 4 个是：</p>
+<table>
+  <tr><th>排名</th><th>特征</th><th>大白话</th></tr>
+  <tr><td>1</td><td>上一小时降雨量</td><td>"刚才下了，接下来很可能继续下" —— <strong>雨的惯性</strong></td></tr>
+  <tr><td>2-3</td><td>时间（一天中的几点）</td><td>马来西亚山区<strong>下午 3-5 点最爱下雨</strong> —— 电脑学会了这个规律</td></tr>
+  <tr><td>4</td><td>3 小时气压变化</td><td><strong>气压下降预示风暴来临</strong> —— 这是经典气象学常识，电脑自己学到了</td></tr>
+</table>
+<div class="callout ok">
+  <div class="callout-title">这一段非常加分</div>
+  证明<strong>你的模型学到的是"物理上有意义"的规律</strong>，不是乱猜。
+</div>
+<!-- ===== 5 ===== -->
+<h2 id="s5"><span class="num">5.</span>App（应用）—— 把模型包装成产品</h2>
+<h3>5.1 这一步在干什么</h3>
+<p>模型本身只是个 <code>.pkl</code> 文件 —— 一个 Python 对象。<strong>没法用</strong>。</p>
+<p>App 的工作是：<strong>让��户能用浏览器点地图，立刻看到那个地方的风险评分</strong>。</p>
+<h3>5.2 整个 App 长什么样？</h3>
+<pre><code>用户在浏览器点地图上一个点 (lat, lon)
+            │
+            ▼
+    前端（Vue + Leaflet 地图）
+            │
+            │  HTTP 请求
+            ▼
+    后端（FastAPI）
+            │
+            ├──► 调用 Open-Meteo API：获取这个点当前的实时天气
+            ├──► 调用 Open Topo Data：获取这个点的海拔高度
+            │
+            ├──► 引擎 A：把天气数据喂给训练好的 RF 模型 → 得到下雨概率
+            ├──► 引擎 B：用一组手写规则评估其他危险（雾、风、雷暴）
+            │
+            ▼
+    综合评分（0-100）+ 双语建议返回前端
+            │
+            ▼
+    前端显示：彩色仪表盘 + "建议：可以安全出行" / "警告：暴雨风险"</code></pre>
+<h3>5.3 ⭐ 双引擎架构 —— 这是项目的<u>核心创新</u></h3>
+<div class="callout tip">
+  <div class="callout-title">这是整个项目最值得吹的地方</div>
+  老师追问"为什么混合架构"时你要能讲清楚。
+</div>
+<h4>引擎 A：随机森林 = "经验主义"</h4>
+<p>学过 17.5 万条历史数据的"经验" —— <strong>它见过的天气模式</strong>它能很准地预测。</p>
+<h4>引擎 B：手写规则 = "原则主义"</h4>
+<p>一组<strong>人工写的物理规则</strong>：</p>
+<pre><code>如果 海拔 > 3500 米     →  缺氧危险（不管模型说什么，强制报警）
+如果 温度 ≤ -5°C         →  冻伤危险
+如果 风速 ≥ 40 km/h      →  大风危险
+如果 风向 + 地形 = 迎风坡  →  地形抬升造雨风险</code></pre>
+<h4>为什么必须两个一起用？—— 珠峰例子</h4>
+<p><strong>情景</strong>：用户点了一下珠穆朗玛峰（8 848 米）。</p>
+<table class="compare">
+  <tr><th>只用引擎 A（纯 ML）</th><th>你的混合架构</th></tr>
+  <tr>
+    <td class="bad">模型只见过马来西亚的山（最高 1865 米）</td>
+    <td class="good">模型仍然给出低概率（"看起来不像会下雨"）</td>
+  </tr>
+  <tr>
+    <td class="bad">它说"下雨概率 5%"</td>
+    <td class="good"><strong>但引擎 B 立刻发现</strong>：海拔 &gt; 3500 → 缺氧；温度 -30°C → 冻伤；风速 80 km/h → 大风</td>
+  </tr>
+  <tr>
+    <td class="bad">系统返回"安全" ❌</td>
+    <td class="good"><strong>三个独立否决（Veto）触发</strong></td>
+  </tr>
+  <tr>
+    <td class="bad">登山者去了 → 死</td>
+    <td class="good">综合评分被强制设为 100 = <strong>危险</strong> ✅</td>
+  </tr>
+</table>
+<blockquote>
+  <p><strong>学术上这叫 "Neuro-Symbolic AI（神经-符号 AI）"</strong> —— 能学的让机器学（神经），物理规律手工编码（符号）。</p>
+  <p>这不是你瞎编的，是 2020 年后学术界的热门方向，参考文献 Garcez &amp; Lamb 2020。</p>
+</blockquote>
+<h3>5.4 App 的技术栈（被问到时回答）</h3>
+<table>
+  <tr><th>部分</th><th>用了什么</th><th>一句话解释</th></tr>
+  <tr><td>前端</td><td>Vue 3 + Leaflet + ECharts</td><td>浏览器里的页面，地图，图表</td></tr>
+  <tr><td>后端</td><td>FastAPI（Python）</td><td>处理用户请求，调模型，返回结果</td></tr>
+  <tr><td>缓存</td><td>SQLite</td><td>同一个点 10 分钟内重复查不用每次都算</td></tr>
+  <tr><td>部署</td><td>Docker</td><td>一键就能在任何机器上跑起来</td></tr>
+</table>
+<!-- ===== 6 ===== -->
+<h2 id="s6"><span class="num">6.</span>整个项目你"做对了什么" —— 别人吹起来的话</h2>
+<table>
+  <tr><th>#</th><th>做对的事</th><th>为什么加分</th></tr>
+  <tr><td>1</td><td>数据来自 ERA5 而不是网上随便爬的</td><td><strong>业内金标准</strong>，老师不会质疑数据质量</td></tr>
+  <tr><td>2</td><td>答案列自己工程构造，方法符合 WMO 标准</td><td>证明<strong>读过文献</strong>，不是拍脑袋</td></tr>
+  <tr><td>3</td><td>时间序列切分而不是随机切分</td><td>证明<strong>懂 ML 基础</strong>，没有数据泄漏</td></tr>
+  <tr><td>4</td><td>用 F2 分数选阈值而不是 F1</td><td>证明<strong>理解任务背景</strong> —— 安全关键场景重视召回</td></tr>
+  <tr><td>5</td><td>混合架构（ML + 规则）而不是纯 ML</td><td>项目的<strong>核心研究贡献</strong></td></tr>
+  <tr><td>6</td><td>写了 70 个测试，覆盖率 97%</td><td>证明<strong>工程能力</strong> —— 老师不会怀疑代码可靠性</td></tr>
+  <tr><td>7</td><td>一行命令 <code>make evaluate</code> 复现所有数字</td><td>评审老师能<strong>独立验证</strong>论文里的每个 claim</td></tr>
+</table>
+<!-- ===== 7 ===== -->
+<h2 id="s7"><span class="num">7.</span>上次汇报老师的 3 大疑惑 —— 逐条解决</h2>
+<table>
+  <tr><th>#</th><th>老师疑惑</th><th>你现在的回答</th></tr>
+  <tr>
+    <td>1</td>
+    <td>"App is the last（顺序错了）"</td>
+    <td>严格按 dataset → model → app 顺序展示，写在 <code>pipeline_order.md</code> 里</td>
+  </tr>
+  <tr>
+    <td>2</td>
+    <td>"Y is missing（没有答案列）"</td>
+    <td>自己工程构造的 <code>is_rain_event</code>，方法符合 WMO 标准</td>
+  </tr>
+  <tr>
+    <td>3</td>
+    <td>"应该做回归不是分类"</td>
+    <td>下游决策是二元的、F2 分数只在分类下有意义、API 仍暴露概率</td>
+  </tr>
+</table>
+<!-- ===== 8 ===== -->
+<h2 id="s8"><span class="num">8.</span>这次汇报你只需要做 4 件事</h2>
+<h3>8.1 开场（30 秒）</h3>
+<blockquote>
+  "老师感谢您抽时间。接着上次的内容，我做完了 v1.0.0 工程化强化，整条流水线现在可以端到端复现。我按上次的顺序 —— <strong>dataset、model、app</strong> —— 给您过一遍新的进展，最后讲我对 Chapter 5 的下一步计划，可以吗？"
+</blockquote>
+<h3>8.2 按顺序展示（5 分钟）</h3>
+<table>
+  <tr><th>步骤</th><th>打开</th><th>讲什么</th><th>时长</th></tr>
+  <tr><td>1</td><td><code>docs/dataset.md</code></td><td>"数据来自 ERA5，5 个山点 5 年共 17.5 万行；答案列 <code>is_rain_event</code> 我自己构造的，定义在 §5"</td><td>30 秒</td></tr>
+  <tr><td>2</td><td><code>figures/01_roc_curve.png</code></td><td>"测试 AUC 0.871，召回率 93.4%"</td><td>30 秒</td></tr>
+  <tr><td>3</td><td><code>figures/03_calibration_curve.png</code></td><td>"Brier 分数 0.138，校准良好"</td><td>20 秒</td></tr>
+  <tr><td>4</td><td><code>figures/04_threshold_sweep.png</code></td><td>"用 F2 分数选阈值 —— 安全关键场景重视召回"</td><td>20 秒</td></tr>
+  <tr><td>5</td><td><code>figures/05_feature_importance.png</code></td><td>"前 3 个特征：上一小时降雨、时间周期、气压变化 —— 和气象学文献吻合"</td><td>20 秒</td></tr>
+  <tr><td>6</td><td>App（<strong>最后</strong>才打开）</td><td>演示云顶 + 珠峰两个场景</td><td>90 秒</td></tr>
+</table>
+<h3>8.3 讲下一步（90 秒）</h3>
+<p>打开 <code>docs/progress_update_brief.html</code> §4，照着 5 条 Chapter 5 方向讲一遍，然后<strong>请老师拍板：先做哪两条</strong>？</p>
+<h3>8.4 收尾（30 秒）</h3>
+<blockquote>
+  "明早之前给您发 3 条要点的邮件总结，留个书面确认。谢谢老师。"
+</blockquote>
+<!-- ===== 9 ===== -->
+<h2 id="s9"><span class="num">9.</span>老师可能问的"傻"问题（其实不傻）</h2>
+<table>
+  <tr><th>问题</th><th>你的回答</th></tr>
+  <tr><td>"你的模型是什么？"</td><td>"Random Forest，随机森林"</td></tr>
+  <tr><td>"为什么不用深度学习？"</td><td>"数据量不够，需要可解释性，而且要快"</td></tr>
+  <tr><td>"测试准确率多少？"</td><td>"AUC 0.871，召回率 93.4% —— 我没用准确率，因为类别不平衡"</td></tr>
+  <tr><td>"怎么知道没过拟合？"</td><td>"做了 5 折时间序列交叉验证，每折 AUC 都在 0.83-0.91"</td></tr>
+  <tr><td>"Y 是怎么来的？"</td><td>"从 precipitation 列工程构造的：下一小时 &gt; 0.1 mm 标 1，0.1 mm 是 WMO 标准"</td></tr>
+  <tr><td>"为什么是分类不是回归？"</td><td>"下游决策本身就是二元的，而且只有分类才能直接优化 F2 分数"</td></tr>
+  <tr><td>"规则引擎为什么必要？"</td><td>"纯 ML 学的是平均，遇到分布外输入（比如珠峰）会失效 —— 规则引擎兜底"</td></tr>
+  <tr><td>"万一哪天模型挂了？"</td><td>"三层降级：模型挂了走启发式 / 异常返回类型化错误 / 规则引擎独立运行"</td></tr>
+</table>
+<!-- ===== 10 ===== -->
+<h2 id="s10"><span class="num">10.</span>终极心法 —— 你只要记住这 5 句话</h2>
+<div class="mantra">
+  <ol>
+    <li>"我做的是给登山者用的<strong>山区天气危险预警 App</strong>。"<br><em style="color:var(--muted);font-size:13px">→ 一句话讲清项目</em></li>
+    <li>"我用 ERA5 历史天气数据，<strong>自己构造了答案列 <code>is_rain_event</code></strong>，训了一个随机森林模型。"<br><em style="color:var(--muted);font-size:13px">→ 数据 + 模型</em></li>
+    <li>"测试 <strong>AUC 0.871，召回率 93.4%</strong> —— 我重视召回因为漏报比误报危险。"<br><em style="color:var(--muted);font-size:13px">→ 核心数字</em></li>
+    <li>"我用<strong>混合架构 —— 机器学习 + 手写规则</strong>，规则引擎在分布外场景兜底。"<br><em style="color:var(--muted);font-size:13px">→ 核心创新</em></li>
+    <li>"接下来 Chapter 5 我列了 <strong>5 个评估方向</strong>，请老师建议先做哪两个。"<br><em style="color:var(--muted);font-size:13px">→ 请示</em></li>
+  </ol>
+</div>
+<div class="callout ok">
+  <div class="callout-title">关键心法</div>
+  <strong>这 5 句话能完整回答 90% 的追问。</strong>其余的细节，遇到了再翻这份���档。
+</div>
+<footer>
+  写这份文档的目的：让你<strong>真的懂</strong>自己的项目，而不是背稿子。<br>
+  懂了，老师怎么问你都不慌 —— 因为你说出来的每一句话都是<strong>你自己想清楚的</strong>。<br><br>
+  <span style="color: var(--brand);">L.ZH @ UKM · KyoukoLi/microclimate-x · 2026-05-13</span>
+</footer>
+</main>
+</div>
+<script>
+  // Highlight current TOC item on scroll
+  const tocLinks = document.querySelectorAll('aside.toc a');
+  const sections = Array.from(tocLinks).map(link => document.getElementById(link.getAttribute('href').slice(1)));
+  function highlightCurrent() {
+    let current = 0;
+    sections.forEach((sec, i) => {
+      if (sec && sec.getBoundingClientRect().top < 100) current = i;
+    });
+    tocLinks.forEach((link, i) => {
+      link.style.background = i === current ? 'var(--brand-soft)' : '';
+      link.style.color = i === current ? 'var(--brand)' : '';
+      link.style.borderLeftColor = i === current ? 'var(--brand)' : 'transparent';
+      link.style.fontWeight = i === current ? '600' : '400';
+    });
+  }
+  window.addEventListener('scroll', highlightCurrent);
+  highlightCurrent();
+</script>
+</body>
+</html>

docs/项目大白话讲解.md ADDED Viewed

	@@ -0,0 +1,383 @@

+# 你的毕业设计——大白话讲解版
+> 看完这篇文章，你就能用自己的话把项目讲给完全不懂技术的朋友听。
+> 不需要背任何术语，理解了原理，老师怎么追问你都不慌。
+---
+## 0. 先用一句话讲清楚你做了什么
+> **你做了一个"山区天气危险预警 App"——专门给登山者用的，比手机上的天气预报靠谱得多。**
+就这么简单。下面解释为什么"比手机预报靠谱"。
+---
+## 1. 为什么这个项目有意义？（痛点）
+打开你手机上的天气 App，它告诉你"吉隆坡今天有雨"。
+**问题来了**：吉隆坡有几千平方公里，里面有平地、有山、有山谷、有山顶。
+天气预报背后的网格大概是 **20 公里 × 20 公里** 一格——也就是说，**山顶、山谷、迎风坡共用同一个预报**。但实际上：
+- **山顶**可能在下暴雨
+- **山谷**可能阳光明媚
+- **迎风坡**可能起大雾
+> 这就像有人告诉你"中国今天天气晴"——这种粗粒度的信息对登山者**毫无用处**。
+你做的事：**把预报精度从 20 公里降到一个具体坐标点**，让登山者点地图上任意一个点，就能知道那个具体位置的风险。
+---
+## 2. 整个项目分三块：Dataset → Model → App
+这是导师上次反复强调的顺序——**先有数据，再训模型，最后才做 App**。
+### 想象一个比喻
+你要教一个小孩看天气判断会不会下雨：
+| 步骤 | 比喻 | 项目里对应什么 |
+|---|---|---|
+| 1 | 找一本天气百科全书给小孩看 | **Dataset**（数据集） |
+| 2 | 让小孩反复看书，学会判断规律 | **Model**（训练模型） |
+| 3 | 把小孩装到一个"天气问答机器人"里，让别人能问他 | **App**（应用） |
+---
+## 3. Dataset（数据集）—— 你拿什么"教"电脑
+### 3.1 这一步在干什么
+机器学习的本质是 **"喂样本，让它自己找规律"**。所以第一件事：**准备样本**。
+### 3.2 你的数据从哪来？
+**来源**：欧洲气象中心（ECMWF）的 **ERA5 数据库**。
+这个数据库**不是预报**，是**对过去天气的"完美回放"**——气象学家会把所有历史观测数据（卫星、气球、地面站）综合起来，反推出"那一天那一刻那个地方真实的天气是怎样的"。
+> **类比**：警察破案时调看监控录像——录像就是 ERA5，是已经发生的事实。
+> 而手机预报是"预测未来"，那是另一回事。
+**学术界把 ERA5 当作真值**——其他预报系统都拿 ERA5 来校准自己。所以拿它训练 ML 模型最合适，因为**答案是可信的**。
+### 3.3 你要了多少数据？
+| 项 | 数值 |
+|---|---|
+| 地点 | 5 个马来西亚山区（云顶、金马仑、福隆港、巴生谷、神山） |
+| 时间 | 2020-01-01 到 2024-12-31，整整 5 年 |
+| 频率 | 每小时一行 |
+| **总行数** | **175 315 行**（17.5 万行） |
+| 每行包含 | 温度、湿度、风速、风向、气压、降雨量等十几个数字 |
+### 3.4 ⭐ 关键问题：原始数据里**没有"答案"**
+这是上次老师**最大的疑惑**。
+原始数据长这样（简化）：
+```
+时间                   温度   湿度   降雨量
+2023-06-01 14:00      25°C   80%   0.0 mm
+2023-06-01 15:00      24°C   85%   0.3 mm
+2023-06-01 16:00      23°C   90%   1.2 mm
+...
+```
+老师看了说："**这里面没有"答案"啊！** 没有一列告诉电脑'这是会下雨的情况'还是'这是不会下雨的情况'——你怎么训练模型？"
+**他说的完全正确**。原始数据只有"现象"，没有"标签"。
+### 3.5 你的解决方案：自己**造**一个答案列
+你想了一个聪明的办法——**用未来发生的事，反过来当现在的答案**：
+```python
+df['is_rain_event'] = (df['precipitation'].shift(-1) > 0.1).astype(int)
+```
+翻译成大白话：**看每一行的"下一个小时"——如果下一小时下雨超过 0.1 毫米，就在这一行标记 1（会下雨）；否则标记 0（不会下雨）。**
+| 时间                | 温度  | 湿度 | 降雨量 | **答案 is_rain_event** |
+|---|---|---|---|---|
+| 2023-06-01 14:00   | 25°C | 80% | 0.0   | **0**（因为下一小时只有 0.3 mm < 0.1）—— 等等，0.3 > 0.1 应该是 **1** |
+| 2023-06-01 15:00   | 24°C | 85% | 0.3   | **1**（下一小时 1.2 > 0.1） |
+| 2023-06-01 16:00   | 23°C | 90% | 1.2   | **1** |
+> **核心思想**：训练时电脑看到 14:00 那一行的所有特征（温度湿度等），它要预测的"答案"是**那一刻之后会不会下雨**。
+> 这样训练完，未来给它一组当前的天气数据，它就能预测"接下来会不会下雨"。
+### 3.6 这一步有 3 个**必须能讲出来**的细节
+老师如果追问，你要能讲清楚下面这 3 点：
+#### 细节 ① `.shift(-1)` 的意义 —— 没有"作弊"
+`.shift(-1)` 意思是"用未来的数据当答案"。这听起来像作弊，但其实**完全正确**：
+- 训练时：电脑只看"当前"特征，预测"未来"答案
+- 预测时（真实使用）：用户给当前特征，模型预测未来——**用法一致**
+- 如果用"当前"特征预测"当前"是否下雨——那不是预测，是**作弊**
+**专业术语叫"无时间泄漏"**（no temporal leakage）。
+#### 细节 ② 为什么是 0.1 毫米？—— 不是拍脑袋
+0.1 mm 是 **WMO（世界气象组织）官方定义的"微量降水"阈值**——下到 0.1 毫米才算真的下雨，更少的算"湿润空气"。
+这是**国际标准**，不是你随便定的。老师追问时这一点很重要——证明你**读了文献**。
+#### 细节 ③ 为什么是 0/1 二分类，不是预测毫米数？
+这是上次老师的**第二大疑惑**——他认为应该做"回归"（预测降雨多少毫米）。
+你的答案 3 条：
+1. **下游决策本身就是二选一**：登山者只关心"今天能不能去爬山"——出门或不出门，**就是 0/1**
+2. **回归还是要选阈值**：哪怕你预测出 5.2 mm，最后还是要拿一个阈值（比如 1 mm）转成"出门 / 不出门"——**那个阈值反正要选**，不如一开始就用分类
+3. **退路**：API 仍然返回**概率值**（比如"70% 会下雨"），需要连续值的下游组件照样能用——**两全其美**
+---
+## 4. Model（模型）—— 让电脑学会判断
+### 4.1 这一步在干什么
+把 17.5 万行数据**喂**给一个算法，让它**自己找规律**。
+学完之后，未来给它任何一组新天气数据，它能立刻输出"会下雨的概率是 X%"。
+### 4.2 你用了什么算法？
+**Random Forest（随机森林）**——一种经典的传统机器学习算法。
+#### 比喻：随机森林 = 一群医生会诊
+想象你身体不舒服，你不只看一个医生，而是**找 100 个医生分别诊断**——
+- 每个医生看的"病例资料"略有不同（随机抽一部分）
+- 每个医生只关注几个症状（不是全部）
+- 最后**100 个医生投票**，多数说"感冒"那就是感冒
+随机森林就是这个原理——它训练 100 棵小决策树，每棵树看一部分数据、问一部分特征，最后投票决定结果。
+### 4.3 为什么选随机森林，不用 ChatGPT 那种深度学习？
+老师**很可能问这个**。3 条理由：
+#### 理由 ① 可解释性
+随机森林能告诉你"**它为什么这么判断**"——比如"我看到上一小时下了 0.3 毫米雨，所以判断接下来还会下"。
+深度学习是黑盒——它说会下雨，**没人知道它为什么这么说**。
+> 在**安全关键**应用里（关系到登山者性命），可解释性必须有。
+#### 理由 ② 数据量
+深度学习需要**几百万到几千万**条数据才能发挥优势。你只有 17.5 万行——**太少了**，深度学习反而不如随机森林。
+#### 理由 ③ 速度
+随机森林预测一次 **< 1 毫秒**。深度学习要 10 倍以上时间，还要 GPU。
+> 你的 App 要做到"用户点地图立刻出结果"——快是必须的。
+### 4.4 模型训练得怎么样？（这是老师最关心的数字）
+#### 你必须能背的 4 个数字
+| 指标 | 数值 | 大白话翻译 |
+|---|---|---|
+| **ROC AUC** | **0.871** | 整体准确度的综合分，**满分 1.0**——0.87 算"很好" |
+| **Recall（召回率）** | **93.4%** | 真的下了雨的 100 次里，模型成功预警了 93 次（**只漏报 7 次**） |
+| **Brier Score** | **0.138** | 概率校准度——**越低越好**，0.14 算"校准良好" |
+| **测试样本数** | **35 063 条** | 用来打分的数据量（占总数据的 20%） |
+#### 怎么"考试"？—— 时间序列切分
+你**没有**用随机切分（很多人会犯的错）。
+**比喻**：老师出期末考试，如果他用学生平时做过的题来考——那是作弊。必须用**新的**、学生没见过的题。
+你的做法：把 5 年数据按时间顺序排，**最后 1 年（20%）扣下来不给电脑看**，只用前 4 年训练。训练完，拿最后 1 年的数据"考试"——这才公平。
+#### 为什么不用准确率（accuracy）？
+很多人会问"模型准确率多少"。**陷阱**：
+- 马来西亚山区只有 30% 的时间下雨
+- 一个**永远预测"不下雨"的傻瓜模型**，准确率自动是 70%
+- 但它**永远漏报**，登山者会被淋成落汤鸡
+所以你用 **F2 分数** + **召回率** 而不是准确率——这两个指标**重视"不漏报"**。
+> 老师如果追问，就说：**"安全关键应用，漏报比误报严重得多。漏一次真下雨，登山者可能丧命；误报一次，登山者最多取消行程。所以我用 F2 分数，它把召回率的权重设为精度的 4 倍。"**
+### 4.5 模型学到了什么？（特征重要性）
+电脑学完之后，能告诉你"它最看重哪些信号"。前 4 个是：
+| 排名 | 特征 | 大白话 |
+|---|---|---|
+| 1 | 上一小时降雨量 | "刚才下了，接下来很可能继续下"——**雨的惯性** |
+| 2-3 | 时间（一天中的几点） | 马来西亚山区**下午 3-5 点最爱下雨**——电脑学会了这个规律 |
+| 4 | 3 小时气压变化 | **气压下降预示风暴来临**——这是经典气象学常识，电脑自己学到了 |
+> 这一段非常加分——证明**你的模型学到的是"物理上有意义"的规律**，不是乱猜。
+---
+## 5. App（应用）—— 把模型包装成产品
+### 5.1 这一步在干什么
+模型本身只是个 `.pkl` 文件——一个 Python 对象。**没法用**。
+App 的工作是：**让用户能用浏览器点地图，立刻看到那个地方的风险评分**。
+### 5.2 整个 App 长什么样？
+```
+用户在浏览器点地图上一个点 (lat, lon)
+            │
+            ▼
+    前端（Vue + Leaflet 地图）
+            │
+            │  HTTP 请求
+            ▼
+    后端（FastAPI）
+            │
+            ├──► 调用 Open-Meteo API：获取这个点当前的实时天气
+            ├──► 调用 Open Topo Data：获取这个点的海拔高度
+            │
+            ├──► 引擎 A：把天气数据喂给训练好的 RF 模型 → 得到下雨概率
+            ├──► 引擎 B：用一组手写规则评估其他危险（雾、风、雷暴）
+            │
+            ▼
+    综合评分（0-100）+ 双语建议返回前端
+            │
+            ▼
+    前端显示：彩色仪表盘 + "建议：可以安全出行" / "警告：暴雨风险"
+```
+### 5.3 ⭐ 双引擎架构 —— 这是项目的**核心创新**
+这是整个项目最值得吹的地方。**老师追问"为什么混合架构"时**你要能讲清楚。
+#### 引擎 A：随机森林 = "经验主义"
+学过 17.5 万条历史数据的"经验"——**它见过的天气模式**它能很准地预测。
+#### 引擎 B：手写规则 = "原则主义"
+一组**人工写的物理规则**：
+```
+如果 海拔 > 3500 米 → 缺氧危险（不管模型说什么，强制报警）
+如果 温度 ≤ -5°C → 冻伤危险
+如果 风速 ≥ 40 km/h → 大风危险
+如果 风向 + 地形 = 迎风坡 → 地形抬升造雨风险
+```
+#### 为什么必须两个一起用？—— 珠峰例子
+**情景**：用户点了一下珠穆朗玛峰（8 848 米）。
+| 只用引擎 A（纯 ML） | 你的混合架构 |
+|---|---|
+| 模型只见过马来西亚的山（最高 1865 米） | 模型仍然给出低概率（"看起来不像会下雨"） |
+| 它说"下雨概率 5%" | **但引擎 B 立刻发现**：海拔 > 3500 → 缺氧；温度 -30°C → 冻伤；风速 80 km/h → 大风 |
+| 系统返回"安全" ❌ | **三个独立否决（Veto）触发** |
+| 登山者去了 → 死 | 综合评分被强制设为 100 = **危险** ✅ |
+> **学术上这叫"Neuro-Symbolic AI（神经-符号 AI）"**——能学的让机器学（神经），物理规律手工编码（符号）。
+> 这不是你瞎编的，是 2020 年后学术界的热门方向，参考文献 Garcez & Lamb 2020。
+### 5.4 App 的技术栈（被问到时回答）
+| 部分 | 用了什么 | 一句话解释 |
+|---|---|---|
+| 前端 | Vue 3 + Leaflet + ECharts | 浏览器里的页面，地图，图表 |
+| 后端 | FastAPI（Python） | 处理用户请求，调模型，返回结果 |
+| 缓存 | SQLite | 同一个点 10 分钟内重复查不用每次都算 |
+| 部署 | Docker | 一键就能在任何机器上跑起来 |
+---
+## 6. 整个项目你"做对了什么"—— 别人吹起来的话
+| # | 做对的事 | 为什么加分 |
+|---|---|---|
+| 1 | 数据来自 ERA5 而不是网上随便爬的 | **业内金标准**，老师不会质疑数据质量 |
+| 2 | 答案列自己工程构造，方法符合 WMO 标准 | 证明**读过文献**，不是拍脑袋 |
+| 3 | 时间序列切分而不是随机切分 | 证明**懂 ML 基础**，没有数据泄漏 |
+| 4 | 用 F2 分数选阈值而不是 F1 | 证明**理解任务背景**——安全关键场景重视召回 |
+| 5 | 混合架构（ML + 规则）而不是纯 ML | 项目的**核心研究贡献** |
+| 6 | 写了 70 个测试，覆盖率 97% | 证明**工程能力**——老师不会怀疑代码可靠性 |
+| 7 | 一行命令 `make evaluate` 复现所有数字 | 评审老师能**独立验证**论文里的每个 claim |
+---
+## 7. 上次汇报老师的 3 大疑惑——逐条解决
+| # | 老师疑惑 | 你现在的回答 |
+|---|---|---|
+| 1 | "App is the last（顺序错了）" | 严格按 dataset → model → app 顺序展示，写在 `pipeline_order.md` 里 |
+| 2 | "Y is missing（没有答案列）" | 自己工程构造的 `is_rain_event`，方法符合 WMO 标准 |
+| 3 | "应该做回归不是分类" | 下游决策是二元的、F2 分数只在分类下有意义、API 仍暴露概率 |
+---
+## 8. 这次汇报你只需要做 4 件事
+### 8.1 开场（30 秒）
+> "老师感谢您抽时间。接着上次的内容，我做完了 v1.0.0 工程化强化，整条流水线现在可以端到端复现。我按上次的顺序——**dataset、model、app**——给您过一遍新的进展，最后讲我对 Chapter 5 的下一步计划，可以吗？"
+### 8.2 按顺序展示（5 分钟）
+| 步骤 | 打开 | 讲什么 | 时长 |
+|---|---|---|---|
+| 1 | `docs/dataset.md` | "数据来自 ERA5，5 个山点 5 年共 17.5 万行；答案列 `is_rain_event` 我自己构造的，定义在 §5" | 30 秒 |
+| 2 | `figures/01_roc_curve.png` | "测试 AUC 0.871，召回率 93.4%" | 30 秒 |
+| 3 | `figures/03_calibration_curve.png` | "Brier 分数 0.138，校准良好" | 20 秒 |
+| 4 | `figures/04_threshold_sweep.png` | "用 F2 分数选阈值——安全关键场景重视召回" | 20 秒 |
+| 5 | `figures/05_feature_importance.png` | "前 3 个特征：上一小时降雨、时间周期、气压变化——和气象学文献吻合" | 20 秒 |
+| 6 | App（**最后**才打开） | 演示云顶 + 珠峰两个场景 | 90 秒 |
+### 8.3 讲下一步（90 秒）
+打开 `docs/progress_update_brief.html` §4，照着 5 条 Chapter 5 方向讲一遍，然后**请老师拍板：先做哪两条**？
+### 8.4 收尾（30 秒）
+> "明早之前给您发 3 条要点的邮件总结，留个书面确认。谢谢老师。"
+---
+## 9. 老师可能问的"傻"问题（其实不傻）
+| 问题 | 你的回答 |
+|---|---|
+| "你的模型是什么？" | "Random Forest，随机森林" |
+| "为什么不用深度学习？" | "数据量不够，需要可解释性，而且要快" |
+| "测试准确率多少？" | "AUC 0.871，召回率 93.4%——我没用准确率，因为类别不平衡" |
+| "怎么知道没过拟合？" | "做了 5 折时间序列交叉验证，每折 AUC 都在 0.83-0.91" |
+| "Y 是怎么来的？" | "从 precipitation 列工程构造的：下一小时 > 0.1 mm 标 1，0.1 mm 是 WMO 标准" |
+| "为什么是分类不是回归？" | "下游决策本身就是二元的，而且只有分类才能直接优化 F2 分数" |
+| "规则引擎为什么必要？" | "纯 ML 学的是平均，遇到分布外输入（比如珠峰）会失效——规则引擎兜底" |
+| "万一哪天模型挂了？" | "三层降级：模型挂了走启发式 / 异常返回类型化错误 / 规则引擎独立运行" |
+---
+## 10. 终极心法 —— 你只要记住这 5 句话
+1. **"我做的是给登山者用的山区天气危险预警 App。"**（一句话讲清项目）
+2. **"我用 ERA5 历史天气数据，自己构造了答案列 `is_rain_event`，训了一个随机森林模型。"**（数据 + 模型）
+3. **"测试 AUC 0.871，召回率 93.4%——我重视召回因为漏报比误报危险。"**（核心数字）
+4. **"我用混合架构——机器学习 + 手写规则，规则引擎在分布外场景兜底。"**（核心创新）
+5. **"接下来 Chapter 5 我列了 5 个评估方向，请老师建议先做哪两个。"**（请示）
+**这 5 句话能完整回答 90% 的追问。** 其余的细节，遇到了再翻这份文档。
+---
+> 写这份文档的目的：让你**真的懂**自己的项目，而不是背稿子。
+> 懂了，老师怎么问你都不慌——因为你说出来的每一句话都是**你自己想清楚的**。

frontend/index.html ADDED Viewed

	@@ -0,0 +1,579 @@

+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="UTF-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1.0" />
+  <title>MicroClimate-X — Hybrid Microclimate Risk</title>
+  <meta name="description" content="Intelligent meteorological analysis for complex terrain." />
+  <!-- CDN deps -->
+  <script src="https://cdn.tailwindcss.com"></script>
+  <link rel="stylesheet" href="https://unpkg.com/leaflet@1.9.4/dist/leaflet.css" />
+  <script src="https://unpkg.com/leaflet@1.9.4/dist/leaflet.js"></script>
+  <script src="https://unpkg.com/vue@3/dist/vue.global.prod.js"></script>
+  <style>
+    :root { color-scheme: dark; }
+    body { background:#0b0f17; color:#cbd5e1; font-family: ui-sans-serif, system-ui, -apple-system, "Segoe UI", Roboto, "Helvetica Neue", Arial; }
+    .mono { font-family: ui-monospace, "SF Mono", Menlo, Monaco, Consolas, monospace; }
+    .panel { background:#111827; border:1px solid #1f2937; border-radius:14px; }
+    .leaflet-container { background:#0b0f17; }
+    .ring-gauge { transition: stroke-dashoffset 0.8s ease, stroke 0.4s ease; }
+    .log-line { animation: fadeUp 0.25s ease-out both; }
+    @keyframes fadeUp { from { opacity:0; transform: translateY(4px); } to { opacity:1; transform:none; } }
+    .veto-row { animation: blink 1.2s ease-in-out infinite; }
+    @keyframes blink { 0%,100%{opacity:1} 50%{opacity:.55} }
+    .kbd { background:#1f2937; border:1px solid #374151; padding:1px 6px; border-radius:6px; font-size:11px; }
+    .mini-gauge-svg { transition: stroke-dashoffset 0.6s ease, stroke 0.4s ease; }
+    .pill { padding: 4px 10px; border-radius: 999px; font-size: 11px; border:1px solid #374151;
+            color:#94a3b8; transition: background .15s, color .15s, border-color .15s; cursor:pointer; }
+    .pill:hover { color:#e2e8f0; }
+    .pill:focus-visible { outline: 2px solid #34d399; outline-offset: 2px; }
+    .pill-active { background:#34d399; color:#052e2b; border-color:#34d399; font-weight:600; }
+    .rule-badge { padding:2px 6px; font-size:10px; border-radius:6px; background:#1f2937;
+                  border:1px solid #374151; color:#94a3b8; font-family: ui-monospace, monospace; }
+    .rule-badge-fired { background: #422006; border-color: #b45309; color: #fbbf24; }
+    /* Loading spinner — overlays panels while a request is in flight. */
+    .spinner { width:18px; height:18px; border:2px solid #1f2937; border-top-color:#34d399;
+               border-radius:50%; animation: spin 0.75s linear infinite; display:inline-block; }
+    @keyframes spin { to { transform: rotate(360deg); } }
+    /* Toast — bottom-right notification stack. */
+    #toast-host { position: fixed; bottom: 18px; right: 18px; z-index: 9999;
+                  display: flex; flex-direction: column; gap: 8px; pointer-events: none; }
+    .toast { pointer-events: auto; min-width: 240px; max-width: 360px;
+             background:#1f2937; border:1px solid #374151; border-radius:10px;
+             padding: 10px 14px; color:#e2e8f0; font-size:12px;
+             box-shadow: 0 6px 16px rgba(0,0,0,.5);
+             animation: slideIn .25s ease-out; }
+    .toast-err { border-color: #b91c1c; background:#2a0f10; }
+    .toast-ok  { border-color: #047857; background:#062b22; }
+    @keyframes slideIn { from { transform: translateX(20px); opacity:0; } }
+    /* Mobile-first compaction. */
+    @media (max-width: 640px) {
+      .pill { padding: 3px 7px; font-size: 10px; }
+      .activity-bar { gap: 4px; }
+    }
+  </style>
+</head>
+<body class="min-h-screen">
+  <div id="app" class="min-h-screen flex flex-col">
+    <!-- ─── Header ─────────────────────────────────────── -->
+    <header class="border-b border-slate-800 px-5 py-3 flex items-center justify-between">
+      <div class="flex items-center gap-3">
+        <div class="w-9 h-9 rounded-lg bg-emerald-500/15 ring-1 ring-emerald-400/40 flex items-center justify-center text-emerald-300 font-bold">μ</div>
+        <div>
+          <div class="text-slate-100 font-semibold tracking-tight">MicroClimate-X</div>
+          <div class="text-[11px] text-slate-500 mono">Hybrid Microclimate Risk Engine · UKM FYP</div>
+        </div>
+      </div>
+      <div class="flex items-center gap-3 flex-wrap activity-bar">
+        <!-- Demo scenarios -->
+        <select v-model="selectedScenario"
+                @change="onScenarioChange"
+                class="bg-slate-800 text-slate-200 border border-slate-700 rounded-md text-[11px] px-2 py-1 focus:outline-none focus:ring-1 focus:ring-emerald-400"
+                :aria-label="t.scenarios">
+          <option value="" disabled>{{ t.scenarios }}</option>
+          <option v-for="s in SCENARIOS" :key="s.key" :value="s.key">{{ t.scenarioLabels[s.key] }}</option>
+        </select>
+        <!-- Activity selector -->
+        <div class="flex items-center gap-1">
+          <span class="text-[11px] text-slate-500 mr-1 hidden md:inline">{{ t.activity }}</span>
+          <button v-for="a in ACTIVITIES" :key="a"
+                  @click="setActivity(a)"
+                  :aria-label="t.activities[a]"
+                  :aria-pressed="activity===a"
+                  :class="['pill', activity===a && 'pill-active']">
+            {{ t.activities[a] }}
+          </button>
+        </div>
+        <span class="text-slate-700">|</span>
+        <button @click="lang='en'" :class="['px-2.5 py-1 rounded text-xs ring-1 ring-slate-700',
+                                              lang==='en' ? 'bg-emerald-500/20 text-emerald-300 ring-emerald-500/40' : 'text-slate-400 hover:text-slate-200']">EN</button>
+        <button @click="lang='zh'" :class="['px-2.5 py-1 rounded text-xs ring-1 ring-slate-700',
+                                              lang==='zh' ? 'bg-emerald-500/20 text-emerald-300 ring-emerald-500/40' : 'text-slate-400 hover:text-slate-200']">中文</button>
+        <span v-if="loading" class="spinner ml-1" :title="t.loading"></span>
+        <div class="hidden md:flex items-center text-[11px] text-slate-500 gap-2">
+          <span class="kbd">click</span>
+          <span>{{ t.clickHint }}</span>
+        </div>
+      </div>
+    </header>
+    <!-- ─── Main ───────────────────────────────────────── -->
+    <main class="flex-1 grid grid-cols-12 gap-3 p-3">
+      <!-- Map -->
+      <section class="col-span-12 lg:col-span-7 panel overflow-hidden" style="min-height: 60vh;">
+        <div id="map" class="w-full h-full" style="min-height: 60vh;"></div>
+      </section>
+      <!-- Right column -->
+      <aside class="col-span-12 lg:col-span-5 flex flex-col gap-3">
+        <!-- Score card -->
+        <div class="panel p-5">
+          <div class="flex items-center gap-5">
+            <!-- Gauge -->
+            <div class="relative w-28 h-28 shrink-0">
+              <svg viewBox="0 0 120 120" class="w-full h-full -rotate-90">
+                <circle cx="60" cy="60" r="52" stroke="#1f2937" stroke-width="10" fill="none"/>
+                <circle cx="60" cy="60" r="52" :stroke="riskColor" stroke-width="10" fill="none"
+                        stroke-linecap="round"
+                        :stroke-dasharray="2 * Math.PI * 52"
+                        :stroke-dashoffset="2 * Math.PI * 52 * (1 - riskFraction)"
+                        class="ring-gauge"/>
+              </svg>
+              <div class="absolute inset-0 flex items-center justify-center flex-col">
+                <div class="text-3xl font-semibold tracking-tight" :style="{color: riskColor}">{{ display.risk_score ?? '—' }}</div>
+                <div class="text-[10px] uppercase tracking-widest text-slate-500 mono">risk</div>
+              </div>
+            </div>
+            <!-- Meta -->
+            <div class="flex-1 min-w-0">
+              <div class="text-xs uppercase tracking-widest text-slate-500 mono">{{ t.status }}</div>
+              <div class="text-xl font-medium" :style="{color: riskColor}">{{ riskLevelText }}</div>
+              <div class="mt-2 text-xs text-slate-400 mono break-words">
+                <span v-if="display.latitude != null">{{ display.latitude.toFixed(4) }}, {{ display.longitude.toFixed(4) }}</span>
+                <span v-else>{{ t.awaiting }}</span>
+              </div>
+              <div class="mt-1 text-[11px] text-slate-500 mono">
+                <span v-if="display.terrain">{{ t.terrain }}: <span class="text-slate-300">{{ display.terrain }}</span></span>
+                <span v-if="display.elevation_m != null"> · {{ Math.round(display.elevation_m) }} m</span>
+                <span v-if="display.cached" class="ml-2 text-emerald-400">⚡ cached ({{ display.cache_ttl }} s)</span>
+              </div>
+            </div>
+          </div>
+          <p v-if="display.advice_en || display.advice_zh"
+             class="mt-4 text-sm leading-relaxed border-l-2 pl-3"
+             :style="{borderColor: riskColor}">
+            {{ lang === 'zh' ? display.advice_zh : display.advice_en }}
+          </p>
+        </div>
+        <!-- Sub-hazard mini-gauges (D5 §3.7 / P4.3) -->
+        <div class="panel p-4">
+          <div class="flex items-center justify-between text-xs uppercase tracking-widest text-slate-500 mono mb-3">
+            <span>{{ t.subHazards }}</span>
+            <span class="text-slate-600">P4.3 · P4.4</span>
+          </div>
+          <div class="grid grid-cols-4 gap-2">
+            <div v-for="h in HAZARDS" :key="h.key"
+                 class="flex flex-col items-center gap-1"
+                 :title="t.hazardTooltip[h.key]"
+                 :aria-label="t.hazards[h.key] + ' ' + (display.hazard_subscores?.[h.key] ?? '?') + '/100'">
+              <div class="relative w-14 h-14">
+                <svg viewBox="0 0 60 60" class="w-full h-full -rotate-90">
+                  <circle cx="30" cy="30" r="24" stroke="#1f2937" stroke-width="6" fill="none"/>
+                  <circle cx="30" cy="30" r="24" :stroke="subHazardColor(display.hazard_subscores?.[h.key])"
+                          stroke-width="6" fill="none" stroke-linecap="round"
+                          :stroke-dasharray="2 * Math.PI * 24"
+                          :stroke-dashoffset="2 * Math.PI * 24 * (1 - ((display.hazard_subscores?.[h.key] ?? 0) / 100))"
+                          class="mini-gauge-svg"/>
+                </svg>
+                <div class="absolute inset-0 flex items-center justify-center">
+                  <div class="text-[13px] font-semibold mono"
+                       :style="{color: subHazardColor(display.hazard_subscores?.[h.key])}">
+                    {{ display.hazard_subscores?.[h.key] ?? '–' }}
+                  </div>
+                </div>
+              </div>
+              <div class="text-[10px] text-slate-400 text-center leading-tight">
+                {{ t.hazards[h.key] }}
+              </div>
+            </div>
+          </div>
+          <div class="mt-3 flex items-center justify-between text-[10px] text-slate-500 mono">
+            <span>Activity weight: {{ t.activities[display.activity || activity] }}</span>
+            <span>Composite ← max-dominant + 0.2 · others</span>
+          </div>
+        </div>
+        <!-- D5 §3.7.2 Decision Table R1-R4 -->
+        <div class="panel p-4">
+          <div class="flex items-center justify-between text-xs uppercase tracking-widest text-slate-500 mono mb-2">
+            <span>{{ t.decisionTable }}</span>
+            <span class="text-slate-600">§3.7.2 Table 4.2</span>
+          </div>
+          <div class="flex gap-1.5 mb-2">
+            <span v-for="r in ['R1','R2','R3','R4']" :key="r"
+                  :class="['rule-badge', ruleFired(r) && 'rule-badge-fired']">{{ r }}</span>
+          </div>
+          <div v-if="display.decision_table_matches && display.decision_table_matches.length">
+            <p v-for="m in display.decision_table_matches" :key="m.rule"
+               class="text-[12px] text-amber-200 leading-snug pl-1">
+              <span class="mono text-amber-400">{{ m.rule }}</span>
+              · {{ lang === 'zh' ? m.conclusion_zh : m.conclusion_en }}
+            </p>
+          </div>
+          <p v-else class="text-[11px] text-slate-500">{{ t.noRuleFired }}</p>
+        </div>
+        <!-- Veto block -->
+        <div v-if="display.veto_triggers && display.veto_triggers.length"
+             class="panel p-4 border-red-500/40">
+          <div class="text-xs uppercase tracking-widest text-red-400 mono mb-2">{{ t.veto }}</div>
+          <ul class="space-y-1.5">
+            <li v-for="v in display.veto_triggers" :key="v.rule"
+                class="veto-row text-sm text-red-200 flex gap-2">
+              <span class="text-red-400 mono shrink-0">▶</span>
+              <span>{{ lang === 'zh' ? v.message_zh : v.message_en }}</span>
+            </li>
+          </ul>
+        </div>
+        <!-- ML probability bar -->
+        <div class="panel p-4">
+          <div class="flex items-center justify-between text-xs text-slate-400 mono mb-2">
+            <span>{{ t.mlProb }}</span>
+            <span class="text-slate-200">{{ display.ml_rain_probability != null ? (display.ml_rain_probability * 100).toFixed(1) + '%' : '—' }}</span>
+          </div>
+          <div class="w-full h-2 bg-slate-800 rounded-full overflow-hidden">
+            <div class="h-full transition-all duration-700" :style="{
+                  width: ((display.ml_rain_probability ?? 0) * 100) + '%',
+                  background: 'linear-gradient(90deg, #34d399, #fbbf24, #ef4444)'
+                }"></div>
+          </div>
+          <div class="mt-1 text-[10px] text-slate-500 mono">Engine A · Random Forest</div>
+        </div>
+        <!-- XAI log -->
+        <div class="panel p-4 flex-1 min-h-[200px] flex flex-col">
+          <div class="flex items-center justify-between text-xs uppercase tracking-widest text-slate-500 mono mb-2">
+            <span>{{ t.inferenceLog }}</span>
+            <span class="text-slate-600">XAI</span>
+          </div>
+          <div ref="logScroll" class="flex-1 overflow-auto text-[12px] mono space-y-1 pr-1">
+            <div v-if="!display.inference_log || !display.inference_log.length" class="text-slate-600">{{ t.awaiting }}</div>
+            <div v-for="(s, i) in display.inference_log" :key="i"
+                 class="log-line flex gap-2"
+                 :class="logColor(s.kind)">
+              <span class="shrink-0 w-12 text-slate-500">[{{ s.kind }}]</span>
+              <span>{{ lang === 'zh' ? s.text_zh : s.text_en }}</span>
+            </div>
+          </div>
+        </div>
+      </aside>
+    </main>
+    <!-- ─── Footer ─────────────────────────────────────── -->
+    <footer class="px-5 py-2 text-[11px] mono text-slate-600 border-t border-slate-800 flex flex-wrap items-center justify-between gap-2">
+      <span>API: <span class="text-slate-400">{{ apiBase }}</span></span>
+      <span>{{ t.disclaimer }}</span>
+    </footer>
+    <!-- ─���─ Toast host ─────────────────────────────────── -->
+    <div id="toast-host" aria-live="polite">
+      <div v-for="t in toasts" :key="t.id"
+           :class="['toast', t.kind === 'error' ? 'toast-err' : 'toast-ok']"
+           role="status">
+        {{ t.text }}
+      </div>
+    </div>
+  </div>
+  <script>
+    const { createApp, reactive, computed, ref, onMounted, watch, nextTick } = Vue;
+    const ACTIVITIES = ["hiker", "driver", "construction", "general"];
+    const HAZARDS = [
+      { key: "rainfall" },
+      { key: "fog" },
+      { key: "wind_gust" },
+      { key: "thunderstorm" },
+    ];
+    const SCENARIOS = [
+      { key: "genting",      lat: 3.4225,   lon: 101.7935 },   // Genting Highlands
+      { key: "cameron",      lat: 4.4710,   lon: 101.3779 },   // Cameron valley
+      { key: "kinabalu",     lat: 6.0747,   lon: 116.5586 },   // Mt Kinabalu
+      { key: "everest",      lat: 27.9881,  lon: 86.9250  },   // Mt Everest (OOD)
+      { key: "singapore",    lat: 1.3521,   lon: 103.8198 },   // Flat tropical
+    ];
+    const I18N = {
+      en: {
+        clickHint: "any point on the map for analysis",
+        status:    "Status",
+        awaiting:  "Click any coordinate to analyse…",
+        terrain:   "Terrain",
+        mlProb:    "Rain probability (next hour)",
+        veto:      "Veto triggers",
+        inferenceLog: "Inference log",
+        disclaimer: "Decision-support only. Always consult official forecasts.",
+        levels: { Safe:"Safe", Caution:"Caution", Warning:"Warning", Danger:"Danger" },
+        activity: "Activity",
+        activities: { hiker:"🥾 Hiker", driver:"🚗 Driver", construction:"🏗️ Construction", general:"🧭 General" },
+        subHazards:  "Hazard breakdown",
+        hazards: { rainfall:"Rainfall", fog:"Fog", wind_gust:"Wind gust", thunderstorm:"Thunderstorm" },
+        hazardTooltip: {
+          rainfall:     "Macro rain probability + terrain amplification.",
+          fog:          "Humidity, dew-point depression, cloud cover & basin geometry.",
+          wind_gust:    "Sustained wind + ridge/pass acceleration.",
+          thunderstorm: "CAPE instability + falling pressure precursor.",
+        },
+        decisionTable: "Decision table",
+        noRuleFired:   "No D5 §3.7.2 rule fired for this scenario.",
+        scenarios:     "Quick scenarios",
+        scenarioLabels: {
+          genting:   "🇲🇾 Genting Highlands · slope",
+          cameron:   "🇲🇾 Cameron Highlands · valley",
+          kinabalu:  "🇲🇾 Mt Kinabalu · 4 095 m peak",
+          everest:   "🏔️ Mt Everest · 8 848 m (OOD)",
+          singapore: "🌴 Singapore · flat tropical",
+        },
+        loading: "Loading…",
+        errorTitle: "Request failed",
+      },
+      zh: {
+        clickHint: "点击地图任意位置开始分析",
+        status:    "状态",
+        awaiting:  "请在地图上点击任意坐标开始分析…",
+        terrain:   "地形",
+        mlProb:    "未来一小时降雨概率",
+        veto:      "一票否决",
+        inferenceLog: "推理日志",
+        disclaimer: "仅供辅助决策，请同时参考官方气象预报。",
+        levels: { Safe:"安全", Caution:"注意", Warning:"警告", Danger:"危险" },
+        activity: "活动",
+        activities: { hiker:"🥾 徒步", driver:"🚗 驾驶", construction:"🏗️ 施工", general:"🧭 通用" },
+        subHazards:  "分项灾害评分",
+        hazards: { rainfall:"降雨", fog:"雾", wind_gust:"阵风", thunderstorm:"雷暴" },
+        hazardTooltip: {
+          rainfall:     "宏观降雨概率 + 地形放大。",
+          fog:          "湿度、露点温差、云量、盆地汇雾。",
+          wind_gust:    "持续风速 + 山脊/山口加速。",
+          thunderstorm: "CAPE 不稳定 + 气压骤降前兆。",
+        },
+        decisionTable: "决策表",
+        noRuleFired:   "当前场景未触发 D5 §3.7.2 中的任何规则。",
+        scenarios:     "快速场景",
+        scenarioLabels: {
+          genting:   "🇲🇾 云顶高原 · 山坡",
+          cameron:   "🇲🇾 金马仑高原 · 山谷",
+          kinabalu:  "🇲🇾 神山 · 4 095 m 山峰",
+          everest:   "🏔️ 珠穆朗玛 · 8 848 m （OOD）",
+          singapore: "🌴 新加坡 · 热带平原",
+        },
+        loading: "加载中…",
+        errorTitle: "请求失败",
+      },
+    };
+    createApp({
+      setup() {
+        const lang = ref(localStorage.getItem("mcx_lang") || "en");
+        const activity = ref(localStorage.getItem("mcx_activity") || "hiker");
+        const loading = ref(false);
+        const toasts = reactive([]);
+        const selectedScenario = ref("");
+        const t = computed(() => I18N[lang.value]);
+        watch(lang, v => localStorage.setItem("mcx_lang", v));
+        const apiBase = (() => {
+          const meta = document.querySelector('meta[name="api-base"]');
+          if (meta) return meta.content;
+          if (location.protocol === "file:") return "http://localhost:8000";
+          return location.origin;
+        })();
+        const display = reactive({
+          latitude: null,
+          longitude: null,
+          elevation_m: null,
+          terrain: null,
+          ml_rain_probability: null,
+          risk_score: null,
+          risk_level: null,
+          veto_triggers: [],
+          inference_log: [],
+          advice_en: "",
+          advice_zh: "",
+          cached: false,
+          cache_ttl: 0,
+          hazard_subscores: null,
+          decision_table_matches: [],
+          activity: null,
+        });
+        const riskFraction = computed(() =>
+          display.risk_score == null ? 0 : Math.max(0, Math.min(1, display.risk_score / 100))
+        );
+        const riskColor = computed(() => {
+          const s = display.risk_score ?? -1;
+          if (s < 0) return "#475569";
+          if (s >= 80) return "#ef4444";
+          if (s >= 55) return "#f97316";
+          if (s >= 30) return "#fbbf24";
+          return "#34d399";
+        });
+        const riskLevelText = computed(() => {
+          if (!display.risk_level) return "—";
+          return t.value.levels[display.risk_level] || display.risk_level;
+        });
+        const logColor = (kind) => ({
+          info:     "text-slate-300",
+          ml:       "text-cyan-300",
+          rule:     "text-amber-300",
+          veto:     "text-red-400 font-medium",
+          score:    "text-emerald-300",
+          hazard:   "text-violet-300",
+          table:    "text-amber-200 font-medium",
+          activity: "text-emerald-200",
+        }[kind] || "text-slate-400");
+        const subHazardColor = (score) => {
+          if (score == null) return "#475569";
+          if (score >= 80) return "#ef4444";
+          if (score >= 55) return "#f97316";
+          if (score >= 30) return "#fbbf24";
+          return "#34d399";
+        };
+        const ruleFired = (rule) =>
+          (display.decision_table_matches || []).some(m => m.rule === rule);
+        const logScroll = ref(null);
+        watch(() => display.inference_log, async () => {
+          await nextTick();
+          if (logScroll.value) logScroll.value.scrollTop = logScroll.value.scrollHeight;
+        }, { deep: true });
+        let map, marker;
+        function pushToast(text, kind = "ok", ttl = 4500) {
+          const item = { id: Date.now() + Math.random(), text, kind };
+          toasts.push(item);
+          setTimeout(() => {
+            const i = toasts.findIndex(x => x.id === item.id);
+            if (i >= 0) toasts.splice(i, 1);
+          }, ttl);
+        }
+        async function fetchPrediction(lat, lon) {
+          // typewriter — pre-clear and show "thinking"
+          display.inference_log = [
+            { kind: "info",
+              text_en: `Querying (${lat.toFixed(4)}, ${lon.toFixed(4)}) for activity=${activity.value}…`,
+              text_zh: `查询坐标 (${lat.toFixed(4)}, ${lon.toFixed(4)})，活动类型 ${activity.value}…` },
+          ];
+          loading.value = true;
+          try {
+            const r = await fetch(
+              `${apiBase}/api/predict?lat=${lat}&lon=${lon}&activity=${encodeURIComponent(activity.value)}`
+            );
+            if (!r.ok) {
+              let body;
+              try { body = await r.json(); } catch (_) { body = {}; }
+              const msg = body?.detail || `HTTP ${r.status}`;
+              throw new Error(msg);
+            }
+            const data = await r.json();
+            Object.assign(display, data);
+            const full = data.inference_log || [];
+            display.inference_log = [];
+            for (let i = 0; i < full.length; i++) {
+              await new Promise(res => setTimeout(res, 90));
+              display.inference_log.push(full[i]);
+            }
+          } catch (err) {
+            const text = (lang.value === "zh"
+              ? `${t.value.errorTitle}：${err.message}`
+              : `${t.value.errorTitle}: ${err.message}`);
+            pushToast(text, "error", 6000);
+            display.inference_log.push({
+              kind: "veto",
+              text_en: `Request failed: ${err.message}. Is the API running on ${apiBase}?`,
+              text_zh: `请求失败：${err.message}。请确认 API 是否运行在 ${apiBase}。`,
+            });
+          } finally {
+            loading.value = false;
+          }
+        }
+        function onClick(e) {
+          const { lat, lng } = e.latlng;
+          display.latitude  = lat;
+          display.longitude = lng;
+          if (marker) marker.setLatLng([lat, lng]);
+          else marker = L.marker([lat, lng]).addTo(map);
+          fetchPrediction(lat, lng);
+        }
+        function setActivity(a) {
+          activity.value = a;
+          localStorage.setItem("mcx_activity", a);
+          if (display.latitude != null && display.longitude != null) {
+            fetchPrediction(display.latitude, display.longitude);
+          }
+        }
+        function onScenarioChange() {
+          const s = SCENARIOS.find(x => x.key === selectedScenario.value);
+          if (!s) return;
+          display.latitude  = s.lat;
+          display.longitude = s.lon;
+          map.flyTo([s.lat, s.lon], 10, { duration: 1.2 });
+          if (marker) marker.setLatLng([s.lat, s.lon]);
+          else marker = L.marker([s.lat, s.lon]).addTo(map);
+          fetchPrediction(s.lat, s.lon);
+        }
+        async function checkBackendHealth() {
+          try {
+            const r = await fetch(`${apiBase}/api/health`, { cache: "no-store" });
+            if (!r.ok) throw new Error(`HTTP ${r.status}`);
+            const h = await r.json();
+            if (!h.ml_loaded) {
+              pushToast(
+                lang.value === "zh"
+                  ? "未检测到训练模型，正在使用启发式回退。运行 make train 后即可启用 Random Forest。"
+                  : "No trained model found — running on heuristic fallback. Run `make train` to enable Random Forest.",
+                "error", 7000);
+            }
+          } catch (_e) {
+            // The first /api/predict call will surface its own error toast.
+          }
+        }
+        onMounted(() => {
+          map = L.map("map", {
+            center: [3.4225, 101.7935],  // Genting Highlands
+            zoom: 9,
+            zoomControl: true,
+          });
+          const dark = L.tileLayer(
+            "https://{s}.basemaps.cartocdn.com/dark_all/{z}/{x}/{y}{r}.png",
+            { attribution: "© OpenStreetMap, © CARTO", maxZoom: 19 }
+          );
+          const topo = L.tileLayer(
+            "https://{s}.tile.opentopomap.org/{z}/{x}/{y}.png",
+            { attribution: "© OpenTopoMap, © OpenStreetMap", maxZoom: 17 }
+          );
+          dark.addTo(map);
+          L.control.layers(
+            { "Dark": dark, "Topographic": topo },
+            {}, { position: "bottomleft", collapsed: true }
+          ).addTo(map);
+          map.on("click", onClick);
+          checkBackendHealth();
+          // Auto-trigger an initial demo query for Genting Highlands.
+          setTimeout(() => onClick({ latlng: { lat: 3.4225, lng: 101.7935 } }), 600);
+        });
+        return {
+          lang, t, display, riskFraction, riskColor, riskLevelText,
+          logColor, logScroll, apiBase,
+          activity, setActivity, subHazardColor, ruleFired,
+          ACTIVITIES, HAZARDS, SCENARIOS,
+          selectedScenario, onScenarioChange,
+          loading, toasts,
+        };
+      },
+    }).mount("#app");
+  </script>
+</body>
+</html>

models/.gitkeep ADDED Viewed

File without changes

models/MODEL_CARD.md ADDED Viewed

	@@ -0,0 +1,133 @@

+# Model Card — MicroClimate-X Rain Predictor (Random Forest v1.0)
+> Following the *Model Card* methodology of Mitchell et al. (2019).
+> Authored: 2026-05-11 · UKM Final Year Project · KyoukoLi
+---
+## 1. Model Details
+| Field | Value |
+|---|---|
+| **Model name** | MicroClimate-X RF Rain Predictor |
+| **Version** | 1.0.0 |
+| **Architecture** | `sklearn.ensemble.RandomForestClassifier` |
+| **Hyper-parameters** | `n_estimators=200, max_depth=None, class_weight='balanced', n_jobs=-1, random_state=42` |
+| **Features (n=18)** | `elevation_m`, `temperature_c`, `humidity_pct`, `wind_speed_kmh`, `wind_direction_deg`, `pressure_hpa`, `dew_point_c`, `cloud_cover_pct`, `cape_jkg`, `visibility_m`, `wind_u`, `wind_v`, `hour_sin`, `hour_cos`, `month_sin`, `month_cos`, `dew_point_depression`, `pressure_change_3h`, `precipitation_lag_1h` |
+| **Target** | `is_rain_event` ∈ {0, 1} — defined as `precipitation(t+1h) > 0.1 mm` |
+| **Output** | `predict_proba(...)[:, 1]` — calibrated probability of rain in the next hour |
+| **Author / Contact** | Li Zhenyue (`KyoukoLi`), Faculty of Information Science & Technology, UKM |
+| **Licence** | MIT (see `LICENSE`) |
+---
+## 2. Intended Use
+* **Primary use case**: terrain-aware rain-risk decision support inside the MicroClimate-X *hybrid* pipeline. The RF probability is one input among many — the topographic Rule Engine has *final authority* (Veto cascade + R1-R4 decision table).
+* **Intended users**: hikers, drivers, construction crews, and other outdoor decision makers in complex terrain (initially Malaysian mountain regions).
+* **Out-of-scope uses**:
+  * Lightning forecasting (CAPE → thunderstorm risk is handled by the rule engine sub-scorer, not by this model).
+  * Multi-hour quantitative precipitation forecasting.
+  * Aviation, marine, or any life-critical use without the Rule Engine veto layer in the loop.
+---
+## 3. Training Data
+| Field | Value |
+|---|---|
+| **Source** | ECMWF ERA5 Reanalysis (via Open-Meteo Historical Archive API) |
+| **Spatial coverage** | 5 mountain sites in West Malaysia (Genting, Cameron, Brinchang, Korbu, Kinabalu) |
+| **Temporal coverage** | 2019-01-01 → 2024-12-31 (5 years, hourly) |
+| **Total rows** | 175 315 |
+| **Class balance** | 29.2 % positive (rain-event), 70.8 % negative |
+| **Train / test split** | Time-based; 80 % oldest → train; 20 % newest → test. **No random shuffling** — would leak temporal autocorrelation. |
+| **Synthetic fallback** | `scripts/1b_synth_dataset.py` generates a physically-plausible synthetic replacement when the Open-Meteo API is unreachable. The synthetic data set has the same schema and is sufficient for end-to-end pipeline verification but should **not** be used to ship a production model. |
+---
+## 4. Evaluation — Held-out 20 % temporal test set (n = 35 063)
+Numbers below come from `figures/evaluation_summary.json`, reproducible via `make evaluate`.
+### 4.1 Discrimination
+| Metric | Value |
+|---|---|
+| ROC AUC | **0.871** |
+| PR Average Precision | **0.750** |
+| Test-set base rate | 0.292 |
+### 4.2 Calibration
+| Metric | Value |
+|---|---|
+| Brier score | **0.138** (lower is better; 0 is perfect, 0.25 is random) |
+The reliability diagram (`figures/03_calibration_curve.png`) shows the predicted probability tracks the empirical frequency closely; no post-hoc calibration (Platt / isotonic) was deemed necessary.
+### 4.3 Operating point — safety-critical threshold
+| Threshold τ | F1 | F2 | Precision | Recall |
+|---|---|---|---|---|
+| 0.50 (default) | 0.696 | 0.694 | 0.700 | 0.692 |
+| **0.20 (chosen)** | 0.621 | **0.778** | 0.466 | **0.934** |
+We adopt **τ = 0.20** because the application is **safety-critical**: a missed rain event (false negative) on a windward slope can cascade into orographic flash flooding. F2 weights recall 4× higher than precision and is the appropriate metric for this regime (Sasaki, 2007).
+### 4.4 Confusion matrix at τ = 0.20
+|              | Pred = 0 | Pred = 1 |
+|---|---|---|
+| **True = 0** | 13 877 (TN) | 10 950 (FP) |
+| **True = 1** | 679 (FN)    | 9 557 (TP) |
+Recall = 9 557 / (9 557 + 679) = **93.4 %** — the operationally important metric for "do not let people walk into a storm".
+### 4.5 Top feature importances
+1. `precipitation_lag_1h` — recent rain is by far the strongest signal (rain begets rain).
+2. `hour_cos` / `hour_sin` — diurnal cycle (afternoon convective storms in tropical climates).
+3. `pressure_change_3h` — falling pressure is a classical storm precursor.
+4. `wind_v` — meridional wind component, relevant for monsoon-driven precipitation.
+5. `dew_point_c` / `dew_point_depression` / `temperature_c` — moisture saturation indicators.
+---
+## 5. Quantitative Limitations
+* **Geographic generalisation** — the model has only seen West Malaysian mountains. Hindcast validation in other tropical mountainous regions is a planned thesis Chapter 5 contribution; until then, the Rule Engine Veto cascade is the only safety net for out-of-distribution coordinates (e.g. Himalayas).
+* **Convective forecasting** — the model uses *current-hour* features to predict *next-hour* rain. Forecasting horizon > 1 h would degrade accuracy substantially.
+* **Class imbalance** — addressed via `class_weight='balanced'` and the F2-optimal threshold, but precision at τ = 0.20 is moderate (47 %). False positives are tolerable because they only inflate the *rainfall sub-score*; the composite-score formula combines this with three other hazards.
+* **Calibration drift** — Brier = 0.138 in 2024 hold-out. Calibration should be re-checked annually as climate signals shift.
+---
+## 6. Ethical / Safety Considerations
+* **Decision-support only.** The system is explicitly **not** a substitute for official meteorological forecasts; the disclaimer is shown in every UI footer.
+* **Hidden risk surfaced, not hidden.** The R1 decision-table rule deliberately raises an alarm when *macro* model probability is low but local terrain inputs suggest hidden orographic rain — this is the OPPOSITE of the harmful failure mode where ML over-confidently says "safe".
+* **Mt-Everest test (worst-case OOD).** When fed coordinates the model has never seen, the RF returns ~0 % rain probability — and the Rule Engine then immediately vetoes on `altitude_hypoxia + extreme_cold + gale_wind`. See `tests/test_rule_engine.py::test_mt_everest_veto_hypoxia`.
+---
+## 7. Reproducibility
+```bash
+# Full pipeline from scratch — works offline via the synthetic dataset.
+make install-dev
+make synth          # OR: download real data via scripts/1_download_dataset.py
+make preprocess
+make train
+make evaluate       # writes figures/*.png + figures/evaluation_summary.json
+```
+The seed is fixed (`random_state=42`) and figures are written to `figures/` so the thesis can pull them in directly.
+---
+## 8. Citation
+If you reference this model in academic work, please cite:
+> Li Zhenyue (KyoukoLi). *MicroClimate-X: A Hybrid Microclimate Risk Engine for Complex Terrain*. Bachelor's Thesis, Universiti Kebangsaan Malaysia, Faculty of Information Science & Technology, 2026. GitHub: <https://github.com/KyoukoLi/microclimate-x>

models/feature_columns.json ADDED Viewed

	@@ -0,0 +1,20 @@

+[
+  "elevation_m",
+  "temperature_c",
+  "humidity_pct",
+  "wind_speed_kmh",
+  "wind_direction_deg",
+  "wind_u",
+  "wind_v",
+  "pressure_hpa",
+  "pressure_change_3h",
+  "dew_point_c",
+  "dew_point_depression",
+  "cloud_cover_pct",
+  "cape_jkg",
+  "precipitation_lag_1h",
+  "hour_sin",
+  "hour_cos",
+  "month_sin",
+  "month_cos"
+]

models/training_report.json ADDED Viewed

	@@ -0,0 +1,82 @@

+{
+  "n_train": 140250,
+  "n_test": 35065,
+  "class_balance": 0.3082679747882383,
+  "cv_fold_metrics": [
+    {
+      "fold": 1,
+      "precision": 0.6098984999550885,
+      "recall": 0.8534439416792358,
+      "f1": 0.7114044737807114,
+      "f2": 0.7903252089298601,
+      "auc": 0.8658920922848545
+    },
+    {
+      "fold": 2,
+      "precision": 0.6706632265897708,
+      "recall": 0.6446389496717724,
+      "f1": 0.6573936328473668,
+      "f2": 0.6496809668029051,
+      "auc": 0.8450208663371146
+    },
+    {
+      "fold": 3,
+      "precision": 0.5280549297285699,
+      "recall": 0.7822631913541005,
+      "f1": 0.6305002241721642,
+      "f2": 0.7135608454869669,
+      "auc": 0.828111331389444
+    },
+    {
+      "fold": 4,
+      "precision": 0.5639066975855954,
+      "recall": 0.7033004423273223,
+      "f1": 0.6259368612309789,
+      "f2": 0.6701682715689136,
+      "auc": 0.8407467041985305
+    },
+    {
+      "fold": 5,
+      "precision": 0.7484357589783149,
+      "recall": 0.8668718356001192,
+      "f1": 0.803311867525299,
+      "f2": 0.8402779114301661,
+      "auc": 0.9082845804487562
+    }
+  ],
+  "test_metrics": {
+    "f1": 0.685783089546914,
+    "f2": 0.7235752465557479,
+    "auc": 0.8709626679626591,
+    "confusion_matrix": [
+      [
+        20330,
+        4499
+      ],
+      [
+        2547,
+        7689
+      ]
+    ]
+  },
+  "feature_importance": {
+    "precipitation_lag_1h": 0.37103009181018626,
+    "hour_cos": 0.11580750850535977,
+    "hour_sin": 0.07037540088518035,
+    "pressure_change_3h": 0.047174819845785594,
+    "wind_v": 0.041368375623903254,
+    "dew_point_c": 0.04043788445078633,
+    "dew_point_depression": 0.039252614064941044,
+    "temperature_c": 0.037485880642672,
+    "pressure_hpa": 0.0373177439776536,
+    "cloud_cover_pct": 0.03461861797659651,
+    "wind_u": 0.03413653721205715,
+    "humidity_pct": 0.033652723237235005,
+    "wind_direction_deg": 0.03199287061898489,
+    "wind_speed_kmh": 0.026890889422381343,
+    "month_cos": 0.013067682406623812,
+    "month_sin": 0.01302571181506734,
+    "elevation_m": 0.012364647504585904,
+    "cape_jkg": 0.0
+  }
+}

pyproject.toml ADDED Viewed

	@@ -0,0 +1,45 @@

+[project]
+name = "microclimate-x"
+version = "1.0.0"
+description = "Hybrid Microclimate Risk Engine for Complex Terrain — UKM FYP."
+readme = "README.md"
+requires-python = ">=3.9"
+license = { text = "MIT" }
+authors = [{ name = "Li Zhenyue (KyoukoLi)" }]
+[tool.ruff]
+line-length = 110
+target-version = "py39"
+extend-exclude = [".venv", "data", "models", "figures", "htmlcov"]
+[tool.ruff.lint]
+# E: pycodestyle errors    F: pyflakes    I: isort     UP: pyupgrade
+# B: flake8-bugbear        SIM: simplify  RUF: ruff-native
+# N: pep8-naming           ANN: annotations
+select = ["E", "F", "I", "UP", "B", "SIM", "RUF"]
+ignore = [
+    "E501",   # line-too-long — config.py has long comment citations on purpose
+    "B008",   # function calls in argument defaults — FastAPI Query(...) idiom
+    "UP007",  # `X | Y` syntax — pydantic on py3.9 needs eval_type_backport anyway
+    "UP045",  # same
+    "RUF001", # ambiguous unicode chars — bilingual EN/ZH strings legitimately use them
+    "RUF002", # docstring ambiguous unicode chars
+    "RUF003", # comment ambiguous unicode chars
+    "SIM117", # combined `with` — readability over compactness here
+]
+[tool.ruff.lint.per-file-ignores]
+"tests/*"   = ["E402", "F401"]  # tests sometimes reorder imports for env setup
+"scripts/*" = ["E402"]          # scripts often set up paths before importing
+[tool.ruff.format]
+quote-style = "double"
+indent-style = "space"
+[tool.pytest.ini_options]
+testpaths = ["tests"]
+addopts = "-ra --strict-markers"
+asyncio_mode = "auto"
+filterwarnings = [
+    "ignore::DeprecationWarning:pydantic.*",
+]

requirements-dev.txt ADDED Viewed

	@@ -0,0 +1,14 @@

+-r requirements.txt
+# Test infrastructure
+pytest>=7.4.0
+pytest-asyncio>=0.23.0
+pytest-cov>=4.1.0
+respx>=0.23.0
+httpx>=0.27.0
+# Linter / formatter — keep version pinned so CI is reproducible
+ruff>=0.6.0
+# Plotting (for scripts/4_evaluate_model.py)
+matplotlib>=3.8.0

requirements.txt ADDED Viewed

	@@ -0,0 +1,17 @@

+# Backend
+fastapi>=0.110.0
+uvicorn[standard]>=0.27.0
+pydantic>=2.5.0
+httpx>=0.27.0
+tenacity>=8.2.3
+eval_type_backport>=0.2.0   # lets pydantic resolve `X | Y` on Python 3.9
+# Data & ML
+pandas>=2.1.0
+numpy>=1.26.0
+scikit-learn>=1.4.0
+joblib>=1.3.0
+# Testing
+pytest>=7.4.0
+pytest-asyncio>=0.23.0

scripts/1_download_dataset.py ADDED Viewed

	@@ -0,0 +1,138 @@

+"""
+Step 1 / Dataset Download
+==========================
+Downloads hourly historical weather data from Open-Meteo Historical Weather API
+(backed by ECMWF ERA5 reanalysis) for 5 Malaysian mountain locations,
+plus elevation data from Open-Topo-Data (SRTM DEM).
+Parameters as confirmed with supervisor:
+    - Location: Malaysia (mountain regions)
+    - Time range: 2020-01-01 to 2023-12-31
+    - Variables: temperature_2m, relative_humidity_2m, precipitation,
+                 wind_speed_10m, wind_direction_10m, surface_pressure
+Output: data/raw_<site>.csv  (one file per location)
+Run:  python scripts/1_download_dataset.py
+"""
+from __future__ import annotations
+import sys
+import time
+from pathlib import Path
+import httpx
+import pandas as pd
+ROOT = Path(__file__).resolve().parent.parent
+DATA_DIR = ROOT / "data"
+DATA_DIR.mkdir(exist_ok=True)
+# Malaysian mountain locations (lat, lon, name).
+# Chosen to span Peninsular Malaysia + Borneo and cover diverse terrain:
+# valleys, highlands, and one extreme peak for OOD reference.
+SITES = [
+    ("genting_highlands", 3.4225, 101.7935),
+    ("cameron_highlands", 4.4694, 101.3776),
+    ("frasers_hill",      3.7256, 101.7378),
+    ("klang_valley",      3.0738, 101.5183),
+    ("mt_kinabalu_base",  6.0535, 116.5586),
+]
+START_DATE = "2020-01-01"
+END_DATE   = "2023-12-31"
+HOURLY_VARS = [
+    "temperature_2m",
+    "relative_humidity_2m",
+    "precipitation",
+    "wind_speed_10m",
+    "wind_direction_10m",
+    "surface_pressure",
+    "dew_point_2m",
+    "cloud_cover",
+    "cape",
+]
+OPEN_METEO_URL = "https://archive-api.open-meteo.com/v1/archive"
+OPEN_TOPO_URL  = "https://api.opentopodata.org/v1/srtm30m"
+def fetch_elevation(lat: float, lon: float) -> float:
+    """Fetch ground elevation in meters from Open-Topo-Data (SRTM 30m)."""
+    resp = httpx.get(
+        OPEN_TOPO_URL,
+        params={"locations": f"{lat},{lon}"},
+        timeout=30.0,
+    )
+    resp.raise_for_status()
+    data = resp.json()
+    return float(data["results"][0]["elevation"])
+def fetch_hourly(lat: float, lon: float) -> pd.DataFrame:
+    """Fetch hourly historical weather data for the configured date range."""
+    resp = httpx.get(
+        OPEN_METEO_URL,
+        params={
+            "latitude":   lat,
+            "longitude":  lon,
+            "start_date": START_DATE,
+            "end_date":   END_DATE,
+            "hourly":     ",".join(HOURLY_VARS),
+            "timezone":   "Asia/Kuala_Lumpur",
+            "windspeed_unit": "kmh",
+        },
+        timeout=120.0,
+    )
+    resp.raise_for_status()
+    payload = resp.json()
+    df = pd.DataFrame(payload["hourly"])
+    df["time"] = pd.to_datetime(df["time"])
+    return df
+def download_site(name: str, lat: float, lon: float) -> Path:
+    out = DATA_DIR / f"raw_{name}.csv"
+    if out.exists():
+        print(f"  [skip] {name}: already exists at {out}")
+        return out
+    print(f"  [elev] fetching elevation for {name} ({lat}, {lon})…")
+    elev = fetch_elevation(lat, lon)
+    print(f"         elevation = {elev:.1f} m")
+    print(f"  [hourly] fetching weather time-series for {name}…")
+    df = fetch_hourly(lat, lon)
+    df.insert(0, "site",         name)
+    df.insert(1, "latitude",     lat)
+    df.insert(2, "longitude",    lon)
+    df.insert(3, "elevation_m",  elev)
+    df.to_csv(out, index=False)
+    print(f"  [save] {len(df):>6} rows → {out}")
+    return out
+def main() -> int:
+    print(f"Downloading {len(SITES)} sites from Open-Meteo + Open-Topo-Data…")
+    print(f"  date range: {START_DATE} → {END_DATE}")
+    print(f"  variables:  {', '.join(HOURLY_VARS)}\n")
+    for name, lat, lon in SITES:
+        print(f"[ {name} ]")
+        try:
+            download_site(name, lat, lon)
+        except httpx.HTTPError as exc:
+            print(f"  [error] {exc}", file=sys.stderr)
+            return 1
+        time.sleep(1.0)  # be polite to the public APIs
+    print("\nDone. Next step:")
+    print("  python scripts/2_preprocess.py")
+    return 0
+if __name__ == "__main__":
+    raise SystemExit(main())

scripts/1b_synth_dataset.py ADDED Viewed

	@@ -0,0 +1,168 @@

+"""
+Step 1B / Synthetic Dataset Generator  (offline fallback)
+==========================================================
+When the real Open-Meteo / Open-Topo-Data APIs are unreachable (e.g. behind
+a restrictive corporate proxy or in an offline classroom), this script
+generates a physically-plausible synthetic dataset with the *exact same
+schema* as scripts/1_download_dataset.py.
+This lets the end-to-end pipeline (preprocess + train + serve) be
+validated without network access. To switch back to real data later,
+delete data/raw_*.csv and run scripts/1_download_dataset.py.
+The synthetic generator encodes:
+    * Standard atmosphere lapse rate (≈ -6.5 °C / km)
+    * Hydrostatic pressure decay with altitude (~ -12 hPa / 100 m)
+    * Tropical diurnal temperature cycle (cooler at night, warmer mid-afternoon)
+    * Malaysia's bimodal monsoon precipitation seasonality (Apr-May, Oct-Nov peaks)
+    * Humidity inversely correlated with temperature, plus monsoon boost
+    * Heavy-tailed precipitation distribution (most hours dry, rare extremes)
+    * CAPE rising with humid afternoon convection
+    * Dew-point depression that shrinks toward saturation as humidity rises
+This is *NOT* a substitute for real ERA5 reanalysis data in the final
+thesis — its purpose is purely to exercise the ML pipeline end-to-end.
+Run:  python scripts/1b_synth_dataset.py
+"""
+from __future__ import annotations
+from pathlib import Path
+import numpy as np
+import pandas as pd
+ROOT = Path(__file__).resolve().parent.parent
+DATA_DIR = ROOT / "data"
+DATA_DIR.mkdir(exist_ok=True)
+# Site (name, lat, lon, approx elevation_m) — same as scripts/1_download_dataset.py
+SITES = [
+    ("genting_highlands", 3.4225, 101.7935, 1742.0),
+    ("cameron_highlands", 4.4694, 101.3776, 1500.0),
+    ("frasers_hill",      3.7256, 101.7378, 1300.0),
+    ("klang_valley",      3.0738, 101.5183,  120.0),
+    ("mt_kinabalu_base",  6.0535, 116.5586, 1800.0),
+]
+START = pd.Timestamp("2020-01-01 00:00:00")
+END   = pd.Timestamp("2023-12-31 23:00:00")
+def generate_site(name: str, lat: float, lon: float, elev: float,
+                  rng: np.random.Generator) -> pd.DataFrame:
+    """Generate hourly synthetic weather time-series for a single site."""
+    timestamps = pd.date_range(START, END, freq="h")
+    n = len(timestamps)
+    hour  = timestamps.hour.to_numpy()
+    doy   = timestamps.dayofyear.to_numpy()
+    # Temperature: tropical baseline 27 °C at sea level, lapse rate to altitude,
+    # plus diurnal swing (±4 °C) and seasonal (±1.5 °C).
+    sea_level_temp = 27.0
+    lapse = -6.5 * (elev / 1000.0)
+    diurnal  = -4.0 * np.cos(2 * np.pi * (hour - 3) / 24.0)
+    seasonal =  1.5 * np.cos(2 * np.pi * (doy - 60) / 365.25)
+    noise_T = rng.normal(0.0, 1.2, n)
+    temperature = sea_level_temp + lapse + diurnal + seasonal + noise_T
+    # Pressure: hydrostatic decay, plus 3-hourly random walk for synoptic systems.
+    sea_level_p = 1010.0
+    p_alt = sea_level_p - 12.0 * (elev / 100.0)
+    pressure = p_alt + rng.normal(0.0, 0.8, n)
+    pressure = pd.Series(pressure).rolling(3, min_periods=1).mean().to_numpy()
+    # Monsoon-driven rainy season: Apr-May and Oct-Nov are peak rainfall in
+    # Peninsular Malaysia; weight precipitation probability accordingly.
+    monsoon_weight = (
+        0.5 + 0.5 * np.cos(2 * np.pi * (doy - 305) / 365.25)       # NE monsoon
+        + 0.4 * np.exp(-0.5 * ((doy - 135) / 25.0) ** 2)            # SW pre-monsoon
+        + 0.4 * np.exp(-0.5 * ((doy - 305) / 30.0) ** 2)
+    )
+    # Humidity: anti-correlated with diurnal temperature; lifted by monsoon.
+    humidity_base = 78.0 + 4.0 * monsoon_weight
+    humidity = humidity_base - 0.9 * diurnal + rng.normal(0.0, 5.0, n)
+    humidity = np.clip(humidity, 30.0, 100.0)
+    # CAPE: builds with afternoon humid heat — peaks 13-16h on humid days.
+    afternoon = np.exp(-0.5 * ((hour - 14.5) / 2.5) ** 2)
+    cape = (
+        afternoon * (humidity - 60.0) * 25.0 * monsoon_weight
+        + rng.normal(0.0, 80.0, n)
+    )
+    cape = np.clip(cape, 0.0, 4500.0)
+    # Cloud cover: tied to humidity & monsoon.
+    cloud = np.clip(
+        0.55 * humidity + 25.0 * monsoon_weight + rng.normal(0.0, 8.0, n),
+        0.0, 100.0,
+    )
+    # Dew point depression shrinks at high humidity (saturation).
+    dew_dep = np.clip(36.0 - 0.32 * humidity + rng.normal(0.0, 1.4, n), 0.1, 30.0)
+    dew_point = temperature - dew_dep
+    # Wind: weak in tropics; daytime sea breeze in lowlands, slightly more wind aloft.
+    wind_base = 5.0 + 0.0025 * elev
+    wind_speed = np.clip(
+        wind_base + 2.5 * afternoon + np.abs(rng.normal(0.0, 2.5, n)),
+        0.0, 60.0,
+    )
+    # Direction: slow random walk so consecutive hours have correlated direction.
+    dir_steps = rng.normal(0.0, 25.0, n).cumsum()
+    wind_dir = (dir_steps % 360.0 + 180.0 * monsoon_weight) % 360.0
+    # Precipitation: zero-inflated; probability rises with humidity × monsoon × CAPE.
+    rain_prob = (
+        0.04
+        + 0.55 * monsoon_weight * (humidity > 80).astype(float)
+        + 0.0001 * cape
+        + 0.25 * afternoon * (humidity > 85).astype(float)
+    )
+    rain_prob = np.clip(rain_prob, 0.0, 0.85)
+    rain_event = rng.random(n) < rain_prob
+    # When it rains, amount follows an exponential distribution (heavy-tailed).
+    rain_amount = np.where(
+        rain_event,
+        rng.exponential(scale=2.8, size=n),  # mm/h
+        0.0,
+    )
+    df = pd.DataFrame({
+        "site":                 name,
+        "latitude":             lat,
+        "longitude":            lon,
+        "elevation_m":          elev,
+        "time":                 timestamps,
+        "temperature_2m":       np.round(temperature, 2),
+        "relative_humidity_2m": np.round(humidity, 1),
+        "precipitation":        np.round(rain_amount, 2),
+        "wind_speed_10m":       np.round(wind_speed, 2),
+        "wind_direction_10m":   np.round(wind_dir, 1),
+        "surface_pressure":     np.round(pressure, 1),
+        "dew_point_2m":         np.round(dew_point, 2),
+        "cloud_cover":          np.round(cloud, 1),
+        "cape":                 np.round(cape, 0),
+    })
+    return df
+def main() -> int:
+    rng = np.random.default_rng(seed=42)
+    print(f"Generating SYNTHETIC dataset for {len(SITES)} sites…")
+    print(f"  date range: {START.date()} → {END.date()}\n")
+    for name, lat, lon, elev in SITES:
+        out = DATA_DIR / f"raw_{name}.csv"
+        df = generate_site(name, lat, lon, elev, rng)
+        df.to_csv(out, index=False)
+        rain_pct = (df["precipitation"] > 0.1).mean() * 100.0
+        print(f"  [{name:<18}] {len(df):>6} rows  rain-hours={rain_pct:4.1f}%  → {out.name}")
+    print("\nDone (synthetic). Next:  python scripts/2_preprocess.py")
+    return 0
+if __name__ == "__main__":
+    raise SystemExit(main())

scripts/2_preprocess.py ADDED Viewed

	@@ -0,0 +1,160 @@

+"""
+Step 2 / Preprocessing & Feature Engineering
+=============================================
+Reads raw per-site CSVs, engineers ML-ready features, and derives the binary
+target `is_rain_event` from the raw `precipitation` column.
+Pipeline:
+    1. Load all data/raw_*.csv and concatenate.
+    2. Drop rows with NaN in critical fields.
+    3. Engineer features:
+         - wind_u, wind_v       (decompose circular wind direction)
+         - hour_sin, hour_cos   (cyclic time encoding)
+         - month_sin, month_cos (captures Malaysia's monsoon seasonality)
+         - precipitation_lag_1h (autocorrelation signal)
+         - dew_point_depression (T - T_dew, saturation proxy)
+         - pressure_change_3h   (storm-approaching signal)
+    4. Derive target:
+         is_rain_event(t) = 1 iff precipitation(t+1h) > RAIN_THRESHOLD_MM (WMO trace)
+    5. Save data/processed.csv
+Run:  python scripts/2_preprocess.py
+"""
+from __future__ import annotations
+from pathlib import Path
+import numpy as np
+import pandas as pd
+ROOT = Path(__file__).resolve().parent.parent
+DATA_DIR = ROOT / "data"
+# WMO definition of "trace precipitation": >= 0.1 mm in an hour.
+RAIN_THRESHOLD_MM = 0.1
+def engineer_features(df: pd.DataFrame) -> pd.DataFrame:
+    """Add domain-informed derived features. Operates per site to avoid
+    cross-site leakage in lag/shift operations."""
+    out_frames: list[pd.DataFrame] = []
+    for _, g in df.groupby("site", sort=False):
+        g = g.sort_values("time").reset_index(drop=True).copy()
+        # Wind: decompose into u/v components. Raw degrees are circular and
+        # mathematically misleading to tree models (0° vs 360° look "far").
+        rad = np.deg2rad(g["wind_direction_10m"])
+        g["wind_u"] = g["wind_speed_10m"] * np.sin(rad)
+        g["wind_v"] = g["wind_speed_10m"] * np.cos(rad)
+        # Cyclic time encoding (avoids the 23→0 hour discontinuity).
+        h = g["time"].dt.hour
+        m = g["time"].dt.month
+        g["hour_sin"]  = np.sin(2 * np.pi * h / 24)
+        g["hour_cos"]  = np.cos(2 * np.pi * h / 24)
+        g["month_sin"] = np.sin(2 * np.pi * m / 12)
+        g["month_cos"] = np.cos(2 * np.pi * m / 12)
+        # Lag / tendency features (storm precursors).
+        g["precipitation_lag_1h"] = g["precipitation"].shift(1).fillna(0.0)
+        g["pressure_change_3h"]   = g["surface_pressure"] - g["surface_pressure"].shift(3)
+        g["pressure_change_3h"]   = g["pressure_change_3h"].fillna(0.0)
+        # Dew point depression: small value = atmosphere near saturation.
+        g["dew_point_depression"] = g["temperature_2m"] - g["dew_point_2m"]
+        # === Target: predict whether rain occurs in the NEXT hour ===
+        # Using shift(-1) explicitly to avoid temporal data leakage:
+        # features at time t pair with the rainfall outcome at t+1h.
+        next_hour_precip = g["precipitation"].shift(-1)
+        g["is_rain_event"] = (next_hour_precip > RAIN_THRESHOLD_MM).astype("Int64")
+        # Drop the final row (no t+1h label) and any all-NaN rows.
+        g = g.iloc[:-1].copy()
+        out_frames.append(g)
+    return pd.concat(out_frames, ignore_index=True)
+def main() -> int:
+    raw_files = sorted(DATA_DIR.glob("raw_*.csv"))
+    if not raw_files:
+        print("ERROR: no data/raw_*.csv found. Run scripts/1_download_dataset.py first.")
+        return 1
+    print(f"Loading {len(raw_files)} raw site files…")
+    dfs = [pd.read_csv(p, parse_dates=["time"]) for p in raw_files]
+    df = pd.concat(dfs, ignore_index=True)
+    print(f"  rows total: {len(df):,}")
+    # Standardised column names (presentation-friendly + matches design doc).
+    df = df.rename(columns={
+        "temperature_2m":       "temperature_c",
+        "relative_humidity_2m": "humidity_pct",
+        "wind_speed_10m":       "wind_speed_kmh",
+        "wind_direction_10m":   "wind_direction_deg",
+        "surface_pressure":     "pressure_hpa",
+        "dew_point_2m":         "dew_point_c",
+        "cloud_cover":          "cloud_cover_pct",
+        "cape":                 "cape_jkg",
+    })
+    # Restore originals expected by engineer_features (it uses raw names for clarity).
+    df = df.rename(columns={
+        "temperature_c":       "temperature_2m",
+        "humidity_pct":        "relative_humidity_2m",
+        "wind_speed_kmh":      "wind_speed_10m",
+        "wind_direction_deg":  "wind_direction_10m",
+        "pressure_hpa":        "surface_pressure",
+        "dew_point_c":         "dew_point_2m",
+        "cloud_cover_pct":     "cloud_cover",
+        "cape_jkg":            "cape",
+    })
+    before = len(df)
+    df = df.dropna(subset=[
+        "temperature_2m", "relative_humidity_2m", "precipitation",
+        "wind_speed_10m", "wind_direction_10m", "surface_pressure",
+    ])
+    print(f"  rows after dropna: {len(df):,}  (dropped {before - len(df):,})")
+    print("Engineering features per site…")
+    df = engineer_features(df)
+    # Final renaming to the design-doc-friendly column names that the
+    # downstream training script and README expect.
+    df = df.rename(columns={
+        "temperature_2m":       "temperature_c",
+        "relative_humidity_2m": "humidity_pct",
+        "wind_speed_10m":       "wind_speed_kmh",
+        "wind_direction_10m":   "wind_direction_deg",
+        "surface_pressure":     "pressure_hpa",
+        "dew_point_2m":         "dew_point_c",
+        "cloud_cover":          "cloud_cover_pct",
+        "cape":                 "cape_jkg",
+    })
+    # Drop the one terminal row per site that lacks the t+1h label.
+    df = df.dropna(subset=["is_rain_event"]).copy()
+    df["is_rain_event"] = df["is_rain_event"].astype(int)
+    out = DATA_DIR / "processed.csv"
+    df.to_csv(out, index=False)
+    print("\n=== Processed dataset summary ===")
+    print(f"  total samples         : {len(df):,}")
+    print(f"  sites                 : {df['site'].nunique()}")
+    print(f"  date range            : {df['time'].min()} → {df['time'].max()}")
+    print(f"  class balance (Y=1)   : {df['is_rain_event'].mean():.1%}")
+    print(f"  saved to              : {out}")
+    print("\nFirst rows of (selected cols):")
+    cols = ["site", "time", "elevation_m", "temperature_c", "humidity_pct",
+            "wind_speed_kmh", "pressure_hpa", "is_rain_event"]
+    print(df[cols].head(10).to_string(index=False))
+    print("\nNext step:  python scripts/3_train_model.py")
+    return 0
+if __name__ == "__main__":
+    raise SystemExit(main())

scripts/3_train_model.py ADDED Viewed

	@@ -0,0 +1,183 @@

+"""
+Step 3 / Random Forest Training
+================================
+Trains a Random Forest classifier on the processed dataset using:
+    - Time-based CV (NOT random split — would leak temporal autocorrelation)
+    - class_weight='balanced' (rain is the minority class)
+    - Hold-out test = last 20 % of the time-ordered dataset
+Outputs:
+    models/rf_model.pkl              — fitted estimator
+    models/feature_columns.json      — exact feature order used at train time
+    models/training_report.json      — metrics + feature importance + meta
+Run:  python scripts/3_train_model.py
+"""
+from __future__ import annotations
+import json
+from pathlib import Path
+import joblib
+import numpy as np
+import pandas as pd
+from sklearn.ensemble import RandomForestClassifier
+from sklearn.metrics import (
+    classification_report,
+    confusion_matrix,
+    f1_score,
+    fbeta_score,
+    precision_recall_fscore_support,
+    roc_auc_score,
+)
+from sklearn.model_selection import TimeSeriesSplit
+ROOT = Path(__file__).resolve().parent.parent
+DATA_DIR  = ROOT / "data"
+MODEL_DIR = ROOT / "models"
+MODEL_DIR.mkdir(exist_ok=True)
+# Features fed to the model (X). Order matters — saved alongside the model.
+FEATURE_COLUMNS: list[str] = [
+    "elevation_m",
+    "temperature_c",
+    "humidity_pct",
+    "wind_speed_kmh",
+    "wind_direction_deg",   # kept for interpretability comparison
+    "wind_u", "wind_v",     # mathematically correct circular decomposition
+    "pressure_hpa",
+    "pressure_change_3h",
+    "dew_point_c",
+    "dew_point_depression",
+    "cloud_cover_pct",
+    "cape_jkg",
+    "precipitation_lag_1h",
+    "hour_sin", "hour_cos",
+    "month_sin", "month_cos",
+]
+TARGET = "is_rain_event"
+def load_dataset() -> pd.DataFrame:
+    p = DATA_DIR / "processed.csv"
+    if not p.exists():
+        raise SystemExit("ERROR: data/processed.csv not found. "
+                         "Run scripts/2_preprocess.py first.")
+    df = pd.read_csv(p, parse_dates=["time"])
+    df = df.sort_values(["site", "time"]).reset_index(drop=True)
+    return df
+def time_based_split(df: pd.DataFrame, test_frac: float = 0.2) -> tuple[pd.DataFrame, pd.DataFrame]:
+    """Last `test_frac` of the time-ordered data per site is held out."""
+    train_parts, test_parts = [], []
+    for _, g in df.groupby("site", sort=False):
+        cut = int(len(g) * (1.0 - test_frac))
+        train_parts.append(g.iloc[:cut])
+        test_parts.append(g.iloc[cut:])
+    return pd.concat(train_parts, ignore_index=True), pd.concat(test_parts, ignore_index=True)
+def crossval_score(X: np.ndarray, y: np.ndarray, n_splits: int = 5) -> list[dict]:
+    """TimeSeriesSplit gives a fair temporal-CV estimate."""
+    tscv = TimeSeriesSplit(n_splits=n_splits)
+    fold_metrics: list[dict] = []
+    for fold, (tr, va) in enumerate(tscv.split(X), start=1):
+        model = RandomForestClassifier(
+            n_estimators=200,
+            max_depth=15,
+            min_samples_leaf=20,
+            class_weight="balanced",
+            n_jobs=-1,
+            random_state=42,
+        )
+        model.fit(X[tr], y[tr])
+        proba = model.predict_proba(X[va])[:, 1]
+        pred  = (proba >= 0.5).astype(int)
+        p, r, f1, _ = precision_recall_fscore_support(y[va], pred, average="binary", zero_division=0)
+        try:
+            auc = roc_auc_score(y[va], proba)
+        except ValueError:
+            auc = float("nan")
+        f2 = fbeta_score(y[va], pred, beta=2.0, zero_division=0)
+        print(f"  fold {fold}: P={p:.3f}  R={r:.3f}  F1={f1:.3f}  F2={f2:.3f}  AUC={auc:.3f}")
+        fold_metrics.append({"fold": fold, "precision": p, "recall": r,
+                              "f1": f1, "f2": f2, "auc": auc})
+    return fold_metrics
+def main() -> int:
+    print("Loading processed dataset…")
+    df = load_dataset()
+    print(f"  rows: {len(df):,}   features: {len(FEATURE_COLUMNS)}")
+    print(f"  class balance (Y=1): {df[TARGET].mean():.1%}")
+    print("\nTime-based train/test split (last 20% per site held out)…")
+    train_df, test_df = time_based_split(df, test_frac=0.20)
+    print(f"  train: {len(train_df):,}   test: {len(test_df):,}")
+    X_train = train_df[FEATURE_COLUMNS].to_numpy()
+    y_train = train_df[TARGET].to_numpy()
+    X_test  = test_df[FEATURE_COLUMNS].to_numpy()
+    y_test  = test_df[TARGET].to_numpy()
+    print("\nTime-series cross-validation on training fold (5 splits)…")
+    fold_metrics = crossval_score(X_train, y_train, n_splits=5)
+    print("\nFitting final model on full training set…")
+    model = RandomForestClassifier(
+        n_estimators=300,
+        max_depth=20,
+        min_samples_leaf=10,
+        class_weight="balanced",
+        n_jobs=-1,
+        random_state=42,
+    )
+    model.fit(X_train, y_train)
+    print("\nEvaluating on held-out test set…")
+    proba = model.predict_proba(X_test)[:, 1]
+    pred  = (proba >= 0.5).astype(int)
+    print(classification_report(y_test, pred, target_names=["NoRain", "Rain"], digits=3))
+    cm = confusion_matrix(y_test, pred)
+    print("Confusion matrix:")
+    print(f"  [[TN={cm[0,0]:>6}  FP={cm[0,1]:>6}]")
+    print(f"   [FN={cm[1,0]:>6}  TP={cm[1,1]:>6}]]")
+    auc_test = roc_auc_score(y_test, proba)
+    f2_test  = fbeta_score(y_test, pred, beta=2.0, zero_division=0)
+    print(f"AUC = {auc_test:.3f}    F2 = {f2_test:.3f}")
+    print("\nFeature importances:")
+    fi = sorted(zip(FEATURE_COLUMNS, model.feature_importances_), key=lambda x: -x[1])
+    for name, imp in fi:
+        bar = "█" * int(imp * 200)
+        print(f"  {name:<24} {imp:.4f} {bar}")
+    print("\nSaving artefacts…")
+    joblib.dump(model, MODEL_DIR / "rf_model.pkl")
+    with open(MODEL_DIR / "feature_columns.json", "w") as f:
+        json.dump(FEATURE_COLUMNS, f, indent=2)
+    with open(MODEL_DIR / "training_report.json", "w") as f:
+        json.dump({
+            "n_train":        len(train_df),
+            "n_test":         len(test_df),
+            "class_balance":  float(df[TARGET].mean()),
+            "cv_fold_metrics": fold_metrics,
+            "test_metrics": {
+                "f1":  float(f1_score(y_test, pred, zero_division=0)),
+                "f2":  float(f2_test),
+                "auc": float(auc_test),
+                "confusion_matrix": cm.tolist(),
+            },
+            "feature_importance": {name: float(imp) for name, imp in fi},
+        }, f, indent=2)
+    print(f"  → {MODEL_DIR/'rf_model.pkl'}")
+    print(f"  → {MODEL_DIR/'feature_columns.json'}")
+    print(f"  → {MODEL_DIR/'training_report.json'}")
+    print("\nNext step:  uvicorn backend.main:app --reload --port 8000")
+    return 0
+if __name__ == "__main__":
+    raise SystemExit(main())

scripts/4_evaluate_model.py ADDED Viewed

	@@ -0,0 +1,272 @@

+"""
+Step 4 / Model Evaluation
+==========================
+Produces *publication-quality* figures that can be pasted directly into
+the thesis (Chapter 5 — Results / Discussion). Run AFTER 3_train_model.py.
+Inputs
+------
+    models/rf_model.pkl
+    models/feature_columns.json
+    data/processed.csv
+Outputs
+-------
+    figures/01_roc_curve.png            ROC + AUC
+    figures/02_pr_curve.png             Precision-Recall + AP
+    figures/03_calibration_curve.png    Reliability diagram + Brier score
+    figures/04_threshold_sweep.png      F1 / F2 / Precision / Recall vs threshold
+    figures/05_feature_importance.png   Top-20 features (horizontal bar)
+    figures/06_confusion_matrix.png     Confusion matrix at optimal F2 threshold
+    figures/threshold_sweep.csv         Same data as 04 in machine-readable form
+    figures/evaluation_summary.json     One-shot metrics blob for the thesis
+Run:  python scripts/4_evaluate_model.py
+"""
+from __future__ import annotations
+import json
+from datetime import datetime, timezone
+from pathlib import Path
+import joblib
+import matplotlib
+import numpy as np
+import pandas as pd
+matplotlib.use("Agg")
+import matplotlib.pyplot as plt
+from sklearn.calibration import calibration_curve
+from sklearn.metrics import (
+    auc,
+    average_precision_score,
+    brier_score_loss,
+    confusion_matrix,
+    f1_score,
+    fbeta_score,
+    precision_recall_curve,
+    precision_score,
+    recall_score,
+    roc_curve,
+)
+ROOT = Path(__file__).resolve().parent.parent
+MODEL_DIR = ROOT / "models"
+DATA_DIR  = ROOT / "data"
+FIG_DIR   = ROOT / "figures"
+FIG_DIR.mkdir(exist_ok=True)
+# ── Matplotlib defaults — keep figures consistent across panels ──────────
+plt.rcParams.update({
+    "figure.figsize":  (7.0, 4.5),
+    "figure.dpi":      120,
+    "savefig.dpi":     200,
+    "savefig.bbox":    "tight",
+    "font.size":       11,
+    "axes.titlesize":  13,
+    "axes.labelsize":  11,
+    "legend.fontsize": 10,
+    "axes.spines.top":   False,
+    "axes.spines.right": False,
+    "grid.alpha":        0.25,
+    "axes.axisbelow":    True,
+})
+# ── Load artefacts ───────────────────────────────────────────────────────
+def _load() -> tuple:
+    model_path = MODEL_DIR / "rf_model.pkl"
+    feats_path = MODEL_DIR / "feature_columns.json"
+    data_path  = DATA_DIR  / "processed.csv"
+    for p in (model_path, feats_path, data_path):
+        if not p.exists():
+            raise FileNotFoundError(
+                f"Missing artefact: {p}. Run scripts/3_train_model.py first."
+            )
+    model      = joblib.load(model_path)
+    feat_cols  = json.loads(feats_path.read_text())
+    df         = pd.read_csv(data_path)
+    df["time"] = pd.to_datetime(df["time"])
+    df = df.sort_values("time").reset_index(drop=True)
+    # Use the last 20% as test (same split as training).
+    cut = int(len(df) * 0.80)
+    test = df.iloc[cut:].reset_index(drop=True)
+    X = test[feat_cols].values
+    y = test["is_rain_event"].astype(int).values
+    proba = model.predict_proba(X)[:, 1]
+    return model, feat_cols, X, y, proba, test
+# ── Figure builders ──────────────────────────────────────────────────────
+def plot_roc(y, proba) -> dict:
+    fpr, tpr, _ = roc_curve(y, proba)
+    auc_v = auc(fpr, tpr)
+    fig, ax = plt.subplots()
+    ax.plot(fpr, tpr, color="#0ea5e9", linewidth=2.0, label=f"RF (AUC = {auc_v:.3f})")
+    ax.plot([0, 1], [0, 1], "--", color="#9ca3af", linewidth=1.0, label="Random baseline")
+    ax.set_xlabel("False Positive Rate")
+    ax.set_ylabel("True Positive Rate")
+    ax.set_title("ROC Curve — rain-event classifier")
+    ax.legend(loc="lower right")
+    ax.grid(True)
+    fig.savefig(FIG_DIR / "01_roc_curve.png")
+    plt.close(fig)
+    return {"auc": float(auc_v)}
+def plot_pr(y, proba) -> dict:
+    pr, rc, _ = precision_recall_curve(y, proba)
+    ap = average_precision_score(y, proba)
+    base_rate = float(y.mean())
+    fig, ax = plt.subplots()
+    ax.plot(rc, pr, color="#10b981", linewidth=2.0, label=f"RF (AP = {ap:.3f})")
+    ax.hlines(base_rate, 0, 1, colors="#9ca3af", linestyles="--",
+              label=f"Base rate = {base_rate:.3f}")
+    ax.set_xlabel("Recall")
+    ax.set_ylabel("Precision")
+    ax.set_title("Precision–Recall Curve")
+    ax.legend(loc="lower left")
+    ax.grid(True)
+    fig.savefig(FIG_DIR / "02_pr_curve.png")
+    plt.close(fig)
+    return {"average_precision": float(ap), "base_rate": base_rate}
+def plot_calibration(y, proba) -> dict:
+    frac_pos, mean_pred = calibration_curve(y, proba, n_bins=10, strategy="quantile")
+    brier = brier_score_loss(y, proba)
+    fig, ax = plt.subplots()
+    ax.plot([0, 1], [0, 1], "--", color="#9ca3af", linewidth=1.0,
+            label="Perfectly calibrated")
+    ax.plot(mean_pred, frac_pos, marker="o", color="#f59e0b", linewidth=2.0,
+            label=f"RF (Brier = {brier:.3f})")
+    ax.set_xlabel("Mean predicted probability")
+    ax.set_ylabel("Fraction of positives (observed)")
+    ax.set_title("Reliability Diagram — model calibration")
+    ax.legend(loc="upper left")
+    ax.grid(True)
+    fig.savefig(FIG_DIR / "03_calibration_curve.png")
+    plt.close(fig)
+    return {"brier_score": float(brier)}
+def plot_threshold_sweep(y, proba) -> dict:
+    thresholds = np.linspace(0.05, 0.95, 19)
+    rows = []
+    best_f2 = (-1.0, 0.5)
+    for thr in thresholds:
+        yp = (proba >= thr).astype(int)
+        f1   = f1_score(y, yp, zero_division=0)
+        f2   = fbeta_score(y, yp, beta=2.0, zero_division=0)
+        prec = precision_score(y, yp, zero_division=0)
+        rec  = recall_score(y, yp, zero_division=0)
+        rows.append({
+            "threshold": thr, "f1": f1, "f2": f2,
+            "precision": prec, "recall": rec,
+        })
+        if f2 > best_f2[0]:
+            best_f2 = (f2, thr)
+    sweep = pd.DataFrame(rows)
+    sweep.to_csv(FIG_DIR / "threshold_sweep.csv", index=False)
+    fig, ax = plt.subplots()
+    ax.plot(sweep.threshold, sweep.precision, label="Precision", color="#0ea5e9", linewidth=2.0)
+    ax.plot(sweep.threshold, sweep.recall,    label="Recall",    color="#10b981", linewidth=2.0)
+    ax.plot(sweep.threshold, sweep.f1,        label="F1",        color="#f59e0b", linewidth=1.4, linestyle="--")
+    ax.plot(sweep.threshold, sweep.f2,        label="F2",        color="#ef4444", linewidth=2.0)
+    ax.axvline(best_f2[1], color="#ef4444", alpha=0.25, linestyle=":")
+    ax.set_xlabel("Decision threshold")
+    ax.set_ylabel("Score")
+    ax.set_title(f"Threshold sweep — best F2 = {best_f2[0]:.3f} @ τ = {best_f2[1]:.2f}")
+    ax.legend(loc="lower left", ncols=4)
+    ax.grid(True)
+    fig.savefig(FIG_DIR / "04_threshold_sweep.png")
+    plt.close(fig)
+    return {"best_f2": float(best_f2[0]), "best_f2_threshold": float(best_f2[1])}
+def plot_feature_importance(model, feat_cols, top_n: int = 20) -> dict:
+    imp = pd.Series(model.feature_importances_, index=feat_cols)
+    imp = imp.sort_values(ascending=True).tail(top_n)
+    fig, ax = plt.subplots(figsize=(7.0, 0.32 * len(imp) + 1.2))
+    ax.barh(imp.index, imp.values, color="#6366f1")
+    ax.set_xlabel("Importance (mean decrease in impurity)")
+    ax.set_title(f"Top {len(imp)} feature importances")
+    ax.grid(True, axis="x")
+    fig.savefig(FIG_DIR / "05_feature_importance.png")
+    plt.close(fig)
+    return {"feature_importance": imp.sort_values(ascending=False).to_dict()}
+def plot_confusion(y, proba, threshold: float) -> dict:
+    yp = (proba >= threshold).astype(int)
+    cm = confusion_matrix(y, yp)
+    tn, fp, fn, tp = cm.ravel()
+    fig, ax = plt.subplots(figsize=(4.5, 4.0))
+    im = ax.imshow(cm, cmap="Blues")
+    for i in range(2):
+        for j in range(2):
+            ax.text(j, i, str(cm[i, j]), ha="center", va="center",
+                    color="black" if cm[i, j] < cm.max() / 2 else "white",
+                    fontsize=13, fontweight="bold")
+    ax.set_xticks([0, 1], ["No rain", "Rain"])
+    ax.set_yticks([0, 1], ["No rain", "Rain"])
+    ax.set_xlabel("Predicted label")
+    ax.set_ylabel("True label")
+    ax.set_title(f"Confusion matrix @ τ = {threshold:.2f}")
+    fig.colorbar(im, ax=ax, fraction=0.046, pad=0.04)
+    fig.savefig(FIG_DIR / "06_confusion_matrix.png")
+    plt.close(fig)
+    return {"tn": int(tn), "fp": int(fp), "fn": int(fn), "tp": int(tp)}
+# ── Main ─────────────────────────────────────────────────────────────────
+def main() -> None:
+    print(f"[eval] loading artefacts from {MODEL_DIR}")
+    model, feat_cols, _, y, proba, _test = _load()
+    print(f"[eval] test set: {len(y)} samples  ({int(y.sum())} positives, "
+          f"{(y.mean() * 100):.1f}% rain-event rate)")
+    summary = {
+        "generated_at":   datetime.now(timezone.utc).isoformat(),
+        "n_test":         len(y),
+        "n_positives":    int(y.sum()),
+        "positive_rate":  float(y.mean()),
+        "n_features":     len(feat_cols),
+    }
+    summary["roc"]        = plot_roc(y, proba)
+    summary["pr"]         = plot_pr(y, proba)
+    summary["calibration"] = plot_calibration(y, proba)
+    sweep = plot_threshold_sweep(y, proba)
+    summary["threshold_sweep"] = sweep
+    summary["confusion"]  = plot_confusion(y, proba, sweep["best_f2_threshold"])
+    top_importances = plot_feature_importance(model, feat_cols)
+    summary["top_features"] = list(top_importances["feature_importance"].keys())[:10]
+    out = FIG_DIR / "evaluation_summary.json"
+    out.write_text(json.dumps(summary, indent=2))
+    print(f"[eval] all figures written to {FIG_DIR}")
+    print(f"[eval] summary JSON: {out}")
+    print(f"[eval] best F2 = {sweep['best_f2']:.3f} at τ = {sweep['best_f2_threshold']:.2f}")
+    print(f"[eval] ROC AUC = {summary['roc']['auc']:.3f},  "
+          f"PR AP = {summary['pr']['average_precision']:.3f},  "
+          f"Brier = {summary['calibration']['brier_score']:.3f}")
+if __name__ == "__main__":
+    main()

scripts/deploy_hf.sh ADDED Viewed

	@@ -0,0 +1,135 @@

+#!/usr/bin/env bash
+# ──────────────────────────────────────────────────────────────────────────
+# scripts/deploy_hf.sh — fully-automated deploy to Hugging Face Spaces
+# ──────────────────────────────────────────────────────────────────────────
+#
+# Usage:
+#   HF_TOKEN="<your-hf-write-token>" ./scripts/deploy_hf.sh <hf-user>/<space-name>
+#
+# Example (token redacted — get yours at https://huggingface.co/settings/tokens):
+#   HF_TOKEN="$HF_TOKEN" ./scripts/deploy_hf.sh W1nd5pac/microclimate-x
+#
+# What it does (no manual steps):
+#   1. Ensures huggingface_hub CLI is installed in .venv/
+#   2. Authenticates with HF_TOKEN
+#   3. Creates the Space (Docker SDK) if it doesn't exist yet
+#   4. Uploads the whole repo (server-side LFS handles the 217 MB model)
+#   5. Prints the live URL when the build is queued
+#
+# Skips:
+#   data/   figures/   tests/   .venv/   .git/   *.sqlite3   __pycache__/
+# ──────────────────────────────────────────────────────────────────────────
+set -euo pipefail
+if [[ $# -lt 1 ]]; then
+  echo "Usage: HF_TOKEN=hf_xxx $0 <hf-user>/<space-name>"
+  echo "Example: HF_TOKEN=hf_xxx $0 W1nd5pac/microclimate-x"
+  exit 2
+fi
+REPO_ID="$1"
+ROOT="$(cd "$(dirname "$0")/.." && pwd)"
+cd "$ROOT"
+# Clean env so other venvs / PYTHONPATH leaks don't break us.
+unset PYTHONPATH VIRTUAL_ENV PYTHONHOME
+# ── 1. ensure .venv has huggingface_hub ──────────────────────────────────
+if [[ ! -x ".venv/bin/hf" ]]; then
+  echo "▶ Installing huggingface_hub CLI into .venv/ …"
+  .venv/bin/pip install -q -U "huggingface_hub[cli,hf_transfer]"
+fi
+HF=".venv/bin/hf"
+# Speed-boost for the 217 MB model upload.
+export HF_HUB_ENABLE_HF_TRANSFER=1
+# ── 2. authenticate ──────────────────────────────────────────────────────
+if [[ -z "${HF_TOKEN:-}" ]]; then
+  if ! $HF auth whoami >/dev/null 2>&1; then
+    echo "❌ HF_TOKEN env not set and not already logged in."
+    echo "   Get a Write token at https://huggingface.co/settings/tokens and run:"
+    echo "     HF_TOKEN=hf_xxx $0 $REPO_ID"
+    exit 1
+  fi
+fi
+if [[ -n "${HF_TOKEN:-}" ]]; then
+  # Re-login non-interactively so we use the supplied token (idempotent).
+  echo "▶ Authenticating as the token's owner …"
+  echo "$HF_TOKEN" | $HF auth login --token "$HF_TOKEN" --add-to-git-credential >/dev/null 2>&1 || true
+fi
+WHOAMI=$($HF auth whoami 2>/dev/null | head -1 || echo "?")
+echo "  Logged in as: $WHOAMI"
+# ── 3. create the Space if missing (idempotent — 409 means "exists") ─────
+echo "▶ Ensuring Space $REPO_ID exists (Docker SDK) …"
+CREATE_OUTPUT=$($HF repos create "$REPO_ID" --repo-type space --space-sdk docker 2>&1 || true)
+if echo "$CREATE_OUTPUT" | grep -q "Successfully created"; then
+  echo "  Created fresh Space."
+elif echo "$CREATE_OUTPUT" | grep -qi "already created\|409"; then
+  echo "  Space already exists — will push to it."
+else
+  echo "$CREATE_OUTPUT"
+  echo "❌ Unexpected response from 'hf repos create'. Aborting."
+  exit 1
+fi
+# ── 4. sanity-check the model exists locally ─────────────────────────────
+MODEL="models/rf_model.pkl"
+if [[ ! -f "$MODEL" ]]; then
+  echo "⚠️  $MODEL not found — the Space will fall back to a heuristic predictor."
+  read -r -p "Continue without the trained model? [y/N] " ans
+  [[ "$ans" =~ ^[Yy]$ ]] || exit 1
+fi
+# ── 5. upload everything ─────────────────────────────────────────────────
+echo "▶ Uploading repo → spaces/$REPO_ID …"
+echo "  (217 MB rf_model.pkl uses HF's server-side Xet/LFS — no local LFS needed)"
+DEPLOY_MSG="Deploy $(date -u +%Y-%m-%dT%H:%M:%SZ) — $(git rev-parse --short HEAD 2>/dev/null || echo local)"
+# Pass 1: bulk-upload everything except the model (default: respects .gitignore
+# which already excludes *.pkl, so the big file won't go in this pass).
+$HF upload \
+  "$REPO_ID" \
+  . \
+  . \
+  --repo-type=space \
+  --commit-message="$DEPLOY_MSG (code)" \
+  --exclude "data/*" \
+  --exclude "figures/*" \
+  --exclude "tests/*" \
+  --exclude ".venv/*" \
+  --exclude ".local/*" \
+  --exclude ".pytest_cache/*" \
+  --exclude ".ruff_cache/*" \
+  --exclude ".mypy_cache/*" \
+  --exclude "**/__pycache__/*" \
+  --exclude "*.sqlite3" \
+  --exclude "*.sqlite3-*" \
+  --exclude "*.pyc" \
+  --exclude ".DS_Store" \
+  --exclude ".git/*" \
+  --exclude ".github/*"
+# Pass 2: explicitly push the 217 MB Random Forest model. An explicit
+# single-file path bypasses .gitignore filtering — without this step the Space
+# falls back to the heuristic predictor and the AUC=0.871 claim won't reproduce.
+if [[ -f "$MODEL" ]]; then
+  echo "▶ Uploading models/rf_model.pkl (217 MB) — bypassing .gitignore …"
+  $HF upload \
+    "$REPO_ID" \
+    "$MODEL" \
+    "models/rf_model.pkl" \
+    --repo-type=space \
+    --commit-message="$DEPLOY_MSG (model)"
+fi
+echo
+echo "✅ Upload complete. Space is rebuilding now."
+echo "   Status:    https://huggingface.co/spaces/$REPO_ID"
+echo "   Live URL:  https://huggingface.co/spaces/$REPO_ID  (≈ 3-5 min for first build)"
+echo
+echo "Tip: once the green Running badge shows, send the Live URL to your supervisor."

scripts/start_demo.sh ADDED Viewed

	@@ -0,0 +1,86 @@

+#!/usr/bin/env bash
+# ──────────────────────────────────────────────────────────────────────────
+# scripts/start_demo.sh — one-shot demo for supervisor showcase
+#
+# What it does:
+#   1. Kills any previous demo processes (uvicorn / cloudflared)
+#   2. Starts FastAPI on 127.0.0.1:8181  (clean env, isolated from other venvs)
+#   3. Waits until /api/health returns 200
+#   4. Starts a Cloudflare Quick Tunnel and prints the public URL
+#   5. On Ctrl-C, cleanly shuts down both processes
+#
+# Usage:
+#   ./scripts/start_demo.sh
+#
+# Prereqs (already done by the agent on this machine):
+#   - .venv/  Python 3.9 venv with all deps installed
+#   - .local/bin/cloudflared  (macOS arm64, downloaded from GitHub releases)
+#   - models/rf_model.pkl  (217 MB, real ERA5-trained Random Forest)
+# ──────────────────────────────────────────────────────────────────────────
+set -euo pipefail
+PORT="${PORT:-8181}"
+ROOT="$(cd "$(dirname "$0")/.." && pwd)"
+LOG_DIR="${TMPDIR:-/tmp}"
+UVICORN_LOG="$LOG_DIR/mcx-uvicorn.log"
+TUNNEL_LOG="$LOG_DIR/mcx-tunnel.log"
+cd "$ROOT"
+# ── 1. Kill leftovers from a previous run ────────────────────────────────
+pkill -f "uvicorn backend.main:app.*--port $PORT" 2>/dev/null || true
+pkill -f "cloudflared tunnel --url http://127.0.0.1:$PORT" 2>/dev/null || true
+sleep 1
+# ── 2. Start FastAPI in the background ───────────────────────────────────
+echo "▶ Starting FastAPI on http://127.0.0.1:$PORT …"
+env -u PYTHONPATH -u VIRTUAL_ENV -u PYTHONHOME \
+  ".venv/bin/python" -m uvicorn backend.main:app \
+  --host 127.0.0.1 --port "$PORT" \
+  > "$UVICORN_LOG" 2>&1 &
+UVICORN_PID=$!
+cleanup() {
+  echo
+  echo "▶ Shutting down (uvicorn=$UVICORN_PID, cloudflared=${CF_PID:-n/a})…"
+  [[ -n "${CF_PID:-}" ]] && kill "$CF_PID" 2>/dev/null || true
+  kill "$UVICORN_PID" 2>/dev/null || true
+  wait 2>/dev/null || true
+  echo "✓ Stopped. Logs preserved at:"
+  echo "    $UVICORN_LOG"
+  echo "    $TUNNEL_LOG"
+}
+trap cleanup EXIT INT TERM
+# ── 3. Wait for /api/health ──────────────────────────────────────────────
+printf "  waiting for ML model load "
+for _ in $(seq 1 40); do
+  if curl -sf --max-time 1 --noproxy '*' "http://127.0.0.1:$PORT/api/health" >/dev/null 2>&1; then
+    echo " ✓"
+    break
+  fi
+  printf "."
+  sleep 1
+done
+if ! curl -sf --max-time 1 --noproxy '*' "http://127.0.0.1:$PORT/api/health" >/dev/null 2>&1; then
+  echo
+  echo "❌ FastAPI did not become ready in 40 s. Last log lines:"
+  tail -20 "$UVICORN_LOG"
+  exit 1
+fi
+HEALTH=$(curl -s --noproxy '*' "http://127.0.0.1:$PORT/api/health")
+ML_LOADED=$(echo "$HEALTH" | python3 -c 'import json,sys; print(json.load(sys.stdin)["ml_loaded"])' 2>/dev/null || echo "?")
+echo "  ML model loaded: $ML_LOADED   (response: ${HEALTH:0:80}…)"
+echo
+# ── 4. Start Cloudflare Quick Tunnel ─────────────────────────────────────
+echo "▶ Opening Cloudflare Quick Tunnel …"
+echo "  (your public URL will print below as 'https://*.trycloudflare.com')"
+echo "  ─────────────────────────────────────────────────────────────────"
+# Run cloudflared in foreground so the user sees the URL and can Ctrl-C.
+./.local/bin/cloudflared tunnel --url "http://127.0.0.1:$PORT" 2>&1 | tee "$TUNNEL_LOG" &
+CF_PID=$!
+wait "$CF_PID"