"""Placeholder hetero graph encoder.""" from __future__ import annotations import numpy as np from app.knowledge.ddi_knowledge import top_risky_pairs from app.knowledge.drug_catalog import DRUG_CLASSES from app.knowledge.side_effect_ontology import SIDE_EFFECT_TAGS def encode_regimen(drugs: list[str], dim: int = 24) -> np.ndarray: vec = np.zeros(dim, dtype=float) ordered = sorted(drugs) for idx, drug in enumerate(ordered[:12]): vec[idx] = (hash(drug) % 1000) / 1000.0 class_counts: dict[str, int] = {} for drug in ordered: cls = DRUG_CLASSES.get(drug, "unknown") class_counts[cls] = class_counts.get(cls, 0) + 1 class_values = sorted(class_counts.values(), reverse=True) for i, value in enumerate(class_values[:5], start=12): vec[i] = min(1.0, value / 4.0) side_effect_count = sum(len(SIDE_EFFECT_TAGS.get(drug, [])) for drug in ordered) vec[17] = min(1.0, side_effect_count / 20.0) vec[18] = min(1.0, len(ordered) / 12.0) vec[19] = min(1.0, len(top_risky_pairs(ordered)) / 4.0) vec[20] = float(any("sedative" == DRUG_CLASSES.get(drug) for drug in ordered)) vec[21] = float(any("anticoagulant" == DRUG_CLASSES.get(drug) for drug in ordered)) vec[22] = float(any("glucose_lowering" == DRUG_CLASSES.get(drug) for drug in ordered)) vec[23] = min(1.0, sum(ord(ch) for ch in "".join(ordered)) % 1000 / 1000.0) return vec