adithya9903's picture
Deploy PolyGuard HF training Space
fd0c71a verified
"""Placeholder hetero graph encoder."""
from __future__ import annotations
import numpy as np
from app.knowledge.ddi_knowledge import top_risky_pairs
from app.knowledge.drug_catalog import DRUG_CLASSES
from app.knowledge.side_effect_ontology import SIDE_EFFECT_TAGS
def encode_regimen(drugs: list[str], dim: int = 24) -> np.ndarray:
vec = np.zeros(dim, dtype=float)
ordered = sorted(drugs)
for idx, drug in enumerate(ordered[:12]):
vec[idx] = (hash(drug) % 1000) / 1000.0
class_counts: dict[str, int] = {}
for drug in ordered:
cls = DRUG_CLASSES.get(drug, "unknown")
class_counts[cls] = class_counts.get(cls, 0) + 1
class_values = sorted(class_counts.values(), reverse=True)
for i, value in enumerate(class_values[:5], start=12):
vec[i] = min(1.0, value / 4.0)
side_effect_count = sum(len(SIDE_EFFECT_TAGS.get(drug, [])) for drug in ordered)
vec[17] = min(1.0, side_effect_count / 20.0)
vec[18] = min(1.0, len(ordered) / 12.0)
vec[19] = min(1.0, len(top_risky_pairs(ordered)) / 4.0)
vec[20] = float(any("sedative" == DRUG_CLASSES.get(drug) for drug in ordered))
vec[21] = float(any("anticoagulant" == DRUG_CLASSES.get(drug) for drug in ordered))
vec[22] = float(any("glucose_lowering" == DRUG_CLASSES.get(drug) for drug in ordered))
vec[23] = min(1.0, sum(ord(ch) for ch in "".join(ordered)) % 1000 / 1000.0)
return vec