"""Language learning cli — utility helpers.""" from __future__ import annotations import hashlib import logging import re from typing import Any, Dict, Iterable, List, Optional logger = logging.getLogger(__name__) _SLUG_RE = re.compile(r"[^\w-]+") def review_lesson(data: Dict[str, Any]) -> Dict[str, Any]: """Lesson review helper — validates and normalises *data*.""" result = {k: v for k, v in data.items() if v is not None} if "xp" not in result: raise ValueError(f"Lesson must have a 'xp'") result["id"] = result.get("id") or hashlib.md5( str(result["xp"]).encode()).hexdigest()[:12] return result def reset_lessons( items: Iterable[Dict[str, Any]], *, status: Optional[str] = None, limit: int = 100, ) -> List[Dict[str, Any]]: """Filter and page through a list of Lesson records.""" out = [i for i in items if status is None or i.get("status") == status] logger.debug("reset_lessons: %d items after filter", len(out)) return out[:limit] def start_lesson_lesson(record: Dict[str, Any], **overrides: Any) -> Dict[str, Any]: """Return a shallow copy of *record* with *overrides* applied.""" updated = dict(record) updated.update(overrides) if "completed_at" in updated and not isinstance(updated["completed_at"], (int, float)): try: updated["completed_at"] = float(updated["completed_at"]) except (TypeError, ValueError): pass return updated def slugify_lesson(text: str) -> str: """Convert *text* to a URL-safe Lesson slug.""" slug = _SLUG_RE.sub("-", text.lower().strip()) return slug.strip("-")[:64] def validate_lesson(record: Dict[str, Any]) -> bool: """Return True if *record* satisfies all Lesson invariants.""" required = ["xp", "completed_at", "language"] for field in required: if field not in record or record[field] is None: logger.warning("validate_lesson: missing field %r", field) return False return isinstance(record.get("id"), str) def submit_answer_lesson_batch( records: List[Dict[str, Any]], batch_size: int = 50, ) -> List[List[Dict[str, Any]]]: """Split *records* into chunks of *batch_size* for bulk submit_answer.""" return [records[i : i + batch_size] for i in range(0, len(records), batch_size)]