surrogate-1 / agents /role-knowledge-map.json
Ashira Pitchayapakayakul
feat: +800 LLM-expanded SDLC keywords across 10 roles
d6ecdbd
{
"version": "1.0",
"description": "Per-role SDLC knowledge map. Drives hf-dataset-discoverer.py search queries. Each role has CORE skills (must master) and ADJACENT skills (should know). Source: real job descriptions from FAANG / unicorns / OSS projects 2024-2026.",
"roles": {
"solution-architect": {
"core": [
"system design",
"domain driven design",
"bounded context",
"aggregate root",
"hexagonal architecture",
"clean architecture",
"onion architecture",
"adr architecture decision record",
"trade-off analysis",
"scalability pattern",
"consistency model",
"cap theorem",
"saga pattern",
"event sourcing",
"cqrs",
"microservices",
"monolith first",
"integration pattern",
"anti-corruption layer",
"bff backend for frontend"
],
"adjacent": [
"threat modeling stride",
"data modeling",
"api design rest graphql",
"monitoring strategy",
"capacity planning",
"cost optimization",
"non-functional requirements",
"service level objectives"
],
"expanded": [
"adr architecture decision record",
"anti-corruption layer",
"apache cassandra nosql",
"apache kafka streaming",
"api design graphql",
"api design rest",
"aws cdk",
"aws cloudformation",
"aws iam",
"aws saa certification",
"azure active directory",
"azure cdk",
"azure resource manager",
"azure well-architected framework",
"bff backend for frontend",
"bounded context",
"cap theorem",
"capacity planning",
"chaos engineering",
"ci/cd pipeline",
"cka certification",
"clean architecture",
"cloud development kit",
"consistency model",
"container security",
"cost optimization",
"cqrs",
"data modeling",
"datadog monitoring",
"devsecops practices",
"distributed tracing",
"docker containerization",
"domain driven design",
"envoy proxy",
"event sourcing",
"gitops workflow",
"google cloud architecture",
"google cloud cdk",
"google cloud deployment manager",
"google cloud iam",
"grafana visualization",
"grpc framework",
"hashicorp vault",
"hexagonal architecture",
"integration pattern",
"iso 27001 standard",
"istio service mesh",
"jenkins automation",
"jwt tokenization",
"kubernetes deployment",
"kubernetes security",
"linkerd service mesh",
"microservices architecture",
"mongodb nosql",
"monitoring strategy",
"monolith first",
"new relic monitoring",
"non-functional requirements",
"oauth authentication",
"observability platform",
"onion architecture",
"openid connect",
"opentelemetry standard",
"pki infrastructure",
"postgresql database",
"prometheus monitoring",
"protocol buffers",
"pulumi infrastructure",
"saga pattern",
"saml federation",
"scalability pattern",
"serverless architecture",
"service level objectives",
"service mesh architecture",
"sre engineering",
"terraform infrastructure",
"terraform state management",
"threat modeling stride",
"trade-off analysis",
"zero trust security"
]
},
"backend-engineer": {
"core": [
"rest api design",
"graphql schema",
"grpc protobuf",
"postgresql",
"mysql",
"mongodb",
"redis cache",
"authentication oauth jwt",
"authorization rbac abac",
"message queue kafka rabbitmq",
"background jobs celery sidekiq",
"error handling exception",
"structured logging traceid",
"unit test integration test",
"fastapi flask express spring",
"go fiber gin",
"rust axum actix",
"node nestjs",
"kotlin ktor"
],
"adjacent": [
"frontend api consumption",
"ci cd pipeline",
"docker container",
"owasp top 10",
"performance profiling pprof",
"n+1 query",
"circuit breaker",
"rate limiting",
"idempotency"
],
"expanded": [
"abac attribute checks",
"actix web actors",
"akka actor model",
"ansible configuration management",
"apache kafka streams",
"auth0 customization",
"aws lambda functions",
"azure functions",
"cassandra data modeling",
"celery task scheduling",
"ci cd pipeline configuration",
"circuit breaker pattern",
"confluent schema registry",
"consul service discovery",
"datadog monitoring",
"django rest framework",
"docker container orchestration",
"dynamodb partition keys",
"elasticsearch full text search",
"elk stack logging",
"envoy proxy sidecar",
"exception handling strategy",
"express middleware stack",
"fastapi dependency injection",
"flask blueprints",
"fluentd log forwarding",
"frontend api consumption",
"gin gonic handlers",
"go fiber router",
"google cloud run",
"grafana dashboarding",
"graphql schema definition",
"grpc protobuf contracts",
"helm chart templating",
"idempotency key enforcement",
"integration test automation",
"istio service mesh",
"jaeger distributed tracing",
"jedis connection pooling",
"jwt token validation",
"kafka message streaming",
"keycloak identity brokering",
"kibana visualization",
"kubernetes deployment manifests",
"laravel sanctum",
"logstash filters",
"mongodb aggregation pipeline",
"mongodb change streams",
"mysql gtid replication",
"mysql replication setup",
"n+1 query detection",
"nginx ingress controller",
"node nestjs modules",
"oauth 2.0 implementation",
"okta integration",
"opentelemetry tracing",
"owasp top 10 compliance",
"performance profiling with pprof",
"phoenix framework channels",
"postgresql logical replication",
"postgresql query optimization",
"prometheus metrics collection",
"quarkus native image",
"rabbitmq exchange routing",
"rate limiting algorithms",
"rbac policy enforcement",
"redis cache invalidation",
"redisson java client",
"rest api design",
"ruby on rails api mode",
"rust axum extractors",
"sentry error tracking",
"sidekiq background processing",
"spring boot starters",
"spring security oauth2",
"structured logging with traceid",
"terraform infrastructure as code",
"unit test coverage",
"vault secrets management",
"vertx reactive programming"
]
},
"frontend-engineer": {
"core": [
"react hooks suspense",
"next.js app router",
"vue composition api",
"svelte sveltekit",
"solid solidstart",
"typescript strict",
"tailwind css",
"css-in-js styled-components",
"shadcn radix headless",
"state management zustand jotai redux",
"tanstack react query",
"react testing library",
"playwright cypress e2e",
"wcag accessibility aria",
"web vitals lcp cls inp",
"bundle optimization code splitting tree shaking"
],
"adjacent": [
"backend api integration",
"design system tokens",
"seo meta tags structured data",
"a/b testing experiment",
"analytics events",
"feature flag",
"i18n localization",
"progressive web app",
"service worker"
],
"expanded": [
"a/b testing experiment",
"accessibility guidelines wcag 2.2",
"analytics events tracking",
"api gateway integration",
"aria authoring practices",
"aws lambda functions",
"babel transpilation",
"backend api integration",
"bundle optimization code splitting",
"chrome devtools performance",
"cloudflare workers",
"containerization docker",
"css flexbox layout",
"css grid layout",
"css-in-js styled-components",
"cypress end-to-end testing",
"design system tokens",
"eslint code linting",
"feature flag management",
"firefox developer edition",
"google cloud functions",
"graphql api schema",
"grpc protocol buffers",
"headless chrome testing",
"i18n localization",
"javascript es2025",
"jest testing framework",
"jotai redux",
"jwt token authentication",
"kubernetes deployment",
"lighthouse performance metrics",
"microsoft azure functions",
"microsoft edge devtools",
"next.js app router",
"oauth authentication",
"openapi specification",
"playwright cypress e2e",
"preact compatibility",
"progressive web app",
"puppeteer automation",
"pwa manifest file",
"radix ui components",
"react concurrent mode",
"react hooks suspense",
"react server components",
"react testing library",
"remix run",
"restful api design",
"rollup bundle optimization",
"safari web inspector",
"seo meta tags",
"serverless architecture",
"service worker registration",
"shadcn radix headless",
"shadcn theme builder",
"solid solidstart",
"solidstart adapter",
"state management zustand",
"structured data schema",
"svelte 4 compiler",
"svelte sveltekit",
"sveltekit adapter",
"tailwind css",
"tailwind css v4",
"tanstack react query",
"tree shaking",
"typescript 5",
"typescript strict",
"vite development server",
"vue 3 composition",
"vue composition api",
"wai-aria specification",
"wcag accessibility aria",
"web vitals lcp cls inp",
"webassembly binary format",
"webpack 5 module federation",
"webpack configuration",
"webpagetest performance testing",
"webrtc peer-to-peer connection",
"websockets realtime communication"
]
},
"mobile-engineer": {
"core": [
"swiftui combine",
"uikit lifecycle",
"kotlin jetpack compose",
"android navigation",
"react native expo",
"flutter dart",
"offline first cache realm room",
"push notification fcm apns",
"deep linking universal",
"app store optimization aso",
"app review guidelines",
"crash reporting sentry crashlytics",
"memory profiling",
"battery optimization"
],
"adjacent": [
"backend api consumption",
"graphql apollo",
"analytics amplitude mixpanel",
"feature flag",
"accessibility voiceover talkback",
"in app purchase store kit billing"
],
"expanded": [
"accessibility voiceover",
"agile development methodology",
"amplitude cohorts",
"analytics amplitude mixpanel",
"android 13 updates",
"android jetpack",
"android navigation",
"apns integration",
"app clips integration",
"app review guidelines",
"app store optimization aso",
"apple app analytics",
"aws saa certification",
"azure developer associate",
"azure functions integration",
"backend api consumption",
"battery optimization techniques",
"behavior driven development bdd",
"billing android",
"bitrise automation",
"circleci pipeline",
"cka certified kubernetes administrator",
"clean architecture pattern",
"cloud functions firebase",
"code refactoring techniques",
"code review process",
"codecoverage analysis",
"continuous deployment cd",
"continuous integration ci",
"core data storage",
"crash reporting sentry",
"crashlytics crash reporting",
"crashlytics integration",
"datadog integration",
"deep linking universal",
"design patterns repository",
"docker containerization",
"event driven architecture",
"expo sdk 46",
"feature flag management",
"firebase cloud messaging",
"flutter 3.0 features",
"flutter dart",
"git version control",
"github actions workflow",
"google cloud ace",
"google firebase analytics",
"graphql apollo client",
"in app purchase storekit",
"ios 16 features",
"ios swiftui 4",
"iso 27001 certification",
"jenkins pipeline",
"jetpack compose 1.3",
"kanban board",
"keychain services",
"kotlin 1.8 features",
"kotlin jetpack compose",
"kubernetes cluster management",
"memory profiling tools",
"microservices architecture",
"mixpanel funnels",
"mvp design pattern",
"mvvm architecture",
"new relic monitoring",
"offline first cache realm",
"pair programming technique",
"push notification fcm",
"react native 0.71",
"react native expo",
"room persistence library",
"scrum framework",
"sentry error tracking",
"serverless computing aws lambda",
"swift 5.7 updates",
"swiftui combine",
"talkback integration",
"test driven development tdd",
"uikit lifecycle",
"user defaults management"
]
},
"devops-engineer": {
"core": [
"github actions workflow",
"gitlab ci",
"jenkins pipeline",
"circleci",
"argocd flux gitops",
"docker multi-stage",
"buildkit buildx",
"kubernetes deployment service ingress",
"helm chart kustomize",
"terraform module",
"pulumi cdk",
"ansible chef puppet",
"configuration management",
"vault secrets sealed-secrets sops",
"blue green canary deployment",
"feature flag rollout"
],
"adjacent": [
"networking vpc subnet",
"security scanning trivy snyk",
"observability prometheus grafana",
"finops cost",
"container runtime containerd cri-o"
],
"expanded": [
"12 factor app methodology",
"ansible tower",
"api gateway management",
"argocd flux gitops",
"audit logging compliance",
"automated testing framework",
"aws codepipeline",
"aws saa certification",
"azure devops services",
"backstage service catalog",
"blue green deployment",
"buildkit buildx",
"canary release strategy",
"capacity planning strategy",
"chaos engineering principles",
"chef infra",
"ci cd pipeline automation",
"circleci orb",
"cka certification",
"ckad certification",
"cloud agnostic deployment",
"cloud cost management",
"cloud native applications",
"compliance as code",
"container orchestration",
"container runtime containerd",
"continuous deployment strategy",
"continuous integration pipeline",
"cost estimation tooling",
"cri-o kubernetes",
"devsecops methodology",
"distributed tracing system",
"docker multi-stage build",
"edge computing use cases",
"feature flag rollout",
"finops cost optimization",
"github actions workflow",
"gitlab ci cd",
"gitops tooling",
"google cloud build",
"grafana dashboards",
"helm chart kustomize",
"hybrid cloud architecture",
"infrastructure as code",
"iso 27001 compliance",
"jenkins pipeline",
"knative eventing",
"kubernetes deployment yaml",
"kubernetes operator pattern",
"kustomize overlay",
"load balancing strategy",
"logging mechanism",
"microservices architecture",
"monitoring alerting system",
"multi cloud strategy",
"networking vpc subnet",
"observability prometheus",
"openshift container platform",
"performance monitoring metrics",
"policy as code",
"pulumi cdk typescript",
"puppet forge",
"rancher kubernetes management",
"reliability engineering practices",
"resource optimization techniques",
"sealed secrets",
"security scanning trivy",
"serverless computing architecture",
"serverless functions",
"service discovery mechanism",
"service mesh istio",
"shift left security",
"site reliability engineering",
"skaffold development",
"snyk vulnerability",
"sops encryption",
"tanzu kubernetes grid",
"tekton pipelines",
"terraform module registry",
"vault secrets engine"
]
},
"sre-engineer": {
"core": [
"service level indicator sli",
"service level objective slo",
"error budget",
"burn rate alert",
"multi window alerting",
"prometheus metrics",
"grafana dashboard",
"loki promtail fluentd logging",
"opentelemetry tracing",
"incident response runbook",
"blameless postmortem",
"five whys root cause",
"chaos engineering chaos-mesh litmus",
"capacity planning",
"load testing k6 locust",
"on-call rotation pagerduty"
],
"adjacent": [
"kubernetes deep",
"linux performance ebpf",
"networking troubleshooting",
"security incident",
"cost optimization",
"disaster recovery"
],
"expanded": [
"ansible automation",
"aws saa certification",
"aws well-architected framework",
"azure well-architected framework",
"backpressure management",
"blameless postmortem",
"bulkhead pattern",
"burn rate alerting",
"calico networking",
"capacity planning",
"chaos engineering",
"chaos-mesh",
"cilium networking",
"circuit breaker pattern",
"cka certification",
"ckad certification",
"cloud native computing",
"cloudevents specification",
"cncf certification",
"continuous deployment",
"continuous integration",
"continuous monitoring",
"cost optimization",
"dapr framework",
"devops practices",
"disaster recovery planning",
"distributed tracing",
"docker containerization",
"ebpf optimization",
"error budget management",
"event-driven architecture",
"five whys analysis",
"fluentd",
"gitops workflow",
"google cloud architecture",
"grafana dashboard",
"grpc protocol",
"horizontal pod autoscaling",
"http/2 protocol",
"incident response runbook",
"infrastructure as code",
"iso 20000 certification",
"iso 27001 compliance",
"istio service mesh",
"itil certification",
"k6 performance",
"knative platform",
"kubernetes autoscaling",
"kubernetes cluster management",
"kubernetes deployment",
"kubernetes networking",
"linkerd service mesh",
"linux kernel tuning",
"linux performance",
"litmus testing",
"load testing",
"locust testing",
"loki logging",
"microservices architecture",
"multi-window alerting",
"networking fundamentals",
"networking troubleshooting",
"on-call rotation",
"opentelemetry sdk",
"opentelemetry tracing",
"opentracing standard",
"pagerduty integration",
"prometheus metrics",
"promtail",
"quic protocol",
"security incident response",
"serverless computing",
"service level indicator",
"service level objective",
"sli monitoring",
"slo tracking",
"sre principles",
"tcp/ip protocol",
"terraform management",
"vertical pod autoscaling"
]
},
"cloud-engineer": {
"core": [
"aws ec2 s3 lambda dynamodb rds vpc iam",
"gcp gce gcs cloud-run firestore bigquery",
"azure aks cosmos blob",
"aws well-architected framework",
"multi-region active active passive",
"disaster recovery rpo rto",
"cost optimization spot reserved savings-plan",
"tagging strategy cost allocation",
"private subnet nat gateway vpc endpoint",
"iam policy least privilege",
"kms encryption"
],
"adjacent": [
"kubernetes eks gke aks",
"service mesh istio linkerd",
"compliance soc2 hipaa pci",
"cdn cloudfront cloudflare",
"edge computing lambda-edge"
],
"expanded": [
"aks policy addon",
"aks virtual node",
"ansible aws ssm",
"argo cd gitops",
"aurora serverless v2",
"aws config rules",
"aws control tower",
"aws dynamodb global tables",
"aws ec2 auto scaling",
"aws iam role chaining",
"aws kms envelope encryption",
"aws lambda cold start",
"aws rds multi az",
"aws s3 lifecycle policies",
"aws savings plans",
"aws security hub",
"aws vpc flow logs",
"aws well-architected review",
"azure aks node pools",
"azure blob immutable storage",
"azure cosmos db graph api",
"azure monitor insights",
"azure security center",
"cdn cache invalidation",
"chaos engineering gremlin",
"cloudflare zero trust",
"cloudformation drift detection",
"cloudtrail log integrity",
"compliance soc2 type ii",
"cost optimization reserved instances",
"datadog distributed tracing",
"disaster recovery runbook",
"documentdb change streams",
"edge computing iot edge",
"eks add ons",
"eks fargate profiles",
"elk stack ingestion",
"fluxcd helm operator",
"gcp audit logging",
"gcp bigquery slot commitments",
"gcp cloud run jobs",
"gcp firestore native mode",
"gcp folder hierarchy",
"gcp gce preemptible vms",
"gcp gcs signed urls",
"gcp security command center",
"github actions aws oidc",
"gitlab ci gcp auth",
"gke autopilot clusters",
"gke hub config sync",
"grafana mimir",
"hipaa eligible services",
"iam policy conditions",
"istio canary releases",
"istio traffic mirroring",
"kafka event streaming",
"kinesis data streams",
"kms key rotation",
"kubernetes cluster autoscaler",
"lambda edge viewer request",
"linkerd tap cli",
"memcached replication group",
"multi region active active",
"nat gateway failover",
"new relic apm",
"opensearch kibana dashboards",
"opensearch serverless",
"pci dss aws",
"private subnet egress",
"prometheus cloudwatch exporter",
"pub sub schema registry",
"pulumi aws provider",
"redis elasticache cluster",
"rpo rto metrics",
"sentry error tracking",
"service mesh sidecar injection",
"splunk hec",
"tagging strategy aws",
"terraform modules registry",
"vpc endpoint policies"
]
},
"devsecops-engineer": {
"core": [
"sast semgrep codeql bandit",
"dast zap burp",
"sca trivy grype snyk dependabot",
"secret scanning gitleaks trufflehog",
"container image scan trivy clair",
"sbom syft cyclonedx spdx",
"sigstore cosign attestation",
"slsa supply chain framework",
"opa rego conftest policy as code",
"shift left security",
"vulnerability management cvss epss kev"
],
"adjacent": [
"incident response forensics",
"compliance automation",
"threat intelligence mitre att&ck",
"zero trust mtls service mesh"
],
"expanded": [
"12 factor app",
"api security",
"as code shift left",
"att&ck zero trust",
"attestation slsa",
"aws iam",
"aws saa certified",
"azure ad",
"azure devops",
"burp suite",
"calico typha",
"ci cd pipeline",
"cilium hubble",
"cis benchmarks",
"cka certified",
"cloud native",
"cmmc level 3",
"cncf certified",
"codeql bandit",
"compliance automation",
"conftest policy",
"container image scan",
"cvss epss",
"cwe sage",
"cyclonedx spdx",
"dast zap",
"dependabot github",
"devsecops framework",
"docker kubernetes",
"ebpf cilium",
"fedramp moderate",
"fluxcd kustomize",
"gcp iam",
"gitops argocd",
"google cloud",
"google workspace",
"grype snyk",
"incident response forensics",
"iso 27001 compliant",
"istio envoy",
"jira service desk",
"jwt json web",
"kev cve",
"kubeflow tfx",
"kubernetes dashboard",
"linkerd buoyant",
"microsoft 365",
"mitre att&ck v10",
"mtls mutual auth",
"mtls service mesh",
"network policy",
"newman postman",
"nist cybersecurity",
"nist sp 800",
"oauth 2.0",
"opa rego",
"openid connect",
"owasp top 10",
"pci dss v3",
"prometheus grafana",
"saml 2.0",
"sast semgrep",
"sbom syft",
"sca trivy",
"scim 2.0",
"secret scanning gitleaks",
"security vulnerability management",
"service mesh istio",
"sigstore cosign",
"skaffold ko",
"slack ms teams",
"spinnaker armada",
"supply chain framework",
"tekton pipeline",
"terraform aws",
"threat intelligence mitre",
"tokenization encryption",
"trivy clair",
"trufflehog twillio",
"x509 certificates"
]
},
"cloud-security": {
"core": [
"cspm prowler scoutsuite steampipe",
"cis benchmark aws azure gcp",
"iam audit access analyzer",
"least privilege",
"encryption at rest in transit kms",
"envelope encryption",
"key rotation",
"waf shield guardduty",
"compliance pci-dss hipaa soc2 fedramp gdpr iso27001",
"siem splunk elastic security qradar",
"cloud detection response cdr",
"incident response cloud trail"
],
"adjacent": [
"network security firewall nsg",
"application security owasp",
"threat detection lateral movement",
"data loss prevention dlp"
],
"expanded": [
"access analyzer",
"ansible",
"application security",
"aws lambda security",
"aws saa",
"aws secrets manager",
"aws well-architected framework",
"azure functions security",
"azure key vault",
"azure security center",
"azure security engineer associate",
"casb",
"cdr",
"cis benchmark",
"cka",
"cloud access security broker",
"cloud detection response",
"cloud security gateway",
"cloud security posture management",
"cloudformation",
"cloudtrail",
"compliance as code",
"container security",
"cspm",
"data loss prevention",
"dlp",
"docker security",
"elastic security",
"encryption at rest",
"encryption in transit",
"envelope encryption",
"extended detection response",
"fedramp",
"firewall",
"gcp cloud functions security",
"gcp professional cloud security engineer",
"gcp security command center",
"gdpr",
"google cloud secret manager",
"guardduty",
"hashicorp vault",
"hipaa",
"iam",
"incident response",
"infrastructure as code",
"iso 27001",
"iso 27017",
"iso 27018",
"key rotation",
"kms",
"kubernetes security",
"lateral movement",
"least privilege",
"managed detection response",
"mdr",
"mitre att&ck",
"network security",
"nist cybersecurity framework",
"nsg",
"owasp",
"pci-dss",
"prowler",
"qradar",
"sase",
"scoutsuite",
"secret management",
"secure access service edge",
"security orchestration automation response",
"serverless security",
"shield",
"siem",
"soar",
"soc2",
"splunk",
"steampipe",
"terraform",
"threat detection",
"waf",
"xdr",
"zero trust architecture"
]
},
"data-engineer": {
"core": [
"airflow dag",
"dagster prefect",
"spark pyspark",
"flink streaming",
"kafka connect schema registry",
"delta lake iceberg hudi",
"lakehouse",
"snowflake bigquery redshift",
"dbt model test snapshot",
"schema evolution avro protobuf",
"great expectations dbt-tests data quality",
"openlineage data lineage",
"cdc debezium"
],
"adjacent": [
"ml pipeline kubeflow tfx",
"observability for data datadog metaflow",
"cost optimization warehouse"
],
"expanded": [
"airflow dag design",
"apache beam pipeline",
"apache flink sql",
"apache spark sql",
"avro data serialization",
"aws cloudformation template",
"aws saa certification",
"azure resource manager",
"batch processing workflow",
"bigquery data analytics",
"cdc debezium integration",
"change data capture",
"cka certified kubernetes",
"cloud-native design pattern",
"containerization using docker",
"cost optimization strategy",
"dagster prefect workflow",
"data anonymization technique",
"data architecture framework",
"data architecture pattern",
"data catalog management",
"data cataloging standard",
"data certification standard",
"data discovery protocol",
"data discovery tool",
"data encryption algorithm",
"data engineering framework",
"data engineering methodology",
"data governance framework",
"data integration pattern",
"data lakehouse implementation",
"data lineage analysis",
"data loading strategy",
"data masking method",
"data pipeline monitoring",
"data quality assurance",
"data quality metric",
"data replication technique",
"data roadmap creation",
"data strategy development",
"data technology stack",
"data transformation workflow",
"data validation rule",
"data versioning system",
"data warehouse optimization",
"datadog monitoring tool",
"dbt model development",
"dbt test automation",
"dbt-tests data validation",
"delta lake storage",
"event-driven architecture pattern",
"flink streaming architecture",
"gcp cloud deployment manager",
"great expectations testing",
"hudi data lake",
"iceberg table format",
"iso 27001 compliance",
"java data engineering",
"kafka connect schema",
"kubeflow workflow management",
"kubernetes cluster management",
"lakehouse architecture pattern",
"metaflow workflow automation",
"microservices architecture style",
"ml pipeline development",
"openlineage data lineage",
"protobuf data format",
"python data engineering",
"real-time data processing",
"redshift data engineering",
"scala data engineering",
"schema evolution management",
"serverless computing model",
"snapshot testing strategy",
"snowflake data warehousing",
"spark pyspark optimization",
"stream processing architecture",
"terraform infrastructure provisioning",
"tfx pipeline orchestration",
"warehouse cost management"
]
},
"ml-engineer": {
"core": [
"pytorch lightning",
"huggingface transformers",
"lora qlora peft fine-tuning",
"unsloth axolotl",
"deepspeed fsdp accelerate",
"vllm tgi triton inference",
"model serving",
"mlflow weights and biases",
"feature store feast tecton",
"data version control dvc",
"rag retrieval augmented generation",
"vector database faiss chroma weaviate qdrant",
"embedding nomic bge instructor",
"reranker cross-encoder bge mxbai",
"evaluation lm-eval-harness",
"prompt engineering chain of thought"
],
"adjacent": [
"devops kubernetes",
"data engineering",
"statistics distribution",
"rlhf dpo orpo preference learning",
"agent framework langgraph crew autogen"
]
},
"database-engineer": {
"core": [
"postgresql tuning",
"mysql innodb",
"explain analyze query plan",
"btree gin gist hash index",
"partial index expression index",
"table partition list range hash",
"vacuum autovacuum bloat",
"replication streaming logical",
"connection pool pgbouncer",
"schema migration sqitch flyway alembic liquibase",
"online ddl pt-online-schema-change",
"backup pitr point-in-time recovery"
],
"adjacent": [
"redis caching pattern",
"timescaledb timeseries",
"clickhouse olap",
"graph neo4j",
"search elasticsearch opensearch"
]
},
"qa-engineer": {
"core": [
"test pyramid",
"unit test mock stub",
"integration test database",
"playwright cypress webdriver e2e",
"rest assured supertest api test",
"property based testing fast-check hypothesis",
"fuzzing afl libfuzzer",
"mutation testing pitest stryker",
"snapshot test storybook",
"contract testing pact",
"test factory fixture builder pattern",
"coverage line branch path"
],
"adjacent": [
"ci cd pipeline test stage",
"performance testing k6 jmeter",
"security testing zap",
"accessibility testing axe pa11y",
"visual regression chromatic"
]
},
"performance-engineer": {
"core": [
"profiling pprof py-spy async-profiler",
"load testing k6 locust gatling",
"stress testing",
"soak test",
"p50 p95 p99 latency",
"throughput rps",
"flame graph",
"n+1 query elimination",
"caching l1 l2 cdn",
"connection pool sizing",
"async io goroutine coroutine",
"memory profiling heap allocation",
"garbage collection tuning"
],
"adjacent": [
"observability tracing",
"database tuning",
"kernel ebpf bpftrace",
"network latency rtt"
]
},
"tech-writer": {
"core": [
"diataxis framework tutorial how-to reference explanation",
"openapi swagger redoc",
"api design google api guidelines",
"readme structure",
"adr template",
"runbook structure",
"code documentation jsdoc rustdoc",
"tutorial step by step",
"style guide google microsoft chicago"
],
"adjacent": [
"code reading comprehension",
"user research empathy",
"i18n internationalization",
"screencast tutorial recording"
]
},
"platform-engineer": {
"core": [
"internal developer platform idp",
"backstage developer portal",
"golden path opinionated workflow",
"service catalog",
"shared ci cd template",
"observability infrastructure",
"secrets distribution",
"feature flag platform",
"multi-tenancy"
],
"adjacent": [
"all sre devops topics",
"developer experience dx",
"documentation platform"
]
},
"ai-agent-engineer": {
"core": [
"react agent reasoning acting",
"tool calling function calling",
"mcp model context protocol",
"agent orchestration langgraph crew autogen",
"agentic workflow",
"multi agent collaboration",
"self critique reflexion",
"voyager skill library",
"memory episodic procedural",
"rag retrieval augmented",
"vector search embedding rerank",
"prompt engineering xml structured",
"constitutional ai safety"
],
"adjacent": [
"all backend topics",
"ml engineering fine-tuning",
"evaluation benchmark swe-bench",
"cost optimization token budget"
]
}
},
"cross_cutting_topics": [
"system design interview",
"high scalability",
"distributed system consensus raft paxos",
"consistency strong eventual causal",
"caching strategy ttl invalidation",
"rate limiting algorithm token bucket leaky",
"load balancer round robin least connection",
"circuit breaker hystrix resilience4j",
"12 factor app",
"twelve factor",
"domain language ubiquitous",
"code review checklist",
"git workflow gitflow trunk-based",
"semver conventional commits",
"testing best practice",
"logging structured json",
"tracing opentelemetry w3c",
"metrics red use sli",
"observability three pillars",
"incident severity sev1 sev2",
"blameless culture",
"engineering excellence dora metrics"
]
}