"""
Personal Career Agent — LoRA SFT Training Script
Base: Qwen/Qwen2.5-1.5B-Instruct  |  Method: TRL SFTTrainer + LoRA

Run:
    pip install transformers trl datasets peft torch trackio
    python train.py

Requires: GPU with ≥16GB VRAM (T4 works at batch 2 + grad accum 4 + LoRA)
"""
import json, random
from datasets import load_dataset, Dataset, concatenate_datasets
from transformers import AutoTokenizer
from trl import SFTTrainer, SFTConfig
from peft import LoraConfig, TaskType

MODEL_ID = "Qwen/Qwen2.5-1.5B-Instruct"
OUTPUT_HUB = "Builder-Neekhil/career-agent-v1"
DATASET_HUB = "Builder-Neekhil/career-agent-dataset-v1"

CAREER_SYSTEM = (
    "You are a seasoned career advising expert with 15 years of experience helping professionals "
    "navigate their careers. You excel at: reviewing and tailoring resumes, assessing job fit, "
    "generating interview questions, suggesting career paths, and optimizing for ATS keywords. "
    "Be specific, honest, actionable, and concise. When appropriate, provide structured JSON outputs."
)

# ── DATA BUILDERS ─────────────────────────────────────────────────────

def build_resume_job_fit():
    ds = load_dataset("cnamuangtoun/resume-job-description-fit", split="train")
    out = []
    for ex in ds:
        resume, job = ex["resume_text"].strip(), ex["job_description_text"].strip()
        fit = "Good Fit" if ex["label"] in ("Fit", "Good Fit", "Good") else "No Fit"
        score = 75 if fit == "Good Fit" else 25
        prompt = (
            f"Resume:\n{resume}\n\nJob Description:\n{job}\n\n"
            f"Task: Assess how well this resume matches the job. Return a JSON with fields: "
            f"'fit_assessment' ('{fit}'), 'score' ({score}), 'strengths' (list), 'gaps' (list), "
            f"'suggestions' (list of concrete improvements)."
        )
        answer = json.dumps({
            "fit_assessment": fit, "score": score,
            "strengths": ["Relevant experience present"],
            "gaps": ["Tailor keywords to job description"],
            "suggestions": ["Add measurable achievements", "Mirror JD language in skills section"]
        }, indent=2)
        out.append({"messages": [
            {"role": "system", "content": CAREER_SYSTEM},
            {"role": "user", "content": prompt},
            {"role": "assistant", "content": answer}
        ]})
    return Dataset.from_list(out)


def build_resume_review():
    ds = load_dataset("opensporks/resumes", split="train")
    out = []
    for ex in ds:
        resume, cat = ex["Resume_str"].strip(), ex["Category"]
        out.append({"messages": [
            {"role": "system", "content": CAREER_SYSTEM},
            {"role": "user", "content": f"Please review my resume and give me actionable feedback:\n\n{resume}"},
            {"role": "assistant", "content": (
                f"## Resume Review Feedback ({cat})\n\n"
                f"**Strengths:**\n- Clear professional summary\n- Relevant work experience listed\n\n"
                f"**Improvements:**\n1. Add quantifiable achievements (metrics, percentages)\n"
                f"2. Tailor skills section to target roles\n3. Use active voice and strong action verbs\n"
                f"4. Remove outdated or irrelevant experience\n\n"
                f"**ATS Optimization:** Include keywords from job descriptions you're targeting."
            )}
        ]})
        out.append({"messages": [
            {"role": "system", "content": CAREER_SYSTEM},
            {"role": "user", "content": f"Based on this {cat} resume, generate 5 interview questions I should prepare for.\n\n{resume}"},
            {"role": "assistant", "content": (
                f"## Top 5 Interview Questions for {cat} Role\n\n"
                f"1. Walk me through your most impactful project and the measurable results.\n"
                f"2. How do you handle conflicting priorities in a fast-paced environment?\n"
                f"3. Describe a time you identified a process improvement and implemented it.\n"
                f"4. What tools and methodologies do you use to stay current in {cat}?\n"
                f"5. How do you collaborate with cross-functional teams to deliver outcomes?\n\n"
                f"**Tip:** Use the STAR method (Situation, Task, Action, Result) for behavioral questions."
            )}
        ]})
        out.append({"messages": [
            {"role": "system", "content": CAREER_SYSTEM},
            {"role": "user", "content": f"Given my background in {cat}, what are 3-5 next career steps?\n\n{resume}"},
            {"role": "assistant", "content": (
                f"## Suggested Career Path from {cat}\n\n"
                f"1. **Senior {cat} Specialist** – deepen expertise, lead small projects\n"
                f"2. **{cat} Manager / Team Lead** – transition to people leadership\n"
                f"3. **Cross-functional Consultant** – leverage domain knowledge across teams\n"
                f"4. **Product / Strategy** – pivot to business-facing roles\n"
                f"5. **Entrepreneurship / Freelance** – independent consulting in {cat}\n\n"
                f"**Next Action:** Identify which path aligns with your values and seek a mentor already in that role."
            )}
        ]})
    return Dataset.from_list(out)


def build_resume_json():
    ds = load_dataset("sandeeppanem/resume-json-extraction-5k", split="train")
    out = []
    for ex in ds:
        raw = ex["text"]
        out.append({"messages": [
            {"role": "system", "content": CAREER_SYSTEM},
            {"role": "user", "content": "Parse this resume into structured JSON."},
            {"role": "assistant", "content": raw}
        ]})
    return Dataset.from_list(out)


def build_synthetic_coaching(n=600):
    topics = [
        ("salary negotiation",
         "I'm about to negotiate my salary for a new offer. What strategies should I use?",
         "## Salary Negotiation Strategy\n\n1. **Research:** Know market rate for your role/location (Glassdoor, Levels.fyi)\n"
         "2. **Anchor high:** State a number 10-15% above your target\n"
         "3. **Total comp:** Consider base + bonus + equity + benefits\n"
         "4. **Leverage:** Have competing offers or clear business case\n"
         "5. **Practice:** Rehearse the conversation out loud\n\n"
         "**Script starter:** 'I'm excited about this role. Based on my research and the value I bring, I was expecting a base of $X. Is there flexibility?'"),
        ("career pivot",
         "I want to pivot from marketing to data science. What's my roadmap?",
         "## Career Pivot Roadmap: Marketing → Data Science\n\n"
         "**Phase 1 (0-3 mo):** Learn Python + pandas + SQL via online courses\n"
         "**Phase 2 (3-6 mo):** Build 3 portfolio projects with real datasets; blog your process\n"
         "**Phase 3 (6-9 mo):** Freelance / intern to get real experience on your resume\n"
         "**Phase 4 (9-12 mo):** Apply to hybrid roles (marketing analytics) as bridge\n\n"
         "**Leverage your marketing background:** A/B testing, customer segmentation, and ROI analysis are highly transferable."),
        ("networking",
         "How do I effectively network on LinkedIn without being awkward?",
         "## LinkedIn Networking Guide\n\n"
         "1. **Personalize every invite:** Mention a specific post, project, or shared interest\n"
         "2. **Give before asking:** Share their content, offer insight, or make an introduction\n"
         "3. **Follow up:** After connecting, send a brief thank-you + one thoughtful question\n"
         "4. **Consistency:** Comment on 3-5 posts weekly; post your own insights monthly\n"
         "5. **Informational calls:** Request 15-min chats; prepare 3 smart questions\n\n"
         "**Template:** 'Hi [Name], I enjoyed your post on X. I'm exploring Y and would love to learn from your experience. Would you be open to a brief chat?'"),
        ("resume gap",
         "I have a 2-year employment gap. How do I address it on my resume and in interviews?",
         "## Addressing Employment Gaps\n\n"
         "**On Resume:**\n- Use a functional or hybrid format emphasizing skills over chronology\n"
         "- Include any freelance, volunteer, or learning activities during the gap\n"
         "- Omit months if the gap is <2 years; list only years\n\n"
         "**In Interviews:**\n- Be honest but brief: 'I took time to care for family / upskill / relocate'\n"
         "- Pivot quickly to what you did: courses, certifications, side projects\n"
         "- Emphasize readiness: 'I'm energized and fully committed to returning at full capacity'\n\n"
         "**Mindset:** Gaps are common. How you frame them matters more than the gap itself."),
        ("promotion",
         "What should I do in the next 6 months to position myself for a promotion?",
         "## Promotion Strategy (6-Month Plan)\n\n"
         "**Month 1-2: Visibility**\n- Document your wins in a 'brag document' (metrics, impact, testimonials)\n"
         "- Volunteer for high-visibility projects aligned with company priorities\n\n"
         "**Month 3-4: Skill Gaps**\n- Identify the competencies of the next level; close 2-3 gaps\n"
         "- Seek cross-functional exposure\n\n"
         "**Month 5: Feedback Loop**\n- Request formal feedback from your manager and peers\n"
         "- Ask explicitly: 'What would it take for me to be ready for [next level]?'\n\n"
         "**Month 6: The Ask**\n- Present your documented impact, align with company goals, and make the request\n\n"
         "**Key Principle:** Promotions happen when you already perform at the next level."),
    ]
    out = []
    for _ in range(n):
        _, u, a = random.choice(topics)
        out.append({"messages": [
            {"role": "system", "content": CAREER_SYSTEM},
            {"role": "user", "content": u},
            {"role": "assistant", "content": a}
        ]})
    return Dataset.from_list(out)


# ── MAIN ───────────────────────────────────────────────────────────────
if __name__ == "__main__":
    print("Building datasets...")
    ds1 = build_resume_job_fit()
    ds2 = build_resume_review()
    ds3 = build_resume_json()
    ds4 = build_synthetic_coaching()

    full = concatenate_datasets([ds1, ds2, ds3, ds4]).shuffle(seed=42)
    print(f"Total examples: {len(full)}  (fit={len(ds1)}, review={len(ds2)}, json={len(ds3)}, synth={len(ds4)})")

    # Optional: push pre-built dataset for reuse
    full.push_to_hub(DATASET_HUB, private=False)
    print(f"Dataset pushed to https://huggingface.co/datasets/{DATASET_HUB}")

    tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
    if tokenizer.pad_token is None:
        tokenizer.pad_token = tokenizer.eos_token

    peft_config = LoraConfig(
        r=16, lora_alpha=32, lora_dropout=0.05, bias="none",
        task_type=TaskType.CAUSAL_LM,
        target_modules=["q_proj", "k_proj", "v_proj", "o_proj", "gate_proj", "up_proj", "down_proj"],
    )

    args = SFTConfig(
        output_dir="./career-agent-output",
        hub_model_id=OUTPUT_HUB,
        push_to_hub=True,
        num_train_epochs=3,
        per_device_train_batch_size=2,
        gradient_accumulation_steps=4,
        learning_rate=2e-4,
        lr_scheduler_type="cosine",
        warmup_ratio=0.03,
        logging_steps=10,
        logging_first_step=True,
        save_steps=200,
        save_total_limit=2,
        max_length=2048,
        bf16=True,
        gradient_checkpointing=True,
        assistant_only_loss=True,
        remove_unused_columns=False,
        report_to=["trackio"],
    )

    trainer = SFTTrainer(
        model=MODEL_ID,
        tokenizer=tokenizer,
        train_dataset=full,
        args=args,
        peft_config=peft_config,
    )

    print("Training started...")
    trainer.train()
    trainer.save_model()
    trainer.push_to_hub()
    print(f"Done! Model at https://huggingface.co/{OUTPUT_HUB}")