# okto_version: "1.2"

# Teste 5: Flan-T5 com INFERENCE e BEHAVIOR
# Modelo: google/flan-t5-base
# Objetivo: Testar inferência com controle de comportamento

PROJECT "test_flan_t5_inference"
DESCRIPTION "Teste Flan-T5 com INFERENCE, BEHAVIOR e GUARD"

ENV {
  accelerator: "gpu"
  min_memory: "8GB"
  precision: "fp16"
  backend: "oktoseek"
  install_missing: true
}

DATASET {
  train: "dataset/train.jsonl"
  validation: "dataset/val.jsonl"
}

MODEL {
  base: "google/flan-t5-base"
  device: "auto"
}

TRAIN {
  epochs: 3
  batch_size: 16
  learning_rate: 0.0001
  device: "auto"
}

BEHAVIOR {
  mode: "chat"
  personality: "friendly"
  verbosity: "medium"
  language: "pt-BR"
  avoid: ["violence", "hate", "politics"]
  fallback: "Como posso ajudar?"
  prompt_style: "User: {input}\nAssistant:"
}

GUARD {
  prevent {
    hallucination
    toxicity
    bias
    data_leak
  }
  detect_using: ["classifier", "regex", "rule_engine"]
  on_violation {
    REPLACE with_message: "Desculpe, essa solicitação não é permitida."
  }
}

INFERENCE {
  mode: "chat"
  format: "User: {input}\nAssistant:"
  exit_command: "/exit"
  params {
    max_length: 120
    temperature: 0.7
    top_p: 0.9
    beams: 2
    do_sample: true
  }
  CONTROL {
    IF confidence < 0.3 {
      RETRY
      LOG "Low confidence - retrying"
    }
    
    IF repetition > 3 {
      REGENERATE
      LOG "High repetition detected - regenerating"
    }
  }
}

MONITOR {
  metrics: ["loss", "val_loss", "accuracy", "confidence"]
  log_to: "logs/inference_test.log"
}

EXPORT {
  format: ["okm"]
  path: "export/"
}