# okto_version: "1.2" # Teste 5: Flan-T5 com INFERENCE e BEHAVIOR # Modelo: google/flan-t5-base # Objetivo: Testar inferência com controle de comportamento PROJECT "test_flan_t5_inference" DESCRIPTION "Teste Flan-T5 com INFERENCE, BEHAVIOR e GUARD" ENV { accelerator: "gpu" min_memory: "8GB" precision: "fp16" backend: "oktoseek" install_missing: true } DATASET { train: "dataset/train.jsonl" validation: "dataset/val.jsonl" } MODEL { base: "google/flan-t5-base" device: "auto" } TRAIN { epochs: 3 batch_size: 16 learning_rate: 0.0001 device: "auto" } BEHAVIOR { mode: "chat" personality: "friendly" verbosity: "medium" language: "pt-BR" avoid: ["violence", "hate", "politics"] fallback: "Como posso ajudar?" prompt_style: "User: {input}\nAssistant:" } GUARD { prevent { hallucination toxicity bias data_leak } detect_using: ["classifier", "regex", "rule_engine"] on_violation { REPLACE with_message: "Desculpe, essa solicitação não é permitida." } } INFERENCE { mode: "chat" format: "User: {input}\nAssistant:" exit_command: "/exit" params { max_length: 120 temperature: 0.7 top_p: 0.9 beams: 2 do_sample: true } CONTROL { IF confidence < 0.3 { RETRY LOG "Low confidence - retrying" } IF repetition > 3 { REGENERATE LOG "High repetition detected - regenerating" } } } MONITOR { metrics: ["loss", "val_loss", "accuracy", "confidence"] log_to: "logs/inference_test.log" } EXPORT { format: ["okm"] path: "export/" }