| # okto_version: "1.2"
|
| PROJECT "DeployAPIExample"
|
| DESCRIPTION "Demonstrates DEPLOY block for API deployment"
|
|
|
| ENV {
|
| accelerator: "gpu"
|
| min_memory: "8GB"
|
| precision: "fp16"
|
| }
|
|
|
| DATASET {
|
| train: "examples/datasets/demo_train.jsonl"
|
| format: "jsonl"
|
| type: "chat"
|
| }
|
|
|
| MODEL {
|
| name: "api-deploy-model"
|
| base: "oktoseek/base-mini"
|
| device: "cuda"
|
| }
|
|
|
| TRAIN {
|
| epochs: 5
|
| batch_size: 32
|
| device: "cuda"
|
| }
|
|
|
| EXPORT {
|
| format: ["onnx", "okm"]
|
| path: "export/"
|
| }
|
|
|
| DEPLOY {
|
| target: "api"
|
| host: "0.0.0.0"
|
| endpoint: "/chatbot"
|
| requires_auth: true
|
| port: 9000
|
| max_concurrent_requests: 100
|
| protocol: "http"
|
| format: "onnx"
|
| }
|
|
|
| SECURITY {
|
| input_validation {
|
| max_length: 500
|
| disallow_patterns: [
|
| "<script>",
|
| "DROP TABLE",
|
| "rm -rf",
|
| "sudo"
|
| ]
|
| }
|
|
|
| output_validation {
|
| prevent_data_leak: true
|
| mask_personal_info: true
|
| }
|
|
|
| rate_limit {
|
| max_requests_per_minute: 60
|
| }
|
|
|
| encryption {
|
| algorithm: "AES-256"
|
| }
|
| }
|
|
|
| BEHAVIOR {
|
| mode: "chat"
|
| personality: "assistant"
|
| verbosity: "medium"
|
| language: "en"
|
| fallback: "How can I help you?"
|
| }
|
|
|
|
|