raazkumar commited on
Commit
838f982
·
verified ·
1 Parent(s): 33a1ae7

Upload production/helm/ml-intern/values.yaml

Browse files
Files changed (1) hide show
  1. production/helm/ml-intern/values.yaml +161 -0
production/helm/ml-intern/values.yaml ADDED
@@ -0,0 +1,161 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ replicaCount:
2
+ api: 2
3
+ worker: 2
4
+
5
+ image:
6
+ repository: ml-intern
7
+ pullPolicy: IfNotPresent
8
+ tag: "latest"
9
+
10
+ imagePullSecrets: []
11
+ nameOverride: ""
12
+ fullnameOverride: ""
13
+
14
+ serviceAccount:
15
+ create: true
16
+ annotations: {}
17
+ name: ""
18
+
19
+ podAnnotations:
20
+ prometheus.io/scrape: "true"
21
+ prometheus.io/port: "8000"
22
+ prometheus.io/path: "/metrics"
23
+
24
+ podSecurityContext:
25
+ fsGroup: 1000
26
+
27
+ securityContext:
28
+ runAsNonRoot: true
29
+ runAsUser: 1000
30
+ capabilities:
31
+ drop:
32
+ - ALL
33
+ readOnlyRootFilesystem: true
34
+ allowPrivilegeEscalation: false
35
+
36
+ service:
37
+ type: ClusterIP
38
+ port: 8000
39
+
40
+ ingress:
41
+ enabled: false
42
+ className: "nginx"
43
+ annotations:
44
+ nginx.ingress.kubernetes.io/rate-limit: "100"
45
+ nginx.ingress.kubernetes.io/rate-limit-window: "1m"
46
+ hosts:
47
+ - host: ml-intern.local
48
+ paths:
49
+ - path: /
50
+ pathType: Prefix
51
+ tls: []
52
+
53
+ resources:
54
+ api:
55
+ requests:
56
+ cpu: 250m
57
+ memory: 512Mi
58
+ limits:
59
+ cpu: 2000m
60
+ memory: 2Gi
61
+ worker:
62
+ requests:
63
+ cpu: 100m
64
+ memory: 256Mi
65
+ limits:
66
+ cpu: 1000m
67
+ memory: 1Gi
68
+
69
+ autoscaling:
70
+ enabled: true
71
+ api:
72
+ minReplicas: 2
73
+ maxReplicas: 20
74
+ targetCPUUtilizationPercentage: 70
75
+ targetMemoryUtilizationPercentage: 80
76
+ scaleUpStabilizationWindowSeconds: 60
77
+ scaleDownStabilizationWindowSeconds: 300
78
+
79
+ nodeSelector: {}
80
+
81
+ tolerations: []
82
+
83
+ affinity:
84
+ api:
85
+ podAntiAffinity:
86
+ preferredDuringSchedulingIgnoredDuringExecution:
87
+ - weight: 100
88
+ podAffinityTerm:
89
+ labelSelector:
90
+ matchExpressions:
91
+ - key: app.kubernetes.io/name
92
+ operator: In
93
+ values:
94
+ - ml-intern
95
+ topologyKey: kubernetes.io/hostname
96
+
97
+ config:
98
+ port: 8000
99
+ workers: 4
100
+ maxConcurrentRequests: 200
101
+ defaultRpmLimit: 40
102
+ requestTimeout: 120
103
+ cacheTtlSeconds: 300
104
+ budgetUsdPerSession: 10.0
105
+ circuitBreaker:
106
+ failureThreshold: 5
107
+ recoveryTimeout: 60
108
+ logLevel: INFO
109
+
110
+ secrets:
111
+ hfToken: ""
112
+ anthropicApiKey: ""
113
+ openaiApiKey: ""
114
+ groqApiKey: ""
115
+ nvidiaApiKey: ""
116
+
117
+ redis:
118
+ enabled: true
119
+ architecture: standalone
120
+ auth:
121
+ enabled: false
122
+ master:
123
+ persistence:
124
+ enabled: true
125
+ size: 5Gi
126
+ resources:
127
+ requests:
128
+ memory: 256Mi
129
+ cpu: 100m
130
+ limits:
131
+ memory: 1Gi
132
+ cpu: 500m
133
+
134
+ postgresql:
135
+ enabled: true
136
+ auth:
137
+ username: ml_intern
138
+ password: ml_intern
139
+ database: ml_intern
140
+ primary:
141
+ persistence:
142
+ enabled: true
143
+ size: 10Gi
144
+ resources:
145
+ requests:
146
+ memory: 256Mi
147
+ cpu: 100m
148
+ limits:
149
+ memory: 1Gi
150
+ cpu: 500m
151
+
152
+ monitoring:
153
+ enabled: true
154
+ prometheus:
155
+ enabled: true
156
+ retention: "30d"
157
+ grafana:
158
+ enabled: true
159
+ adminPassword: "admin"
160
+ jaeger:
161
+ enabled: true