-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathdeployment.yaml
More file actions
84 lines (84 loc) · 2.02 KB
/
deployment.yaml
File metadata and controls
84 lines (84 loc) · 2.02 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
apiVersion: apps/v1
kind: Deployment
metadata:
name: diagnoai
namespace: diagnoai
labels:
app: diagnoai
spec:
replicas: 1
selector:
matchLabels:
app: diagnoai
template:
metadata:
labels:
app: diagnoai
spec:
containers:
- name: diagnoai
image: bhupencod3/diagnoai:latest
imagePullPolicy: Always
ports:
- containerPort: 8000
envFrom:
- configMapRef:
name: diagnoai-config
env:
- name: OPENAI_API_KEY
valueFrom:
secretKeyRef:
name: diagnoai-secrets
key: openai-api-key
- name: HF_TOKEN
valueFrom:
secretKeyRef:
name: diagnoai-secrets
key: hf-token
- name: GROK_API_KEY
valueFrom:
secretKeyRef:
name: diagnoai-secrets
key: grok-api-key
- name: REPLICATE_API_TOKEN
valueFrom:
secretKeyRef:
name: diagnoai-secrets
key: replicate-api-token
resources:
requests:
memory: "4Gi"
cpu: "1000m"
limits:
memory: "6Gi"
cpu: "2000m"
startupProbe:
httpGet:
path: /health
port: 8000
failureThreshold: 30
periodSeconds: 10
livenessProbe:
httpGet:
path: /health
port: 8000
initialDelaySeconds: 60
periodSeconds: 10
readinessProbe:
httpGet:
path: /ready
port: 8000
initialDelaySeconds: 30
periodSeconds: 5
volumeMounts:
- name: vector-store-volume
mountPath: /app/data/vector_store
- name: data-volume
mountPath: /app/data
volumes:
- name: vector-store-volume
persistentVolumeClaim:
claimName: vector-store-pvc
- name: data-volume
persistentVolumeClaim:
claimName: data-pvc