Skip to content

Commit d48270f

Browse files
committed
examples(kubernete): add nvidia example
Signed-off-by: Ettore Di Giacinto <[email protected]>
1 parent e5c6428 commit d48270f

File tree

1 file changed

+69
-0
lines changed

1 file changed

+69
-0
lines changed
Lines changed: 69 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,69 @@
1+
apiVersion: v1
2+
kind: Namespace
3+
metadata:
4+
name: local-ai
5+
---
6+
apiVersion: v1
7+
kind: PersistentVolumeClaim
8+
metadata:
9+
name: models-pvc
10+
namespace: local-ai
11+
spec:
12+
accessModes:
13+
- ReadWriteOnce
14+
resources:
15+
requests:
16+
storage: 50Gi
17+
---
18+
apiVersion: apps/v1
19+
kind: Deployment
20+
metadata:
21+
name: local-ai
22+
namespace: local-ai
23+
labels:
24+
app: local-ai
25+
spec:
26+
selector:
27+
matchLabels:
28+
app: local-ai
29+
replicas: 1
30+
template:
31+
metadata:
32+
labels:
33+
app: local-ai
34+
name: local-ai
35+
spec:
36+
runtimeClassName: "nvidia"
37+
containers:
38+
- args:
39+
- phi-2
40+
env:
41+
- name: DEBUG
42+
value: "true"
43+
name: local-ai
44+
image: quay.io/go-skynet/local-ai:master-cublas-cuda12
45+
imagePullPolicy: IfNotPresent
46+
resources:
47+
limits:
48+
nvidia.com/gpu: 1
49+
volumeMounts:
50+
- name: models-volume
51+
mountPath: /build/models
52+
volumes:
53+
- name: models-volume
54+
persistentVolumeClaim:
55+
claimName: models-pvc
56+
---
57+
apiVersion: v1
58+
kind: Service
59+
metadata:
60+
name: local-ai
61+
namespace: local-ai
62+
spec:
63+
selector:
64+
app: local-ai
65+
type: NodePort
66+
ports:
67+
- protocol: TCP
68+
targetPort: 8080
69+
port: 8080

0 commit comments

Comments
 (0)