File tree Expand file tree Collapse file tree 1 file changed +69
-0
lines changed Expand file tree Collapse file tree 1 file changed +69
-0
lines changed Original file line number Diff line number Diff line change
1
+ apiVersion : v1
2
+ kind : Namespace
3
+ metadata :
4
+ name : local-ai
5
+ ---
6
+ apiVersion : v1
7
+ kind : PersistentVolumeClaim
8
+ metadata :
9
+ name : models-pvc
10
+ namespace : local-ai
11
+ spec :
12
+ accessModes :
13
+ - ReadWriteOnce
14
+ resources :
15
+ requests :
16
+ storage : 50Gi
17
+ ---
18
+ apiVersion : apps/v1
19
+ kind : Deployment
20
+ metadata :
21
+ name : local-ai
22
+ namespace : local-ai
23
+ labels :
24
+ app : local-ai
25
+ spec :
26
+ selector :
27
+ matchLabels :
28
+ app : local-ai
29
+ replicas : 1
30
+ template :
31
+ metadata :
32
+ labels :
33
+ app : local-ai
34
+ name : local-ai
35
+ spec :
36
+ runtimeClassName : " nvidia"
37
+ containers :
38
+ - args :
39
+ - phi-2
40
+ env :
41
+ - name : DEBUG
42
+ value : " true"
43
+ name : local-ai
44
+ image : quay.io/go-skynet/local-ai:master-cublas-cuda12
45
+ imagePullPolicy : IfNotPresent
46
+ resources :
47
+ limits :
48
+ nvidia.com/gpu : 1
49
+ volumeMounts :
50
+ - name : models-volume
51
+ mountPath : /build/models
52
+ volumes :
53
+ - name : models-volume
54
+ persistentVolumeClaim :
55
+ claimName : models-pvc
56
+ ---
57
+ apiVersion : v1
58
+ kind : Service
59
+ metadata :
60
+ name : local-ai
61
+ namespace : local-ai
62
+ spec :
63
+ selector :
64
+ app : local-ai
65
+ type : NodePort
66
+ ports :
67
+ - protocol : TCP
68
+ targetPort : 8080
69
+ port : 8080
You can’t perform that action at this time.
0 commit comments