github.com/1aal/kubeblocks@v0.0.0-20231107070852-e1c03e598921/deploy/llm/templates/clusterdefinition.yaml (about) 1 apiVersion: apps.kubeblocks.io/v1alpha1 2 kind: ClusterDefinition 3 metadata: 4 name: vllm 5 labels: 6 {{- include "llm.labels" . | nindent 4}} 7 spec: 8 componentDefs: 9 - name: vllm 10 workloadType: Stateful 11 characterType: vllm 12 scriptSpecs: 13 - name: vllm-scripts 14 templateRef: vllm-scripts 15 namespace: {{ .Release.Namespace }} 16 volumeName: scripts 17 defaultMode: 493 18 service: 19 ports: 20 - name: model 21 port: 8000 22 targetPort: model 23 podSpec: 24 volumes: 25 - name: model-store 26 emptyDir: {} 27 containers: 28 - name: vllm 29 imagePullPolicy: {{default .Values.image.pullPolicy "IfNotPresent"}} 30 securityContext: 31 runAsUser: 0 32 privileged: true 33 allowPrivilegeEscalation: true 34 terminationMessagePath: /dev/termination-log 35 terminationMessagePolicy: File 36 volumeMounts: 37 - mountPath: /llm/config/ 38 name: config 39 - name: scripts 40 mountPath: /scripts 41 - mountPath: /llm/storage 42 name: model-store 43 command: 44 - /scripts/start.sh 45 ports: 46 - name: model 47 containerPort: 8000 48 connectionCredential: 49 username: root 50 password: "" 51 52 --- 53 apiVersion: apps.kubeblocks.io/v1alpha1 54 kind: ClusterDefinition 55 metadata: 56 name: ggml 57 labels: 58 {{- include "llm.labels" . | nindent 4}} 59 spec: 60 componentDefs: 61 - name: ggml 62 workloadType: Stateful 63 characterType: ggml 64 service: 65 ports: 66 - name: model 67 port: 8000 68 targetPort: model 69 podSpec: 70 volumes: 71 - name: models 72 emptyDir: {} 73 containers: 74 - name: ggml 75 imagePullPolicy: {{default .Values.imageDev.pullPolicy "IfNotPresent"}} 76 securityContext: 77 runAsUser: 0 78 terminationMessagePath: /dev/termination-log 79 terminationMessagePolicy: File 80 volumeMounts: 81 - name: models 82 mountPath: /models 83 ports: 84 - name: model 85 containerPort: 8000 86 connectionCredential: 87 username: root 88 password: ""