github.com/1aal/kubeblocks@v0.0.0-20231107070852-e1c03e598921/deploy/llm-cluster/templates/cluster.yaml (about) 1 {{- include "kblib.clusterCommon" . }} 2 {{ if .Values.cpuMode }} 3 clusterDefinitionRef: ggml # ref clusterDefinition.name 4 componentSpecs: 5 - name: ggml 6 componentDefRef: ggml # ref clusterDefinition componentDefs.name 7 {{- include "kblib.componentMonitor" . | indent 6 }} 8 replicas: {{ .Values.replicas }} 9 serviceAccountName: {{ include "kblib.serviceAccountName" . }} 10 {{- include "kblib.componentResources" . | indent 6 }} 11 {{ else }} 12 clusterDefinitionRef: vllm # ref clusterDefinition.name 13 componentSpecs: 14 - name: vllm 15 componentDefRef: vllm # ref clusterDefinition componentDefs.name 16 {{- include "kblib.componentMonitor" . | indent 6 }} 17 replicas: {{ .Values.replicas }} 18 serviceAccountName: {{ include "kblib.serviceAccountName" . }} 19 resources: 20 limits: 21 nvidia.com/gpu: {{ .Values.gpu }} 22 requests: 23 nvidia.com/gpu: {{ .Values.gpu }} 24 {{ end }}