github.com/1aal/kubeblocks@v0.0.0-20231107070852-e1c03e598921/deploy/llm/templates/clusterdefinition.yaml (about)

     1  apiVersion: apps.kubeblocks.io/v1alpha1
     2  kind: ClusterDefinition
     3  metadata:
     4    name: vllm
     5    labels:
     6      {{- include "llm.labels" . | nindent 4}}
     7  spec:
     8    componentDefs:
     9      - name: vllm
    10        workloadType: Stateful
    11        characterType: vllm
    12        scriptSpecs:
    13          - name: vllm-scripts
    14            templateRef: vllm-scripts
    15            namespace: {{ .Release.Namespace }}
    16            volumeName: scripts
    17            defaultMode: 493
    18        service:
    19          ports:
    20            - name: model
    21              port: 8000
    22              targetPort: model
    23        podSpec:
    24          volumes:
    25            - name: model-store
    26              emptyDir: {}
    27          containers:
    28            - name: vllm
    29              imagePullPolicy: {{default .Values.image.pullPolicy "IfNotPresent"}}
    30              securityContext:
    31                runAsUser: 0
    32                privileged: true
    33                allowPrivilegeEscalation: true
    34              terminationMessagePath: /dev/termination-log
    35              terminationMessagePolicy: File
    36              volumeMounts:
    37                - mountPath: /llm/config/
    38                  name: config
    39                - name: scripts
    40                  mountPath: /scripts
    41                - mountPath: /llm/storage
    42                  name: model-store
    43              command:
    44                - /scripts/start.sh
    45              ports:
    46                - name: model
    47                  containerPort: 8000
    48    connectionCredential:
    49      username: root
    50      password: ""
    51  
    52  ---
    53  apiVersion: apps.kubeblocks.io/v1alpha1
    54  kind: ClusterDefinition
    55  metadata:
    56    name: ggml
    57    labels:
    58      {{- include "llm.labels" . | nindent 4}}
    59  spec:
    60    componentDefs:
    61      - name: ggml
    62        workloadType: Stateful
    63        characterType: ggml
    64        service:
    65          ports:
    66            - name: model
    67              port: 8000
    68              targetPort: model
    69        podSpec:
    70          volumes:
    71            - name: models
    72              emptyDir: {}
    73          containers:
    74            - name: ggml
    75              imagePullPolicy: {{default .Values.imageDev.pullPolicy "IfNotPresent"}}
    76              securityContext:
    77                runAsUser: 0
    78              terminationMessagePath: /dev/termination-log
    79              terminationMessagePolicy: File
    80              volumeMounts:
    81                - name: models
    82                  mountPath: /models
    83              ports:
    84                - name: model
    85                  containerPort: 8000
    86    connectionCredential:
    87      username: root
    88      password: ""