k8s.io/test-infra@v0.0.0-20240520184403-27c6b4c223d8/config/jobs/kubernetes/sig-cloud-provider/gcp/gpu/gpu-gce.yaml

k8s.io/test-infra@v0.0.0-20240520184403-27c6b4c223d8/config/jobs/kubernetes/sig-cloud-provider/gcp/gpu/gpu-gce.yaml (about)

     1  presets:
     2  - labels:
     3      preset-ci-gce-device-plugin-gpu: "true"
     4    env:
     5    - name: NODE_ACCELERATORS
     6      value: type=nvidia-tesla-t4,count=2
     7    - name: NODE_SIZE
     8      value: n1-standard-2
     9  - labels:
    10      preset-ci-gce-device-plugin-gpu-nvidia-t4: "true"
    11    env:
    12    - name: NODE_ACCELERATORS
    13      value: type=nvidia-tesla-t4,count=2
    14    - name: NODE_SIZE
    15      value: n1-standard-2
    16  
    17  periodics:
    18  - name: ci-kubernetes-e2e-gce-device-plugin-gpu
    19    cluster: k8s-infra-prow-build
    20    cron: "30 1-23/2 * * *"
    21    labels:
    22      preset-service-account: "true"
    23      preset-k8s-ssh: "true"
    24      preset-ci-gce-device-plugin-gpu: "true"
    25    annotations:
    26      fork-per-release: "true"
    27      fork-per-release-replacements: "--extract=ci/fast/latest-fast -> --extract=ci/latest-{{.Version}}"
    28      fork-per-release-cron: 0 0-23/2 * * *, 0 3-23/6 * * *, 0 8-23/12 * * *, 0 8-23/24 * * *, 0 14-23/24 * * *
    29      testgrid-dashboards: sig-release-master-blocking, google-gce
    30      testgrid-tab-name: gce-device-plugin-gpu-master
    31      testgrid-alert-email: gke-kubernetes-accelerators-bugs@google.com
    32      description: "Uses kubetest to run e2e tests (+Feature:GPUDevicePlugin) against a cluster created with cluster/kube-up.sh"
    33      testgrid-num-failures-to-alert: '6'
    34      testgrid-alert-stale-results-hours: '24'
    35    decorate: true
    36    decoration_config:
    37      timeout: 300m
    38    spec:
    39      containers:
    40      - command:
    41        - runner.sh
    42        - /workspace/scenarios/kubernetes_e2e.py
    43        args:
    44        - --check-leaked-resources
    45        - --extract=ci/fast/latest-fast
    46        - --extract-ci-bucket=k8s-release-dev
    47        # Note: The GCE Node image used may have a dependency on the nvidia-driver-installer image defined in https://github.com/kubernetes/kubernetes/blob/master/test/e2e/testing-manifests/scheduling/nvidia-driver-installer.yaml
    48        # If updating the image defined here, the cos-gpu-installer image may need to updated to support the corresponding COS image.
    49        - --env=KUBE_GCE_NODE_IMAGE=cos-109-17800-147-22
    50        - --gcp-node-image=gci
    51        - --gcp-nodes=1
    52        - --gcp-project-type=gpu-project
    53        - --gcp-zone=us-west1-b
    54        - --provider=gce
    55        - --test_args=--ginkgo.focus=\[Feature:GPUDevicePlugin\] --minStartupPods=8
    56        - --timeout=180m
    57        image: gcr.io/k8s-staging-test-infra/kubekins-e2e:v20240515-17c6d50e24-master
    58        resources:
    59          limits:
    60            cpu: 1
    61            memory: 3Gi
    62          requests:
    63            cpu: 1
    64            memory: 3Gi