github.com/kubeflow/training-operator@v1.7.0/scripts/setup-training-operator.sh (about)

     1  #!/bin/bash
     2  
     3  # Copyright 2021 The Kubernetes Authors.
     4  #
     5  # Licensed under the Apache License, Version 2.0 (the "License");
     6  # you may not use this file except in compliance with the License.
     7  # You may obtain a copy of the License at
     8  #
     9  #     http://www.apache.org/licenses/LICENSE-2.0
    10  #
    11  # Unless required by applicable law or agreed to in writing, software
    12  # distributed under the License is distributed on an "AS IS" BASIS,
    13  # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    14  # See the License for the specific language governing permissions and
    15  # limitations under the License.
    16  
    17  # This shell script is used to build a cluster and create a namespace from our
    18  # argo workflow
    19  
    20  
    21  set -o errexit
    22  set -o nounset
    23  set -o pipefail
    24  
    25  CLUSTER_NAME="${CLUSTER_NAME}"
    26  REGION="${AWS_REGION:-us-west-2}"
    27  REGISTRY="${ECR_REGISTRY:-public.ecr.aws/j1r0q0g6/training/training-operator}"
    28  VERSION="${PULL_BASE_SHA}"
    29  GO_DIR=${GOPATH}/src/github.com/${REPO_OWNER}/${REPO_NAME}
    30  
    31  echo "Configuring kubeconfig.."
    32  aws eks update-kubeconfig --region=${REGION} --name=${CLUSTER_NAME}
    33  
    34  echo "Update training operator manifest with new name $REGISTRY and tag $VERSION"
    35  cd manifests/overlays/standalone
    36  #kustomize edit set image public.ecr.aws/j1r0q0g6/training/training-operator=${REGISTRY}:${VERSION}
    37  kustomize edit set image kubeflow/training-operator=${REGISTRY}:${VERSION}
    38  
    39  echo "Installing training operator manifests"
    40  kustomize build . | kubectl apply -f -
    41  
    42  TIMEOUT=30
    43  until kubectl get pods -n kubeflow | grep training-operator | grep 1/1 || [[ $TIMEOUT -eq 1 ]]; do
    44    sleep 10
    45    TIMEOUT=$(( TIMEOUT - 1 ))
    46  done
    47  kubectl describe all -n kubeflow
    48  kubectl describe pods -n kubeflow