github.com/kubeflow/training-operator@v1.7.0/scripts/setup-training-operator.sh (about) 1 #!/bin/bash 2 3 # Copyright 2021 The Kubernetes Authors. 4 # 5 # Licensed under the Apache License, Version 2.0 (the "License"); 6 # you may not use this file except in compliance with the License. 7 # You may obtain a copy of the License at 8 # 9 # http://www.apache.org/licenses/LICENSE-2.0 10 # 11 # Unless required by applicable law or agreed to in writing, software 12 # distributed under the License is distributed on an "AS IS" BASIS, 13 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 14 # See the License for the specific language governing permissions and 15 # limitations under the License. 16 17 # This shell script is used to build a cluster and create a namespace from our 18 # argo workflow 19 20 21 set -o errexit 22 set -o nounset 23 set -o pipefail 24 25 CLUSTER_NAME="${CLUSTER_NAME}" 26 REGION="${AWS_REGION:-us-west-2}" 27 REGISTRY="${ECR_REGISTRY:-public.ecr.aws/j1r0q0g6/training/training-operator}" 28 VERSION="${PULL_BASE_SHA}" 29 GO_DIR=${GOPATH}/src/github.com/${REPO_OWNER}/${REPO_NAME} 30 31 echo "Configuring kubeconfig.." 32 aws eks update-kubeconfig --region=${REGION} --name=${CLUSTER_NAME} 33 34 echo "Update training operator manifest with new name $REGISTRY and tag $VERSION" 35 cd manifests/overlays/standalone 36 #kustomize edit set image public.ecr.aws/j1r0q0g6/training/training-operator=${REGISTRY}:${VERSION} 37 kustomize edit set image kubeflow/training-operator=${REGISTRY}:${VERSION} 38 39 echo "Installing training operator manifests" 40 kustomize build . | kubectl apply -f - 41 42 TIMEOUT=30 43 until kubectl get pods -n kubeflow | grep training-operator | grep 1/1 || [[ $TIMEOUT -eq 1 ]]; do 44 sleep 10 45 TIMEOUT=$(( TIMEOUT - 1 )) 46 done 47 kubectl describe all -n kubeflow 48 kubectl describe pods -n kubeflow