diff --git a/Makefile b/Makefile index 41b0e3112d..6f935bdfcb 100644 --- a/Makefile +++ b/Makefile @@ -38,7 +38,7 @@ help: ## Display this help. ##@ Development manifests: controller-gen ## Generate WebhookConfiguration, ClusterRole and CustomResourceDefinition objects. - $(CONTROLLER_GEN) $(CRD_OPTIONS) rbac:roleName=manager-role webhook paths="./pkg/apis/..." output:crd:artifacts:config=config/crd/bases + $(CONTROLLER_GEN) $(CRD_OPTIONS) rbac:roleName=manager-role webhook paths="./pkg/apis/..." output:crd:artifacts:config=manifests/base generate: controller-gen ## Generate code containing DeepCopy, DeepCopyInto, and DeepCopyObject method implementations. $(CONTROLLER_GEN) object:headerFile="hack/boilerplate.go.txt" paths="./pkg/apis/..." diff --git a/config/crd/kustomization.yaml b/config/crd/kustomization.yaml deleted file mode 100644 index a590114997..0000000000 --- a/config/crd/kustomization.yaml +++ /dev/null @@ -1,13 +0,0 @@ -# This kustomization.yaml is not intended to be run by itself, -# since it depends on service name and namespace that are out of this kustomize package. -# It should be run by config/default -resources: -- bases/kubeflow.org_xgboostjobs.yaml -- bases/kubeflow.org_pytorchjobs.yaml -- bases/kubeflow.org_tfjobs.yaml -- bases/kubeflow.org_mxjobs.yaml -#+kubebuilder:scaffold:crdkustomizeresource - -# the following config is for teaching kustomize how to do kustomization for CRDs. -configurations: -- kustomizeconfig.yaml diff --git a/config/crd/kustomizeconfig.yaml b/config/crd/kustomizeconfig.yaml deleted file mode 100644 index 13425cc3c6..0000000000 --- a/config/crd/kustomizeconfig.yaml +++ /dev/null @@ -1,19 +0,0 @@ -# This file is for teaching kustomize how to substitute name and namespace reference in CRD -nameReference: - - kind: Service - version: v1 - fieldSpecs: - - kind: CustomResourceDefinition - version: v1 - group: apiextensions.k8s.io - path: spec/conversion/webhook/clientConfig/service/name - -namespace: - - kind: CustomResourceDefinition - version: v1 - group: apiextensions.k8s.io - path: spec/conversion/webhook/clientConfig/service/namespace - create: false - -varReference: - - path: metadata/annotations \ No newline at end of file diff --git a/config/manager/manager.yaml b/config/manager/manager.yaml deleted file mode 100644 index 1c018da451..0000000000 --- a/config/manager/manager.yaml +++ /dev/null @@ -1,57 +0,0 @@ -apiVersion: v1 -kind: Namespace -metadata: - labels: - control-plane: kubeflow-training-operator - name: kubeflow ---- -apiVersion: apps/v1 -kind: Deployment -metadata: - name: training-operator - namespace: system - labels: - control-plane: kubeflow-training-operator -spec: - selector: - matchLabels: - control-plane: kubeflow-training-operator - replicas: 1 - template: - metadata: - labels: - control-plane: kubeflow-training-operator - spec: -# securityContext: -# runAsNonRoot: true - containers: - - command: - - /manager -# disable leader-elect now -# args: -# - --leader-elect - image: kubeflow/training-operator:v1.0.0 - name: manager - securityContext: - allowPrivilegeEscalation: false - livenessProbe: - httpGet: - path: /healthz - port: 8081 - initialDelaySeconds: 15 - periodSeconds: 20 - readinessProbe: - httpGet: - path: /readyz - port: 8081 - initialDelaySeconds: 5 - periodSeconds: 10 - resources: - limits: - cpu: 100m - memory: 30Mi - requests: - cpu: 100m - memory: 20Mi - serviceAccountName: training-operator-service-account - terminationGracePeriodSeconds: 10 diff --git a/manifests/base/cluster-role-binding.yaml b/manifests/base/cluster-role-binding.yaml index e05aad7fc4..2e5b93dcb5 100644 --- a/manifests/base/cluster-role-binding.yaml +++ b/manifests/base/cluster-role-binding.yaml @@ -3,12 +3,12 @@ apiVersion: rbac.authorization.k8s.io/v1beta1 kind: ClusterRoleBinding metadata: labels: - app: tf-job-operator - name: tf-job-operator + app: training-operator + name: training-operator roleRef: apiGroup: rbac.authorization.k8s.io kind: ClusterRole - name: tf-job-operator + name: training-operator subjects: - kind: ServiceAccount - name: tf-job-operator + name: training-operator diff --git a/manifests/base/cluster-role.yaml b/manifests/base/cluster-role.yaml index 5e599a7831..702a3f8cd5 100644 --- a/manifests/base/cluster-role.yaml +++ b/manifests/base/cluster-role.yaml @@ -3,100 +3,47 @@ apiVersion: rbac.authorization.k8s.io/v1beta1 kind: ClusterRole metadata: labels: - app: tf-job-operator - name: tf-job-operator + app: training-operator + name: training-operator rules: -- apiGroups: - - kubeflow.org - resources: - - tfjobs - - tfjobs/status - - tfjobs/finalizers - verbs: - - '*' -- apiGroups: - - apiextensions.k8s.io - resources: - - customresourcedefinitions - verbs: - - '*' -- apiGroups: - - "" - resources: - - pods - - services - - endpoints - - events - verbs: - - '*' -- apiGroups: - - apps - - extensions - resources: - - deployments - verbs: - - '*' -- apiGroups: - - scheduling.volcano.sh - resources: - - podgroups - verbs: - - '*' - ---- - -apiVersion: rbac.authorization.k8s.io/v1 -kind: ClusterRole -metadata: - name: kubeflow-tfjobs-admin - labels: - rbac.authorization.kubeflow.org/aggregate-to-kubeflow-admin: "true" -aggregationRule: - clusterRoleSelectors: - - matchLabels: - rbac.authorization.kubeflow.org/aggregate-to-kubeflow-tfjobs-admin: "true" -rules: [] - ---- - -apiVersion: rbac.authorization.k8s.io/v1 -kind: ClusterRole -metadata: - name: kubeflow-tfjobs-edit - labels: - rbac.authorization.kubeflow.org/aggregate-to-kubeflow-edit: "true" - rbac.authorization.kubeflow.org/aggregate-to-kubeflow-tfjobs-admin: "true" -rules: -- apiGroups: - - kubeflow.org - resources: - - tfjobs - - tfjobs/status - verbs: - - get - - list - - watch - - create - - delete - - deletecollection - - patch - - update - ---- - -apiVersion: rbac.authorization.k8s.io/v1 -kind: ClusterRole -metadata: - name: kubeflow-tfjobs-view - labels: - rbac.authorization.kubeflow.org/aggregate-to-kubeflow-view: "true" -rules: -- apiGroups: - - kubeflow.org - resources: - - tfjobs - - tfjobs/status - verbs: - - get - - list - - watch + - apiGroups: + - kubeflow.org + resources: + - tfjobs + - mxjobs + - pytorchjobs + - xgboostjobs + - tfjobs/status + - pytorchjobs/status + - mxjobs/status + - xgboostjobs/status + verbs: + - "*" + - apiGroups: + - apiextensions.k8s.io + resources: + - customresourcedefinitions + verbs: + - "*" + - apiGroups: + - "" + resources: + - pods + - services + - endpoints + - events + verbs: + - "*" + - apiGroups: + - apps + - extensions + resources: + - deployments + verbs: + - "*" + - apiGroups: + - scheduling.volcano.sh + resources: + - podgroups + verbs: + - "*" diff --git a/manifests/base/crd.yaml b/manifests/base/crd.yaml deleted file mode 100644 index 71384fcfad..0000000000 --- a/manifests/base/crd.yaml +++ /dev/null @@ -1,52 +0,0 @@ -apiVersion: apiextensions.k8s.io/v1beta1 -kind: CustomResourceDefinition -metadata: - name: tfjobs.kubeflow.org -spec: - additionalPrinterColumns: - - JSONPath: .status.conditions[-1:].type - name: State - type: string - - JSONPath: .metadata.creationTimestamp - name: Age - type: date - group: kubeflow.org - names: - kind: TFJob - plural: tfjobs - singular: tfjob - scope: Namespaced - subresources: - status: {} - validation: - openAPIV3Schema: - properties: - spec: - properties: - tfReplicaSpecs: - properties: - Chief: - properties: - replicas: - maximum: 1 - minimum: 1 - type: integer - PS: - properties: - replicas: - minimum: 1 - type: integer - Worker: - properties: - replicas: - minimum: 1 - type: integer - Evaluator: - properties: - replicas: - minimum: 0 - type: integer - versions: - - name: v1 - served: true - storage: true diff --git a/manifests/base/deployment.yaml b/manifests/base/deployment.yaml deleted file mode 100644 index 346e36476d..0000000000 --- a/manifests/base/deployment.yaml +++ /dev/null @@ -1,29 +0,0 @@ ---- -apiVersion: apps/v1 -kind: Deployment -metadata: - name: tf-job-operator -spec: - replicas: 1 - template: - metadata: - labels: - name: tf-job-operator - annotations: - sidecar.istio.io/inject: "false" - spec: - containers: - - args: - - -monitoring-port=8443 - env: - - name: MY_POD_NAMESPACE - valueFrom: - fieldRef: - fieldPath: metadata.namespace - - name: MY_POD_NAME - valueFrom: - fieldRef: - fieldPath: metadata.name - image: public.ecr.aws/j1r0q0g6/training/tf-operator - name: tf-job-operator - serviceAccountName: tf-job-operator diff --git a/config/crd/bases/kubeflow.org_mxjobs.yaml b/manifests/base/kubeflow.org_mxjobs.yaml similarity index 100% rename from config/crd/bases/kubeflow.org_mxjobs.yaml rename to manifests/base/kubeflow.org_mxjobs.yaml diff --git a/config/crd/bases/kubeflow.org_pytorchjobs.yaml b/manifests/base/kubeflow.org_pytorchjobs.yaml similarity index 100% rename from config/crd/bases/kubeflow.org_pytorchjobs.yaml rename to manifests/base/kubeflow.org_pytorchjobs.yaml diff --git a/config/crd/bases/kubeflow.org_tfjobs.yaml b/manifests/base/kubeflow.org_tfjobs.yaml similarity index 100% rename from config/crd/bases/kubeflow.org_tfjobs.yaml rename to manifests/base/kubeflow.org_tfjobs.yaml diff --git a/config/crd/bases/kubeflow.org_xgboostjobs.yaml b/manifests/base/kubeflow.org_xgboostjobs.yaml similarity index 100% rename from config/crd/bases/kubeflow.org_xgboostjobs.yaml rename to manifests/base/kubeflow.org_xgboostjobs.yaml diff --git a/manifests/base/kustomization.yaml b/manifests/base/kustomization.yaml index c1b91df23a..f45174ffa4 100644 --- a/manifests/base/kustomization.yaml +++ b/manifests/base/kustomization.yaml @@ -2,14 +2,11 @@ apiVersion: kustomize.config.k8s.io/v1beta1 kind: Kustomization namespace: kubeflow resources: -- crd.yaml -- cluster-role-binding.yaml -- cluster-role.yaml -- deployment.yaml -- service-account.yaml -- service.yaml -commonLabels: - app: tf-job-operator - kustomize.component: tf-job-operator - app.kubernetes.io/component: tfjob - app.kubernetes.io/name: tf-job-operator + - kubeflow.org_tfjobs.yaml + - kubeflow.org_mxjobs.yaml + - kubeflow.org_pytorchjobs.yaml + - kubeflow.org_xgboostjobs.yaml + - cluster-role-binding.yaml + - cluster-role.yaml + - service-account.yaml + - service.yaml diff --git a/manifests/base/service-account.yaml b/manifests/base/service-account.yaml index 2ea6a87d29..e6f10afc28 100644 --- a/manifests/base/service-account.yaml +++ b/manifests/base/service-account.yaml @@ -2,5 +2,5 @@ apiVersion: v1 kind: ServiceAccount metadata: labels: - app: tf-job-operator - name: tf-job-operator + app: training-operator + name: training-operator diff --git a/manifests/base/service.yaml b/manifests/base/service.yaml index 97f92e3ea1..e95f9f4727 100644 --- a/manifests/base/service.yaml +++ b/manifests/base/service.yaml @@ -7,13 +7,13 @@ metadata: prometheus.io/scrape: "true" prometheus.io/port: "8443" labels: - app: tf-job-operator - name: tf-job-operator + app: training-operator + name: training-operator spec: ports: - name: monitoring-port port: 8443 targetPort: 8443 selector: - name: tf-job-operator + name: training-operator type: ClusterIP diff --git a/config/default/kustomization.yaml b/manifests/default/kustomization.yaml similarity index 100% rename from config/default/kustomization.yaml rename to manifests/default/kustomization.yaml diff --git a/config/default/manager_config_patch.yaml b/manifests/default/manager_config_patch.yaml similarity index 100% rename from config/default/manager_config_patch.yaml rename to manifests/default/manager_config_patch.yaml diff --git a/config/manager/controller_manager_config.yaml b/manifests/manager/controller_manager_config.yaml similarity index 100% rename from config/manager/controller_manager_config.yaml rename to manifests/manager/controller_manager_config.yaml diff --git a/config/manager/kustomization.yaml b/manifests/manager/kustomization.yaml similarity index 65% rename from config/manager/kustomization.yaml rename to manifests/manager/kustomization.yaml index 1d1341d9b5..638fcb401e 100644 --- a/config/manager/kustomization.yaml +++ b/manifests/manager/kustomization.yaml @@ -1,5 +1,5 @@ resources: -- manager.yaml + - manager.yaml #generatorOptions: # disableNameSuffixHash: true @@ -10,7 +10,3 @@ resources: # name: manager-config apiVersion: kustomize.config.k8s.io/v1beta1 kind: Kustomization -images: -- name: kubeflow/training-operator - newName: kubeflow/training-operator - newTag: latest diff --git a/manifests/manager/manager.yaml b/manifests/manager/manager.yaml new file mode 100644 index 0000000000..129776ad72 --- /dev/null +++ b/manifests/manager/manager.yaml @@ -0,0 +1,50 @@ +apiVersion: apps/v1 +kind: Deployment +metadata: + name: training-operator + namespace: system + labels: + control-plane: kubeflow-training-operator +spec: + selector: + matchLabels: + control-plane: kubeflow-training-operator + replicas: 1 + template: + metadata: + labels: + control-plane: kubeflow-training-operator + spec: + # securityContext: + # runAsNonRoot: true + containers: + - command: + - /manager + # disable leader-elect now + # args: + # - --leader-elect + image: kubeflow/training-operator:v1.0.0 + name: manager + securityContext: + allowPrivilegeEscalation: false + livenessProbe: + httpGet: + path: /healthz + port: 8081 + initialDelaySeconds: 15 + periodSeconds: 20 + readinessProbe: + httpGet: + path: /readyz + port: 8081 + initialDelaySeconds: 5 + periodSeconds: 10 + resources: + limits: + cpu: 100m + memory: 30Mi + requests: + cpu: 100m + memory: 20Mi + serviceAccountName: training-operator-service-account + terminationGracePeriodSeconds: 10 diff --git a/manifests/overlays/kubeflow/kubeflow-training-roles.yaml b/manifests/overlays/kubeflow/kubeflow-training-roles.yaml new file mode 100644 index 0000000000..05cd2ab778 --- /dev/null +++ b/manifests/overlays/kubeflow/kubeflow-training-roles.yaml @@ -0,0 +1,53 @@ +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRole +metadata: + name: kubeflow-training-admin + labels: + rbac.authorization.kubeflow.org/aggregate-to-kubeflow-admin: "true" +aggregationRule: + clusterRoleSelectors: + - matchLabels: + rbac.authorization.kubeflow.org/aggregate-to-kubeflow-training-admin: "true" +rules: [] + +--- +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRole +metadata: + name: kubeflow-training-edit + labels: + rbac.authorization.kubeflow.org/aggregate-to-kubeflow-edit: "true" + rbac.authorization.kubeflow.org/aggregate-to-kubeflow-training-admin: "true" +rules: + - apiGroups: + - kubeflow.org + resources: + - tfjobs + - tfjobs/status + verbs: + - get + - list + - watch + - create + - delete + - deletecollection + - patch + - update + +--- +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRole +metadata: + name: kubeflow-training-view + labels: + rbac.authorization.kubeflow.org/aggregate-to-kubeflow-view: "true" +rules: + - apiGroups: + - kubeflow.org + resources: + - tfjobs + - tfjobs/status + verbs: + - get + - list + - watch diff --git a/manifests/overlays/kubeflow/kustomization.yaml b/manifests/overlays/kubeflow/kustomization.yaml index 380504ca89..7c5e9c1ff6 100644 --- a/manifests/overlays/kubeflow/kustomization.yaml +++ b/manifests/overlays/kubeflow/kustomization.yaml @@ -2,13 +2,11 @@ apiVersion: kustomize.config.k8s.io/v1beta1 kind: Kustomization namespace: kubeflow resources: -- ../../base -commonLabels: - app: tf-job-operator - kustomize.component: tf-job-operator - app.kubernetes.io/component: tfjob - app.kubernetes.io/name: tf-job-operator + - ../../base + - ../../manager + - ../../rbac + - kubeflow-training-roles.yaml images: -- name: public.ecr.aws/j1r0q0g6/training/tf-operator - newTag: 47a74b738920edbf4207160cec7e1dff9cdab3f2 - + - name: kubeflow/training-operator:v1.0.0 + newName: deepakmuley/kubeflow-training-operator + newTag: "1" diff --git a/manifests/overlays/standalone/kustomization.yaml b/manifests/overlays/standalone/kustomization.yaml index a37f068715..7eda9f927f 100644 --- a/manifests/overlays/standalone/kustomization.yaml +++ b/manifests/overlays/standalone/kustomization.yaml @@ -2,14 +2,11 @@ apiVersion: kustomize.config.k8s.io/v1beta1 kind: Kustomization namespace: kubeflow resources: -- ../../base -- namespace.yaml -commonLabels: - app: tf-job-operator - kustomize.component: tf-job-operator - app.kubernetes.io/component: tfjob - app.kubernetes.io/name: tf-job-operator + - ../../base + - ../../manager + - ../../rbac + - namespace.yaml images: -- name: public.ecr.aws/j1r0q0g6/training/tf-operator - newTag: 47a74b738920edbf4207160cec7e1dff9cdab3f2 - + - name: kubeflow/training-operator:v1.0.0 + newName: deepakmuley/kubeflow-training-operator + newTag: "1" diff --git a/manifests/overlays/standalone_v2/kustomization.yaml b/manifests/overlays/standalone_v2/kustomization.yaml deleted file mode 100644 index 475f3b162b..0000000000 --- a/manifests/overlays/standalone_v2/kustomization.yaml +++ /dev/null @@ -1,15 +0,0 @@ -apiVersion: kustomize.config.k8s.io/v1beta1 -kind: Kustomization -namespace: kubeflow -resources: -- ../../base_v2 -- namespace.yaml -commonLabels: - app: training-operator - kustomize.component: training-operator - app.kubernetes.io/component: kubeflow-training - app.kubernetes.io/name: training-operator -images: -- name: public.ecr.aws/j1r0q0g6/training/training-operator - newTag: cd2fc1ff397b1f349f68524f4abd5013a32e3033 - diff --git a/manifests/overlays/standalone_v2/namespace.yaml b/manifests/overlays/standalone_v2/namespace.yaml deleted file mode 100644 index 7a940e4673..0000000000 --- a/manifests/overlays/standalone_v2/namespace.yaml +++ /dev/null @@ -1,4 +0,0 @@ -apiVersion: v1 -kind: Namespace -metadata: - name: kubeflow diff --git a/config/prometheus/kustomization.yaml b/manifests/prometheus/kustomization.yaml similarity index 100% rename from config/prometheus/kustomization.yaml rename to manifests/prometheus/kustomization.yaml diff --git a/config/prometheus/monitor.yaml b/manifests/prometheus/monitor.yaml similarity index 100% rename from config/prometheus/monitor.yaml rename to manifests/prometheus/monitor.yaml diff --git a/config/rbac/auth_proxy_client_clusterrole.yaml b/manifests/rbac/auth_proxy_client_clusterrole.yaml similarity index 100% rename from config/rbac/auth_proxy_client_clusterrole.yaml rename to manifests/rbac/auth_proxy_client_clusterrole.yaml diff --git a/config/rbac/auth_proxy_role.yaml b/manifests/rbac/auth_proxy_role.yaml similarity index 100% rename from config/rbac/auth_proxy_role.yaml rename to manifests/rbac/auth_proxy_role.yaml diff --git a/config/rbac/auth_proxy_role_binding.yaml b/manifests/rbac/auth_proxy_role_binding.yaml similarity index 100% rename from config/rbac/auth_proxy_role_binding.yaml rename to manifests/rbac/auth_proxy_role_binding.yaml diff --git a/config/rbac/auth_proxy_service.yaml b/manifests/rbac/auth_proxy_service.yaml similarity index 100% rename from config/rbac/auth_proxy_service.yaml rename to manifests/rbac/auth_proxy_service.yaml diff --git a/config/rbac/kustomization.yaml b/manifests/rbac/kustomization.yaml similarity index 100% rename from config/rbac/kustomization.yaml rename to manifests/rbac/kustomization.yaml diff --git a/config/rbac/leader_election_role.yaml b/manifests/rbac/leader_election_role.yaml similarity index 100% rename from config/rbac/leader_election_role.yaml rename to manifests/rbac/leader_election_role.yaml diff --git a/config/rbac/leader_election_role_binding.yaml b/manifests/rbac/leader_election_role_binding.yaml similarity index 100% rename from config/rbac/leader_election_role_binding.yaml rename to manifests/rbac/leader_election_role_binding.yaml diff --git a/config/rbac/mxjob_editor_role.yaml b/manifests/rbac/mxjob_editor_role.yaml similarity index 100% rename from config/rbac/mxjob_editor_role.yaml rename to manifests/rbac/mxjob_editor_role.yaml diff --git a/config/rbac/mxjob_viewer_role.yaml b/manifests/rbac/mxjob_viewer_role.yaml similarity index 100% rename from config/rbac/mxjob_viewer_role.yaml rename to manifests/rbac/mxjob_viewer_role.yaml diff --git a/config/rbac/pytorchjob_editor_role.yaml b/manifests/rbac/pytorchjob_editor_role.yaml similarity index 100% rename from config/rbac/pytorchjob_editor_role.yaml rename to manifests/rbac/pytorchjob_editor_role.yaml diff --git a/config/rbac/pytorchjob_viewer_role.yaml b/manifests/rbac/pytorchjob_viewer_role.yaml similarity index 100% rename from config/rbac/pytorchjob_viewer_role.yaml rename to manifests/rbac/pytorchjob_viewer_role.yaml diff --git a/config/rbac/role.yaml b/manifests/rbac/role.yaml similarity index 100% rename from config/rbac/role.yaml rename to manifests/rbac/role.yaml diff --git a/config/rbac/role_binding.yaml b/manifests/rbac/role_binding.yaml similarity index 100% rename from config/rbac/role_binding.yaml rename to manifests/rbac/role_binding.yaml diff --git a/config/rbac/service_account.yaml b/manifests/rbac/service_account.yaml similarity index 100% rename from config/rbac/service_account.yaml rename to manifests/rbac/service_account.yaml diff --git a/config/rbac/tfjob_editor_role.yaml b/manifests/rbac/tfjob_editor_role.yaml similarity index 100% rename from config/rbac/tfjob_editor_role.yaml rename to manifests/rbac/tfjob_editor_role.yaml diff --git a/config/rbac/tfjob_viewer_role.yaml b/manifests/rbac/tfjob_viewer_role.yaml similarity index 100% rename from config/rbac/tfjob_viewer_role.yaml rename to manifests/rbac/tfjob_viewer_role.yaml diff --git a/config/rbac/xgboostjob_editor_role.yaml b/manifests/rbac/xgboostjob_editor_role.yaml similarity index 100% rename from config/rbac/xgboostjob_editor_role.yaml rename to manifests/rbac/xgboostjob_editor_role.yaml diff --git a/config/rbac/xgboostjob_viewer_role.yaml b/manifests/rbac/xgboostjob_viewer_role.yaml similarity index 100% rename from config/rbac/xgboostjob_viewer_role.yaml rename to manifests/rbac/xgboostjob_viewer_role.yaml diff --git a/scripts/setup-training-operator.sh b/scripts/setup-training-operator.sh index d310cce152..7f9c8b5deb 100755 --- a/scripts/setup-training-operator.sh +++ b/scripts/setup-training-operator.sh @@ -32,7 +32,7 @@ echo "Configuring kubeconfig.." aws eks update-kubeconfig --region=${REGION} --name=${CLUSTER_NAME} echo "Update training operator manifest with new name $REGISTRY and tag $VERSION" -cd config/default +cd manifests/overlays/standalone #kustomize edit set image public.ecr.aws/j1r0q0g6/training/training-operator=${REGISTRY}:${VERSION} kustomize edit set image kubeflow/training-operator=${REGISTRY}:${VERSION}