From 65f12184a57c5901646f3c5ce507685e6b8c8f39 Mon Sep 17 00:00:00 2001 From: Xin Wang Date: Mon, 15 Sep 2025 04:47:02 +0000 Subject: [PATCH] Revert "Add cert mgr installation which is required by HPTO (#180)" This reverts commit a4f0465ce01e656a23b5920ce58dda9966aaff1b. --- helm_chart/HyperPodHelmChart/Chart.yaml | 4 ---- helm_chart/HyperPodHelmChart/values.yaml | 9 --------- helm_chart/readme.md | 15 --------------- 3 files changed, 28 deletions(-) diff --git a/helm_chart/HyperPodHelmChart/Chart.yaml b/helm_chart/HyperPodHelmChart/Chart.yaml index 31d37bfa..97e3c4e9 100644 --- a/helm_chart/HyperPodHelmChart/Chart.yaml +++ b/helm_chart/HyperPodHelmChart/Chart.yaml @@ -24,10 +24,6 @@ version: 0.1.0 appVersion: "1.16.0" dependencies: - - name: cert-manager - version: "v1.18.2" - repository: oci://quay.io/jetstack/charts - condition: cert-manager.enabled - name: training-operators version: "0.1.0" repository: "file://charts/training-operators" diff --git a/helm_chart/HyperPodHelmChart/values.yaml b/helm_chart/HyperPodHelmChart/values.yaml index 7628c91c..264e16a8 100644 --- a/helm_chart/HyperPodHelmChart/values.yaml +++ b/helm_chart/HyperPodHelmChart/values.yaml @@ -115,15 +115,6 @@ namespace: create: true name: aws-hyperpod -cert-manager: - enabled: false - namespace: cert-manager - global: - leaderElection: - namespace: cert-manager - crds: - enabled: true - mlflow: enabled: false diff --git a/helm_chart/readme.md b/helm_chart/readme.md index 15f1ba61..77ff1c05 100644 --- a/helm_chart/readme.md +++ b/helm_chart/readme.md @@ -33,7 +33,6 @@ More information about orchestration features for cluster admins [here](https:// | [Kubeflow Training Operator](https://www.kubeflow.org/docs/components/trainer/legacy-v1/overview/) | Installs operators for managing various machine learning training jobs, such as TensorFlow, PyTorch, and MXNet, providing native Kubernetes support for distributed training workloads. | | Yes | | HyperPod patching | Deploys the RBAC and controller resources needed for orchestrating rolling updates and patching workflows in SageMaker HyperPod clusters. Includes pod eviction and node monitoring. | HyperPod Resiliency | Yes | | hyperpod-inference-operator | Installs the HyperPod Inference Operator and its dependencies to the cluster, allowing cluster deployment and inferencing of JumpStart, s3-hosted, and FSx-hosted models | No | -| [cert-manager](https://github.com/cert-manager/cert-manager) | Automatically provisions and manages TLS certificates in Kubernetes clusters. Provides certificate lifecycle management including issuance, renewal, and revocation for secure communications. | [Hyperpod training operator](https://docs.aws.amazon.com/sagemaker/latest/dg/sagemaker-eks-operator.html) | No | > **_Note_** The `mpijob` scheme is disabled in the Training Operator helm chart to avoid conflicting with the MPI Operator. @@ -49,20 +48,6 @@ storage: enabled: true ``` -To enable cert-manager for TLS certificate management, pass in `--set cert-manager.enabled=true` when installing or upgrading the main chart or set the following in the values.yaml file: -``` -cert-manager: - enabled: true - namespace: cert-manager - global: - leaderElection: - namespace: cert-manager - crds: - enabled: true -``` -namespace specifies which name space cert-manager should be installed - - --- The following plugins are only required for HyperPod Resiliency if you are using the following supported devices, such as GPU/Neuron instances, unless you install these plugins on your own.