Skip to content

Commit 839f0e2

Browse files
committed
[Test] In test_ultraserver, remove the compute node custom action in favor of the cookbook attribute to force IMEX configuration.
1 parent d891cdc commit 839f0e2

File tree

3 files changed

+10
-291
lines changed

3 files changed

+10
-291
lines changed

tests/integration-tests/tests/ultraserver/test_gb200.py

Lines changed: 4 additions & 9 deletions
Original file line numberDiff line numberDiff line change
@@ -28,9 +28,9 @@
2828
# hardwiring the reservation id here when we need it.
2929
CAPACITY_BLOCK_RESERVATION_ID = "cr-123456789"
3030

31-
# We use 0.0.0.0 as placeholder IPs just to get IMEX started.
31+
# We use placeholder IPs just to get IMEX started.
3232
# These values are hardwired in the cookbook.
33-
FAKE_IPS = ["0.0.0.0", "0.0.0.0"]
33+
FAKE_IPS = ["172.31.51.93", "172.31.48.43"]
3434

3535

3636
def submit_job_imex_status(rce: RemoteCommandExecutor, queue: str, max_nodes: int = 1):
@@ -52,7 +52,8 @@ def assert_imex_nodes_config_is_correct(rce: RemoteCommandExecutor, launch_templ
5252
logging.info(f"Checking IMEX nodes config contains the expected nodes: {expected_ips}")
5353
imex_nodes_config_file = f"/opt/parallelcluster/shared/nvidia-imex/nodes_config_{launch_template_id}.cfg"
5454
imex_config_content = read_remote_file(rce, imex_nodes_config_file)
55-
actual_ips = [ip.strip() for ip in imex_config_content.strip().split("\n")]
55+
imex_config_content_clean = [line for line in imex_config_content.split("\n") if not line.strip().startswith("#")]
56+
actual_ips = [ip.strip() for ip in imex_config_content_clean]
5657
assert_that(actual_ips).contains_only(*expected_ips)
5758
logging.info(f"IMEX nodes config {imex_nodes_config_file} contains the expected nodes: {expected_ips}")
5859

@@ -263,11 +264,6 @@ def test_gb200(
263264
)
264265
bucket.upload_file(head_node_start_script_rendered, headnode_start_filename)
265266

266-
# TODO: Remove after testing: BEGIN: added compute custom action to force the configuraiton of IMEX
267-
compute_configured_filename = "compute_node_configured.sh"
268-
bucket.upload_file(str(test_datadir / compute_configured_filename), compute_configured_filename)
269-
# TODO: Remove after testing: END
270-
271267
queue_with_imex = "q1"
272268
compute_resource_with_imex = "cr1"
273269
queue_without_imex = "q2"
@@ -276,7 +272,6 @@ def test_gb200(
276272
cluster_config = pcluster_config_reader(
277273
bucket_name=bucket_name,
278274
head_node_start_script=headnode_start_filename,
279-
compute_node_configured_script=compute_configured_filename,
280275
max_queue_size=max_queue_size,
281276
queue_with_imex=queue_with_imex,
282277
compute_resource_with_imex=compute_resource_with_imex,

tests/integration-tests/tests/ultraserver/test_gb200/test_gb200/compute_node_configured.sh

Lines changed: 0 additions & 264 deletions
This file was deleted.

tests/integration-tests/tests/ultraserver/test_gb200/test_gb200/pcluster.config.yaml

Lines changed: 6 additions & 18 deletions
Original file line numberDiff line numberDiff line change
@@ -33,12 +33,6 @@ Scheduling:
3333
Networking:
3434
SubnetIds:
3535
- {{ private_subnet_id }}
36-
CustomActions:
37-
OnNodeConfigured:
38-
Script: s3://{{ bucket_name }}/{{ compute_node_configured_script }}
39-
Iam:
40-
S3Access:
41-
- BucketName: {{ bucket_name }}
4236
- Name: {{ queue_without_imex }}
4337
ComputeResources:
4438
- Name: {{ compute_resource_without_imex }}
@@ -49,18 +43,12 @@ Scheduling:
4943
Networking:
5044
SubnetIds:
5145
- {{ private_subnet_id }}
52-
CustomActions:
53-
OnNodeConfigured:
54-
Script: s3://{{ bucket_name }}/{{ compute_node_configured_script }}
55-
Iam:
56-
S3Access:
57-
- BucketName: {{ bucket_name }}
5846

5947
# The DevSetting below forces the configuration of NVIDIA IMEX on instances that are not GB200.
6048
# We do it to simulate the behavior of GB200 instances.
61-
#{% if instance != "p6e-gb200.36xlarge" %}
62-
#DevSettings:
63-
# Cookbook:
64-
# ExtraChefAttributes: |
65-
# { "cluster": { "nvidia": { "imex": { "force_configuration": "true" } } }
66-
#{% endif %}
49+
{% if instance != "p6e-gb200.36xlarge" %}
50+
DevSettings:
51+
Cookbook:
52+
ExtraChefAttributes: |
53+
{ "cluster": { "nvidia": { "imex": { "force_configuration": "true" } } } }
54+
{% endif %}

0 commit comments

Comments
 (0)