Skip to content

Commit 881d029

Browse files
committed
Fix unit tests
1 parent 88e708e commit 881d029

File tree

2 files changed

+26
-11
lines changed

2 files changed

+26
-11
lines changed

src/slurm_plugin/instance_manager.py

Lines changed: 13 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -848,7 +848,11 @@ def _best_effort_node_assignment(
848848
# No instances launched at all, e.g. CreateFleet API returns no EC2 instances,
849849
# or no left instances available from a best-effort EC2 launch
850850
logger.info("No launched instances found for nodes %s", print_with_count(nodes_resume_list))
851-
self._update_failed_nodes(set(nodes_resume_list), "InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)", override=False)
851+
self._update_failed_nodes(
852+
set(nodes_resume_list),
853+
"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)",
854+
override=False,
855+
)
852856

853857
def _all_or_nothing_node_assignment(
854858
self,
@@ -903,7 +907,11 @@ def _all_or_nothing_node_assignment(
903907
# No instances launched at all, e.g. CreateFleet API returns no EC2 instances,
904908
# or no left instances available from a best-effort EC2 launch
905909
logger.info("No launched instances found for nodes %s", print_with_count(nodes_resume_list))
906-
self._update_failed_nodes(set(nodes_resume_list), "InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)", override=False)
910+
self._update_failed_nodes(
911+
set(nodes_resume_list),
912+
"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)",
913+
override=False,
914+
)
907915

908916
def _launch_instances( # noqa: C901
909917
self,
@@ -986,7 +994,9 @@ def _launch_ec2_instances(self, batch_nodes, compute_resource, fleet_manager, in
986994
# queue_2: {cr_3: list[EC2Instance]}
987995
# }
988996
else:
989-
self._update_failed_nodes(set(batch_nodes), "InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)")
997+
self._update_failed_nodes(
998+
set(batch_nodes), "InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)"
999+
)
9901000
return launched_ec2_instances
9911001

9921002
def _get_fleet_manager(self, all_or_nothing_batch, compute_resource, queue):

tests/slurm_plugin/test_instance_manager.py

Lines changed: 13 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -3195,7 +3195,7 @@ def test_update_slurm_node_addrs(
31953195
{},
31963196
False,
31973197
None,
3198-
{"InsufficientInstanceCapacity": {"queue4-st-c5xlarge-1"}},
3198+
{"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)": {"queue4-st-c5xlarge-1"}},
31993199
),
32003200
(
32013201
SlurmResumeJob(140819, "queue4-st-c5xlarge-1", "queue4-st-c5xlarge-1", "NO"),
@@ -3210,7 +3210,7 @@ def test_update_slurm_node_addrs(
32103210
{},
32113211
False,
32123212
None,
3213-
{"InsufficientInstanceCapacity": {"queue4-st-c5xlarge-1"}},
3213+
{"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)": {"queue4-st-c5xlarge-1"}},
32143214
),
32153215
(
32163216
SlurmResumeJob(140819, "queue4-st-c5xlarge-1", "queue4-st-c5xlarge-1", "NO"),
@@ -3328,7 +3328,12 @@ def test_update_slurm_node_addrs(
33283328
{},
33293329
False,
33303330
None,
3331-
{"InsufficientInstanceCapacity": {"queue1-st-c5xlarge-1", "queue4-st-c5xlarge-1"}},
3331+
{
3332+
"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)": {
3333+
"queue1-st-c5xlarge-1",
3334+
"queue4-st-c5xlarge-1",
3335+
}
3336+
},
33323337
),
33333338
(
33343339
SlurmResumeJob(
@@ -3348,7 +3353,7 @@ def test_update_slurm_node_addrs(
33483353
{},
33493354
False,
33503355
None,
3351-
{"InsufficientInstanceCapacity": {"queue1-st-c5xlarge-1"}},
3356+
{"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)": {"queue1-st-c5xlarge-1"}},
33523357
),
33533358
(
33543359
SlurmResumeJob(
@@ -3915,7 +3920,7 @@ def test_node_assignment_by_scaling_strategy(
39153920
{},
39163921
[{"Instances": []}],
39173922
{},
3918-
{"InsufficientInstanceCapacity": {"queue4-st-c5xlarge-1"}},
3923+
{"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)": {"queue4-st-c5xlarge-1"}},
39193924
),
39203925
(
39213926
None,
@@ -4719,7 +4724,7 @@ def test_update_dict(self, instance_manager, target_dict, update, expected_dict)
47194724
{"q1": {"c1": ["q1-dy-c1-1"], "c2": ["q1-dy-c2-1"]}},
47204725
[],
47214726
True,
4722-
{"InsufficientInstanceCapacity": {"q1-dy-c1-1", "q1-dy-c2-1"}},
4727+
{"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)": {"q1-dy-c1-1", "q1-dy-c2-1"}},
47234728
),
47244729
],
47254730
)
@@ -4898,7 +4903,7 @@ def test_best_effort_node_assignment(
48984903
{"q1": {"c1": ["q1-dy-c1-1"], "c2": ["q1-dy-c2-1"]}},
48994904
[],
49004905
True,
4901-
{"InsufficientInstanceCapacity": {"q1-dy-c1-1", "q1-dy-c2-1"}},
4906+
{"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)": {"q1-dy-c1-1", "q1-dy-c2-1"}},
49024907
None,
49034908
{},
49044909
{},
@@ -5590,7 +5595,7 @@ def test_add_instances(
55905595
{},
55915596
False,
55925597
{
5593-
"InsufficientInstanceCapacity": {
5598+
"InsufficientInstanceCapacity(Check slurm_resume log for ec2 error codes)": {
55945599
"queue2-st-c5xlarge-1",
55955600
"queue2-dy-c5xlarge-1",
55965601
"queue1-st-c5xlarge-2",

0 commit comments

Comments
 (0)