Skip to content

Commit d27eaa2

Browse files
author
Theofilos Manitaras
authored
Pin version of NGC Pytorch image to 25.06-py3 (#386)
Signed-off-by: Theofilos Manitaras <[email protected]>
1 parent 89b3036 commit d27eaa2

File tree

2 files changed

+28
-20
lines changed

2 files changed

+28
-20
lines changed

checks/apps/pytorch/pytorch_allreduce.py

Lines changed: 15 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
# SPDX-License-Identifier: BSD-3-Clause
55

66
import pathlib
7-
import re
7+
import re # noqa: F401
88
import sys
99

1010
import reframe as rfm
@@ -26,22 +26,27 @@ class PyTorchNCCLAllReduce(rfm.RunOnlyRegressionTest, ContainerEngineMixin):
2626
valid_prog_environs = ['builtin']
2727
num_nodes = variable(int, value=8)
2828
sourcesdir = None
29-
curated_images = ['nvcr.io#nvidia/pytorch:24.12-py3']
29+
curated_images = ['nvcr.io#nvidia/pytorch:25.06-py3']
3030

3131
# NOTE: only the "-py3" image is supported by the test
3232
supported_flavors = ["-py3"]
3333

34+
3435
pytorch_tags = nvidia_image_tags('pytorch')
3536
latest_tags = []
3637

37-
for flavor in supported_flavors:
38-
versions = []
39-
for tag in pytorch_tags:
40-
if re.match(rf'^\d+\.\d+{flavor}$', tag):
41-
versions.append(tag[:-len(flavor)])
42-
if versions:
43-
latest_version = max(versions)
44-
latest_tags += [f'{latest_version+flavor}']
38+
# FIXME: 25.08-py3 version and above use Cuda 13 see:
39+
# https://jira.cscs.ch/browse/VCUE-1039
40+
41+
# for flavor in supported_flavors:
42+
# versions = []
43+
# for tag in pytorch_tags:
44+
# if re.match(rf'^\d+\.\d+{flavor}$', tag):
45+
# versions.append(tag[:-len(flavor)])
46+
# if versions:
47+
# versions.sort(reverse=True)
48+
# for v in versions:
49+
# latest_tags += [f'{latest_version+flavor}']
4550

4651
latest_images = [f'nvcr.io#nvidia/pytorch:{tag}' for tag in latest_tags]
4752
image = parameter(curated_images + latest_images)

checks/apps/pytorch/pytorch_nvidia.py

Lines changed: 13 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
import re
1+
import re # noqa: F401
22
import sys
33
import pathlib
44
import reframe as rfm
@@ -38,23 +38,26 @@ class PyTorchDdpCeNv(PyTorchTestBase, ContainerEngineMixin):
3838
'NVIDIA NGC')
3939
valid_systems = ['+ce +nvgpu']
4040
aws_ofi_nccl = parameter([True])
41-
curated_images = ['nvcr.io#nvidia/pytorch:24.01-py3']
41+
curated_images = ['nvcr.io#nvidia/pytorch:25.06-py3']
4242

4343
# NOTE: only the "-py3" image is supported by the test
4444
supported_flavors = ["-py3"]
4545

4646
pytorch_tags = nvidia_image_tags('pytorch')
4747
latest_tags = []
4848

49-
for flavor in supported_flavors:
50-
versions = []
51-
for tag in pytorch_tags:
52-
if re.match(rf'^\d+\.\d+{flavor}$', tag):
53-
versions.append(tag[:-len(flavor)])
49+
# FIXME: 25.08-py3 version and above use Cuda 13 see:
50+
# https://jira.cscs.ch/browse/VCUE-1039
5451

55-
if versions:
56-
latest_version = max(versions)
57-
latest_tags += [f'{latest_version}{flavor}']
52+
# for flavor in supported_flavors:
53+
# versions = []
54+
# for tag in pytorch_tags:
55+
# if re.match(rf'^\d+\.\d+{flavor}$', tag):
56+
# versions.append(tag[:-len(flavor)])
57+
58+
# if versions:
59+
# latest_version = max(versions)
60+
# latest_tags += [f'{latest_version}{flavor}']
5861

5962
latest_images = [f'nvcr.io#nvidia/pytorch:{tag}' for tag in latest_tags]
6063
image = parameter(curated_images + latest_images)

0 commit comments

Comments
 (0)