Skip to content

Commit 02d2fc8

Browse files
committed
moving restartConfig for auto resume policy to under Worker key to align with kubeflow docs
1 parent aa1b5b8 commit 02d2fc8

File tree

3 files changed

+3
-3
lines changed

3 files changed

+3
-3
lines changed

launcher/nemo/k8s_templates/training/training.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@ spec:
2525
pytorchReplicaSpecs:
2626
Worker:
2727
replicas: {{ $config.nodes }}
28+
restartPolicy: {{ $config.restartPolicy }}
2829
template:
2930
{{- if $config.customLabels }}
3031
metadata:
@@ -101,7 +102,6 @@ spec:
101102
- mountPath: /var/log/aws/clusters
102103
name: aws-clusters-logs
103104
readOnly: true
104-
restartPolicy: {{ $config.restartPolicy }}
105105

106106
{{- if (or $config.labelSelector.required $config.labelSelector.preferred) }}
107107
affinity:

tests/k8s_workflow/k8s_baseline_artifacts/llama-8b/k8s_template/templates/training.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@ spec:
2525
pytorchReplicaSpecs:
2626
Worker:
2727
replicas: {{ $config.nodes }}
28+
restartPolicy: {{ $config.restartPolicy }}
2829
template:
2930
{{- if $config.customLabels }}
3031
metadata:
@@ -101,7 +102,6 @@ spec:
101102
- mountPath: /var/log/aws/clusters
102103
name: aws-clusters-logs
103104
readOnly: true
104-
restartPolicy: {{ $config.restartPolicy }}
105105

106106
{{- if (or $config.labelSelector.required $config.labelSelector.preferred) }}
107107
affinity:

tests/k8s_workflow/k8s_baseline_artifacts/test_custom/k8s_template/templates/training.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -25,6 +25,7 @@ spec:
2525
pytorchReplicaSpecs:
2626
Worker:
2727
replicas: {{ $config.nodes }}
28+
restartPolicy: {{ $config.restartPolicy }}
2829
template:
2930
{{- if $config.customLabels }}
3031
metadata:
@@ -101,7 +102,6 @@ spec:
101102
- mountPath: /var/log/aws/clusters
102103
name: aws-clusters-logs
103104
readOnly: true
104-
restartPolicy: {{ $config.restartPolicy }}
105105

106106
{{- if (or $config.labelSelector.required $config.labelSelector.preferred) }}
107107
affinity:

0 commit comments

Comments
 (0)