Skip to content

Commit

Permalink
Add retries for ocp4_workload_habana_gaudi_gpu_setup (#9014)
Browse files Browse the repository at this point in the history
  • Loading branch information
jkupferer authored Jan 23, 2025
1 parent 5d2f688 commit b87f6f5
Showing 1 changed file with 8 additions and 1 deletion.
Original file line number Diff line number Diff line change
Expand Up @@ -5,13 +5,17 @@
api_version: v1
kind: Namespace
name: "{{ habana_gaudi_operator_namespace }}"
register: r_habana_gpu_operator_namespace
until: r_habana_gpu_operator_namespace is successful
retries: 10
delay: 5

- name: Create Habana Gaudi GPU operatorgroup
kubernetes.core.k8s:
state: present
definition: "{{ lookup('template', 'habana-gaudi/habana_gaudi_operatorgroup.yaml.j2') | from_yaml }}"
register: operatorgroup_result
until: operatorgroup_result is successful
retries: 25
delay: 5

Expand All @@ -20,6 +24,7 @@
state: present
definition: "{{ lookup('template', 'habana-gaudi/habana_gaudi_sub.yaml.j2') | from_yaml }}"
register: subscription_result
until: subscription_result is successful
retries: 50
delay: 5

Expand All @@ -32,4 +37,6 @@
state: present
definition: "{{ lookup('template', 'habana-gaudi/habana_gpu_deviceconfig.yaml.j2') | from_yaml }}"
register: devconfig_result
delay: 5
until: devconfig_result is successful
retries: 30
delay: 5

0 comments on commit b87f6f5

Please sign in to comment.