Add fallback to node drain using --disable-eviction flag (#8094)
* Add fallback to node drain using --disable-eviction flag Signed-off-by: Utku Ozdemir <uoz@protonmail.com> * Move drain fallback tasks to separate file Signed-off-by: Utku Ozdemir <uoz@protonmail.com> * Add delegate_facts to fix the drain fallback Signed-off-by: Utku Ozdemir <uoz@protonmail.com> * Fix ansible-lint error Signed-off-by: Utku Ozdemir <uoz@protonmail.com> * Move drain fallback into block Signed-off-by: Utku Ozdemir <uoz@protonmail.com>
This commit is contained in:
parent
84b56d23a4
commit
10c30ea5b1
2 changed files with 41 additions and 2 deletions
|
@ -6,6 +6,12 @@ drain_nodes: true
|
||||||
drain_retries: 3
|
drain_retries: 3
|
||||||
drain_retry_delay_seconds: 10
|
drain_retry_delay_seconds: 10
|
||||||
|
|
||||||
|
drain_fallback_enabled: false
|
||||||
|
drain_fallback_grace_period: 300
|
||||||
|
drain_fallback_timeout: 360s
|
||||||
|
drain_fallback_retries: 0
|
||||||
|
drain_fallback_retry_delay_seconds: 10
|
||||||
|
|
||||||
upgrade_node_always_cordon: false
|
upgrade_node_always_cordon: false
|
||||||
upgrade_node_uncordon_after_drain_failure: true
|
upgrade_node_uncordon_after_drain_failure: true
|
||||||
upgrade_node_fail_if_drain_fails: true
|
upgrade_node_fail_if_drain_fails: true
|
||||||
|
|
|
@ -73,15 +73,48 @@
|
||||||
{{ bin_dir }}/kubectl drain
|
{{ bin_dir }}/kubectl drain
|
||||||
--force
|
--force
|
||||||
--ignore-daemonsets
|
--ignore-daemonsets
|
||||||
--grace-period {{ drain_grace_period }}
|
--grace-period {{ hostvars['localhost']['drain_grace_period_after_failure'] | default(drain_grace_period) }}
|
||||||
--timeout {{ drain_timeout }}
|
--timeout {{ hostvars['localhost']['drain_timeout_after_failure'] | default(drain_timeout) }}
|
||||||
--delete-emptydir-data {{ kube_override_hostname|default(inventory_hostname) }}
|
--delete-emptydir-data {{ kube_override_hostname|default(inventory_hostname) }}
|
||||||
{% if drain_pod_selector %}--pod-selector '{{ drain_pod_selector }}'{% endif %}
|
{% if drain_pod_selector %}--pod-selector '{{ drain_pod_selector }}'{% endif %}
|
||||||
when: drain_nodes
|
when: drain_nodes
|
||||||
register: result
|
register: result
|
||||||
|
failed_when:
|
||||||
|
- result.rc != 0
|
||||||
|
- not drain_fallback_enabled
|
||||||
until: result.rc == 0
|
until: result.rc == 0
|
||||||
retries: "{{ drain_retries }}"
|
retries: "{{ drain_retries }}"
|
||||||
delay: "{{ drain_retry_delay_seconds }}"
|
delay: "{{ drain_retry_delay_seconds }}"
|
||||||
|
|
||||||
|
- name: Drain fallback
|
||||||
|
block:
|
||||||
|
- name: Set facts after regular drain has failed
|
||||||
|
set_fact:
|
||||||
|
drain_grace_period_after_failure: "{{ drain_fallback_grace_period }}"
|
||||||
|
drain_timeout_after_failure: "{{ drain_fallback_timeout }}"
|
||||||
|
delegate_to: localhost
|
||||||
|
delegate_facts: yes
|
||||||
|
run_once: yes
|
||||||
|
|
||||||
|
- name: Drain node - fallback with disabled eviction
|
||||||
|
command: >-
|
||||||
|
{{ bin_dir }}/kubectl drain
|
||||||
|
--force
|
||||||
|
--ignore-daemonsets
|
||||||
|
--grace-period {{ drain_fallback_grace_period }}
|
||||||
|
--timeout {{ drain_fallback_timeout }}
|
||||||
|
--delete-emptydir-data {{ kube_override_hostname|default(inventory_hostname) }}
|
||||||
|
{% if drain_pod_selector %}--pod-selector '{{ drain_pod_selector }}'{% endif %}
|
||||||
|
--disable-eviction
|
||||||
|
register: drain_fallback_result
|
||||||
|
until: drain_fallback_result.rc == 0
|
||||||
|
retries: "{{ drain_fallback_retries }}"
|
||||||
|
delay: "{{ drain_fallback_retry_delay_seconds }}"
|
||||||
|
when:
|
||||||
|
- drain_nodes
|
||||||
|
- drain_fallback_enabled
|
||||||
|
- result.rc != 0
|
||||||
|
|
||||||
rescue:
|
rescue:
|
||||||
- name: Set node back to schedulable
|
- name: Set node back to schedulable
|
||||||
command: "{{ bin_dir }}/kubectl --kubeconfig {{ kube_config_dir }}/admin.conf uncordon {{ inventory_hostname }}"
|
command: "{{ bin_dir }}/kubectl --kubeconfig {{ kube_config_dir }}/admin.conf uncordon {{ inventory_hostname }}"
|
||||||
|
|
Loading…
Reference in a new issue