Skip to content
main.yml 10.3 KiB
Newer Older
---
- name: reset | stop services
  service:
    name: "{{ item }}"
    state: stopped
  with_items:
    - kubelet
  failed_when: false

- name: reset | remove services
    path: "/etc/systemd/system/{{ item }}"
    state: absent
    - kubelet.service
    - calico-node.service
    - containerd.service.d/http-proxy.conf
    - crio.service.d/http-proxy.conf
    - k8s-certs-renew.service
    - k8s-certs-renew.timer
  register: services_removed
    - containerd
    - crio
- name: reset | remove docker dropins
  file:
    path: "/etc/systemd/system/docker.service.d/{{ item }}"
    state: absent
  with_items:
    - docker-dns.conf
    - docker-options.conf
zhengchuan hu's avatar
zhengchuan hu committed
    - http-proxy.conf
    - docker-orphan-cleanup.conf
- name: reset | systemctl daemon-reload  # noqa 503
  when: services_removed.changed or docker_dropins_removed.changed
- name: reset | remove all containers
  shell: "set -o pipefail && {{ docker_bin_dir }}/docker ps -aq | xargs -r docker rm -fv"
  args:
    executable: /bin/bash
  register: remove_all_containers
  retries: 4
  until: remove_all_containers.rc == 0
  delay: 5
okamototk's avatar
okamototk committed
  when: container_manager == "docker"
- name: reset | restart docker if needed  # noqa 503
  service:
    name: docker
    state: restarted
okamototk's avatar
okamototk committed
  when: docker_dropins_removed.changed and container_manager == "docker"
- name: reset | check if crictl is present
  stat:
    path: "{{ bin_dir }}/crictl"
    get_attributes: no
    get_checksum: no
    get_mime: no
  register: crictl

- name: reset | stop all cri containers
  shell: "set -o pipefail && {{ bin_dir }}/crictl ps -q | xargs -r {{ bin_dir }}/crictl -t 60s stop"
  args:
    executable: /bin/bash
okamototk's avatar
okamototk committed
  register: remove_all_cri_containers
  retries: 5
  until: remove_all_cri_containers.rc == 0
okamototk's avatar
okamototk committed
    - containerd
  when:
    - crictl.stat.exists
    - container_manager in ["crio", "containerd"]
  ignore_errors: true  # noqa ignore-errors
- name: reset | force remove all cri containers
  command: "{{ bin_dir }}/crictl rm -a -f"
okamototk's avatar
okamototk committed
  register: remove_all_cri_containers
  retries: 5
  until: remove_all_cri_containers.rc == 0
okamototk's avatar
okamototk committed
    - containerd
  when:
    - crictl.stat.exists
    - container_manager in ["crio", "containerd"]
    - deploy_container_engine
- name: reset | stop and disable crio service
  service:
    name: crio
    state: stopped
    enabled: false
  failed_when: false
  tags: [ crio ]
  when: container_manager == "crio"

- name: reset | forcefully wipe CRI-O's container and image storage
  command: "crio wipe -f"
  failed_when: false
  tags: [ crio ]
  when: container_manager == "crio"

- name: reset | stop all cri pods
  shell: "set -o pipefail && {{ bin_dir }}/crictl pods -q | xargs -r {{ bin_dir }}/crictl -t 60s stopp"
  args:
    executable: /bin/bash
okamototk's avatar
okamototk committed
  register: remove_all_cri_containers
  retries: 5
  until: remove_all_cri_containers.rc == 0
  tags: [ containerd ]
  when:
    - crictl.stat.exists
    - container_manager == "containerd"
  ignore_errors: true  # noqa ignore-errors
- block:
    - name: reset | force remove all cri pods
      command: "{{ bin_dir }}/crictl rmp -a -f"
      register: remove_all_cri_containers
      retries: 5
      until: remove_all_cri_containers.rc == 0
      delay: 5
      tags: [ containerd ]
      when:
        - crictl.stat.exists
        - container_manager == "containerd"

  rescue:
    - name: reset | force remove all cri pods (rescue)
      shell: "ip netns list | cut -d' ' -f 1 | xargs -n1 ip netns delete && {{ bin_dir }}/crictl rmp -a -f"
okamototk's avatar
okamototk committed

- name: reset | stop etcd services
  service:
    name: "{{ item }}"
    state: stopped
  with_items:
    - etcd
    - etcd-events
  failed_when: false
  tags:
    - services

- name: reset | remove etcd services
  file:
    path: "/etc/systemd/system/{{ item }}.service"
    state: absent
  with_items:
    - etcd
    - etcd-events
  register: services_removed
  tags:
    - services

- name: reset | remove containerd
  when: container_manager == 'containerd'
  block:
    - name: reset | stop containerd service
      service:
        name: containerd
        state: stopped
      failed_when: false
      tags:
        - services

    - name: reset | remove containerd service
      file:
        path: /etc/systemd/system/containerd.service
        state: absent
      register: services_removed
      tags:
        - services

- name: reset | gather mounted kubelet dirs  # noqa 301
  shell: set -o pipefail && mount | grep /var/lib/kubelet/ | awk '{print $3}' | tac
    executable: /bin/bash
  register: mounted_dirs
  failed_when: false
- name: reset | unmount kubelet dirs  # noqa 301
  command: umount -f {{ item }}
  with_items: "{{ mounted_dirs.stdout_lines }}"
  register: umount_dir
  when: mounted_dirs
  retries: 4
  until: umount_dir.rc == 0
  delay: 5
- name: flush iptables
  iptables:
    flush: yes
- name: Clear IPVS virtual server table
  command: "ipvsadm -C"
  ignore_errors: true  # noqa ignore-errors
    - kube_proxy_mode == 'ipvs' and inventory_hostname in groups['k8s_cluster']
- name: reset | check kube-ipvs0 network device
  stat:
    path: /sys/class/net/kube-ipvs0
    get_attributes: no
    get_checksum: no
    get_mime: no
- name: reset | Remove kube-ipvs0
  command: "ip link del kube-ipvs0"
  when:
    - kube_proxy_mode == 'ipvs'
- name: reset | check nodelocaldns network device
  stat:
    path: /sys/class/net/nodelocaldns
    get_attributes: no
    get_checksum: no
    get_mime: no
  register: nodelocaldns_device

- name: reset | Remove nodelocaldns
  command: "ip link del nodelocaldns"
  when:
    - enable_nodelocaldns|default(false)|bool
    - nodelocaldns_device.stat.exists

- name: reset | delete some files and directories
  file:
    path: "{{ item }}"
    state: absent
    - /var/lib/kubelet
    - "{{ containerd_storage_dir }}"
    - "{{ ansible_env.HOME | default('/root') }}/.kube"
    - "{{ ansible_env.HOME | default('/root') }}/.helm"
    - "{{ etcd_data_dir }}"
    - "{{ etcd_events_data_dir }}"
    - "{{ etcd_config_dir }}"
    - /var/log/calico
    - /etc/cni
    - /etc/nerdctl
    - "{{ nginx_config_dir }}"
    - /etc/dnsmasq.d
    - /etc/dnsmasq.conf
    - /etc/dnsmasq.d-available
    - /etc/etcd.env
    - /etc/calico
    - /etc/NetworkManager/conf.d/calico.conf
    - /etc/NetworkManager/conf.d/k8s.conf
jwfang's avatar
jwfang committed
    - /etc/weave.env
    - /opt/cni
    - /etc/dhcp/dhclient.d/zdnsupdate.sh
    - /etc/dhcp/dhclient-exit-hooks.d/zdnsupdate
tanshanshan's avatar
tanshanshan committed
    - /run/flannel
    - /etc/flannel
    - /run/kubernetes
    - /usr/local/share/ca-certificates/etcd-ca.crt
tanshanshan's avatar
tanshanshan committed
    - /etc/ssl/certs/etcd-ca.pem
    - /etc/ssl/certs/kube-ca.pem
    - /etc/pki/ca-trust/source/anchors/etcd-ca.crt
    - /etc/pki/ca-trust/source/anchors/kube-ca.crt
tanshanshan's avatar
tanshanshan committed
    - /var/log/pods/
jwfang's avatar
jwfang committed
    - "{{ bin_dir }}/kubelet"
    - "{{ bin_dir }}/etcd-scripts"
    - "{{ bin_dir }}/etcd"
    - "{{ bin_dir }}/etcd-events"
jwfang's avatar
jwfang committed
    - "{{ bin_dir }}/etcdctl"
jwfang's avatar
jwfang committed
    - "{{ bin_dir }}/kubernetes-scripts"
    - "{{ bin_dir }}/kubectl"
    - "{{ bin_dir }}/kubeadm"
jwfang's avatar
jwfang committed
    - "{{ bin_dir }}/helm"
    - "{{ bin_dir }}/calicoctl"
    - "{{ bin_dir }}/calicoctl.sh"
    - "{{ bin_dir }}/calico-upgrade"
jwfang's avatar
jwfang committed
    - "{{ bin_dir }}/weave"
    - "{{ bin_dir }}/nerdctl"
    - "{{ bin_dir }}/k8s-certs-renew.sh"
    - /var/lib/cni
Erwan Miran's avatar
Erwan Miran committed
    - /etc/openvswitch
    - /run/openvswitch
    - /var/lib/kube-router
    - /var/lib/calico
    - /etc/cilium
    - /run/calico
    - /etc/bash_completion.d/kubectl.sh
    - /etc/bash_completion.d/crictl
    - /etc/bash_completion.d/nerdctl
    - /etc/bash_completion.d/krew
    - /etc/bash_completion.d/krew.sh
    - "{{ krew_root_dir }}"
    - /etc/modules-load.d/kube_proxy-ipvs.conf
    - /etc/modules-load.d/kubespray-br_netfilter.conf
    - /etc/modules-load.d/kubespray-kata-containers.conf
    - /usr/libexec/kubernetes
    - /etc/origin/openvswitch
    - /etc/origin/ovn
    - /etc/crictl.yaml
  ignore_errors: true  # noqa ignore-errors
- name: reset | remove containerd binary files
  file:
    path: "{{ containerd_bin_dir }}/{{ item }}"
    state: absent
  with_items:
    - containerd
    - containerd-shim
    - containerd-shim-runc-v1
    - containerd-shim-runc-v2
    - containerd-stress
    - crictl
    - critest
    - ctd-decoder
    - ctr
    - runc
  ignore_errors: true  # noqa ignore-errors
  when: container_manager == 'containerd'
  tags:
    - files

- name: reset | remove dns settings from dhclient.conf
  blockinfile:
    state: absent
    marker: "# Ansible entries {mark}"
  failed_when: false
  with_items:
    - /etc/dhclient.conf
    - /etc/dhcp/dhclient.conf

- name: reset | remove host entries from /etc/hosts
  blockinfile:
    state: absent
    marker: "# Ansible inventory hosts {mark}"
- name: reset | include file with reset tasks specific to the network_plugin if exists
  include_tasks: "{{ (role_path,'../network_plugin',kube_network_plugin,'tasks/reset.yml') | community.general.path_join | realpath  }}"
    - kube_network_plugin in ['flannel', 'cilium', 'kube-router', 'calico']
- name: reset | Restart network
  service:
    name: >-
      {% if ansible_os_family == "RedHat" -%}
Cristian Calin's avatar
Cristian Calin committed
      {%- if ansible_distribution_major_version|int == 8 or is_fedora_coreos or ansible_distribution == "Fedora" -%}
      NetworkManager
      {%- else -%}
      {%- endif -%}
      {%- elif ansible_distribution == "Ubuntu" and ansible_distribution_release in ["hirsute","bionic", "focal"] -%}
      {%- elif ansible_os_family == "Debian" -%}
      networking
      {%- endif %}
    state: restarted
    - ansible_os_family not in ["Flatcar", "Flatcar Container Linux by Kinvolk"]
    - reset_restart_network