ceph-ansible/infrastructure-playbooks/rolling_update.yml

---
# This playbook does a rolling update for all the Ceph services
#
# The value of 'serial:' adjusts the number of servers to be updated simultaneously.
# We recommend a value of 1, which means hosts of a group (e.g: monitor) will be
# upgraded one by one. It is really crucial for the update process to happen
# in a serialized fashion. DO NOT CHANGE THIS VALUE.
#
#
# If you run a Ceph community version, you have to change the variable: ceph_stable_release to the new release
#
# If you run Red Hat Ceph Storage and are doing a **major** update (e.g: from 2 to 3), you have two options:
#   - if you use a CDN, you have to change the ceph_rhcs_version to a newer one
#   - if you use an ISO, you have to change the ceph_rhcs_iso_path to the directory containing the new Ceph version
#

- name: confirm whether user really meant to upgrade the cluster
  hosts: localhost
  become: false
  vars:
    - mgr_group_name: mgrs
    - jewel_minor_update: False

  vars_prompt:
    - name: ireallymeanit
      prompt: Are you sure you want to upgrade the cluster?
      default: 'no'
      private: no

  tasks:
    - name: exit playbook, if user did not mean to upgrade cluster
      fail:
        msg: >
          "Exiting rolling_update.yml playbook, cluster was NOT upgraded.
           To upgrade the cluster, either say 'yes' on the prompt or
           use `-e ireallymeanit=yes` on the command line when
           invoking the playbook"
      when: ireallymeanit != 'yes'

    - name: fail if no mgr host is present in the inventory
      fail:
        msg: "Please add a mgr host to your inventory."
      when:
        - not jewel_minor_update
        - groups.get(mgr_group_name, []) | length == 0


- name: gather facts and check the init system

  hosts:
    - "{{ mon_group_name|default('mons') }}"
    - "{{ osd_group_name|default('osds') }}"
    - "{{ mds_group_name|default('mdss') }}"
    - "{{ rgw_group_name|default('rgws') }}"
    - "{{ mgr_group_name|default('mgrs') }}"
    - "{{ rbd_mirror_group_name|default('rbdmirrors') }}"
    - "{{ nfs_group_name|default('nfss') }}"
    - "{{ client_group_name|default('clients') }}"

  become: True
  gather_facts: False
  vars:
    delegate_facts_host: True
  tasks:
    - debug: msg="gather facts on all Ceph hosts for following reference"

    - name: gather facts
      setup:
      when:
        - not delegate_facts_host | bool

    - name: gather and delegate facts
      setup:
      delegate_to: "{{ item }}"
      delegate_facts: True
      with_items: "{{ groups['all'] }}"
      when:
        - delegate_facts_host | bool

    - set_fact: rolling_update=true

- name: upgrade ceph mon cluster

  vars:
    health_mon_check_retries: 5
    health_mon_check_delay: 15
    upgrade_ceph_packages: True

  hosts:
    - "{{ mon_group_name|default('mons') }}"

  serial: 1
  become: True

  pre_tasks:
    - name: set mon_host_count
      set_fact: mon_host_count={{ groups[mon_group_name] | length }}

    - debug: msg="WARNING - upgrading a ceph cluster with only one monitor node ({{ inventory_hostname }})"
      when: mon_host_count | int == 1

    - name: fail when single containerized monitor
      fail:
        msg: "Upgrades of a single monitor are not supported, also running 1 monitor is not recommended always use 3."
      when:
        - containerized_deployment
        - mon_host_count | int == 1

    - name: stop ceph mon
      systemd:
        name: ceph-mon@{{ ansible_hostname }}
        state: stopped
        enabled: yes
      when:
        - not containerized_deployment

  roles:
    - ceph-defaults
    - { role: ceph-common, when: not containerized_deployment }
    - { role: ceph-docker-common, when: containerized_deployment }
    - ceph-config
    - ceph-mon

  post_tasks:
    - name: start ceph mon
      systemd:
        name: ceph-mon@{{ ansible_hostname }}
        state: started
        enabled: yes
      when:
        - not containerized_deployment

    - name: restart containerized ceph mon
      systemd:
        name: ceph-mon@{{ ansible_hostname }}
        state: restarted
        enabled: yes
        daemon_reload: yes
      when:
        - containerized_deployment

    - name: set mon_host_count
      set_fact: mon_host_count={{ groups[mon_group_name] | length }}

    - name: select a running monitor if multiple monitors
      set_fact: mon_host={{ item }}
      with_items: "{{ groups[mon_group_name] }}"
      when:
        - mon_host_count | int > 1
        - item != inventory_hostname

    - name: select first monitor if only one monitor
      set_fact: mon_host={{ item }}
      with_items: "{{ groups[mon_group_name][0] }}"
      when:
        - mon_host_count | int == 1

    - name: non container | waiting for the monitor to join the quorum...
      command: ceph --cluster "{{ cluster }}" -s --format json
      register: ceph_health_raw
      until: >
        hostvars[mon_host]['ansible_hostname'] in (ceph_health_raw.stdout | from_json)["quorum_names"] or
        hostvars[mon_host]['ansible_fqdn'] in (ceph_health_raw.stdout | from_json)["quorum_names"]
      retries: "{{ health_mon_check_retries }}"
      delay: "{{ health_mon_check_delay }}"
      delegate_to: "{{ mon_host }}"
      when:
        - not containerized_deployment

    - name: container | waiting for the containerized monitor to join the quorum...
      command: docker exec ceph-mon-{{ hostvars[mon_host]['ansible_hostname'] }} ceph --cluster "{{ cluster }}" -s --format json
      register: ceph_health_raw
      until: >
        hostvars[mon_host]['ansible_hostname'] in (ceph_health_raw.stdout | from_json)["quorum_names"] or
        hostvars[mon_host]['ansible_fqdn'] in (ceph_health_raw.stdout | from_json)["quorum_names"]
      retries: "{{ health_mon_check_retries }}"
      delay: "{{ health_mon_check_delay }}"
      delegate_to: "{{ mon_host }}"
      when:
        - containerized_deployment

    - name: set osd flags
      command: ceph --cluster {{ cluster }} osd set {{ item }}
      with_items:
        - noout
        - noscrub
        - nodeep-scrub
      delegate_to: "{{ mon_host }}"
      when: not containerized_deployment

    - name: set containerized osd flags
      command: |
        docker exec ceph-mon-{{ hostvars[mon_host]['ansible_hostname'] }} ceph --cluster {{ cluster }} osd set {{ item }}
      with_items:
        - noout
        - noscrub
        - nodeep-scrub
      delegate_to: "{{ mon_host }}"
      when: containerized_deployment


- name: upgrade ceph mgr node

  vars:
    upgrade_ceph_packages: True

  hosts:
    - "{{ mgr_group_name|default('mgrs') }}"

  serial: 1
  become: True

  pre_tasks:
    - name: non container - get current fsid
      command: "ceph --cluster {{ cluster }} fsid"
      register: cluster_uuid_non_container
      delegate_to: "{{ groups[mon_group_name][0] }}"
      when:
        - not containerized_deployment

    - name: container - get current fsid
      command: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }} ceph --cluster {{ cluster }} fsid"
      register: cluster_uuid_container
      delegate_to: "{{ groups[mon_group_name][0] }}"
      when:
        - containerized_deployment

    - name: set_fact ceph_cluster_fsid
      set_fact:
        ceph_cluster_fsid: "{{ cluster_uuid_container.stdout if containerized_deployment else cluster_uuid_non_container.stdout }}"

    - name: non container | create ceph mgr keyring(s)
      command: "ceph --cluster {{ cluster }} auth get-or-create mgr.{{ hostvars[item]['ansible_hostname'] }} mon 'allow profile mgr' osd 'allow *' mds 'allow *' -o /etc/ceph/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
      args:
        creates: "{{ ceph_conf_key_directory }}/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
      changed_when: false
      delegate_to: "{{ groups[mon_group_name][0] }}"
      with_items:
        - "{{ groups.get(mgr_group_name, []) }}"
      when:
        - not containerized_deployment
        - "{{ groups.get(mgr_group_name, []) | length > 0 }}"

    - name: container | create ceph mgr keyring(s)
      command: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }} ceph --cluster {{ cluster }} auth get-or-create mgr.{{ hostvars[item]['ansible_hostname'] }} mon 'allow profile mgr' osd 'allow *' mds 'allow *' -o /etc/ceph/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
      args:
        creates: "{{ ceph_conf_key_directory }}/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
      changed_when: false
      delegate_to: "{{ groups[mon_group_name][0] }}"
      with_items:
        - "{{ groups.get(mgr_group_name, []) }}"
      when:
        - containerized_deployment
        - "{{ groups.get(mgr_group_name, []) | length > 0 }}"

    - name: fetch ceph mgr key(s)
      fetch:
        src: "{{ ceph_conf_key_directory }}/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
        dest: "{{ fetch_directory }}/{{ ceph_cluster_fsid }}/{{ ceph_conf_key_directory }}/"
        flat: yes
        fail_on_missing: no
      delegate_to: "{{ groups[mon_group_name][0] }}"
      with_items:
        - "{{ groups.get(mgr_group_name, []) }}"

    # The following task has a failed_when: false
    # to handle the scenario where no mgr existed before the upgrade
    # or if we run a Ceph cluster before Luminous
    - name: stop ceph mgr
      systemd:
        name: ceph-mgr@{{ ansible_hostname }}
        state: stopped
        enabled: yes
      failed_when: false
      when:
        - not containerized_deployment

  roles:
    - ceph-defaults
    - { role: ceph-common, when: not containerized_deployment }
    - { role: ceph-docker-common, when: containerized_deployment }
    - ceph-config
    - { role: ceph-mgr,
        when: "(ceph_release_num[ceph_release] >= ceph_release_num.luminous) or
               (ceph_release_num[ceph_release] < ceph_release_num.luminous and rolling_update)" }

  post_tasks:
    - name: start ceph mgr
      systemd:
        name: ceph-mgr@{{ ansible_hostname }}
        state: started
        enabled: yes
      when:
        - not containerized_deployment

    - name: restart containerized ceph mgr
      systemd:
        name: ceph-mgr@{{ ansible_hostname }}
        state: restarted
        enabled: yes
        daemon_reload: yes
      when:
        - containerized_deployment


- name: upgrade ceph osds cluster

  vars:
    health_osd_check_retries: 40
    health_osd_check_delay: 30
    upgrade_ceph_packages: True

  hosts:
    - "{{ osd_group_name|default('osds') }}"

  serial: 1
  become: True

  pre_tasks:
    - name: get osd numbers
      shell: "if [ -d /var/lib/ceph/osd ] ; then ls /var/lib/ceph/osd | sed 's/.*-//' ; fi"
      register: osd_ids
      changed_when: false
      when: not containerized_deployment

    - name: stop ceph osd
      systemd:
        name: ceph-osd@{{ item }}
        state: stopped
        enabled: yes
      with_items: "{{ osd_ids.stdout_lines }}"
      when:
        - not containerized_deployment

  roles:
    - ceph-defaults
    - { role: ceph-common, when: not containerized_deployment }
    - { role: ceph-docker-common, when: containerized_deployment }
    - ceph-config
    - ceph-osd

  post_tasks:
    - name: get osd numbers
      shell: "if [ -d /var/lib/ceph/osd ] ; then ls /var/lib/ceph/osd | sed 's/.*-//' ; fi"
      register: osd_ids
      changed_when: false
      when: not containerized_deployment

    - name: start ceph osd
      systemd:
        name: ceph-osd@{{ item }}
        state: started
        enabled: yes
      with_items: "{{ osd_ids.stdout_lines }}"
      when:
        - not containerized_deployment

    - name: restart containerized ceph osd
      systemd:
        name: ceph-osd@{{ item | basename }}
        state: restarted
        enabled: yes
        daemon_reload: yes
      with_items: "{{ devices }}"
      when:
        - containerized_deployment

    - name: set_fact docker_exec_cmd_osd
      set_fact:
        docker_exec_cmd_update_osd: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }}"
      when:
        - containerized_deployment

    - name: get num_pgs - non container
      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph --cluster {{ cluster }} -s --format json"
      register: ceph_pgs
      delegate_to: "{{ groups[mon_group_name][0] }}"

    - name: waiting for clean pgs...
      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph --cluster {{ cluster }} -s --format json"
      register: ceph_health_post
      until: >
        ((ceph_health_post.stdout | from_json).pgmap.pgs_by_state | length) == 1
        and
        (ceph_health_post.stdout | from_json).pgmap.pgs_by_state.0.state_name == "active+clean"
      delegate_to: "{{ groups[mon_group_name][0] }}"
      retries: "{{ health_osd_check_retries }}"
      delay: "{{ health_osd_check_delay }}"
      when:
        - (ceph_pgs.stdout | from_json).pgmap.num_pgs != 0


- name: unset osd flags
  vars:
    - jewel_minor_update: False

  hosts:
    - "{{ mon_group_name|default('mons') }}"

  become: True

  roles:
    - ceph-defaults

  tasks:
    - name: set_fact docker_exec_cmd_osd
      set_fact:
        docker_exec_cmd_update_osd: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }}"
      when:
        - containerized_deployment

    - name: unset osd flags
      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph osd unset {{ item }} --cluster {{ cluster }}"
      with_items:
        - noout
        - noscrub
        - nodeep-scrub
      delegate_to: "{{ groups[mon_group_name][0] }}"

    - name: get osd versions
      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph --cluster {{ cluster }} versions"
      register: ceph_versions
      delegate_to: "{{ groups[mon_group_name][0] }}"
      when:
        - not jewel_minor_update

    - name: set_fact ceph_versions_osd
      set_fact:
        ceph_versions_osd: "{{ (ceph_versions.stdout|from_json).osd }}"
      delegate_to: "{{ groups[mon_group_name][0] }}"
      when:
        - not jewel_minor_update

    # length == 1 means there is a single osds versions entry
    # thus all the osds are running the same version
    - name: complete osds upgrade
      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph --cluster {{ cluster }} osd require-osd-release luminous"
      delegate_to: "{{ groups[mon_group_name][0] }}"
      when:
        - (ceph_versions.get('stdout', '{}')|from_json).get('osd', {}) | length == 1
        - ceph_versions_osd | string | search("ceph version 12")
        - not jewel_minor_update


- name: upgrade ceph mdss cluster

  vars:
    upgrade_ceph_packages: True

  hosts:
    - "{{ mds_group_name|default('mdss') }}"

  serial: 1
  become: True

  pre_tasks:
    - name: stop ceph mds
      systemd:
        name: ceph-mds@{{ ansible_hostname }}
        state: stopped
        enabled: yes
      when:
        - not containerized_deployment

  roles:
    - ceph-defaults
    - { role: ceph-common, when: not containerized_deployment }
    - { role: ceph-docker-common, when: containerized_deployment }
    - ceph-config
    - ceph-mds

  post_tasks:
    - name: start ceph mds
      systemd:
        name: ceph-mds@{{ ansible_hostname }}
        state: started
        enabled: yes
      when:
        - not containerized_deployment

    - name: restart ceph mds
      systemd:
        name: ceph-mds@{{ ansible_hostname }}
        state: restarted
        enabled: yes
        daemon_reload: yes
      when:
        - containerized_deployment


- name: upgrade ceph rgws cluster

  vars:
    upgrade_ceph_packages: True

  hosts:
    - "{{ rgw_group_name|default('rgws') }}"

  serial: 1
  become: True

  pre_tasks:
    - name: stop ceph rgw
      systemd:
        name: ceph-radosgw@rgw.{{ ansible_hostname }}
        state: stopped
        enabled: yes
      when:
        - not containerized_deployment

  roles:
    - ceph-defaults
    - { role: ceph-common, when: not containerized_deployment }
    - { role: ceph-docker-common, when: containerized_deployment }
    - ceph-config
    - ceph-rgw

  post_tasks:
    - name: start ceph rgw
      systemd:
        name: ceph-radosgw@rgw.{{ ansible_hostname }}
        state: started
        enabled: yes
      when:
        - not containerized_deployment

    - name: restart containerized ceph rgw
      systemd:
        name: ceph-radosgw@rgw.{{ ansible_hostname }}
        state: restarted
        enabled: yes
        daemon_reload: yes
      when:
        - containerized_deployment


- name: upgrade ceph rbd mirror node

  vars:
    upgrade_ceph_packages: True

  hosts:
    - "{{ rbd_mirror_group_name|default('rbdmirrors') }}"

  serial: 1
  become: True

  pre_tasks:
    # NOTE(leseb): these tasks have a 'failed_when: false'
    # in case we run before luminous or after
    - name: stop ceph rbd mirror before luminous
      systemd:
        name: "ceph-rbd-mirror@{{ ceph_rbd_mirror_local_user }}"
        state: stopped
        enabled: no
      failed_when: false

    - name: stop ceph rbd mirror for and after luminous
      systemd:
        name: "ceph-rbd-mirror@rbd-mirror.{{ ansible_hostname }}"
        state: stopped
        enabled: yes
      failed_when: false

  roles:
    - ceph-defaults
    - { role: ceph-common, when: not containerized_deployment }
    - { role: ceph-docker-common, when: containerized_deployment }
    - ceph-config
    - ceph-rbd-mirror

  post_tasks:
    - name: start ceph rbd mirror
      systemd:
        name: "ceph-rbd-mirror@rbd-mirror.{{ ansible_hostname }}"
        state: started
        enabled: yes
      when:
        - not containerized_deployment

    - name: restart containerized ceph rbd mirror
      systemd:
        name: ceph-rbd-mirror@rbd-mirror.{{ ansible_hostname }}
        state: restarted
        enabled: yes
        daemon_reload: yes
      when:
        - containerized_deployment


- name: upgrade ceph nfs node

  vars:
    upgrade_ceph_packages: True

  hosts:
    - "{{ nfs_group_name|default('nfss') }}"

  serial: 1
  become: True

  pre_tasks:
    # failed_when: false is here so that if we upgrade
    # from a version of ceph that does not have nfs-ganesha
    # then this task will not fail
    - name: stop ceph nfs
      systemd:
        name: nfs-ganesha
        state: stopped
        enabled: yes
      failed_when: false
      when:
        - not containerized_deployment

  roles:
    - ceph-defaults
    - { role: ceph-common, when: not containerized_deployment }
    - { role: ceph-docker-common, when: containerized_deployment }
    - ceph-config
    - { role: ceph-nfs,
        when: "(ceph_release_num[ceph_release] >= ceph_release_num.luminous) or
               (ceph_release_num[ceph_release] < ceph_release_num.luminous and rolling_update)" }

  post_tasks:
    - name: start nfs gateway
      systemd:
        name: nfs-ganesha
        state: started
        enabled: yes
      when:
        - not containerized_deployment
        - ceph_nfs_enable_service

    - name: systemd restart nfs container
      systemd:
        name: ceph-nfs@{{ ceph_nfs_service_suffix | default(ansible_hostname) }}
        state: restarted
        enabled: yes
        daemon_reload: yes
      when:
        - ceph_nfs_enable_service
        - containerized_deployment


- name: upgrade ceph client node

  vars:
    upgrade_ceph_packages: True

  hosts:
    - "{{ client_group_name|default('clients') }}"

  serial: 1
  become: True

  roles:
    - ceph-defaults
    - { role: ceph-common, when: not containerized_deployment }
    - { role: ceph-docker-common, when: containerized_deployment }
    - ceph-config
    - ceph-client


- name: show ceph status

  hosts:
    - "{{ mon_group_name|default('mons') }}"

  become: True

  roles:
    - ceph-defaults

  tasks:
    - name: set_fact docker_exec_cmd_status
      set_fact:
        docker_exec_cmd_status: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }}"
      when:
        - containerized_deployment

    - name: show ceph status
      command: "{{ docker_exec_cmd_status|default('') }} ceph --cluster {{ cluster }} -s"
      delegate_to: "{{ groups[mon_group_name][0] }}"
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
+								---
 								# This playbook does a rolling update for all the Ceph services
-												rolling_update: clarify "serial" usage

Prior to this commit the serial variable was poorly documented. Now we
are making clear that this value should be left untouched as the rolling
update mechanism should happen serially.

Solves: bz-1396742
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-11-21 18:29:05 +08:00
+								#
 								# The value of 'serial:' adjusts the number of servers to be updated simultaneously.
 								# We recommend a value of 1, which means hosts of a group (e.g: monitor) will be
 								# upgraded one by one. It is really crucial for the update process to happen
 								# in a serialized fashion. DO NOT CHANGE THIS VALUE.
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
+								#
 								#
-												rolling_update: clarify update doc

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1490188
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-14 05:46:29 +08:00
+								# If you run a Ceph community version, you have to change the variable: ceph_stable_release to the new release
 								#
 								# If you run Red Hat Ceph Storage and are doing a **major** update (e.g: from 2 to 3), you have two options:
 								#   - if you use a CDN, you have to change the ceph_rhcs_version to a newer one
 								#   - if you use an ISO, you have to change the ceph_rhcs_iso_path to the directory containing the new Ceph version
 								#
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
-												rolling-upgrade: cleanup and cosmetic

refactoring the current code to apply the default syntax style that is
used in the entire playbook.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-01 00:13:47 +08:00
+								- name: confirm whether user really meant to upgrade the cluster
 								  hosts: localhost
-												rolling_update: do not require root to answer question

There is no need to ask for root on the local action. This will prompt
for a password the current user is not part of sudoers. That's
  unnecessary anyways.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1516947
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-12-16 00:39:32 +08:00
+								  become: false
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								  vars:
 								    - mgr_group_name: mgrs
-												rolling update: add mgr exception for jewel minor updates

When update from a minor Jewel version to another, the playbook will
fail on the task "fail if no mgr host is present in the inventory".
This now can be worked around by running Ansible with_items

-e jewel_minor_update=true

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1535382
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-01-17 22:18:11 +08:00
+								    - jewel_minor_update: False
-												rolling-upgrade: cleanup and cosmetic

refactoring the current code to apply the default syntax style that is
used in the entire playbook.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-01 00:13:47 +08:00
 								  vars_prompt:
 								    - name: ireallymeanit
 								      prompt: Are you sure you want to upgrade the cluster?
 								      default: 'no'
 								      private: no
 								  tasks:
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								    - name: exit playbook, if user did not mean to upgrade cluster
 								      fail:
 								        msg: >
 								          "Exiting rolling_update.yml playbook, cluster was NOT upgraded.
 								           To upgrade the cluster, either say 'yes' on the prompt or
 								           use `-e ireallymeanit=yes` on the command line when
 								           invoking the playbook"
 								      when: ireallymeanit != 'yes'
 								    - name: fail if no mgr host is present in the inventory
 								      fail:
 								        msg: "Please add a mgr host to your inventory."
 								      when:
-												rolling update: add mgr exception for jewel minor updates

When update from a minor Jewel version to another, the playbook will
fail on the task "fail if no mgr host is present in the inventory".
This now can be worked around by running Ansible with_items

-e jewel_minor_update=true

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1535382
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-01-17 22:18:11 +08:00
+								        - not jewel_minor_update
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								        - groups.get(mgr_group_name, []) | length == 0
-												rolling-upgrade: cleanup and cosmetic

refactoring the current code to apply the default syntax style that is
used in the entire playbook.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-01 00:13:47 +08:00
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
-												infrastructure-playbooks: fix syntax errors in all playbooks

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2016-10-26 05:56:58 +08:00
+								- name: gather facts and check the init system
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
-												infrastructure-playbooks: fix syntax errors in all playbooks

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2016-10-26 05:56:58 +08:00
+								  hosts:
-												rolling-update: do not set group name vars at playbook level

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2017-03-08 03:16:12 +08:00
+								    - "{{ mon_group_name|default('mons') }}"
 								    - "{{ osd_group_name|default('osds') }}"
 								    - "{{ mds_group_name|default('mdss') }}"
 								    - "{{ rgw_group_name|default('rgws') }}"
-												test: add mgr section to the host inventory file

Without this, we don't test the mgr role so we need to add it.

Co-Authored-by: Guillaume Abrioux <gabrioux@redhat.com>
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-04-11 20:20:11 +08:00
+								    - "{{ mgr_group_name|default('mgrs') }}"
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - "{{ rbd_mirror_group_name|default('rbdmirrors') }}"
 								    - "{{ nfs_group_name|default('nfss') }}"
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
+								    - "{{ client_group_name|default('clients') }}"
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
 								  become: True
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								  gather_facts: False
 								  vars:
 								    delegate_facts_host: True
-												gather facts first

there are vars like hostvars["rgws"]["ansible_hostname"] under
ceph-common

											
										
										
											2015-04-15 03:50:39 +08:00
+								  tasks:
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
+								    - debug: msg="gather facts on all Ceph hosts for following reference"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								    - name: gather facts
 								      setup:
 								      when:
 								        - not delegate_facts_host | bool
 								    - name: gather and delegate facts
 								      setup:
 								      delegate_to: "{{ item }}"
 								      delegate_facts: True
 								      with_items: "{{ groups['all'] }}"
 								      when:
 								        - delegate_facts_host | bool
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								    - set_fact: rolling_update=true
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
+								- name: upgrade ceph mon cluster
-												Control when ceph packages get updated

Currently, all the ceph package installation resources use
"state=latest", which means subsequent runs of the ceph playbooks
could result in ceph being upgraded if there are package updates
available in the selected repo.

This commit adds a new variable to ceph-common called
'upgrade_ceph_packages' which defaults to False.  This variable is used
in the package installation resources for ceph packages to determine if
the resource should use "state=present" or "state=latest".  If the
variable gets set to True, "state=latest" will be used.

Additionally, we update rolling_update.yml to override
upgrade_ceph_packages to true to permit package upgrades in this
context specifically.

Closes issue #506

											
										
										
											2016-01-29 23:54:59 +08:00
+								  vars:
-												upgrade: add custom timeout options

This commit introduces the ability to configure delays and retries for
cluster health checks, for both monitors and OSDs.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-03 17:24:59 +08:00
+								    health_mon_check_retries: 5
-												rolling_update: set health_mon_check_delay to 15

The old value of 10 did not give enough time for a containerized mon to
pass the health check.

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2017-06-13 05:07:52 +08:00
+								    health_mon_check_delay: 15
-												rolling_update: add variable to upgrade ceph

My stupid self removed this crucial variable here: 217ce3ca thinking it
was another hard coded variable import where this is actually the
trigger for the upgrade.

Closes: #1071

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-11-05 00:31:02 +08:00
+								    upgrade_ceph_packages: True
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
+								  hosts:
-												rolling-update: do not set group name vars at playbook level

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2017-03-08 03:16:12 +08:00
+								    - "{{ mon_group_name|default('mons') }}"
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
 								  serial: 1
 								  become: True
-												rolling update: stop MONs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:40:31 +08:00
+								  pre_tasks:
-												Warn user when upgrading cluster with only one mon

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-15 03:04:43 +08:00
+								    - name: set mon_host_count
-												Resolve issues when groups names not in default value.

											
										
										
											2017-03-24 14:40:15 +08:00
+								      set_fact: mon_host_count={{ groups[mon_group_name] | length }}
-												Warn user when upgrading cluster with only one mon

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-15 03:04:43 +08:00
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								    - debug: msg="WARNING - upgrading a ceph cluster with only one monitor node ({{ inventory_hostname }})"
-												Warn user when upgrading cluster with only one mon

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-15 03:04:43 +08:00
+								      when: mon_host_count | int == 1
-												rolling update: stop MONs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:40:31 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: fail when single containerized monitor
 								      fail:
 								        msg: "Upgrades of a single monitor are not supported, also running 1 monitor is not recommended always use 3."
 								      when:
 								        - containerized_deployment
 								        - mon_host_count | int == 1
-												rolling update: stop MONs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:40:31 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: stop ceph mon
 								      systemd:
-												rolling update: stop MONs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:40:31 +08:00
+								        name: ceph-mon@{{ ansible_hostname }}
 								        state: stopped
 								        enabled: yes
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - not containerized_deployment
-												rolling update: stop MONs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:40:31 +08:00
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
+								  roles:
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
+								    - ceph-defaults
-												Move role dependencies in site.yml/site-docker.yml

This will give us more flexibility and avoid a lot of useless when
skipping all tasks from a non-desired role.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:48:13 +08:00
+								    - { role: ceph-common, when: not containerized_deployment }
 								    - { role: ceph-docker-common, when: containerized_deployment }
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								    - ceph-config
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
+								    - ceph-mon
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
+								  post_tasks:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: start ceph mon
 								      systemd:
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
+								        name: ceph-mon@{{ ansible_hostname }}
-												rolling update: stop MONs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:40:31 +08:00
+								        state: started
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
+								        enabled: yes
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - not containerized_deployment
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: restart containerized ceph mon
 								      systemd:
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								        name: ceph-mon@{{ ansible_hostname }}
 								        state: restarted
 								        enabled: yes
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								        daemon_reload: yes
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - containerized_deployment
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								    - name: set mon_host_count
-												Resolve issues when groups names not in default value.

											
										
										
											2017-03-24 14:40:15 +08:00
+								      set_fact: mon_host_count={{ groups[mon_group_name] | length }}
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								    - name: select a running monitor if multiple monitors
-												make sure a running mon to check when upgrade mon

											
										
										
											2015-04-17 10:04:52 +08:00
+								      set_fact: mon_host={{ item }}
-												Resolve issues when groups names not in default value.

											
										
										
											2017-03-24 14:40:15 +08:00
+								      with_items: "{{ groups[mon_group_name] }}"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								      when:
 								        - mon_host_count | int > 1
 								        - item != inventory_hostname
 								    - name: select first monitor if only one monitor
 								      set_fact: mon_host={{ item }}
-												Resolve issues when groups names not in default value.

											
										
										
											2017-03-24 14:40:15 +08:00
+								      with_items: "{{ groups[mon_group_name][0] }}"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								      when:
 								        - mon_host_count | int == 1
-												make sure a running mon to check when upgrade mon

											
										
										
											2015-04-17 10:04:52 +08:00
-												rolling_update: perform pg check when pgs_num > 0

If num_pgs = 0 the check will never return 0.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-07 06:46:46 +08:00
+								    - name: non container | waiting for the monitor to join the quorum...
-												rolling_update: clarify mon quorum command

Cleaner.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-29 06:10:57 +08:00
+								      command: ceph --cluster "{{ cluster }}" -s --format json
 								      register: ceph_health_raw
 								      until: >
-												update: look for short and fqdn in ceph_health_raw

According to hostname configuration, the task waiting for mons to be in
quorum might fail.
The idea here is to look for both shortname and fqdn in
`ceph_health_raw` instead of just `ansible_hostname`

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1546127

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-02-16 20:45:26 +08:00
+								        hostvars[mon_host]['ansible_hostname'] in (ceph_health_raw.stdout | from_json)["quorum_names"] or
 								        hostvars[mon_host]['ansible_fqdn'] in (ceph_health_raw.stdout | from_json)["quorum_names"]
-												upgrade: add custom timeout options

This commit introduces the ability to configure delays and retries for
cluster health checks, for both monitors and OSDs.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-03 17:24:59 +08:00
+								      retries: "{{ health_mon_check_retries }}"
 								      delay: "{{ health_mon_check_delay }}"
-												make sure a running mon to check when upgrade mon

											
										
										
											2015-04-17 10:04:52 +08:00
+								      delegate_to: "{{ mon_host }}"
-												rolling_update: clarify mon quorum command

Cleaner.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-29 06:10:57 +08:00
+								      when:
 								        - not containerized_deployment
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
-												rolling_update: perform pg check when pgs_num > 0

If num_pgs = 0 the check will never return 0.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-07 06:46:46 +08:00
+								    - name: container | waiting for the containerized monitor to join the quorum...
-												rolling_update: clarify mon quorum command

Cleaner.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-29 06:10:57 +08:00
+								      command: docker exec ceph-mon-{{ hostvars[mon_host]['ansible_hostname'] }} ceph --cluster "{{ cluster }}" -s --format json
 								      register: ceph_health_raw
 								      until: >
-												update: look for short and fqdn in ceph_health_raw

According to hostname configuration, the task waiting for mons to be in
quorum might fail.
The idea here is to look for both shortname and fqdn in
`ceph_health_raw` instead of just `ansible_hostname`

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1546127

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-02-16 20:45:26 +08:00
+								        hostvars[mon_host]['ansible_hostname'] in (ceph_health_raw.stdout | from_json)["quorum_names"] or
 								        hostvars[mon_host]['ansible_fqdn'] in (ceph_health_raw.stdout | from_json)["quorum_names"]
-												upgrade: add custom timeout options

This commit introduces the ability to configure delays and retries for
cluster health checks, for both monitors and OSDs.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-03 17:24:59 +08:00
+								      retries: "{{ health_mon_check_retries }}"
 								      delay: "{{ health_mon_check_delay }}"
-												make sure a running mon to check when upgrade mon

											
										
										
											2015-04-17 10:04:52 +08:00
+								      delegate_to: "{{ mon_host }}"
-												rolling_update: clarify mon quorum command

Cleaner.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-29 06:10:57 +08:00
+								      when:
 								        - containerized_deployment
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												rolling_update: move osd flag section

During a minor update from a jewel to a higher jewel version (10.2.9 to
10.2.10 for example) osd flags don't get applied because they were done
in the mgr section which is skipped in jewel since this daemons does not
exist.
Moving the set flag section after all the mons have been updated solves
that problem.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1548071
Co-authored-by: Tomas Petr <tpetr@redhat.com>
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-05-16 22:02:41 +08:00
+								    - name: set osd flags
 								      command: ceph --cluster {{ cluster }} osd set {{ item }}
 								      with_items:
 								        - noout
 								        - noscrub
 								        - nodeep-scrub
 								      delegate_to: "{{ mon_host }}"
 								      when: not containerized_deployment
 								    - name: set containerized osd flags
 								      command: |
 								        docker exec ceph-mon-{{ hostvars[mon_host]['ansible_hostname'] }} ceph --cluster {{ cluster }} osd set {{ item }}
 								      with_items:
 								        - noout
 								        - noscrub
 								        - nodeep-scrub
 								      delegate_to: "{{ mon_host }}"
 								      when: containerized_deployment
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
 								- name: upgrade ceph mgr node
 								  vars:
 								    upgrade_ceph_packages: True
 								  hosts:
 								    - "{{ mgr_group_name|default('mgrs') }}"
 								  serial: 1
 								  become: True
 								  pre_tasks:
-												rolling_update: fix get fsid for containers

When running ansible2.4-update_docker_cluster there is an issue on the
"get current fsid" task. The current task only works for
non-containerized deployment but will run all the time (even for
containerized). This currently results in the following error:

TASK [get current fsid] ********************************************************
task path: /home/jenkins-build/build/workspace/ceph-ansible-prs-luminous-ansible2.4-update_docker_cluster/rolling_update.yml:214
Tuesday 22 May 2018  22:48:32 +0000 (0:00:02.615)       0:11:01.035 ***********
fatal: [mgr0 -> mon0]: FAILED! => {
    "changed": true,
    "cmd": [
        "ceph",
        "--cluster",
        "test",
        "fsid"
    ],
    "delta": "0:05:00.260674",
    "end": "2018-05-22 22:53:34.555743",
    "rc": 1,
    "start": "2018-05-22 22:48:34.295069"
}

STDERR:

2018-05-22 22:48:34.495651 7f89482c6700  0 -- 192.168.17.10:0/1022712 >> 192.168.17.12:6789/0 pipe(0x7f8944067010 sd=4 :42654 s=1 pgs=0 cs=0 l=1 c=0x7f894405d510).connect protocol feature mismatch, my 83ffffffffffff < peer 481dff8eea4fffb missing 400000000000000
2018-05-22 22:48:34.495684 7f89482c6700  0 -- 192.168.17.10:0/1022712 >> 192.168.17.12:6789/0 pipe(0x7f8944067010 sd=4 :42654 s=1 pgs=0 cs=0 l=1 c=0x7f894405d510).fault

This is not really representative on the real error since the 'ceph' cli is available on that machine.
On other environments we will have something like "command not found: ceph".

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-05-23 07:52:40 +08:00
+								    - name: non container - get current fsid
-												rolling_update: get fsid in mgr pre_task

{{ fsid }} points to {{ cluster_uuid.stdout }} which is not defined in
this part of the rolling_update playbook.
Since we need to call {{ fsid }} we must get the fsid and register it to
`cluster_uuid`.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-05-11 14:05:11 +08:00
+								      command: "ceph --cluster {{ cluster }} fsid"
-												rolling_update: fix get fsid for containers

When running ansible2.4-update_docker_cluster there is an issue on the
"get current fsid" task. The current task only works for
non-containerized deployment but will run all the time (even for
containerized). This currently results in the following error:

TASK [get current fsid] ********************************************************
task path: /home/jenkins-build/build/workspace/ceph-ansible-prs-luminous-ansible2.4-update_docker_cluster/rolling_update.yml:214
Tuesday 22 May 2018  22:48:32 +0000 (0:00:02.615)       0:11:01.035 ***********
fatal: [mgr0 -> mon0]: FAILED! => {
    "changed": true,
    "cmd": [
        "ceph",
        "--cluster",
        "test",
        "fsid"
    ],
    "delta": "0:05:00.260674",
    "end": "2018-05-22 22:53:34.555743",
    "rc": 1,
    "start": "2018-05-22 22:48:34.295069"
}

STDERR:

2018-05-22 22:48:34.495651 7f89482c6700  0 -- 192.168.17.10:0/1022712 >> 192.168.17.12:6789/0 pipe(0x7f8944067010 sd=4 :42654 s=1 pgs=0 cs=0 l=1 c=0x7f894405d510).connect protocol feature mismatch, my 83ffffffffffff < peer 481dff8eea4fffb missing 400000000000000
2018-05-22 22:48:34.495684 7f89482c6700  0 -- 192.168.17.10:0/1022712 >> 192.168.17.12:6789/0 pipe(0x7f8944067010 sd=4 :42654 s=1 pgs=0 cs=0 l=1 c=0x7f894405d510).fault

This is not really representative on the real error since the 'ceph' cli is available on that machine.
On other environments we will have something like "command not found: ceph".

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-05-23 07:52:40 +08:00
+								      register: cluster_uuid_non_container
-												rolling_update: get fsid in mgr pre_task

{{ fsid }} points to {{ cluster_uuid.stdout }} which is not defined in
this part of the rolling_update playbook.
Since we need to call {{ fsid }} we must get the fsid and register it to
`cluster_uuid`.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-05-11 14:05:11 +08:00
+								      delegate_to: "{{ groups[mon_group_name][0] }}"
-												rolling_update: fix get fsid for containers

When running ansible2.4-update_docker_cluster there is an issue on the
"get current fsid" task. The current task only works for
non-containerized deployment but will run all the time (even for
containerized). This currently results in the following error:

TASK [get current fsid] ********************************************************
task path: /home/jenkins-build/build/workspace/ceph-ansible-prs-luminous-ansible2.4-update_docker_cluster/rolling_update.yml:214
Tuesday 22 May 2018  22:48:32 +0000 (0:00:02.615)       0:11:01.035 ***********
fatal: [mgr0 -> mon0]: FAILED! => {
    "changed": true,
    "cmd": [
        "ceph",
        "--cluster",
        "test",
        "fsid"
    ],
    "delta": "0:05:00.260674",
    "end": "2018-05-22 22:53:34.555743",
    "rc": 1,
    "start": "2018-05-22 22:48:34.295069"
}

STDERR:

2018-05-22 22:48:34.495651 7f89482c6700  0 -- 192.168.17.10:0/1022712 >> 192.168.17.12:6789/0 pipe(0x7f8944067010 sd=4 :42654 s=1 pgs=0 cs=0 l=1 c=0x7f894405d510).connect protocol feature mismatch, my 83ffffffffffff < peer 481dff8eea4fffb missing 400000000000000
2018-05-22 22:48:34.495684 7f89482c6700  0 -- 192.168.17.10:0/1022712 >> 192.168.17.12:6789/0 pipe(0x7f8944067010 sd=4 :42654 s=1 pgs=0 cs=0 l=1 c=0x7f894405d510).fault

This is not really representative on the real error since the 'ceph' cli is available on that machine.
On other environments we will have something like "command not found: ceph".

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-05-23 07:52:40 +08:00
+								      when:
 								        - not containerized_deployment
 								    - name: container - get current fsid
 								      command: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }} ceph --cluster {{ cluster }} fsid"
 								      register: cluster_uuid_container
 								      delegate_to: "{{ groups[mon_group_name][0] }}"
 								      when:
 								        - containerized_deployment
 								    - name: set_fact ceph_cluster_fsid
 								      set_fact:
 								        ceph_cluster_fsid: "{{ cluster_uuid_container.stdout if containerized_deployment else cluster_uuid_non_container.stdout }}"
-												rolling_update: get fsid in mgr pre_task

{{ fsid }} points to {{ cluster_uuid.stdout }} which is not defined in
this part of the rolling_update playbook.
Since we need to call {{ fsid }} we must get the fsid and register it to
`cluster_uuid`.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-05-11 14:05:11 +08:00
-												rolling_update: move mgr key creation

Until all the mons haven't been updated to Luminous, there is no way to
create a key. So we should do the key creation in the mon role only if
we are not part of an update.
If we are then the key creation is done after the mons upgrade to
Luminous.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1574995
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-05-11 01:38:55 +08:00
+								    - name: non container | create ceph mgr keyring(s)
 								      command: "ceph --cluster {{ cluster }} auth get-or-create mgr.{{ hostvars[item]['ansible_hostname'] }} mon 'allow profile mgr' osd 'allow *' mds 'allow *' -o /etc/ceph/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
 								      args:
 								        creates: "{{ ceph_conf_key_directory }}/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
 								      changed_when: false
 								      delegate_to: "{{ groups[mon_group_name][0] }}"
 								      with_items:
 								        - "{{ groups.get(mgr_group_name, []) }}"
 								      when:
 								        - not containerized_deployment
 								        - "{{ groups.get(mgr_group_name, []) | length > 0 }}"
 								    - name: container | create ceph mgr keyring(s)
 								      command: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }} ceph --cluster {{ cluster }} auth get-or-create mgr.{{ hostvars[item]['ansible_hostname'] }} mon 'allow profile mgr' osd 'allow *' mds 'allow *' -o /etc/ceph/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
 								      args:
 								        creates: "{{ ceph_conf_key_directory }}/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
 								      changed_when: false
 								      delegate_to: "{{ groups[mon_group_name][0] }}"
 								      with_items:
 								        - "{{ groups.get(mgr_group_name, []) }}"
 								      when:
 								        - containerized_deployment
 								        - "{{ groups.get(mgr_group_name, []) | length > 0 }}"
 								    - name: fetch ceph mgr key(s)
 								      fetch:
 								        src: "{{ ceph_conf_key_directory }}/{{ cluster }}.mgr.{{ hostvars[item]['ansible_hostname'] }}.keyring"
-												rolling_update: fix get fsid for containers

When running ansible2.4-update_docker_cluster there is an issue on the
"get current fsid" task. The current task only works for
non-containerized deployment but will run all the time (even for
containerized). This currently results in the following error:

TASK [get current fsid] ********************************************************
task path: /home/jenkins-build/build/workspace/ceph-ansible-prs-luminous-ansible2.4-update_docker_cluster/rolling_update.yml:214
Tuesday 22 May 2018  22:48:32 +0000 (0:00:02.615)       0:11:01.035 ***********
fatal: [mgr0 -> mon0]: FAILED! => {
    "changed": true,
    "cmd": [
        "ceph",
        "--cluster",
        "test",
        "fsid"
    ],
    "delta": "0:05:00.260674",
    "end": "2018-05-22 22:53:34.555743",
    "rc": 1,
    "start": "2018-05-22 22:48:34.295069"
}

STDERR:

2018-05-22 22:48:34.495651 7f89482c6700  0 -- 192.168.17.10:0/1022712 >> 192.168.17.12:6789/0 pipe(0x7f8944067010 sd=4 :42654 s=1 pgs=0 cs=0 l=1 c=0x7f894405d510).connect protocol feature mismatch, my 83ffffffffffff < peer 481dff8eea4fffb missing 400000000000000
2018-05-22 22:48:34.495684 7f89482c6700  0 -- 192.168.17.10:0/1022712 >> 192.168.17.12:6789/0 pipe(0x7f8944067010 sd=4 :42654 s=1 pgs=0 cs=0 l=1 c=0x7f894405d510).fault

This is not really representative on the real error since the 'ceph' cli is available on that machine.
On other environments we will have something like "command not found: ceph".

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-05-23 07:52:40 +08:00
+								        dest: "{{ fetch_directory }}/{{ ceph_cluster_fsid }}/{{ ceph_conf_key_directory }}/"
-												rolling_update: move mgr key creation

Until all the mons haven't been updated to Luminous, there is no way to
create a key. So we should do the key creation in the mon role only if
we are not part of an update.
If we are then the key creation is done after the mons upgrade to
Luminous.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1574995
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2018-05-11 01:38:55 +08:00
+								        flat: yes
 								        fail_on_missing: no
 								      delegate_to: "{{ groups[mon_group_name][0] }}"
 								      with_items:
 								        - "{{ groups.get(mgr_group_name, []) }}"
 								    # The following task has a failed_when: false
 								    # to handle the scenario where no mgr existed before the upgrade
 								    # or if we run a Ceph cluster before Luminous
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: stop ceph mgr
 								      systemd:
 								        name: ceph-mgr@{{ ansible_hostname }}
 								        state: stopped
 								        enabled: yes
 								      failed_when: false
 								      when:
 								        - not containerized_deployment
 								  roles:
 								    - ceph-defaults
 								    - { role: ceph-common, when: not containerized_deployment }
 								    - { role: ceph-docker-common, when: containerized_deployment }
-												upgrade: fix upgrade jewel to luminous for mgr nodes

mgr nodes can't be upgraded from jewel to luminous because ceph-mgr role
is skipped because of the condition `when:
"ceph_release_num[ceph_release] >= ceph_release_num.luminous"`. Indeed,
ceph-mgr package is upgraded in `ceph-mgr` role, therefore,
`ceph_release` is still set to the old version. It means the when can't
be satisfied.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>
(cherry picked from commit 302e563601cd6820b1ae44fabdfb1506688c7c9b)

											
										
										
											2017-10-19 21:07:58 +08:00
+								    - ceph-config
 								    - { role: ceph-mgr,
 								        when: "(ceph_release_num[ceph_release] >= ceph_release_num.luminous) or
 								               (ceph_release_num[ceph_release] < ceph_release_num.luminous and rolling_update)" }
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
 								  post_tasks:
 								    - name: start ceph mgr
 								      systemd:
 								        name: ceph-mgr@{{ ansible_hostname }}
 								        state: started
 								        enabled: yes
 								      when:
 								        - not containerized_deployment
 								    - name: restart containerized ceph mgr
 								      systemd:
 								        name: ceph-mgr@{{ ansible_hostname }}
 								        state: restarted
 								        enabled: yes
 								        daemon_reload: yes
 								      when:
 								        - containerized_deployment
-												rolling_update: nicer way to set osd flags

Prior to this patch, we were applying the osd flags like this:

"
General pre tasks
Set flags
Upgrade OSDs on a host
Unset flags <-- this triggers pending scrub to start
Set flags
Upgrade OSDs on a hosts
Unset flags <-- this triggers pending scrub to start
.
.
.
General post tasks
"

Now instead, we apply the flag once before starting the OSD update and
unset them once the last OSD is finished.

"
General pre tasks
Set flags and wait for any scrubs to finish
Upgrade OSDs on a host
Upgrade OSDs on a host
.
.
.
Unset flags
General post tasks
"

Fixes: https://bugzilla.redhat.com/show_bug.cgi?id=1450754
Signed-off-by: Sébastien Han <seb@redhat.com>
Co-Authored-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-05-12 21:59:52 +08:00
 								- name: upgrade ceph osds cluster
 								  vars:
 								    health_osd_check_retries: 40
 								    health_osd_check_delay: 30
 								    upgrade_ceph_packages: True
 								  hosts:
 								    - "{{ osd_group_name|default('osds') }}"
 								  serial: 1
 								  become: True
 								  pre_tasks:
-												rolling update: stop OSDs before upgrading

This avoids a bug where OSDs are sometimes restarted twice on
upgrades which leaves the OSD process running but not marked up.

See:

https://bugzilla.redhat.com/show_bug.cgi?id=1394928
https://bugzilla.redhat.com/show_bug.cgi?id=1391675
https://bugzilla.redhat.com/show_bug.cgi?id=1394929

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:25:46 +08:00
+								    - name: get osd numbers
-												playbook: homogenize the way list osd ids

Problem: too many different commands to do the same thing. The 'cut'
command on infrastructure-playbooks/purge-cluster.yml was also wrong.
This sed command from osixia in ceph-docker
https://github.com/ceph/ceph-docker/pull/580/ addresses all the
scenarios.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-03-30 17:51:38 +08:00
+								      shell: "if [ -d /var/lib/ceph/osd ] ; then ls /var/lib/ceph/osd | sed 's/.*-//' ; fi"
-												rolling update: stop OSDs before upgrading

This avoids a bug where OSDs are sometimes restarted twice on
upgrades which leaves the OSD process running but not marked up.

See:

https://bugzilla.redhat.com/show_bug.cgi?id=1394928
https://bugzilla.redhat.com/show_bug.cgi?id=1391675
https://bugzilla.redhat.com/show_bug.cgi?id=1394929

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:25:46 +08:00
+								      register: osd_ids
 								      changed_when: false
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								      when: not containerized_deployment
-												rolling update: stop OSDs before upgrading

This avoids a bug where OSDs are sometimes restarted twice on
upgrades which leaves the OSD process running but not marked up.

See:

https://bugzilla.redhat.com/show_bug.cgi?id=1394928
https://bugzilla.redhat.com/show_bug.cgi?id=1391675
https://bugzilla.redhat.com/show_bug.cgi?id=1394929

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:25:46 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: stop ceph osd
 								      systemd:
 								        name: ceph-osd@{{ item }}
-												rolling update: stop OSDs before upgrading

This avoids a bug where OSDs are sometimes restarted twice on
upgrades which leaves the OSD process running but not marked up.

See:

https://bugzilla.redhat.com/show_bug.cgi?id=1394928
https://bugzilla.redhat.com/show_bug.cgi?id=1391675
https://bugzilla.redhat.com/show_bug.cgi?id=1394929

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:25:46 +08:00
+								        state: stopped
 								        enabled: yes
 								      with_items: "{{ osd_ids.stdout_lines }}"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - not containerized_deployment
-												rolling update: stop OSDs before upgrading

This avoids a bug where OSDs are sometimes restarted twice on
upgrades which leaves the OSD process running but not marked up.

See:

https://bugzilla.redhat.com/show_bug.cgi?id=1394928
https://bugzilla.redhat.com/show_bug.cgi?id=1391675
https://bugzilla.redhat.com/show_bug.cgi?id=1394929

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:25:46 +08:00
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
+								  roles:
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
+								    - ceph-defaults
-												Move role dependencies in site.yml/site-docker.yml

This will give us more flexibility and avoid a lot of useless when
skipping all tasks from a non-desired role.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:48:13 +08:00
+								    - { role: ceph-common, when: not containerized_deployment }
 								    - { role: ceph-docker-common, when: containerized_deployment }
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								    - ceph-config
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
+								    - ceph-osd
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
+								  post_tasks:
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
+								    - name: get osd numbers
-												playbook: homogenize the way list osd ids

Problem: too many different commands to do the same thing. The 'cut'
command on infrastructure-playbooks/purge-cluster.yml was also wrong.
This sed command from osixia in ceph-docker
https://github.com/ceph/ceph-docker/pull/580/ addresses all the
scenarios.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-03-30 17:51:38 +08:00
+								      shell: "if [ -d /var/lib/ceph/osd ] ; then ls /var/lib/ceph/osd | sed 's/.*-//' ; fi"
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
+								      register: osd_ids
 								      changed_when: false
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								      when: not containerized_deployment
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: start ceph osd
 								      systemd:
 								        name: ceph-osd@{{ item }}
-												rolling update: stop OSDs before upgrading

This avoids a bug where OSDs are sometimes restarted twice on
upgrades which leaves the OSD process running but not marked up.

See:

https://bugzilla.redhat.com/show_bug.cgi?id=1394928
https://bugzilla.redhat.com/show_bug.cgi?id=1391675
https://bugzilla.redhat.com/show_bug.cgi?id=1394929

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:25:46 +08:00
+								        state: started
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
+								        enabled: yes
 								      with_items: "{{ osd_ids.stdout_lines }}"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - not containerized_deployment
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: restart containerized ceph osd
 								      systemd:
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								        name: ceph-osd@{{ item | basename }}
 								        state: restarted
 								        enabled: yes
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								        daemon_reload: yes
-												osd: allow multi dedicated journals for containers

Fix: https://bugzilla.redhat.com/show_bug.cgi?id=1475820
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-07-25 23:54:26 +08:00
+								      with_items: "{{ devices }}"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - containerized_deployment
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												infra: use the pg check in the right place

Use the pg check before doing the pg check, not on the quorum check.
Also never quote int when doing comparaison.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-08 20:45:48 +08:00
+								    - name: set_fact docker_exec_cmd_osd
 								      set_fact:
 								        docker_exec_cmd_update_osd: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }}"
-												rolling update: skip pg check if num_pgs = 0

In our test case we don't have any pgs, thus the check fails. The check
always returns an empty array, which makes the comparaison failing.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-08-23 18:31:15 +08:00
+								      when:
-												infra: use the pg check in the right place

Use the pg check before doing the pg check, not on the quorum check.
Also never quote int when doing comparaison.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-08 20:45:48 +08:00
+								        - containerized_deployment
 								    - name: get num_pgs - non container
 								      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph --cluster {{ cluster }} -s --format json"
 								      register: ceph_pgs
 								      delegate_to: "{{ groups[mon_group_name][0] }}"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
-												infra: use the pg check in the right place

Use the pg check before doing the pg check, not on the quorum check.
Also never quote int when doing comparaison.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-08 20:45:48 +08:00
+								    - name: waiting for clean pgs...
 								      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph --cluster {{ cluster }} -s --format json"
-												update: nicer way to wait for clean pgs

More comprhensive and friendly to read.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-28 20:46:26 +08:00
+								      register: ceph_health_post
 								      until: >
 								        ((ceph_health_post.stdout | from_json).pgmap.pgs_by_state | length) == 1
 								        and
 								        (ceph_health_post.stdout | from_json).pgmap.pgs_by_state.0.state_name == "active+clean"
 								      delegate_to: "{{ groups[mon_group_name][0] }}"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								      retries: "{{ health_osd_check_retries }}"
 								      delay: "{{ health_osd_check_delay }}"
-												rolling update: skip pg check if num_pgs = 0

In our test case we don't have any pgs, thus the check fails. The check
always returns an empty array, which makes the comparaison failing.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-08-23 18:31:15 +08:00
+								      when:
-												infra: use the pg check in the right place

Use the pg check before doing the pg check, not on the quorum check.
Also never quote int when doing comparaison.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-08 20:45:48 +08:00
+								        - (ceph_pgs.stdout | from_json).pgmap.num_pgs != 0
-												rolling_update: nicer way to set osd flags

Prior to this patch, we were applying the osd flags like this:

"
General pre tasks
Set flags
Upgrade OSDs on a host
Unset flags <-- this triggers pending scrub to start
Set flags
Upgrade OSDs on a hosts
Unset flags <-- this triggers pending scrub to start
.
.
.
General post tasks
"

Now instead, we apply the flag once before starting the OSD update and
unset them once the last OSD is finished.

"
General pre tasks
Set flags and wait for any scrubs to finish
Upgrade OSDs on a host
Upgrade OSDs on a host
.
.
.
Unset flags
General post tasks
"

Fixes: https://bugzilla.redhat.com/show_bug.cgi?id=1450754
Signed-off-by: Sébastien Han <seb@redhat.com>
Co-Authored-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-05-12 21:59:52 +08:00
 								- name: unset osd flags
-												rolling update: fix undefined jewel_minor_update failure

Variables set at the play level with ``vars`` do
not carry over into the next play in the playbook.

The var jewel_minor_update was set in a previous play but
used in this one and was failing because it was not defined.

Resolves: https://bugzilla.redhat.com/show_bug.cgi?id=1544029

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2018-02-13 04:52:27 +08:00
+								  vars:
 								    - jewel_minor_update: False
-												rolling_update: nicer way to set osd flags

Prior to this patch, we were applying the osd flags like this:

"
General pre tasks
Set flags
Upgrade OSDs on a host
Unset flags <-- this triggers pending scrub to start
Set flags
Upgrade OSDs on a hosts
Unset flags <-- this triggers pending scrub to start
.
.
.
General post tasks
"

Now instead, we apply the flag once before starting the OSD update and
unset them once the last OSD is finished.

"
General pre tasks
Set flags and wait for any scrubs to finish
Upgrade OSDs on a host
Upgrade OSDs on a host
.
.
.
Unset flags
General post tasks
"

Fixes: https://bugzilla.redhat.com/show_bug.cgi?id=1450754
Signed-off-by: Sébastien Han <seb@redhat.com>
Co-Authored-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-05-12 21:59:52 +08:00
 								  hosts:
 								    - "{{ mon_group_name|default('mons') }}"
 								  become: True
 								  roles:
 								    - ceph-defaults
 								  tasks:
-												update: fix var register

Even if the task is skipped, ansible registers the var as 'skipped' so
this task the task using this variable for its next usage.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-29 18:05:43 +08:00
+								    - name: set_fact docker_exec_cmd_osd
 								      set_fact:
 								        docker_exec_cmd_update_osd: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }}"
 								      when:
 								        - containerized_deployment
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
-												update: fix var register

Even if the task is skipped, ansible registers the var as 'skipped' so
this task the task using this variable for its next usage.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-29 18:05:43 +08:00
+								    - name: unset osd flags
 								      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph osd unset {{ item }} --cluster {{ cluster }}"
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								      with_items:
 								        - noout
 								        - noscrub
 								        - nodeep-scrub
-												Resolve issues when groups names not in default value.

											
										
										
											2017-03-24 14:40:15 +08:00
+								      delegate_to: "{{ groups[mon_group_name][0] }}"
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												update: complete luminous upgrade

Once we complete the upgrade to Luminous, we must issue a specific
command. For more info read:
http://ceph.com/community/new-luminous-upgrade-complete/

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-28 21:27:27 +08:00
+								    - name: get osd versions
-												update: fix var register

Even if the task is skipped, ansible registers the var as 'skipped' so
this task the task using this variable for its next usage.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-29 18:05:43 +08:00
+								      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph --cluster {{ cluster }} versions"
-												update: complete luminous upgrade

Once we complete the upgrade to Luminous, we must issue a specific
command. For more info read:
http://ceph.com/community/new-luminous-upgrade-complete/

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-28 21:27:27 +08:00
+								      register: ceph_versions
 								      delegate_to: "{{ groups[mon_group_name][0] }}"
-												upgrade: skip luminous tasks for jewel minor update

These tasks are needed only when upgrading to luminous.
They are not needed in Jewel minor upgrade and by the way, they fail because
`ceph versions` command doesn't exist.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-01-25 23:57:45 +08:00
+								      when:
 								        - not jewel_minor_update
-												update: complete luminous upgrade

Once we complete the upgrade to Luminous, we must issue a specific
command. For more info read:
http://ceph.com/community/new-luminous-upgrade-complete/

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-28 21:27:27 +08:00
 								    - name: set_fact ceph_versions_osd
 								      set_fact:
 								        ceph_versions_osd: "{{ (ceph_versions.stdout|from_json).osd }}"
 								      delegate_to: "{{ groups[mon_group_name][0] }}"
-												upgrade: skip luminous tasks for jewel minor update

These tasks are needed only when upgrading to luminous.
They are not needed in Jewel minor upgrade and by the way, they fail because
`ceph versions` command doesn't exist.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-01-25 23:57:45 +08:00
+								      when:
 								        - not jewel_minor_update
-												update: complete luminous upgrade

Once we complete the upgrade to Luminous, we must issue a specific
command. For more info read:
http://ceph.com/community/new-luminous-upgrade-complete/

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-28 21:27:27 +08:00
 								    # length == 1 means there is a single osds versions entry
 								    # thus all the osds are running the same version
 								    - name: complete osds upgrade
-												update: fix var register

Even if the task is skipped, ansible registers the var as 'skipped' so
this task the task using this variable for its next usage.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-29 18:05:43 +08:00
+								      command: "{{ docker_exec_cmd_update_osd|default('') }} ceph --cluster {{ cluster }} osd require-osd-release luminous"
-												update: complete luminous upgrade

Once we complete the upgrade to Luminous, we must issue a specific
command. For more info read:
http://ceph.com/community/new-luminous-upgrade-complete/

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-28 21:27:27 +08:00
+								      delegate_to: "{{ groups[mon_group_name][0] }}"
 								      when:
-												upgrade: skip luminous tasks for jewel minor update

These tasks are needed only when upgrading to luminous.
They are not needed in Jewel minor upgrade and by the way, they fail because
`ceph versions` command doesn't exist.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-01-25 23:57:45 +08:00
+								        - (ceph_versions.get('stdout', '{}')|from_json).get('osd', {}) | length == 1
-												update: complete luminous upgrade

Once we complete the upgrade to Luminous, we must issue a specific
command. For more info read:
http://ceph.com/community/new-luminous-upgrade-complete/

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-28 21:27:27 +08:00
+								        - ceph_versions_osd | string | search("ceph version 12")
-												upgrade: skip luminous tasks for jewel minor update

These tasks are needed only when upgrading to luminous.
They are not needed in Jewel minor upgrade and by the way, they fail because
`ceph versions` command doesn't exist.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2018-01-25 23:57:45 +08:00
+								        - not jewel_minor_update
-												update: complete luminous upgrade

Once we complete the upgrade to Luminous, we must issue a specific
command. For more info read:
http://ceph.com/community/new-luminous-upgrade-complete/

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-09-28 21:27:27 +08:00
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
+								- name: upgrade ceph mdss cluster
-												Control when ceph packages get updated

Currently, all the ceph package installation resources use
"state=latest", which means subsequent runs of the ceph playbooks
could result in ceph being upgraded if there are package updates
available in the selected repo.

This commit adds a new variable to ceph-common called
'upgrade_ceph_packages' which defaults to False.  This variable is used
in the package installation resources for ceph packages to determine if
the resource should use "state=present" or "state=latest".  If the
variable gets set to True, "state=latest" will be used.

Additionally, we update rolling_update.yml to override
upgrade_ceph_packages to true to permit package upgrades in this
context specifically.

Closes issue #506

											
										
										
											2016-01-29 23:54:59 +08:00
+								  vars:
-												rolling_update: add variable to upgrade ceph

My stupid self removed this crucial variable here: 217ce3ca thinking it
was another hard coded variable import where this is actually the
trigger for the upgrade.

Closes: #1071

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-11-05 00:31:02 +08:00
+								    upgrade_ceph_packages: True
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
+								  hosts:
-												rolling-update: do not set group name vars at playbook level

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2017-03-08 03:16:12 +08:00
+								    - "{{ mds_group_name|default('mdss') }}"
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
 								  serial: 1
 								  become: True
-												rolling update: stop MDSs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:42:52 +08:00
+								  pre_tasks:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: stop ceph mds
 								      systemd:
-												rolling update: stop MDSs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:42:52 +08:00
+								        name: ceph-mds@{{ ansible_hostname }}
 								        state: stopped
 								        enabled: yes
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - not containerized_deployment
-												rolling update: stop MDSs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:42:52 +08:00
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
+								  roles:
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
+								    - ceph-defaults
-												Move role dependencies in site.yml/site-docker.yml

This will give us more flexibility and avoid a lot of useless when
skipping all tasks from a non-desired role.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:48:13 +08:00
+								    - { role: ceph-common, when: not containerized_deployment }
 								    - { role: ceph-docker-common, when: containerized_deployment }
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								    - ceph-config
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
+								    - ceph-mds
-												Add Ceph Playbook

Initial commit.

Signed-off-by: Sébastien Han <sebastien.han@enovance.com>

											
										
										
											2014-03-04 02:08:51 +08:00
+								  post_tasks:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: start ceph mds
 								      systemd:
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
+								        name: ceph-mds@{{ ansible_hostname }}
-												rolling update: stop MDSs before upgrading and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:42:52 +08:00
+								        state: started
-												rolling update: add systemd support

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-06-15 23:08:15 +08:00
+								        enabled: yes
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - not containerized_deployment
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: restart ceph mds
 								      systemd:
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								        name: ceph-mds@{{ ansible_hostname }}
 								        state: restarted
 								        enabled: yes
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								        daemon_reload: yes
-												Rolling update changes for containerized deployments

Separate out systemd restart tasks for containerized and
non-containerized deployments

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-16 16:35:09 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - containerized_deployment
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
 								- name: upgrade ceph rgws cluster
-												Control when ceph packages get updated

Currently, all the ceph package installation resources use
"state=latest", which means subsequent runs of the ceph playbooks
could result in ceph being upgraded if there are package updates
available in the selected repo.

This commit adds a new variable to ceph-common called
'upgrade_ceph_packages' which defaults to False.  This variable is used
in the package installation resources for ceph packages to determine if
the resource should use "state=present" or "state=latest".  If the
variable gets set to True, "state=latest" will be used.

Additionally, we update rolling_update.yml to override
upgrade_ceph_packages to true to permit package upgrades in this
context specifically.

Closes issue #506

											
										
										
											2016-01-29 23:54:59 +08:00
+								  vars:
-												rolling_update: add variable to upgrade ceph

My stupid self removed this crucial variable here: 217ce3ca thinking it
was another hard coded variable import where this is actually the
trigger for the upgrade.

Closes: #1071

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-11-05 00:31:02 +08:00
+								    upgrade_ceph_packages: True
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
+								  hosts:
-												rolling-update: do not set group name vars at playbook level

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2017-03-08 03:16:12 +08:00
+								    - "{{ rgw_group_name|default('rgws') }}"
-												rolling_update: improve variables import

we now have pointer to default role so we don't miss any of the
variables defined.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2016-10-06 19:56:37 +08:00
 								  serial: 1
 								  become: True
-												rolling update: stop RGWs before upgrade and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:44:55 +08:00
+								  pre_tasks:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: stop ceph rgw
 								      systemd:
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								        name: ceph-radosgw@rgw.{{ ansible_hostname }}
-												rolling update: stop RGWs before upgrade and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:44:55 +08:00
+								        state: stopped
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								        enabled: yes
 								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - not containerized_deployment
-												rolling update: stop RGWs before upgrade and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:44:55 +08:00
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
+								  roles:
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
+								    - ceph-defaults
-												Move role dependencies in site.yml/site-docker.yml

This will give us more flexibility and avoid a lot of useless when
skipping all tasks from a non-desired role.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:48:13 +08:00
+								    - { role: ceph-common, when: not containerized_deployment }
 								    - { role: ceph-docker-common, when: containerized_deployment }
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								    - ceph-config
-												Modify the repo to host reoles on the galaxy

Signed-off-by: leseb <seb@redhat.com>

											
										
										
											2015-07-25 00:14:59 +08:00
+								    - ceph-rgw
-												Merge branch 'master' of https://github.com/ceph/ceph-ansible into improve-rolling-upgrade

											
										
										
											2015-03-27 01:51:11 +08:00
 								  post_tasks:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: start ceph rgw
 								      systemd:
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								        name: ceph-radosgw@rgw.{{ ansible_hostname }}
-												rolling update: stop RGWs before upgrade and start afterwards

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

Resolves: rhbz#1394929

											
										
										
											2016-11-15 04:44:55 +08:00
+								        state: started
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								        enabled: yes
 								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - not containerized_deployment
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: restart containerized ceph rgw
 								      systemd:
-												update: update rgw systemd unit name

The old name is used in `rolling_update.yml` and
`purge-docker-cluster.yml`, it breaks the
`test_rgw_service_is_running()` test.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-09-24 10:52:51 +08:00
+								        name: ceph-radosgw@rgw.{{ ansible_hostname }}
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								        state: restarted
 								        enabled: yes
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								        daemon_reload: yes
-												Support containerized rolling update

- Update rolling update playbook to support containerized deployments
  for mons, osds, mdss, and rgws
- Skip checking if existing cluster is running when performing a rolling
  update
- Fixed bug where we were failing to start the mds container because it
  was missing the admin keyring. The admin keyring was missing because
  it was not being pushed from the mon host to the ansible host due to
  the keyring not being available before running the copy_configs.yml
  task include file. Now we forcefully wait for the admin keyring to be
  generated before continuing with the copy_configs.yml task include file
- Skip pre_requisite.yml when running on atomic host. This technically
  no longer requires specifying to skip tasks containing the with_pkg tag
- Add missing variables to all.docker.sample
- Misc. cleanup

Signed-off-by: Ivan Font <ifont@redhat.com>

											
										
										
											2016-11-06 12:15:26 +08:00
+								      when:
-												Refact code

`ceph-docker-common`:
  At the moment there is a lot of duplicated tasks in each
  `./roles/ceph-<role>/tasks/docker/main.yml` that could be refactored in
  `./roles/ceph-docker-common/tasks/main.yml`.

`*_containerized_deployment` variables:
  All `*_containerized_deployment` have been refactored to a single
  variable `containerized_deployment`

duplicate `cephx` variables in `group_vars/* have been removed.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-04-13 01:57:33 +08:00
+								        - containerized_deployment
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								- name: upgrade ceph rbd mirror node
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
 								  vars:
 								    upgrade_ceph_packages: True
 								  hosts:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - "{{ rbd_mirror_group_name|default('rbdmirrors') }}"
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
 								  serial: 1
 								  become: True
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								  pre_tasks:
 								    # NOTE(leseb): these tasks have a 'failed_when: false'
 								    # in case we run before luminous or after
 								    - name: stop ceph rbd mirror before luminous
 								      systemd:
 								        name: "ceph-rbd-mirror@{{ ceph_rbd_mirror_local_user }}"
 								        state: stopped
 								        enabled: no
 								      failed_when: false
 								    - name: stop ceph rbd mirror for and after luminous
 								      systemd:
 								        name: "ceph-rbd-mirror@rbd-mirror.{{ ansible_hostname }}"
 								        state: stopped
 								        enabled: yes
 								      failed_when: false
-												rolling_update: refact code

Refact rolling_update playbook.
Add ceph-client upgrade.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-07-29 04:27:02 +08:00
+								  roles:
 								    - ceph-defaults
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
+								    - { role: ceph-common, when: not containerized_deployment }
 								    - { role: ceph-docker-common, when: containerized_deployment }
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								    - ceph-config
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - ceph-rbd-mirror
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								  post_tasks:
 								    - name: start ceph rbd mirror
 								      systemd:
 								        name: "ceph-rbd-mirror@rbd-mirror.{{ ansible_hostname }}"
 								        state: started
 								        enabled: yes
 								      when:
 								        - not containerized_deployment
 								    - name: restart containerized ceph rbd mirror
 								      systemd:
 								        name: ceph-rbd-mirror@rbd-mirror.{{ ansible_hostname }}
 								        state: restarted
 								        enabled: yes
 								        daemon_reload: yes
 								      when:
 								        - containerized_deployment
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
 								- name: upgrade ceph nfs node
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
 								  vars:
 								    upgrade_ceph_packages: True
 								  hosts:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - "{{ nfs_group_name|default('nfss') }}"
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
 								  serial: 1
 								  become: True
 								  pre_tasks:
-												rolling_update: do not fail the playbook if nfs-ganesha is not present

The rolling update playbook was attempting to stop the
nfs-ganesha service on nodes where jewel is still installed.
The nfs-ganesha service did not exist in jewel so the task fails.

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2018-01-06 00:06:53 +08:00
+								    # failed_when: false is here so that if we upgrade
 								    # from a version of ceph that does not have nfs-ganesha
 								    # then this task will not fail
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: stop ceph nfs
 								      systemd:
 								        name: nfs-ganesha
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
+								        state: stopped
 								        enabled: yes
-												rolling_update: do not fail the playbook if nfs-ganesha is not present

The rolling update playbook was attempting to stop the
nfs-ganesha service on nodes where jewel is still installed.
The nfs-ganesha service did not exist in jewel so the task fails.

Signed-off-by: Andrew Schoen <aschoen@redhat.com>

											
										
										
											2018-01-06 00:06:53 +08:00
+								      failed_when: false
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
+								      when:
 								        - not containerized_deployment
 								  roles:
 								    - ceph-defaults
 								    - { role: ceph-common, when: not containerized_deployment }
 								    - { role: ceph-docker-common, when: containerized_deployment }
-												upgrade: fix upgrade jewel to luminous for nfs nodes

nfs nodes can't be upgraded from jewel to luminous because ceph-nfs role
is skipped because of the condition `when:
"ceph_release_num[ceph_release] >= ceph_release_num.luminous"`. Indeed,
package is upgraded in `ceph-nfs` role, therefore,
`ceph_release` is still set to the old version. It means the when can't
be satisfied.

Signed-off-by: Guillaume Abrioux <gabrioux@redhat.com>

											
										
										
											2017-10-20 00:30:08 +08:00
+								    - ceph-config
 								    - { role: ceph-nfs,
 								        when: "(ceph_release_num[ceph_release] >= ceph_release_num.luminous) or
 								               (ceph_release_num[ceph_release] < ceph_release_num.luminous and rolling_update)" }
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
 								  post_tasks:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: start nfs gateway
 								      systemd:
 								        name: nfs-ganesha
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
+								        state: started
 								        enabled: yes
 								      when:
 								        - not containerized_deployment
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								        - ceph_nfs_enable_service
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - name: systemd restart nfs container
 								      systemd:
 								        name: ceph-nfs@{{ ceph_nfs_service_suffix | default(ansible_hostname) }}
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
+								        state: restarted
 								        enabled: yes
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								        daemon_reload: yes
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
+								      when:
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								        - ceph_nfs_enable_service
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
+								        - containerized_deployment
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								- name: upgrade ceph client node
 								  vars:
 								    upgrade_ceph_packages: True
 								  hosts:
 								    - "{{ client_group_name|default('clients') }}"
 								  serial: 1
 								  become: True
 								  roles:
 								    - ceph-defaults
 								    - { role: ceph-common, when: not containerized_deployment }
 								    - { role: ceph-docker-common, when: containerized_deployment }
-												all: backward compatibility between stable-2.2 and 3.0

stable-3.0 brought numerous changes in ceph-ansible variables, this PR
aims to maintain backward compatibility for someone running stable-2.2
upgrading to stable-3.0 but keeps its groups_vars untouched.
We will then determine the right options to make sure the upgrade works
but we are expecting that new variables should be used.

We will drop this in a near future, maybe 3.1 or 3.2.

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-19 00:03:30 +08:00
+								    - ceph-config
-												upgrade: support for rbd mirror and nfs

- Add upgrade support for rbd mirror and nfs daemons.
- Only works with systemd (remove sysvinit and upstart occurence)
- A bit of cleanup

Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-16 20:15:43 +08:00
+								    - ceph-client
-												upgrade: a support for mgrs

Also we now play ceph-config to have everything being generated for new
daemons bootstrap during upgrade.

Closes: https://bugzilla.redhat.com/show_bug.cgi?id=1497959
Signed-off-by: Sébastien Han <seb@redhat.com>

											
										
										
											2017-10-03 18:25:12 +08:00
+								- name: show ceph status
 								  hosts:
 								    - "{{ mon_group_name|default('mons') }}"
 								  become: True
 								  roles:
 								    - ceph-defaults
 								  tasks:
 								    - name: set_fact docker_exec_cmd_status
 								      set_fact:
 								        docker_exec_cmd_status: "docker exec ceph-mon-{{ hostvars[groups[mon_group_name][0]]['ansible_hostname'] }}"
 								      when:
 								        - containerized_deployment
 								    - name: show ceph status
 								      command: "{{ docker_exec_cmd_status|default('') }} ceph --cluster {{ cluster }} -s"
 								      delegate_to: "{{ groups[mon_group_name][0] }}"