[ceph-osd] Remove wait for misplaced objects during OSD restarts
The wait for misplaced objects during the ceph-osd post-apply job was added to prevent I/O disruption in the case where misplaced objects cause multiple replicas in common failure domains. This concern is only valid before OSD restarts begin because OSD failures during the restart process won't cause replicas that violate replication rules to appear elsewhere. This change keeps the wait for misplaced objects prior to beginning OSD restarts and removes it during those restarts. The wait during OSD restarts now only waits for degraded objects to be recovered before proceeding to the next failure domain. Change-Id: Ic82c67b43089c7a2b45995d1fd9c285d5c0e7cbc
This commit is contained in:
parent
4665ebd35f
commit
cb73c61b4e
@ -15,6 +15,6 @@ apiVersion: v1
|
|||||||
appVersion: v1.0.0
|
appVersion: v1.0.0
|
||||||
description: OpenStack-Helm Ceph OSD
|
description: OpenStack-Helm Ceph OSD
|
||||||
name: ceph-osd
|
name: ceph-osd
|
||||||
version: 0.1.33
|
version: 0.1.34
|
||||||
home: https://github.com/ceph/ceph
|
home: https://github.com/ceph/ceph
|
||||||
...
|
...
|
||||||
|
@ -115,10 +115,21 @@ function wait_for_pgs () {
|
|||||||
done
|
done
|
||||||
}
|
}
|
||||||
|
|
||||||
|
function wait_for_degraded_objects () {
|
||||||
|
echo "#### Start: Checking for degraded objects ####"
|
||||||
|
|
||||||
|
# Loop until no degraded objects
|
||||||
|
while [[ ! -z "`ceph --cluster ${CLUSTER} -s | grep 'degraded'`" ]]
|
||||||
|
do
|
||||||
|
sleep 3
|
||||||
|
ceph -s
|
||||||
|
done
|
||||||
|
}
|
||||||
|
|
||||||
function wait_for_degraded_and_misplaced_objects () {
|
function wait_for_degraded_and_misplaced_objects () {
|
||||||
echo "#### Start: Checking for degraded and misplaced objects ####"
|
echo "#### Start: Checking for degraded and misplaced objects ####"
|
||||||
|
|
||||||
# Loop until no degraded objects
|
# Loop until no degraded or misplaced objects
|
||||||
while [[ ! -z "`ceph --cluster ${CLUSTER} -s | grep 'degraded\|misplaced'`" ]]
|
while [[ ! -z "`ceph --cluster ${CLUSTER} -s | grep 'degraded\|misplaced'`" ]]
|
||||||
do
|
do
|
||||||
sleep 3
|
sleep 3
|
||||||
@ -150,7 +161,7 @@ function restart_by_rack() {
|
|||||||
sleep 60
|
sleep 60
|
||||||
# Degraded objects won't recover with noout set unless pods come back and
|
# Degraded objects won't recover with noout set unless pods come back and
|
||||||
# PGs become healthy, so simply wait for 0 degraded objects
|
# PGs become healthy, so simply wait for 0 degraded objects
|
||||||
wait_for_degraded_and_misplaced_objects
|
wait_for_degraded_objects
|
||||||
ceph -s
|
ceph -s
|
||||||
done
|
done
|
||||||
}
|
}
|
||||||
@ -177,7 +188,7 @@ echo "Latest revision of the helm chart(s) is : $max_release"
|
|||||||
|
|
||||||
if [[ $max_release -gt 1 ]]; then
|
if [[ $max_release -gt 1 ]]; then
|
||||||
if [[ $require_upgrade -gt 0 ]]; then
|
if [[ $require_upgrade -gt 0 ]]; then
|
||||||
echo "waiting for inactive pgs and degraded obejcts before upgrade"
|
echo "waiting for inactive pgs and degraded objects before upgrade"
|
||||||
wait_for_pgs
|
wait_for_pgs
|
||||||
wait_for_degraded_and_misplaced_objects
|
wait_for_degraded_and_misplaced_objects
|
||||||
ceph -s
|
ceph -s
|
||||||
|
@ -34,4 +34,5 @@ ceph-osd:
|
|||||||
- 0.1.31 Helm 3 - Fix Job labels
|
- 0.1.31 Helm 3 - Fix Job labels
|
||||||
- 0.1.32 Update htk requirements
|
- 0.1.32 Update htk requirements
|
||||||
- 0.1.33 Update log-runner container for MAC
|
- 0.1.33 Update log-runner container for MAC
|
||||||
|
- 0.1.34 Remove wait for misplaced objects during OSD restarts
|
||||||
...
|
...
|
||||||
|
Loading…
x
Reference in New Issue
Block a user