Merge "swift-ring-builder can't remove a device with zero weight"

This commit is contained in:
Jenkins 2015-11-02 14:37:33 +00:00 committed by Gerrit Code Review
commit e1910dff17
5 changed files with 50 additions and 15 deletions

View File

@ -306,18 +306,20 @@ def run_scenario(scenario):
command_f(*command) command_f(*command)
rebalance_number = 1 rebalance_number = 1
parts_moved, old_balance = rb.rebalance(seed=seed) parts_moved, old_balance, removed_devs = rb.rebalance(seed=seed)
rb.pretend_min_part_hours_passed() rb.pretend_min_part_hours_passed()
print "\tRebalance 1: moved %d parts, balance is %.6f" % ( print "\tRebalance 1: moved %d parts, balance is %.6f, \
parts_moved, old_balance) %d removed devs" % (
parts_moved, old_balance, removed_devs)
while True: while True:
rebalance_number += 1 rebalance_number += 1
parts_moved, new_balance = rb.rebalance(seed=seed) parts_moved, new_balance, removed_devs = rb.rebalance(seed=seed)
rb.pretend_min_part_hours_passed() rb.pretend_min_part_hours_passed()
print "\tRebalance %d: moved %d parts, balance is %.6f" % ( print "\tRebalance %d: moved %d parts, balance is %.6f, \
rebalance_number, parts_moved, new_balance) %d removed devs" % (
if parts_moved == 0: rebalance_number, parts_moved, new_balance, removed_devs)
if parts_moved == 0 and removed_devs == 0:
break break
if abs(new_balance - old_balance) < 1 and not ( if abs(new_balance - old_balance) < 1 and not (
old_balance == builder.MAX_BALANCE and old_balance == builder.MAX_BALANCE and

View File

@ -797,7 +797,7 @@ swift-ring-builder <builder_file> rebalance [options]
devs_changed = builder.devs_changed devs_changed = builder.devs_changed
try: try:
last_balance = builder.get_balance() last_balance = builder.get_balance()
parts, balance = builder.rebalance(seed=get_seed(3)) parts, balance, removed_devs = builder.rebalance(seed=get_seed(3))
except exceptions.RingBuilderError as e: except exceptions.RingBuilderError as e:
print('-' * 79) print('-' * 79)
print("An error has occurred during ring validation. Common\n" print("An error has occurred during ring validation. Common\n"
@ -807,7 +807,7 @@ swift-ring-builder <builder_file> rebalance [options]
(e,)) (e,))
print('-' * 79) print('-' * 79)
exit(EXIT_ERROR) exit(EXIT_ERROR)
if not (parts or options.force): if not (parts or options.force or removed_devs):
print('No partitions could be reassigned.') print('No partitions could be reassigned.')
print('Either none need to be or none can be due to ' print('Either none need to be or none can be due to '
'min_part_hours [%s].' % builder.min_part_hours) 'min_part_hours [%s].' % builder.min_part_hours)

View File

@ -425,7 +425,7 @@ class RingBuilder(object):
self._initial_balance() self._initial_balance()
self.devs_changed = False self.devs_changed = False
self._build_dispersion_graph() self._build_dispersion_graph()
return self.parts, self.get_balance() return self.parts, self.get_balance(), 0
changed_parts = 0 changed_parts = 0
self._update_last_part_moves() self._update_last_part_moves()
last_balance = 0 last_balance = 0
@ -437,6 +437,7 @@ class RingBuilder(object):
self._set_parts_wanted() self._set_parts_wanted()
self._reassign_parts(new_parts) self._reassign_parts(new_parts)
changed_parts += len(new_parts) changed_parts += len(new_parts)
removed_devs = 0
while True: while True:
reassign_parts = self._gather_reassign_parts() reassign_parts = self._gather_reassign_parts()
changed_parts += len(reassign_parts) changed_parts += len(reassign_parts)
@ -448,6 +449,7 @@ class RingBuilder(object):
remove_dev_id = self._remove_devs.pop()['id'] remove_dev_id = self._remove_devs.pop()['id']
self.logger.debug("Removing dev %d", remove_dev_id) self.logger.debug("Removing dev %d", remove_dev_id)
self.devs[remove_dev_id] = None self.devs[remove_dev_id] = None
removed_devs += 1
balance = self.get_balance() balance = self.get_balance()
if balance < 1 or abs(last_balance - balance) < 1 or \ if balance < 1 or abs(last_balance - balance) < 1 or \
changed_parts == self.parts: changed_parts == self.parts:
@ -457,7 +459,7 @@ class RingBuilder(object):
self.version += 1 self.version += 1
changed_parts = self._build_dispersion_graph(old_replica2part2dev) changed_parts = self._build_dispersion_graph(old_replica2part2dev)
return changed_parts, balance return changed_parts, balance, removed_devs
def _build_dispersion_graph(self, old_replica2part2dev=None): def _build_dispersion_graph(self, old_replica2part2dev=None):
""" """

View File

@ -1696,6 +1696,21 @@ class TestCommands(unittest.TestCase, RunSwiftRingBuilderMixin):
err = e err = e
self.assertEqual(err.code, 2) self.assertEqual(err.code, 2)
def test_rebalance_remove_zero_weighted_device(self):
self.create_sample_ring()
ring = RingBuilder.load(self.tmpfile)
ring.set_dev_weight(3, 0.0)
ring.rebalance()
ring.remove_dev(3)
ring.save(self.tmpfile)
# Test rebalance after remove 0 weighted device
argv = ["", self.tmpfile, "rebalance", "3"]
self.assertRaises(SystemExit, ringbuilder.main, argv)
ring = RingBuilder.load(self.tmpfile)
self.assertTrue(ring.validate())
self.assertEqual(ring.devs[3], None)
def test_write_ring(self): def test_write_ring(self):
self.create_sample_ring() self.create_sample_ring()
argv = ["", self.tmpfile, "rebalance"] argv = ["", self.tmpfile, "rebalance"]

View File

@ -309,6 +309,22 @@ class TestRingBuilder(unittest.TestCase):
rb.rebalance() rb.rebalance()
rb.validate() rb.validate()
def test_remove_zero_weighted(self):
rb = ring.RingBuilder(8, 3, 0)
rb.add_dev({'id': 0, 'device': 'd0', 'ip': '10.0.0.1',
'port': 6002, 'weight': 1000.0, 'region': 0, 'zone': 1})
rb.add_dev({'id': 1, 'device': 'd1', 'ip': '10.0.0.2',
'port': 6002, 'weight': 0.0, 'region': 0, 'zone': 2})
rb.add_dev({'id': 2, 'device': 'd2', 'ip': '10.0.0.3',
'port': 6002, 'weight': 1000.0, 'region': 0, 'zone': 3})
rb.add_dev({'id': 3, 'device': 'd3', 'ip': '10.0.0.1',
'port': 6002, 'weight': 1000.0, 'region': 0, 'zone': 1})
rb.rebalance()
rb.remove_dev(1)
parts, balance, removed = rb.rebalance()
self.assertEqual(removed, 1)
def test_shuffled_gather(self): def test_shuffled_gather(self):
if self._shuffled_gather_helper() and \ if self._shuffled_gather_helper() and \
self._shuffled_gather_helper(): self._shuffled_gather_helper():
@ -366,7 +382,7 @@ class TestRingBuilder(unittest.TestCase):
rb.add_dev({'region': 1, 'zone': 2, 'weight': 4000.0, rb.add_dev({'region': 1, 'zone': 2, 'weight': 4000.0,
'ip': '10.1.1.3', 'port': 10000, 'device': 'sdb'}) 'ip': '10.1.1.3', 'port': 10000, 'device': 'sdb'})
_, balance = rb.rebalance(seed=2) _, balance, _ = rb.rebalance(seed=2)
# maybe not *perfect*, but should be close # maybe not *perfect*, but should be close
self.assertTrue(balance <= 1) self.assertTrue(balance <= 1)
@ -795,7 +811,7 @@ class TestRingBuilder(unittest.TestCase):
# it's as balanced as it gets, so nothing moves anymore # it's as balanced as it gets, so nothing moves anymore
rb.pretend_min_part_hours_passed() rb.pretend_min_part_hours_passed()
parts_moved, _balance = rb.rebalance(seed=1) parts_moved, _balance, _removed = rb.rebalance(seed=1)
self.assertEqual(parts_moved, 0) self.assertEqual(parts_moved, 0)
def test_region_fullness_with_balanceable_ring(self): def test_region_fullness_with_balanceable_ring(self):
@ -867,7 +883,7 @@ class TestRingBuilder(unittest.TestCase):
rb.add_dev({'id': 3, 'region': 1, 'zone': 1, 'weight': 0.25, rb.add_dev({'id': 3, 'region': 1, 'zone': 1, 'weight': 0.25,
'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'}) 'ip': '127.0.0.1', 'port': 10004, 'device': 'sda1'})
rb.pretend_min_part_hours_passed() rb.pretend_min_part_hours_passed()
changed_parts, _balance = rb.rebalance(seed=2) changed_parts, _balance, _removed = rb.rebalance(seed=2)
# there's not enough room in r1 for every partition to have a replica # there's not enough room in r1 for every partition to have a replica
# in it, so only 86 assignments occur in r1 (that's ~1/5 of the total, # in it, so only 86 assignments occur in r1 (that's ~1/5 of the total,
@ -920,7 +936,7 @@ class TestRingBuilder(unittest.TestCase):
for weight in range(0, 101, 10): for weight in range(0, 101, 10):
rb.set_dev_weight(5, weight) rb.set_dev_weight(5, weight)
rb.pretend_min_part_hours_passed() rb.pretend_min_part_hours_passed()
changed_parts, _balance = rb.rebalance(seed=2) changed_parts, _balance, _removed = rb.rebalance(seed=2)
rb.validate() rb.validate()
moved_partitions.append(changed_parts) moved_partitions.append(changed_parts)
# Ensure that the second region has enough partitions # Ensure that the second region has enough partitions