Conditional creation of RAIDed ESP for UEFI Software RAID

Rebuilding an instance on a RAIDed ESPs will fail due to sgdisk
running against an non-clean disk and bailing out. Check if there
is a RAIDed ESP already and skip creation if it exists.

Change-Id: I13617ae77515a9d34bc4bb3caf9fae73d5e4e578
(cherry picked from commit 286d66709a1b2f2068360db641079c67197b21b6)
This commit is contained in:
Arne Wiebalck 2023-08-16 15:51:59 +02:00
parent 0b31c4cb75
commit 031b54b10a
4 changed files with 120 additions and 41 deletions

View File

@ -12,6 +12,7 @@
import copy import copy
import re import re
import shlex
from ironic_lib import disk_utils from ironic_lib import disk_utils
from ironic_lib import utils as il_utils from ironic_lib import utils as il_utils
@ -342,50 +343,58 @@ def prepare_boot_partitions_for_softraid(device, holders, efi_part,
if efi_part: if efi_part:
efi_part = '{}p{}'.format(device, efi_part['number']) efi_part = '{}p{}'.format(device, efi_part['number'])
LOG.info("Creating EFI partitions on software RAID holder disks") # check if we have a RAIDed ESP already
# We know that we kept this space when configuring raid,see md_device = find_esp_raid()
# hardware.GenericHardwareManager.create_configuration. if md_device:
# We could also directly get the EFI partition size. LOG.info("Found RAIDed ESP %s, skip creation", md_device)
partsize_mib = ESP_SIZE_MIB else:
partlabel_prefix = 'uefi-holder-' LOG.info("Creating EFI partitions on software RAID holder disks")
efi_partitions = [] # We know that we kept this space when configuring raid,see
for number, holder in enumerate(holders): # hardware.GenericHardwareManager.create_configuration.
# NOTE: see utils.get_partition_table_type_from_specs # We could also directly get the EFI partition size.
# for uefi we know that we have setup a gpt partition table, partsize_mib = ESP_SIZE_MIB
# sgdisk can be used to edit table, more user friendly partlabel_prefix = 'uefi-holder-'
# for alignment and relative offsets efi_partitions = []
partlabel = '{}{}'.format(partlabel_prefix, number) for number, holder in enumerate(holders):
out, _u = utils.execute('sgdisk', '-F', holder) # NOTE: see utils.get_partition_table_type_from_specs
start_sector = '{}s'.format(out.splitlines()[-1].strip()) # for uefi we know that we have setup a gpt partition table,
out, _u = utils.execute( # sgdisk can be used to edit table, more user friendly
'sgdisk', '-n', '0:{}:+{}MiB'.format(start_sector, # for alignment and relative offsets
partsize_mib), partlabel = '{}{}'.format(partlabel_prefix, number)
'-t', '0:ef00', '-c', '0:{}'.format(partlabel), holder) out, _u = utils.execute('sgdisk', '-F', holder)
start_sector = '{}s'.format(out.splitlines()[-1].strip())
out, _u = utils.execute(
'sgdisk', '-n', '0:{}:+{}MiB'.format(start_sector,
partsize_mib),
'-t', '0:ef00', '-c', '0:{}'.format(partlabel), holder)
# Refresh part table # Refresh part table
utils.execute("partprobe") utils.execute("partprobe")
utils.execute("blkid") utils.execute("blkid")
target_part, _u = utils.execute( target_part, _u = utils.execute(
"blkid", "-l", "-t", "PARTLABEL={}".format(partlabel), holder) "blkid", "-l", "-t", "PARTLABEL={}".format(partlabel),
holder)
target_part = target_part.splitlines()[-1].split(':', 1)[0] target_part = target_part.splitlines()[-1].split(':', 1)[0]
efi_partitions.append(target_part) efi_partitions.append(target_part)
LOG.debug("EFI partition %s created on holder disk %s", LOG.debug("EFI partition %s created on holder disk %s",
target_part, holder) target_part, holder)
# RAID the ESPs, metadata=1.0 is mandatory to be able to boot # RAID the ESPs, metadata=1.0 is mandatory to be able to boot
md_device = get_next_free_raid_device() md_device = get_next_free_raid_device()
LOG.debug("Creating md device %(md_device)s for the ESPs " LOG.debug("Creating md device %(md_device)s for the ESPs "
"on %(efi_partitions)s", "on %(efi_partitions)s",
{'md_device': md_device, 'efi_partitions': efi_partitions}) {'md_device': md_device,
utils.execute('mdadm', '--create', md_device, '--force', 'efi_partitions': efi_partitions})
'--run', '--metadata=1.0', '--level', '1', utils.execute('mdadm', '--create', md_device, '--force',
'--name', 'esp', '--raid-devices', len(efi_partitions), '--run', '--metadata=1.0', '--level', '1',
*efi_partitions) '--name', 'esp', '--raid-devices',
len(efi_partitions),
*efi_partitions)
disk_utils.trigger_device_rescan(md_device) disk_utils.trigger_device_rescan(md_device)
if efi_part: if efi_part:
# Blockdev copy the source ESP and erase it # Blockdev copy the source ESP and erase it
@ -420,3 +429,18 @@ def prepare_boot_partitions_for_softraid(device, holders, efi_part,
# disk, as in virtual disk, where to load the data from. # disk, as in virtual disk, where to load the data from.
# Since there is a structural difference, this means it will # Since there is a structural difference, this means it will
# fail. # fail.
def find_esp_raid():
"""Find the ESP md device in case of a rebuild."""
# find devices of type 'RAID1' and fstype 'VFAT'
lsblk = utils.execute('lsblk', '-PbioNAME,TYPE,FSTYPE')
report = lsblk[0]
for line in report.split('\n'):
dev = {}
vals = shlex.split(line)
for key, val in (v.split('=', 1) for v in vals):
dev[key] = val.strip()
if dev.get('TYPE') == 'raid1' and dev.get('FSTYPE') == 'vfat':
return '/dev/' + dev.get('NAME')

View File

@ -1769,3 +1769,33 @@ MULTIPATH_LINKS_DM = (
' `-+- policy=\'service-time 0\' prio=1 status=active\n' ' `-+- policy=\'service-time 0\' prio=1 status=active\n'
' `- 0:0:0:0 device s 8:0 active ready running\n' ' `- 0:0:0:0 device s 8:0 active ready running\n'
) )
LSBLK_OUPUT = ("""
NAME="sda" TYPE="disk" FSTYPE=""
NAME="sdb" TYPE="disk" FSTYPE=""
""")
LSBLK_OUPUT_ESP_RAID = ("""
NAME="sda" TYPE="disk" FSTYPE=""
NAME="sda1" TYPE="part" FSTYPE="linux_raid_member"
NAME="md127" TYPE="raid1" FSTYPE=""
NAME="md127p1" TYPE="md" FSTYPE="xfs"
NAME="md127p2" TYPE="md" FSTYPE="iso9660"
NAME="md127p14" TYPE="md" FSTYPE=""
NAME="md127p15" TYPE="md" FSTYPE=""
NAME="sda2" TYPE="part" FSTYPE="linux_raid_member"
NAME="md126" TYPE="raid0" FSTYPE=""
NAME="sda3" TYPE="part" FSTYPE="linux_raid_member"
NAME="md125" TYPE="raid1" FSTYPE="vfat"
NAME="sdb" TYPE="disk" FSTYPE=""
NAME="sdb1" TYPE="part" FSTYPE="linux_raid_member"
NAME="md127" TYPE="raid1" FSTYPE=""
NAME="md127p1" TYPE="md" FSTYPE="xfs"
NAME="md127p2" TYPE="md" FSTYPE="iso9660"
NAME="md127p14" TYPE="md" FSTYPE=""
NAME="md127p15" TYPE="md" FSTYPE=""
NAME="sdb2" TYPE="part" FSTYPE="linux_raid_member"
NAME="md126" TYPE="raid0" FSTYPE=""
NAME="sdb3" TYPE="part" FSTYPE="linux_raid_member"
NAME="md125" TYPE="raid1" FSTYPE="vfat"
""")

View File

@ -153,6 +153,7 @@ class TestRaidUtils(base.IronicAgentTest):
volume_name = raid_utils.get_volume_name_of_raid_device('/dev/md0') volume_name = raid_utils.get_volume_name_of_raid_device('/dev/md0')
self.assertIsNone(volume_name) self.assertIsNone(volume_name)
@mock.patch.object(raid_utils, 'find_esp_raid', autospec=True)
@mock.patch.object(disk_utils, 'trigger_device_rescan', autospec=True) @mock.patch.object(disk_utils, 'trigger_device_rescan', autospec=True)
@mock.patch.object(raid_utils, 'get_next_free_raid_device', autospec=True, @mock.patch.object(raid_utils, 'get_next_free_raid_device', autospec=True,
return_value='/dev/md42') return_value='/dev/md42')
@ -161,7 +162,7 @@ class TestRaidUtils(base.IronicAgentTest):
@mock.patch.object(disk_utils, 'find_efi_partition', autospec=True) @mock.patch.object(disk_utils, 'find_efi_partition', autospec=True)
def test_prepare_boot_partitions_for_softraid_uefi_gpt( def test_prepare_boot_partitions_for_softraid_uefi_gpt(
self, mock_efi_part, mock_execute, mock_dispatch, self, mock_efi_part, mock_execute, mock_dispatch,
mock_free_raid_device, mock_rescan): mock_free_raid_device, mock_rescan, mock_find_esp):
mock_efi_part.return_value = {'number': '12'} mock_efi_part.return_value = {'number': '12'}
mock_execute.side_effect = [ mock_execute.side_effect = [
('451', None), # sgdisk -F ('451', None), # sgdisk -F
@ -178,6 +179,7 @@ class TestRaidUtils(base.IronicAgentTest):
(None, None), # cp (None, None), # cp
(None, None), # wipefs (None, None), # wipefs
] ]
mock_find_esp.return_value = None
efi_part = raid_utils.prepare_boot_partitions_for_softraid( efi_part = raid_utils.prepare_boot_partitions_for_softraid(
'/dev/md0', ['/dev/sda', '/dev/sdb'], None, '/dev/md0', ['/dev/sda', '/dev/sdb'], None,
@ -209,6 +211,7 @@ class TestRaidUtils(base.IronicAgentTest):
self.assertEqual(efi_part, '/dev/md42') self.assertEqual(efi_part, '/dev/md42')
mock_rescan.assert_called_once_with('/dev/md42') mock_rescan.assert_called_once_with('/dev/md42')
@mock.patch.object(raid_utils, 'find_esp_raid', autospec=True)
@mock.patch.object(disk_utils, 'trigger_device_rescan', autospec=True) @mock.patch.object(disk_utils, 'trigger_device_rescan', autospec=True)
@mock.patch.object(raid_utils, 'get_next_free_raid_device', autospec=True, @mock.patch.object(raid_utils, 'get_next_free_raid_device', autospec=True,
return_value='/dev/md42') return_value='/dev/md42')
@ -218,7 +221,7 @@ class TestRaidUtils(base.IronicAgentTest):
@mock.patch.object(ilib_utils, 'mkfs', autospec=True) @mock.patch.object(ilib_utils, 'mkfs', autospec=True)
def test_prepare_boot_partitions_for_softraid_uefi_gpt_esp_not_found( def test_prepare_boot_partitions_for_softraid_uefi_gpt_esp_not_found(
self, mock_mkfs, mock_efi_part, mock_execute, mock_dispatch, self, mock_mkfs, mock_efi_part, mock_execute, mock_dispatch,
mock_free_raid_device, mock_rescan): mock_free_raid_device, mock_rescan, mock_find_esp):
mock_efi_part.return_value = None mock_efi_part.return_value = None
mock_execute.side_effect = [ mock_execute.side_effect = [
('451', None), # sgdisk -F ('451', None), # sgdisk -F
@ -233,6 +236,7 @@ class TestRaidUtils(base.IronicAgentTest):
('/dev/sdb14: whatever', None), # blkid ('/dev/sdb14: whatever', None), # blkid
(None, None), # mdadm (None, None), # mdadm
] ]
mock_find_esp.return_value = None
efi_part = raid_utils.prepare_boot_partitions_for_softraid( efi_part = raid_utils.prepare_boot_partitions_for_softraid(
'/dev/md0', ['/dev/sda', '/dev/sdb'], None, '/dev/md0', ['/dev/sda', '/dev/sdb'], None,
@ -262,6 +266,7 @@ class TestRaidUtils(base.IronicAgentTest):
self.assertEqual(efi_part, '/dev/md42') self.assertEqual(efi_part, '/dev/md42')
mock_rescan.assert_called_once_with('/dev/md42') mock_rescan.assert_called_once_with('/dev/md42')
@mock.patch.object(raid_utils, 'find_esp_raid', autospec=True)
@mock.patch.object(disk_utils, 'trigger_device_rescan', autospec=True) @mock.patch.object(disk_utils, 'trigger_device_rescan', autospec=True)
@mock.patch.object(raid_utils, 'get_next_free_raid_device', autospec=True, @mock.patch.object(raid_utils, 'get_next_free_raid_device', autospec=True,
return_value='/dev/md42') return_value='/dev/md42')
@ -269,7 +274,7 @@ class TestRaidUtils(base.IronicAgentTest):
@mock.patch.object(ilib_utils, 'execute', autospec=True) @mock.patch.object(ilib_utils, 'execute', autospec=True)
def test_prepare_boot_partitions_for_softraid_uefi_gpt_efi_provided( def test_prepare_boot_partitions_for_softraid_uefi_gpt_efi_provided(
self, mock_execute, mock_dispatch, mock_free_raid_device, self, mock_execute, mock_dispatch, mock_free_raid_device,
mock_rescan): mock_rescan, mock_find_esp):
mock_execute.side_effect = [ mock_execute.side_effect = [
('451', None), # sgdisk -F ('451', None), # sgdisk -F
(None, None), # sgdisk create part (None, None), # sgdisk create part
@ -285,6 +290,7 @@ class TestRaidUtils(base.IronicAgentTest):
(None, None), # cp (None, None), # cp
(None, None), # wipefs (None, None), # wipefs
] ]
mock_find_esp.return_value = None
efi_part = raid_utils.prepare_boot_partitions_for_softraid( efi_part = raid_utils.prepare_boot_partitions_for_softraid(
'/dev/md0', ['/dev/sda', '/dev/sdb'], '/dev/md0p15', '/dev/md0', ['/dev/sda', '/dev/sdb'], '/dev/md0p15',
@ -389,3 +395,17 @@ class TestGetNextFreeRaidDevice(base.IronicAgentTest):
] ]
self.assertRaises(errors.SoftwareRAIDError, self.assertRaises(errors.SoftwareRAIDError,
raid_utils.get_next_free_raid_device) raid_utils.get_next_free_raid_device)
@mock.patch.object(utils, 'execute', autospec=True)
class TestFindESPRAID(base.IronicAgentTest):
def test_no_esp_raid(self, mock_execute):
mock_execute.side_effect = [(hws.LSBLK_OUPUT, '')]
result = raid_utils.find_esp_raid()
self.assertIsNone(result)
def test_esp_raid(self, mock_execute):
mock_execute.side_effect = [(hws.LSBLK_OUPUT_ESP_RAID, '')]
result = raid_utils.find_esp_raid()
self.assertEqual('/dev/md125', result)

View File

@ -0,0 +1,5 @@
---
fixes:
- |
Fixes an issue with rebuilding instances on Software RAID with
RAIDed ESP partitions.