reconstructor: silence traceback when purging

Catch DiskFileNotExist exceptions when attempting to purge files. The file may have passed its reclaim age since being reverted and will be cleaned up when the reconstructor opens it for purging, raising a DiskFileNotExist. The exception is OK - the diskfile was about to be purged. Change-Id: I5dfdf5950c6bd7fb130ab557347fbe959270c6e9
2021-11-19 12:55:59 +00:00 · 2021-11-19 12:55:59 +00:00 · 092d409c4b
parent 4c84f615a1
commit 092d409c4b
2 changed files with 61 additions and 1 deletions
--- a/swift/obj/reconstructor.py
+++ b/swift/obj/reconstructor.py
@ -47,7 +47,7 @@ from swift.obj.diskfile import DiskFileRouter, get_data_dir, \
    get_tmp_dir, DEFAULT_RECLAIM_AGE
 from swift.common.storage_policy import POLICIES, EC_POLICY
 from swift.common.exceptions import ConnectionTimeout, DiskFileError, \
-    SuffixSyncError, PartitionLockTimeout
+    SuffixSyncError, PartitionLockTimeout, DiskFileNotExist

 SYNC, REVERT = ('sync_only', 'sync_revert')
 UNKNOWN_RESPONSE_STATUS = 0  # used as response status for timeouts, exceptions
@ -988,6 +988,10 @@ class ObjectReconstructor(Daemon):
                                          else df_mgr.commit_window)
                df.purge(timestamps['ts_data'], frag_index,
                         nondurable_purge_delay)
+            except DiskFileNotExist:
+                # may have passed reclaim age since being reverted, or may have
+                # raced with another reconstructor process trying the same
+                pass
            except DiskFileError:
                self.logger.exception(
                    'Unable to purge DiskFile (%r %r %r)',
--- a/test/unit/obj/test_reconstructor.py
+++ b/test/unit/obj/test_reconstructor.py
@ -4666,6 +4666,62 @@ class TestObjectReconstructor(BaseTestObjectReconstructor):

        self.assertEqual(self.reconstructor.handoffs_remaining, 0)

+    def test_process_job_revert_cleanup_but_already_reclaimed(self):
+        frag_index = random.randint(
+            0, self.policy.ec_n_unique_fragments - 1)
+        sync_to = [random.choice([n for n in self.policy.object_ring.devs
+                                  if n != self.local_dev])]
+        sync_to[0]['index'] = frag_index
+        partition = 0
+
+        part_path = os.path.join(self.devices, self.local_dev['device'],
+                                 diskfile.get_data_dir(self.policy),
+                                 str(partition))
+        os.makedirs(part_path)
+        df_mgr = self.reconstructor._df_router[self.policy]
+        df = df_mgr.get_diskfile(self.local_dev['device'], partition, 'a',
+                                 'c', 'data-obj', policy=self.policy)
+        ts_delete = self.ts()
+        df.delete(ts_delete)
+        ohash = os.path.basename(df._datadir)
+        suffix = os.path.basename(os.path.dirname(df._datadir))
+
+        job = {
+            'job_type': object_reconstructor.REVERT,
+            'frag_index': frag_index,
+            'suffixes': [suffix],
+            'sync_to': sync_to,
+            'partition': partition,
+            'path': part_path,
+            'hashes': {},
+            'policy': self.policy,
+            'local_dev': self.local_dev,
+            'device': self.local_dev['device'],
+        }
+
+        fake_time = [float(ts_delete) + df_mgr.reclaim_age - 100]
+
+        def mock_time():
+            return fake_time[0]
+
+        def ssync_response_callback(*args):
+            # pretend ssync completed and time has moved just beyonf the
+            # reclaim age for the tombstone
+            fake_time[0] = float(ts_delete) + df_mgr.reclaim_age + 1
+            return True, {ohash: {'ts_data': ts_delete}}
+
+        ssync_calls = []
+        with mock.patch('swift.obj.diskfile.time.time', mock_time):
+            with mock_ssync_sender(ssync_calls,
+                                   response_callback=ssync_response_callback):
+                self.reconstructor.process_job(job)
+
+        self.assertFalse(os.path.exists(df._datadir))
+        self.assertEqual(self.reconstructor.handoffs_remaining, 0)
+        # check there's no tracebacks for opening the reclaimed tombstone
+        self.assertEqual(
+            [], self.reconstructor.logger.logger.get_lines_for_level('error'))
+
    def test_process_job_revert_cleanup_tombstone(self):
        partition = 0
        sync_to = [random.choice([