openstack
diff --git a/‎doc/manpages/object-server.conf.5
Lines changed: 3 additions & 6 deletions b/‎doc/manpages/object-server.conf.5
Lines changed: 3 additions & 6 deletions
diff --git a/‎doc/source/deployment_guide.rst
Lines changed: 16 additions & 8 deletions b/‎doc/source/deployment_guide.rst
Lines changed: 16 additions & 8 deletions
diff --git a/‎etc/object-server.conf-sample
Lines changed: 6 additions & 4 deletions b/‎etc/object-server.conf-sample
Lines changed: 6 additions & 4 deletions
diff --git a/‎swift/container/reconciler.py
Lines changed: 3 additions & 0 deletions b/‎swift/container/reconciler.py
Lines changed: 3 additions & 0 deletions
diff --git a/‎swift/obj/diskfile.py
Lines changed: 18 additions & 27 deletions b/‎swift/obj/diskfile.py
Lines changed: 18 additions & 27 deletions
diff --git a/‎swift/obj/expirer.py
Lines changed: 4 additions & 1 deletion b/‎swift/obj/expirer.py
Lines changed: 4 additions & 1 deletion
diff --git a/‎swift/obj/reconstructor.py
Lines changed: 2 additions & 3 deletions b/‎swift/obj/reconstructor.py
Lines changed: 2 additions & 3 deletions
@@ -142,6 +142,9 @@ backend node. The default is 60.
 The default is 65536.
 .IP \fBdisk_chunk_size\fR
 The default is 65536.
+.IP \fBreclaim_age\fR
+Time elapsed in seconds before an object can be reclaimed. The default is
+604800 seconds.
 .IP \fBnice_priority\fR
 Modify scheduling priority of server processes. Niceness values range from -20
 (most favorable to the process) to 19 (least favorable to the process).
@@ -394,9 +397,6 @@ default is 1800 seconds.
 The default is 15.
 .IP \fBrsync_error_log_line_length\fR
 Limits how long rsync error log lines are. 0 (default) means to log the entire line.
-.IP \fBreclaim_age\fR
-Time elapsed in seconds before an object can be reclaimed. The default is
-604800 seconds.
 .IP "\fBrecon_cache_path\fR"
 The recon_cache_path simply sets the directory where stats for a few items will be stored.
 Depending on the method of deployment you may need to create this directory manually
@@ -468,9 +468,6 @@ Attempts to kill all workers if nothing replicates for lockup_timeout seconds. T
 default is 1800 seconds.
 .IP \fBring_check_interval\fR
 The default is 15.
-.IP \fBreclaim_age\fR
-Time elapsed in seconds before an object can be reclaimed. The default is
-604800 seconds.
 .IP "\fBrecon_cache_path\fR"
 The recon_cache_path simply sets the directory where stats for a few items will be stored.
 Depending on the method of deployment you may need to create this directory manually
 
@@ -228,10 +228,11 @@ service trying to start is missing there will be an error.  The sections not
 used by the service are ignored.
 
 Consider the example of an object storage node.  By convention, configuration
-for the object-server, object-updater, object-replicator, and object-auditor
-exist in a single file ``/etc/swift/object-server.conf``::
+for the object-server, object-updater, object-replicator, object-auditor, and
+object-reconstructor exist in a single file ``/etc/swift/object-server.conf``::
 
     [DEFAULT]
+    reclaim_age = 604800
 
     [pipeline:main]
     pipeline = object-server
@@ -240,7 +241,6 @@ exist in a single file ``/etc/swift/object-server.conf``::
     use = egg:swift#object
 
     [object-replicator]
-    reclaim_age = 259200
 
     [object-updater]
 
@@ -417,9 +417,9 @@ The following configuration options are available:
 
 [DEFAULT]
 
-================================ ==========  ==========================================
+================================ ==========  ============================================
 Option                           Default     Description
--------------------------------- ----------  ------------------------------------------
+-------------------------------- ----------  --------------------------------------------
 swift_dir                        /etc/swift  Swift configuration directory
 devices                          /srv/node   Parent directory of where devices are
                                              mounted
@@ -515,6 +515,16 @@ network_chunk_size               65536       Size of chunks to read/write over t
 disk_chunk_size                  65536       Size of chunks to read/write to disk
 container_update_timeout         1           Time to wait while sending a container
                                              update on object update.
+reclaim_age                      604800      Time elapsed in seconds before the tombstone
+                                             file representing a deleted object can be
+                                             reclaimed.  This is the maximum window for
+                                             your consistency engine.  If a node that was
+                                             disconnected from the cluster because of a
+                                             fault is reintroduced into the cluster after
+                                             this window without having its data purged
+                                             it will result in dark data.  This setting
+                                             should be consistent across all object
+                                             services.
 nice_priority                    None        Scheduling priority of server processes.
                                              Niceness values range from -20 (most
                                              favorable to the process) to 19 (least
@@ -536,7 +546,7 @@ ionice_priority                  None        I/O scheduling priority of server
                                              priority of the process. Work only with
                                              ionice_class.
                                              Ignored if IOPRIO_CLASS_IDLE is set.
-================================ ==========  ==========================================
+================================ ==========  ============================================
 
 .. _object-server-options:
 
@@ -685,8 +695,6 @@ rsync_compress               no                        Allow rsync to compress d
                                                        process.
 stats_interval               300                       Interval in seconds between
                                                        logging replication statistics
-reclaim_age                  604800                    Time elapsed in seconds before an
-                                                       object can be reclaimed
 handoffs_first               false                     If set to True, partitions that
                                                        are not supposed to be on the
                                                        node will be replicated first.
 
@@ -69,6 +69,12 @@ bind_port = 6200
 # network_chunk_size = 65536
 # disk_chunk_size = 65536
 #
+# Reclamation of tombstone files is performed primarily by the replicator and
+# the reconstructor but the object-server and object-auditor also reference
+# this value - it should be the same for all object services in the cluster,
+# and not greater than the container services reclaim_age
+# reclaim_age = 604800
+#
 # You can set scheduling priority of processes. Niceness values range from -20
 # (most favorable to the process) to 19 (least favorable to the process).
 # nice_priority =
@@ -229,9 +235,6 @@ use = egg:swift#recon
 # attempts to kill all workers if nothing replicates for lockup_timeout seconds
 # lockup_timeout = 1800
 #
-# The replicator also performs reclamation
-# reclaim_age = 604800
-#
 # ring_check_interval = 15
 # recon_cache_path = /var/cache/swift
 #
@@ -293,7 +296,6 @@ use = egg:swift#recon
 # node_timeout = 10
 # http_timeout = 60
 # lockup_timeout = 1800
-# reclaim_age = 604800
 # ring_check_interval = 15
 # recon_cache_path = /var/cache/swift
 # handoffs_first = False
 
@@ -337,6 +337,9 @@ class ContainerReconciler(Daemon):
 
     def __init__(self, conf):
         self.conf = conf
+        # This option defines how long an un-processable misplaced object
+        # marker will be retried before it is abandoned.  It is not coupled
+        # with the tombstone reclaim age in the consistency engine.
         self.reclaim_age = int(conf.get('reclaim_age', 86400 * 7))
         self.interval = int(conf.get('interval', 30))
         conf_path = conf.get('__file__') or \
 
@@ -47,6 +47,7 @@
 from tempfile import mkstemp
 from contextlib import contextmanager
 from collections import defaultdict
+from datetime import timedelta
 
 from eventlet import Timeout
 from eventlet.hubs import trampoline
@@ -77,7 +78,7 @@
 
 
 PICKLE_PROTOCOL = 2
-ONE_WEEK = 604800
+DEFAULT_RECLAIM_AGE = timedelta(weeks=1).total_seconds()
 HASH_FILE = 'hashes.pkl'
 HASH_INVALIDATIONS_FILE = 'hashes.invalid'
 METADATA_KEY = 'user.swift.metadata'
@@ -557,7 +558,7 @@ def __init__(self, conf, logger):
         self.keep_cache_size = int(conf.get('keep_cache_size', 5242880))
         self.bytes_per_sync = int(conf.get('mb_per_sync', 512)) * 1024 * 1024
         self.mount_check = config_true_value(conf.get('mount_check', 'true'))
-        self.reclaim_age = int(conf.get('reclaim_age', ONE_WEEK))
+        self.reclaim_age = int(conf.get('reclaim_age', DEFAULT_RECLAIM_AGE))
         self.replication_one_per_device = config_true_value(
             conf.get('replication_one_per_device', 'true'))
         self.replication_lock_timeout = int(conf.get(
@@ -886,13 +887,12 @@ def get_ondisk_files(self, files, datadir, verify=True, **kwargs):
 
         return results
 
-    def cleanup_ondisk_files(self, hsh_path, reclaim_age=ONE_WEEK, **kwargs):
+    def cleanup_ondisk_files(self, hsh_path, **kwargs):
         """
         Clean up on-disk files that are obsolete and gather the set of valid
         on-disk files for an object.
 
         :param hsh_path: object hash path
-        :param reclaim_age: age in seconds at which to remove tombstones
         :param frag_index: if set, search for a specific fragment index .data
                            file, otherwise accept the first valid .data file
         :returns: a dict that may contain: valid on disk files keyed by their
@@ -901,7 +901,7 @@ def cleanup_ondisk_files(self, hsh_path, reclaim_age=ONE_WEEK, **kwargs):
                   reverse sorted, stored under the key 'files'.
         """
         def is_reclaimable(timestamp):
-            return (time.time() - float(timestamp)) > reclaim_age
+            return (time.time() - float(timestamp)) > self.reclaim_age
 
         files = listdir(hsh_path)
         files.sort(reverse=True)
@@ -932,11 +932,10 @@ def _update_suffix_hashes(self, hashes, ondisk_info):
         """
         raise NotImplementedError
 
-    def _hash_suffix_dir(self, path, reclaim_age):
+    def _hash_suffix_dir(self, path):
         """
 
         :param path: full path to directory
-        :param reclaim_age: age in seconds at which to remove tombstones
         """
         hashes = defaultdict(hashlib.md5)
         try:
@@ -948,7 +947,7 @@ def _hash_suffix_dir(self, path, reclaim_age):
         for hsh in path_contents:
             hsh_path = join(path, hsh)
             try:
-                ondisk_info = self.cleanup_ondisk_files(hsh_path, reclaim_age)
+                ondisk_info = self.cleanup_ondisk_files(hsh_path)
             except OSError as err:
                 if err.errno == errno.ENOTDIR:
                     partition_path = dirname(path)
@@ -1006,34 +1005,30 @@ def _hash_suffix_dir(self, path, reclaim_age):
             raise PathNotDir()
         return hashes
 
-    def _hash_suffix(self, path, reclaim_age):
+    def _hash_suffix(self, path):
         """
         Performs reclamation and returns an md5 of all (remaining) files.
 
         :param path: full path to directory
-        :param reclaim_age: age in seconds at which to remove tombstones
         :raises PathNotDir: if given path is not a valid directory
         :raises OSError: for non-ENOTDIR errors
         """
         raise NotImplementedError
 
-    def _get_hashes(self, partition_path, recalculate=None, do_listdir=False,
-                    reclaim_age=None):
+    def _get_hashes(self, partition_path, recalculate=None, do_listdir=False):
         """
         Get hashes for each suffix dir in a partition.  do_listdir causes it to
         mistrust the hash cache for suffix existence at the (unexpectedly high)
-        cost of a listdir.  reclaim_age is just passed on to hash_suffix.
+        cost of a listdir.
 
         :param partition_path: absolute path of partition to get hashes for
         :param recalculate: list of suffixes which should be recalculated when
                             got
         :param do_listdir: force existence check for all hashes in the
                            partition
-        :param reclaim_age: age at which to remove tombstones
 
         :returns: tuple of (number of suffix dirs hashed, dictionary of hashes)
         """
-        reclaim_age = reclaim_age or self.reclaim_age
         hashed = 0
         hashes_file = join(partition_path, HASH_FILE)
         modified = False
@@ -1072,7 +1067,7 @@ def _get_hashes(self, partition_path, recalculate=None, do_listdir=False,
             if not hash_:
                 suffix_dir = join(partition_path, suffix)
                 try:
-                    hashes[suffix] = self._hash_suffix(suffix_dir, reclaim_age)
+                    hashes[suffix] = self._hash_suffix(suffix_dir)
                     hashed += 1
                 except PathNotDir:
                     del hashes[suffix]
@@ -1086,8 +1081,7 @@ def _get_hashes(self, partition_path, recalculate=None, do_listdir=False,
                     write_pickle(
                         hashes, hashes_file, partition_path, PICKLE_PROTOCOL)
                     return hashed, hashes
-            return self._get_hashes(partition_path, recalculate, do_listdir,
-                                    reclaim_age)
+            return self._get_hashes(partition_path, recalculate, do_listdir)
         else:
             return hashed, hashes
 
@@ -1237,8 +1231,7 @@ def get_diskfile_from_hash(self, device, partition, object_hash,
             dev_path, get_data_dir(policy), str(partition), object_hash[-3:],
             object_hash)
         try:
-            filenames = self.cleanup_ondisk_files(object_path,
-                                                  self.reclaim_age)['files']
+            filenames = self.cleanup_ondisk_files(object_path)['files']
         except OSError as err:
             if err.errno == errno.ENOTDIR:
                 quar_path = self.quarantine_renamer(dev_path, object_path)
@@ -1369,7 +1362,7 @@ def yield_hashes(self, device, partition, policy,
                 object_path = os.path.join(suffix_path, object_hash)
                 try:
                     results = self.cleanup_ondisk_files(
-                        object_path, self.reclaim_age, **kwargs)
+                        object_path, **kwargs)
                     timestamps = {}
                     for ts_key, info_key, info_ts_key in key_preference:
                         if info_key not in results:
@@ -2581,17 +2574,16 @@ def _update_suffix_hashes(self, hashes, ondisk_info):
             hashes[None].update(
                 file_info['timestamp'].internal + file_info['ext'])
 
-    def _hash_suffix(self, path, reclaim_age):
+    def _hash_suffix(self, path):
         """
         Performs reclamation and returns an md5 of all (remaining) files.
 
         :param path: full path to directory
-        :param reclaim_age: age in seconds at which to remove tombstones
         :raises PathNotDir: if given path is not a valid directory
         :raises OSError: for non-ENOTDIR errors
         :returns: md5 of files in suffix
         """
-        hashes = self._hash_suffix_dir(path, reclaim_age)
+        hashes = self._hash_suffix_dir(path)
         return hashes[None].hexdigest()
 
 
@@ -3197,12 +3189,11 @@ def _update_suffix_hashes(self, hashes, ondisk_info):
             file_info = ondisk_info['durable_frag_set'][0]
             hashes[None].update(file_info['timestamp'].internal + '.durable')
 
-    def _hash_suffix(self, path, reclaim_age):
+    def _hash_suffix(self, path):
         """
         Performs reclamation and returns an md5 of all (remaining) files.
 
         :param path: full path to directory
-        :param reclaim_age: age in seconds at which to remove tombstones
         :raises PathNotDir: if given path is not a valid directory
         :raises OSError: for non-ENOTDIR errors
         :returns: dict of md5 hex digests
@@ -3211,5 +3202,5 @@ def _hash_suffix(self, path, reclaim_age):
         # here we flatten out the hashers hexdigest into a dictionary instead
         # of just returning the one hexdigest for the whole suffix
 
-        hash_per_fi = self._hash_suffix_dir(path, reclaim_age)
+        hash_per_fi = self._hash_suffix_dir(path)
         return dict((fi, md5.hexdigest()) for fi, md5 in hash_per_fi.items())
@@ -65,7 +65,10 @@ def __init__(self, conf, logger=None, swift=None):
             raise ValueError("concurrency must be set to at least 1")
         self.processes = int(self.conf.get('processes', 0))
         self.process = int(self.conf.get('process', 0))
-        self.reclaim_age = int(conf.get('reclaim_age', 86400 * 7))
+        # This option defines how long an un-processable expired object
+        # marker will be retried before it is abandoned.  It is not coupled
+        # with the tombstone reclaim age in the consistency engine.
+        self.reclaim_age = int(conf.get('reclaim_age', 604800))
 
     def report(self, final=False):
         """
 
@@ -132,7 +132,6 @@ def __init__(self, conf, logger=None):
         self.stats_interval = int(conf.get('stats_interval', '300'))
         self.ring_check_interval = int(conf.get('ring_check_interval', 15))
         self.next_check = time.time() + self.ring_check_interval
-        self.reclaim_age = int(conf.get('reclaim_age', 86400 * 7))
         self.partition_times = []
         self.interval = int(conf.get('interval') or
                             conf.get('run_pause') or 30)
@@ -431,7 +430,7 @@ def _get_hashes(self, policy, path, recalculate=None, do_listdir=False):
         df_mgr = self._df_router[policy]
         hashed, suffix_hashes = tpool_reraise(
             df_mgr._get_hashes, path, recalculate=recalculate,
-            do_listdir=do_listdir, reclaim_age=self.reclaim_age)
+            do_listdir=do_listdir)
         self.logger.update_stats('suffix.hashes', hashed)
         return suffix_hashes
 
@@ -834,7 +833,7 @@ def collect_parts(self, override_devices=None,
                 obj_path = join(dev_path, data_dir)
                 tmp_path = join(dev_path, get_tmp_dir(int(policy)))
                 unlink_older_than(tmp_path, time.time() -
-                                  self.reclaim_age)
+                                  df_mgr.reclaim_age)
                 if not os.path.exists(obj_path):
                     try:
                         mkdirs(obj_path)