Blame SOURCES/sos-bz1789049-since-option-improved.patch

30a705
From 71cdbde72f81d586da37a9e108868d6aa1b4ef69 Mon Sep 17 00:00:00 2001
30a705
From: Pavel Moravec <pmoravec@redhat.com>
30a705
Date: Thu, 5 Dec 2019 14:26:03 +0100
30a705
Subject: [PATCH] [plugins] improve heuristic for applying --since to
30a705
 logarchives
30a705
30a705
logarchive_pattern treats some configs (e.g. /etc/dbus-1) as log
30a705
archives, causing --since option will skip collecting them.
30a705
30a705
This patch just improves the heuristic by claiming nothing under /etc
30a705
is a logarchive, and adds a warning to sosreport help.
30a705
30a705
Improves: #1847
30a705
30a705
Signed-off-by: Pavel Moravec <pmoravec@redhat.com>
30a705
---
30a705
 man/en/sosreport.1      | 5 ++++-
30a705
 sos/plugins/__init__.py | 5 ++++-
30a705
 2 files changed, 8 insertions(+), 2 deletions(-)
30a705
30a705
diff --git a/man/en/sosreport.1 b/man/en/sosreport.1
30a705
index a885d5630..f63b8deab 100644
30a705
--- a/man/en/sosreport.1
30a705
+++ b/man/en/sosreport.1
30a705
@@ -158,8 +158,11 @@ and including logs in non-default locations. This option may significantly
30a705
 increase the size of reports.
30a705
 .TP
30a705
 .B \--since YYYYMMDD[HHMMSS]
30a705
-Limits the collection to logs newer than this date.
30a705
+Limits the collection of log archives(*) to those newer than this date.
30a705
 This also affects \--all-logs. Will pad with 0s if HHMMSS isn't specified.
30a705
+(*) Sos interprets as a log archive any file not found in /etc, that has
30a705
+either a numeric or compression-type extension for example '.zip'. '.1', '.gz'
30a705
+ etc.)
30a705
 .TP
30a705
 .B \--allow-system-changes
30a705
 Run commands even if they can change the system (e.g. load kernel modules).
30a705
diff --git a/sos/plugins/__init__.py b/sos/plugins/__init__.py
30a705
index b7a47b6a4..44ae413d0 100644
30a705
--- a/sos/plugins/__init__.py
30a705
+++ b/sos/plugins/__init__.py
30a705
@@ -917,6 +917,7 @@ def add_copy_spec(self, copyspecs, sizelimit=None, maxage=None,
30a705
             since = self.get_option('since')
30a705
 
30a705
         logarchive_pattern = re.compile(r'.*((\.(zip|gz|bz2|xz))|[-.][\d]+)$')
30a705
+        configfile_pattern = re.compile(r"^%s/*" % self.join_sysroot("etc"))
30a705
 
30a705
         if not self.test_predicate(pred=pred):
30a705
             self._log_info("skipped copy spec '%s' due to predicate (%s)" %
30a705
@@ -962,7 +963,9 @@ def time_filter(path):
30a705
                 """ When --since is passed, or maxage is coming from the
30a705
                 plugin, we need to filter out older files """
30a705
 
30a705
-                if logarchive_pattern.search(path) is None:
30a705
+                # skip config files or not-logarchive files from the filter
30a705
+                if ((logarchive_pattern.search(path) is None) or
30a705
+                   (configfile_pattern.search(path) is not None)):
30a705
                     return True
30a705
                 filetime = datetime.fromtimestamp(getmtime(path))
30a705
                 if ((since and filetime < since) or