Merge "Report tool support for subcloud collect bundles"

2023-06-14 18:18:58 +00:00 · 2023-06-14 18:18:58 +00:00 · d56d82ce4c
commit d56d82ce4c
parent c4b2d8d8e5 53719fe07f
5 changed files with 723 additions and 283 deletions
--- a/tools/collector/debian-scripts/collect
+++ b/tools/collector/debian-scripts/collect
@ -3188,7 +3188,7 @@ if [ "${SUBCLOUD_COLLECT}" = false ] ; then
            echo ""
            echo "------------- Collect Report ------------------"
            # run the report tool
-            ${COLLECT_DIR}/report/report.py -d ${COLLECT_DIR}
+            ${COLLECT_DIR}/report/report.py -b ${COLLECT_DIR}
            echo "-----------------------------------------------"
            echo ""
--- a/tools/collector/debian-scripts/report/README
+++ b/tools/collector/debian-scripts/report/README
@ -1,95 +1,212 @@
 The Report tool is used to gather relevant log, events
 and information about the system from a collect bundle
 and present that data for quick / easy issue analysis.
 Report can run directly from a cloned starlingX utilities git
    ${MY_REPO}/stx/utilities/tools/collector/debian-scripts/report/report.py {options}
 Report is installed and can be run on any 22.12 POSTGA system node.
    /usr/local/bin/report/report.py --directory /scratch
 Report can also be commanded to automatically run during a collect operation
    collect all --report
 See Report's --help option for additional optional command line arguments.
    report.py --help
 Selecting the right command option for your collect bundle:
   Report is designed to analyze a host or subcloud 'collect bundle'.
   Report needs to be told where to find the collect bundle to analyze
   using one of three options
   Analyze Host Bundle: --bundle or -b option
   -------------------
       Use this option to point to a 'directory' that 'contains'
      host tarball files.
          report.py --bundle /scratch/ALL_NODES_YYYYMMDD_hhmmss
      Point to a directory containing host tarballs.
      Such directory contains hostname's tarballs ; ending in tgz
          /scratch/ALL_NODES_YYYYMMDD_hhmmss
          ├── controller-0_YYYMMDD_hhmmss.tgz
          └── controller-1_YYYMMDD_hhmmss.tgz
       This is the option collect uses to auto analyze a just
      collected bundle with the collect --report option.
    Analyze Directory: --directory or -d option
    -----------------
        Use this option when a collect bundle 'tar file' is in a
       in a specific 'directory'. If there are multiple collect
       bundles in that directory then the tool will prompt the
       user to select one from a list.
           report.py --directory /scratch
           0 - exit
           1 - ALL_NODES_20230608.235225
           2 - ALL_NODES_20230609.004604
           Please select bundle to analyze:
       Analysis proceeds automatically if there is only a
       single collect bundle found.
    Analyze Specific Collect Bundle tar file: --file or -f option
    ----------------------------------------
        Use this option to point to a specific collect bundle
        tar file to analyze.
            report.py --file /scratch/ALL_NODES_YYYYMMDD_hhmmss.tar
 Host vs Subcloud Collect Bundles:
 Expected Host Bundle Format:
    ├── SELECT_NODES_YYYYMMDD.hhmmss.tar
    ├── SELECT_NODES_YYYYMMDD.hhmmss
          ├── controller-0_YYYYMMDD.hhmmss
          ├── controller-0_YYYYMMDD.hhmmss.tgz
          ├── controller-1_YYYYMMDD.hhmmss
          ├── controller-1_YYYYMMDD.hhmmss.tgz
          ├── worker-0_YYYYMMDD.hhmmss
          └── worker-1_YYYYMMDD.hhmmss.tgz
 Expected Subcloud Bundle Format
    ├── SELECT_SUBCLOUDS_YYYYMMDD.hhmmss.tar
    └── SELECT_SUBCLOUDS_YYYYMMDD.hhmmss
        ├── subcloudX_YYYYMMDD.hhmmss.tar
        ├── subcloudX_YYYYMMDD.hhmmss
        │   ├── controller-0_YYYYMMDD.hhmmss
        │   ├── controller-0_YYYYMMDD.hhmmss.tgz
        │   ├── report_analysis
        │   └── report_tool.tgz
        ├── subcloudY_YYYYMMDD.hhmmss.tar
        ├── subcloudY_YYYYMMDD.hhmmss
        │   ├── controller-0_YYYYMMDD.hhmmss
        │   ├── controller-0_YYYYMMDD.hhmmss.tgz
        │   ├── report_analysis
        │   └── report_tool.tgz
        ├── subcloudZ_YYYYMMDD.hhmmss.tar
        └── subcloudZ_YYYYMMDD.hhmmss
            ├── controller-0_YYYYMMDD.hhmmss
            └── controller-0_YYYYMMDD.hhmmss.tgz
 If there are multiple bundles found at the specified --directory
 then the list is displayed and the user is prompted to select a
 bundle from the list.
 This would be typical when analyzing a selected subcloud collect
 bundle like in the example below
        $ report -d /localdisk/issues/SELECT_SUBCLOUDS_YYYYMMDD.hhmmss.tar
    Report will extract the subcloud tar file and if it sees more
    than one tar file it will prompt the user to select which one
    to analyze
        0 - exit
        1 - subcloudX_YYYYMMDD.hhmmss
        2 - subcloudY_YYYYMMDD.hhmmss
        3 - subcloudZ_YYYYMMDD.hhmmss
        Please select the bundle to analyze:
 Refer to report.py file header for a description of the tool
-Example:
+Report places the report analysis in the bundle itself.
 Consider the following collect bundle structure and notice 
 the 'report_analysis' folder which contians the Report analysis.
-Consider the following collect bundle structure
+    SELECT_NODES_20220527.193605
    ├── controller-0_20220527.193605
    │   ├── etc
    │   ├── root
    │   └── var
    ├── controller-1_20220527.193605
    │   ├── etc
    │   ├── root
    │   └── var
    └── report_analysis (where the output files will be placed)
-SELECT_NODES_20220527.193605
+Pass a collect bundle to Report's CLI for two phases of processing ...
 ├── controller-0_20220527.193605
 │   ├── etc
 │   ├── root
 │   └── var
 ├── controller-1_20220527.193605
 │   ├── etc
 │   ├── root
 │   └── var
 └── report_analysis (where the output files will be placed)
-> cat plugins/alarm
+    Phase 1: Process algorithm specific plugins to collect plugin
             specific 'report logs'. Basically fault, event,
             alarm and state change logs.
-algorithm=alarm
+    Phase 2: Run the correlator against the plugin found 'report logs'
-alarm_exclude=400., 800.
+             to produce descriptive strings that represent failures
-entity_exclude=subsystem=vim
+             that were found in the collect bundle and to summarize
             the events, alarms and state change data.
-> cat plugins/substring
+Report then produces a report analysis that gets stored with
 the original bundle.
-algorithm=substring
+Example Analysis:
 files=var/log/mtcAgent.log, var/log/sm.log
 hosts=controllers
 substring=operation failed
 substring=Failed to send message
-> report/report.py --start 20220501 --end 20220530
+$ report -d /localdisk/CGTS-44887
-Running the command above will populate the report folder with output files.
+extracting /localdisk/CGTS-44887/ALL_NODES_20230307.183540.tar
 The tool also provides default values, more details are in 'report.py -h'.
-The substring algorithm creates an output file for every host of the
+Report: /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis
 specified host type. The files will contain log events within the
 provided date range containing the substring 'operation failed' and 'Failed
 to send message'.
-The alarm algorithm creates two output file: 'log' and 'alarm'
+extracting : /localdisk/CGTS-44887/ALL_NODES_20230307.183540/controller-1_20230307.183540.tgz
-'log' contains customer log messages created within the provided date range,
+extracting : /localdisk/CGTS-44887/ALL_NODES_20230307.183540/compute-0_20230307.183540.tgz
-and 'alarm' contains system alarms created within the provided date range, as
+extracting : /localdisk/CGTS-44887/ALL_NODES_20230307.183540/controller-0_20230307.183540.tgz
-long as the alarm ids and entity ids are not included in the alarm plugin file.
+extracting : /localdisk/CGTS-44887/ALL_NODES_20230307.183540/compute-1_20230307.183540.tgz
-For more detailed information about an algorithm use 'report.py <algorithm> -h'.
+Active Ctrl: controller-1
 System Type: All-in-one
 S/W Version: 22.12
 System Mode: duplex
 DC Role    : systemcontroller
 Node Type  : controller
 subfunction: controller,worker
 Mgmt Iface : vlan809
 Clstr Iface: vlan909
 OAM Iface  : eno8403
 OS Release : Debian GNU/Linux 11 (bullseye)
 Build Type : Formal
 Build Date : 2023-03-01 23:00:06 +0000
 controllers: controller-1,controller-0
 workers    : compute-1,compute-0
-Here is the report directory after running the above command
+Plugin Results:
-.
+  621 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/log
-├── ALL_NODES_20221211.214001.tar
+  221 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/swact_activity
-└── report_analysis
+  132 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/alarm
-    ├── correlator_alarms
+   85 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/substring_controller-0
-    ├── correlator_events
+   60 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/system_info
-    ├── correlator_failures
+   54 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/maintenance_errors
-    ├── correlator_state_changes
+   36 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/heartbeat_loss
-    ├── plugins
+   26 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/process_failures
-    │   ├── alarm
+   16 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/state_changes
-    │   ├── daemon_failures
+   13 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/substring_controller-1
-    │   ├── heartbeat_loss
+    2 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/plugins/puppet_errors
    │   ├── log
    │   ├── maintenance_errors
    │   ├── process_failures
    │   ├── puppet_errors
    │   ├── state_changes
    │   ├── substring_compute-0
    │   ├── substring_compute-1
    │   ├── substring_compute-2
    │   ├── substring_controller-0
    │   ├── substring_controller-1
    │   ├── swact_activity
    │   └── system_info
    ├── report.log
    └── untar.log
-The report tool also allows users to point it at any collect bundle and
+... nothing found by plugins: daemon_failures
 have it automatically extract the tarball and tar files for each host
 before running.
-The report tool can be run to analyze a collect bundle either on or off
+Correlated Results:
 system by specifying the bundle to analyze using the --directory or
 -d <directory> command option.
-> report/tool/report.py -d <directory containing collect bundle>
+Events       : 8  /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/events
 Alarms       : 26 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/alarms
 State Changes: 16 /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/state_changes
 Failures     : 4  /localdisk/CGTS-44887/ALL_NODES_20230307.183540/report_analysis/failures
 2023-03-07T05:00:11 controller-0 uncontrolled swact
 2023-03-07T05:01:52 controller-0 heartbeat loss failure
 2023-03-07T17:42:35 controller-0 configuration failure
 2023-03-07T17:58:06 controller-0 goenabled failure
-Users may specify if they want the correlator to only find events,
+Inspect the Correlated and Plugin results files for failures,
-alarm transitions, and state changes for a specific host.
+alarms, events and state changes.
 > report/tool/report.py --hostname controller-0
 The report tool can also be run automatically during the collect
 by using the collect --report or -r option. The report_analysis
 will be tared and included in the collect bundle when the --report
 option is used.
--- a/tools/collector/debian-scripts/report/execution_engine.py
+++ b/tools/collector/debian-scripts/report/execution_engine.py
@ -52,6 +52,7 @@ logger = logging.getLogger(__name__)
 # regex expression used to get the hostname from the host dir name
 # eg: chops '_20221201.213332' off of controller-0_20221201.213332
 regex_chop_bundle_date = r"_\d{8}\.\d{6}"
 regex_get_bundle_date = r".*_\d{8}\.\d{6}$"
 class ExecutionEngine:
@ -82,14 +83,18 @@ class ExecutionEngine:
        # Uncompresses host tar files if not already done
        with open(os.path.join(output_dir, "untar.log"), "a") as logfile:
            # Now extract the tarballs
            for obj in (os.scandir(self.input_dir)):
                # files to ignore
                if obj.name == "report_tool.tgz":
                    continue
                info = os.path.splitext(obj.name)
-                logger.debug("Host File Info: %s", info)
+                if (obj.is_file() and tarfile.is_tarfile(obj.path) and not
                if (obj.is_file() and obj.name != "report_tool.tgz" and
                        tarfile.is_tarfile(obj.path) and not
                        os.path.isdir(os.path.join(self.input_dir, info[0]))):
                    try:
-                        logger.info("extracting %s", obj.name)
+                        logger.info("extracting : %s", obj.path)
                        subprocess.run(["tar", "xzfC", obj.path,
                                        self.input_dir],
                                       stderr=logfile, check=True)
@ -97,44 +102,30 @@ class ExecutionEngine:
                        logger.error(e)
        # Determine the active controller and load system info from it.
-        for folder in (f.path for f in os.scandir(input_dir)):
+        for folder in (f.path for f in os.scandir(self.input_dir)):
-            logger.debug("base folder: %s", os.path.basename(folder))
+            basename = os.path.basename(folder)
            # Ignore all directories that are not a properly dated
            # collect file
            if not re.match(regex_get_bundle_date, basename):
                continue
            # skip over files (the tarballs)
            if not os.path.isdir(folder):
                continue
-            basename = os.path.basename(folder)
+
-            if basename == "report_analysis":
+            logger.debug("base folder: %s", os.path.basename(folder))
                continue
            # Get the hostname from the host folder
            hostname = re.sub(regex_chop_bundle_date, "", basename)
            self.hostnames.append(hostname)
            logger.debug("searching for active controller: %s" % hostname)
            host_dir = folder
            if os.path.isdir(host_dir):
                extra_path = os.path.join(host_dir, "var", "extra")
                # don't analyse a directory that doesn't contain
                # a 'var/extra' dir.
                if not os.path.exists(extra_path):
                    logger.warning("missing var/extra for %s" % hostname)
                    continue
                database_path = os.path.join(host_dir, extra_path, "database")
                hostinfo_path = os.path.join(host_dir, extra_path, "host.info")
                if os.path.exists(database_path):
                    if os.listdir(database_path):
                        logger.info("Active Ctrl: %s" % hostname)
                        self.active_controller_directory = folder
                        self.active_controller_hostname = hostname
            self.host_dirs.append(host_dir)
            logger.debug("Host Dirs: %s", self.host_dirs)
-            # save host folder path based on nodetype
+            # build up a list of hosts. save host folder path based on nodetype
            hostinfo_path = os.path.join(host_dir, "var/extra/host.info")
            if os.path.exists(hostinfo_path):
                hostname, subfunction = self._extract_subfunction(
                    hostinfo_path)
@ -145,8 +136,39 @@ class ExecutionEngine:
                elif "storage" in subfunction:
                    self.hosts["storages"][hostname] = folder
            # skip non controller hosts since that could not be active
            if hostname[0:10] != "controller":
                continue
            logger.debug("searching for active controller: %s" % hostname)
            if os.path.isdir(host_dir):
                logger.debug("... checking %s" % hostname)
                extra_path = os.path.join(host_dir, "var/extra")
                # don't analyse a directory that doesn't contain
                # a 'var/extra' dir.
                if not os.path.exists(extra_path):
                    logger.warning("%s is missing var/extra" % hostname)
                    continue
                database_path = os.path.join(host_dir, "var/extra/database")
                if os.path.exists(database_path):
                    if os.listdir(database_path):
                        logger.info("Active Ctrl: %s" % hostname)
                        self.active_controller_directory = folder
                        self.active_controller_hostname = hostname
        if not len(self.host_dirs):
            logger.error("Error: No host bundles found in %s" % input_dir)
            files = []
            for folder in (f.path for f in os.scandir(input_dir)):
                files.append(os.path.basename(folder))
            if files:
                logger.error("... content: %s" % files)
            sys.exit("")
        if not self.active_controller_directory:
-            logger.error("Active Ctrl: NOT FOUND")
+            logger.warning("Active Ctrl: NOT FOUND")
    def execute(self, plugins, output_dir):
        """Run a list of plugins
@ -373,7 +395,10 @@ class ExecutionEngine:
            # Print a summary of the logs/data gathers by the plugins
            empty_files = ""
-            logger.info("Plugin Results:\n")
+            logger.info("")
            logger.info("Plugin Results:")
            logger.info("")
            lines = []
            for fn in os.listdir(plugin_output_dir):
                filename = os.path.join(plugin_output_dir, fn)
                with open(filename, "r+") as f:
@ -384,17 +409,23 @@ class ExecutionEngine:
                        readline = buf.readline
                        while readline():
                            entries += 1
-                        if fn == "system_info":
+                        lines.append("%5d %s" % (entries, filename))
                            logger.info(filename)
                        else:
                            logger.info("%s has %d entries" %
                                        (filename, entries))
                    else:
                        empty_files += fn + " "
            # Sort the lines based on the numeric value
            sorted_lines = sorted(lines, key=lambda x: int(x.split()[0]),
                                  reverse=True)
            for line in sorted_lines:
                logger.info(line)
            if empty_files:
-                logger.info("\n... nothing found by plugins: %s" % empty_files)
+                logger.info("")
                logger.info("... nothing found by plugins: %s" % empty_files)
        else:
-            logger.error("Plugin output dir missing: %s" % plugin_output_dir)
+            logger.error("Error: Plugin output dir missing: %s" %
                         plugin_output_dir)
            sys.exit("... exiting")
        # Running the correlator and printing the output from it
@ -426,8 +457,9 @@ class ExecutionEngine:
        alarms.append("\nTotal alarms found: " + str(alarms_len) + "\n")
        state_changes.append("\nTotal state changes found: " +
                             str(state_changes_len) + "\n")
-
+        logger.info("")
-        logger.info("\nCorrelated Results:\n")
+        logger.info("Correlated Results:")
        logger.info("")
        self._create_output_file("failures", output_dir,
                                 failures, "")
        self._create_output_file("events", output_dir,
--- a/tools/collector/debian-scripts/report/plugin_algs/system_info.py
+++ b/tools/collector/debian-scripts/report/plugin_algs/system_info.py
@ -120,9 +120,4 @@ def system_info(hostname, host_dir, output_dir, hosts, loud=False):
                file.write(f"{k}: {','.join(v.keys())}\n")
                if loud is True:
                    print(f"{k}: {','.join(v.keys())}")
    # create an empty line following the system info dump
    if loud is True:
        print("")
    return
--- a/tools/collector/debian-scripts/report/report.py
+++ b/tools/collector/debian-scripts/report/report.py
@ -90,7 +90,9 @@
 #  command line                      functionality
 #  -------------------------------   ----------------------------------
 # > report.py --help                  - help message
-# > report.py -d <collect bundle dir> - Run all plugins against bundle
+# > report.py -b /path/to/bundle      - path to dir containing host tarballs
 # > report.py -d /path/to/bundle      - path to dir containing tar bundle(s)
 # > report.py -f /path/to/bundle.tar  - specify path to a bundle tar file
 # > report.py -d <dir> [plugin ...]   - Run only specified plugins
 # > report.py -d <dir> <algs> [labels]- Run algorithm with labels
 # > report.py <algorithm> --help      - algorithm specific help
@ -98,7 +100,6 @@
 #    See --help output for a complete list of full and abbreviated
 #    command line options and examples of plugins.
 #
 # TODO: revise README
 # Refer to README file for more usage and output examples
 #######################################################################
@ -108,30 +109,32 @@ from datetime import timedelta
 from datetime import timezone
 import logging
 import os
 import re
 import shutil
 import subprocess
 import sys
 import tarfile
 import tempfile
 import time
 from execution_engine import ExecutionEngine
 from plugin import Plugin
 # Globals
 now = datetime.now(timezone.utc)
 report_dir = os.path.dirname(os.path.realpath(__file__))
 analysis_folder_name = "report_analysis"
 bundle_name = None
 plugins = []
 output_dir = None
 tmp_report_log = tempfile.mkstemp()
 clean = True
 # TODO: rework this description
 parser = argparse.ArgumentParser(
-    description="Log Event Reporter",
+    description="Report Tool:",
    epilog="Analyzes data collected by the plugins and produces a "
    "report_analysis stored with the collect bundle. The report tool "
    "can be run either on or off system by specifying the bundle to "
-    "analyze using the --directory or -d <directory> command option.",
+    "analyze using the --directory, --bundle or --file command options.",
 )
 parser.add_argument(
@ -141,17 +144,20 @@ parser.add_argument(
 )
 parser.add_argument(
-    "--clean", "-c",
+    "--bundle", "-b",
-    action="store_true",
+    default="",
-    help="Cleanup (remove) existing report data",
+    required=False,
    help="Specify the full path to a directory containing a collect "
    "bundle to analyze. Use this option when pointing to a directory "
    "with host .tgz files that are already extracted from a tar file.",
 )
 parser.add_argument(
    "--directory", "-d",
    default="",
    required=False,
-    help="Specify the full path to a directory containing a collect "
+    help="Specify the full path to a directory containing collect "
-    "bundle to analyze. This is a required parameter",
+    "bundles to analyze.",
 )
 parser.add_argument(
@ -190,6 +196,12 @@ parser.add_argument(
    "(default:20000101)",
 )
 parser.add_argument(
    "--state",
    action="store_true",
    help="Debug option to dump object state during execution",
 )
 parser.add_argument(
    "--verbose", "-v",
    action="store_true",
@ -352,12 +364,14 @@ parser_audit.add_argument(
    "(not required, default: today)"
 )
 args = parser.parse_args()
 args.start = datetime.strptime(args.start, "%Y%m%d").strftime(
    "%Y-%m-%dT%H:%M:%S")
 args.end = datetime.strptime(args.end, "%Y%m%d").strftime("%Y-%m-%dT%H:%M:%S")
 ###########################################################
 #                 Args error checking
 ###########################################################
 if args.file:
    if not os.path.exists(args.file):
        exit_msg = "Error: Specified file (" + args.file + ") does not exist."
@ -374,61 +388,70 @@ if args.file:
        sys.exit(exit_msg)
    else:
        try:
-            input_dir = os.path.splitext(args.file)[0]
+            input_dir = os.path.dirname(args.file)
            input_file = os.path.dirname(os.path.realpath(args.file))
            output_dir = os.path.join(input_dir, analysis_folder_name)
-            # print("input_file : ", input_file)
+            subprocess.run(["tar", "xfC", args.file], check=True)
            subprocess.run(["tar", "xfC", args.file, input_file], check=True)
            # print("extracted ", args.file)
        except subprocess.CalledProcessError as e:
            print(e)
        except PermissionError as e:
            print(e)
            sys.exit("Permission Error: Unable to extract bundle")
 elif args.directory:
    # Get the bundle input and report output dirs
    output_dir = os.path.join(args.directory, analysis_folder_name)
    input_dir = os.path.join(args.directory)
    if not os.path.isdir(input_dir):
        sys.exit("Error: Specified input directory is not a directory")
 elif args.bundle:
    output_dir = os.path.join(args.bundle, analysis_folder_name)
    input_dir = os.path.join(args.bundle)
 else:
    exit_msg = "Error: Please use either the --file or --directory option to "
    exit_msg += "specify a\ncollect bundle file or directory containing a "
    exit_msg += "collect bundle file to analyze."
    sys.exit(exit_msg)
 # TODO: date current analysis if there rather than remove
 if args.clean and not clean:
    clean = True
 if clean is True and os.path.exists(output_dir):
    shutil.rmtree(output_dir)
 os.makedirs(output_dir, exist_ok=True)
-# setting up logger
+###########################################################
-formatter = logging.Formatter("%(message)s")
+#                  Setup logging
 ###########################################################
 logger = logging.getLogger()
 logging.basicConfig(
    filename=os.path.join(output_dir, "report.log"),
    level=logging.DEBUG,
    format="%(asctime)s %(levelname)s: %(message)s",
    datefmt="%Y-%m-%dT%H:%M:%S",
 )
 logging.Formatter.converter = time.gmtime
-ch = logging.StreamHandler()
+def remove_logging():
-ch.setLevel(logging.INFO)
+    """Move logging to a different location ; from /tmp to the bundle"""
 if args.debug:
    ch.setLevel(logging.DEBUG)
 ch.setFormatter(formatter)
-logger.addHandler(ch)
+    logger = logging.getLogger()
    for handler in logger.handlers[:]:
        logger.removeHandler(handler)
 # Command line parsing done. Logging setup
-#####################################################################
+def setup_logging(logfile):
-#             Find and extract the bundle to analyze
+    """Setup logging"""
 #####################################################################
 # Find and extract the bundle to analyze
-# Creating report log
+    # setting up logger
-open(os.path.join(output_dir, "report.log"), "w").close()
+    formatter = logging.Formatter("%(message)s")
    logging.basicConfig(
        filename=logfile,
        level=logging.DEBUG if args.debug else logging.INFO,
        format="%(asctime)s %(levelname)s: %(message)s",
        datefmt="%Y-%m-%dT%H:%M:%S",
    )
    logging.Formatter.converter = time.gmtime
    console_handler = logging.StreamHandler()
    if args.debug:
        console_handler.setLevel(logging.DEBUG)
    else:
        console_handler.setLevel(logging.INFO)
    console_handler.setFormatter(formatter)
    logger.addHandler(console_handler)
 setup_logging(tmp_report_log[1])
 if args.debug:
    logger.debug("Arguments : %s", args)
@ -436,140 +459,413 @@ if args.debug:
    logger.debug("Input  Dir: %s", input_dir)
    logger.debug("Output Dir: %s", output_dir)
-if not os.path.isdir(input_dir):
+###########################################################
-    sys.exit("Error: Specified input directory is not a directory")
+#        Find and extract the bundle to analyze
 ###########################################################
-# Search 'input_dir' for bundles.
+
-bundle_tar_file_found = False
+# List of directories to ignore
 bundle_name = None
 bundle_names = []
 bundles = []
 ignore_list = [analysis_folder_name]
 ignore_list += ["apps", "horizon", "lighttpd", "lost+found", "sysinv-tmpdir"]
 ignore_list += ["patch-api-proxy-tmpdir", "platform-api-proxy-tmpdir"]
 regex_get_bundle_date = r".*_\d{8}\.\d{6}$"
 with open(os.path.join(output_dir, "untar.log"), "a") as logfile:
    for obj in (os.scandir(input_dir)):
        # Don't display dirs from the ignore list.
        # This makes the bundle selection list cleaner when
        # report is run against /scratch
        ignored = False
        for ignore in ignore_list:
            if obj.name == ignore:
                ignored = True
        if ignored is True:
            continue
-        if obj.is_dir(follow_symlinks=False):
+class BundleObject:
-            date_time = obj.name[-15:]
+    def __init__(self, input_dir):
-            if args.debug:
+        self.input_base_dir = input_dir  # the first specified input dir
-                logger.debug("Found Dir : %s : %s", obj.name, date_time)
+        self.input_dir = input_dir       # current input_dir ; can change
-        elif os.path.islink(obj.path):
+        self.tar_file_found = False      # True if <bundle>.tar file present
-            # ignore sym links
+        self.subcloud_bundle = False     # host vs subcloud bundle
-            continue
+        self.bundle_name = None          # full path of current bundle
        self.bundle_names = []           # list of bundle names
        self.bundle_info = ["", []]      # tarfile bundle info [name,[files]]
        self.bundles = []                # list of bundles
        self.tars = 0                    # number of tar files found
        self.tgzs = 0                    # number of host tgz files found
    def debug_state(self, func):
        if args.state:
            logger.debug("State:%10s: input_base_dir : %s",
                         func, self.input_base_dir)
            logger.debug("State:%10s: input_dir      : %s",
                         func, self.input_dir)
            logger.debug("State:%10s: output_dir     : %s",
                         func, output_dir)
            logger.debug("State:%10s: tar_file_found : %s",
                         func, self.tar_file_found)
            logger.debug("State:%10s: subcloud_bundle: %s",
                         func, self.subcloud_bundle)
            logger.debug("State:%10s: bundle_name    : %s",
                         func, self.bundle_name)
            logger.debug("State:%10s: bundle_names   : %s",
                         func, self.bundle_names)
            logger.debug("State:%10s: bundle_info    : %s",
                         func, self.bundle_info)
            logger.debug("State:%10s: bundles        : %s",
                         func, self.bundles)
            logger.debug("State:%10s: tars-n-tgzs    : %s:%s",
                         func, self.tars, self.tgzs)
    def update_io_dirs(self, new_dir):
        """Update the input_dir and output_dir dirs
        Parameters:
           new_dir (string): path to change input_dir to
        """
        self.debug_state("get_bundles")
        global output_dir
        if self.input_dir != new_dir:
            str1 = "input_dir change: " + self.input_dir + " -> " + new_dir
            self.input_dir = new_dir
            old_output_dir = output_dir
            output_dir = os.path.join(self.input_dir, analysis_folder_name)
            str2 = "output_dir change: " + old_output_dir + " -> " + output_dir
        else:
-            if not tarfile.is_tarfile(obj.path):
+            str1 = "input_dir  change is null"
            str2 = "output_dir change is null"
        logger.debug(str1)
        logger.debug(str2)
        self.debug_state("update_io_dirs")
    def get_bundles(self):
        """Get a list of all collect bundle from input_dir"""
        self.debug_state("get_bundles")
        logger.debug("get_bundles: %s", self.input_dir)
        for obj in (os.scandir(self.input_dir)):
            # Don't display dirs from the ignore list.
            # This makes the bundle selection list cleaner when
            # report is run against /scratch
            ignored = False
            for ignore in ignore_list:
                if obj.name == ignore:
                    ignored = True
                    break
            if ignored is True:
                continue
            filename = os.path.splitext(obj.name)[0]
            date_time = filename[-15:]
            if args.debug:
                logger.debug("Found File: %s : %s", obj.name, date_time)
-        # TODO: Add more filtering above to avoid directories that are
+            if obj.is_dir(follow_symlinks=False):
-        #       clearly not collect data is not added to the list of
+                date_time = obj.name[-15:]
-        #       options.
+                if args.debug:
-
+                    logger.debug("found dir : %s : %s", obj.name, date_time)
-        # Add this bundle to the list. Avoid duplicates
+            elif os.path.islink(obj.path):
-        found = False
+                # ignore sym links
        name = obj.name
        if obj.name.endswith('.tar'):
            bundle_tar_file_found = True
            name = os.path.splitext(obj.name)[0]
        for bundle in bundles:
            if bundle == name:
                found = True
                break
        if found is False:
            bundles.append(name)
            bundle_names.append(name)
        else:
            logger.debug("Discarding duplicate %s", obj.name)
 if args.debug:
    logger.debug("Bundle  %d : %s", len(bundles), bundles)
    logger.debug("Bundle Sel: %s", bundle_names)
 if bundles:
    if bundle_tar_file_found is False:
        # If a collect bundle .tar file is not found then treat this
        # case as though the input_dir is a hosts tarball directory
        # like would be seen when running report on the system during
        # the collect operation.
        bundle_name = input_dir
    elif len(bundles) > 1:
        retry = True
        while retry is True:
            logger.info("0 - exit")
            index = 1
            # TODO: filter files/dirs with date.time ; 20221102.143258
            for bundle in bundle_names:
                if bundle.endswith(('.tar', '.tgz', '.gz')):
                    logger.info("%d - %s", index, os.path.splitext(bundle)[0])
                else:
                    logger.info("%d - %s", index, bundle)
                index += 1
            try:
                select = int(input('Please select the bundle to analyze: '))
            except ValueError:
                logger.info("Invalid input; integer between 1 "
                            "and %d required", len(bundles))
                continue
            if not select:
                sys.exit()
            if select <= len(bundles):
                index = 0
                for bundle in bundle_names:
                    if index == select-1:
                        logger.info("%s selected", bundle)
                        bundle_name = bundle
                        break
                    else:
                        index += 1
                retry = False
            else:
-                logger.info("Invalid selection (%s) index=%d",
+                if not tarfile.is_tarfile(obj.path):
-                            select, index)
+                    continue
-    # single bundle found
+                filename = os.path.splitext(obj.name)[0]
                date_time = filename[-15:]
                if args.debug:
                    logger.debug("found file: %s : %s", obj.name, date_time)
            # Add this bundle to the list. Avoid duplicates
            found = False
            name = obj.name
            if obj.name.endswith('.tar'):
                self.tar_file_found = True
                name = os.path.splitext(obj.name)[0]
            if obj.name.endswith('.tgz'):
                continue
            for bundle in self.bundles:
                if bundle == name:
                    found = True
                    break
            if found is False:
                if re.match(regex_get_bundle_date, name):
                    self.bundles.append(name)
                    self.bundle_names.append(name)
                elif not obj.is_dir(follow_symlinks=False):
                    logger.info("unexpected bundle name '%s'", name)
                    logger.info("... collect bundles name should include "
                                "'_YYYYMMDD.HHMMSS'")
                    select = str(input('accept as bundle (Y/N): '))
                    if select[0] == 'Y' or select[0] == 'y':
                        self.bundles.append(name)
                        self.bundle_names.append(name)
                    else:
                        logger.warning("not a bundle")
        if args.debug:
            logger.debug("bundles %2d: %s", len(self.bundles), self.bundles)
            logger.debug("bundle sel: %s", self.bundle_names)
        self.debug_state("get_bundles")
    def get_bundle(self):
        """Get a list of all collect bundles from input_dir
        Parameters:
            input_dir (string): path to the directory to analyze
        """
        self.debug_state("get_bundle")
        logger.debug("get_bundle %s", self.input_dir)
        if self.tar_file_found is False:
            # If a collect bundle .tar file is not found then treat this
            # case as though the input_dir is a hosts tarball directory
            # like would be seen when running report on the system during
            # the collect operation.
            logger.debug("get_bundle tar file not found")
            self.bundle_name = self.input_dir
        elif len(self.bundles) > 1:
            retry = True
            while retry is True:
                logger.info("0 - exit")
                idx = 1
                for bundle in self.bundle_names:
                    if bundle.endswith(('.tar', '.tgz', '.gz')):
                        logger.info("%d - %s",
                                    idx, os.path.splitext(bundle)[0])
                    else:
                        logger.info("%d - %s", idx, bundle)
                    idx += 1
                try:
                    select = int(input('Please select bundle to analyze: '))
                except ValueError:
                    logger.info("Invalid input; integer between 1 "
                                "and %d required", len(self.bundles))
                    continue
                if not select:
                    sys.exit()
                if select <= len(self.bundles):
                    idx = 0
                    for bundle in self.bundle_names:
                        if idx == select-1:
                            logger.info("%s selected", bundle)
                            self.bundle_name = bundle
                            break
                        else:
                            idx += 1
                    retry = False
                else:
                    logger.info("Invalid selection (%s) idx=%d",
                                select, idx)
        # single bundle found
        else:
            self.bundle_name = self.bundle_names[0]
            logger.debug("bundle name: %s", self.bundle_name)
        self.debug_state("get_bundle")
    def get_bundle_info(self, bundle):
        """Returns a list containing the tar file content
           This is required for cases where the name of the supplied
           tar file extracts its contents to a directory that is not
           the same (without the extension) as the original tar file
        Returns:
           bundle_info (list): the bundle info [ "dir", [ files ]]
           bundle_info[0] ( string) 'directory' found in tar file
           bundle_info[1] (list) a list of files found in 'directory'
        """
        self.debug_state("get_bundle_info")
        bundle_tar = os.path.join(self.input_dir, self.bundle_name) + ".tar"
        logger.debug("get_bundle_info %s", bundle_tar)
        if not os.path.exists(bundle_tar):
            logger.error("Error: No collect tar bundle found: %s", bundle_tar)
            sys.exit()
        try:
            result = subprocess.run(["tar", "tf", bundle_tar],
                                    stdout=subprocess.PIPE)
            output = result.stdout.decode('utf-8').splitlines()
            logger.debug("... bundle info: %s", output)
        except subprocess.CalledProcessError as e:
            logger.error(e)
        except subprocess.PermissionError as e:
            logger.error(e)
        if output != []:
            for item in output:
                dir, file = item.split("/", 1)
                if dir is None:
                    continue
                if self.bundle_info[0] == "":
                    self.bundle_info[0] = dir
                if self.bundle_info[0] != dir:
                    logger.warning("ignoring unexpected extra directory "
                                   "only one directory permitted in a "
                                   "collect bundle ; %s is != %s",
                                   self.bundle_info[0], dir)
                    continue
                elif file.endswith(('.tar')):
                    logger.debug("tar contains tar: %s", file)
                    self.bundle_info[1].append(file)
                elif file.endswith(('.tgz')):
                    logger.debug("tar contains tgz: %s", file)
                    if self.bundle_info[0] is None:
                        self.bundle_info[0] = dir
                    self.bundle_info[1].append(file)
                else:
                    if self.bundle_info[0] is None:
                        self.bundle_info[0] = dir
                    if file:
                        self.bundle_info[1].append(file)
        self.debug_state("get_bundle_info")
    def extract_bundle(self):
        """Extract bundle if not already extracted"""
        logger.debug("bundle name: %s", self.bundle_name)
        # extract the bundle if not already extracted
        bundle_tar = os.path.join(self.input_dir, self.bundle_name) + ".tar"
        if os.path.exists(bundle_tar):
            if not os.access(self.input_dir, os.W_OK):
                logger.error("Permission Error: Bundle dir not writable: %s",
                             self.input_dir)
                sys.exit("Collect bundle must be writable for analysis.")
            try:
                logger.info("extracting %s", bundle_tar)
                untar_data = subprocess.run(
                    ["tar", "xfC", bundle_tar, self.input_dir],
                    check=True, stdout=subprocess.PIPE)
                logger.debug(untar_data)
            except subprocess.CalledProcessError as e:
                logger.error(e)
            except PermissionError as e:
                logger.error(e)
                sys.exit("Permission Error: Unable to extract bundle")
        elif args.debug:
            logger.debug("already extracted: %s", bundle_tar)
    def get_bundle_type(self):
        """Determine the bundle type ; host or subcloud
           Subcloud bundles contain one or more tar files rather
           than tgz files ; at this level.
           However rather than fail the report if both are found,
           which is unlikely, the code favors treating as a normal
           host bundle with the tgz check first.
        """
        if self.tgzs:
            self.extract_bundle()
            self.bundle_name = os.path.join(self.input_dir,
                                            self.bundle_info[0])
            logger.debug("Host bundle: %s", self.bundle_name)
        elif self.tars:
            self.extract_bundle()
            self.bundle_name = os.path.join(self.input_dir,
                                            self.bundle_info[0])
            self.subcloud_bundle = True
            logger.debug("Subcloud bundle: %s", self.bundle_name)
        else:
            sys.exit("Error: bundle contains no .tar files")
        self.update_io_dirs(self.bundle_name)
        if self.subcloud_bundle is True:
            # clear current bundle lists, etc. in prep for the
            # selected subcloud bundle
            self.bundle_names = []
            self.bundles = []
            self.bundle_name = None
            self.tar_file_found = False
            # get the subcloud bundle(s) and select one
            # if more than one is present.
            self.get_bundles()
            if self.bundles:
                self.get_bundle()
            # handle the no bundles found case ; unlikely
            if self.bundle_name is None:
                sys.exit("No valid collect subcloud bundles found.")
            # extract the subcloud bundle if needed
            self.extract_bundle()
            # add the full path to the bundle name.
            # can't use self.bundle_info[0] because that is the
            # bundle name that contians the subcloud tars
            self.bundle_name = os.path.join(self.input_dir, self.bundle_name)
            # update the input directory to point top the subcloud folder
            self.update_io_dirs(self.bundle_name)
        self.debug_state("get_bundle_type")
 # Initialize the Bundle Object. Logging starts in /tmp
 obj = BundleObject(input_dir)
 with open(os.path.join(output_dir, tmp_report_log[1]), "a") as logfile:
    obj.debug_state("init")
    if args.bundle:
        logger.info("Bundle: %s", args.bundle)
        obj.input_dir = input_dir
    elif args.file:
        # Note: The args.file has already been validated at this point.
        basename = os.path.splitext(os.path.basename(args.file))
        if re.match(regex_get_bundle_date, basename[0]):
            obj.bundles.append(basename[0])
            obj.bundle_names.append(basename[0])
            obj.tar_file_found = True
        else:
            logger.info("unexpected bundle name '%s'", basename[0])
            logger.info("... collect bundles name should include "
                        "'_YYYYMMDD.HHMMSS'")
            select = str(input('accept as bundle (Y/N): '))
            if select[0] == 'Y' or select[0] == 'y':
                obj.bundles.append(basename[0])
                obj.bundle_names.append(basename[0])
                obj.tar_file_found = True
            else:
                sys.exit("rejected ; exiting ...")
    else:
-        # logger.info("bundle_names: %s", bundle_names)
+        # get the bundles
-        bundle_name = bundle_names[0]
+        obj.get_bundles()
-# handle the no bundles found case
+    if not args.bundle:
-if bundle_name is None:
+        if obj.bundles:
-    sys.exit("No valid collect bundles found.")
+            obj.get_bundle()
-# extract the bundle if not already extracted
+        # handle the no bundles found case
-path_file = os.path.join(input_dir, bundle_name)
+        if obj.bundle_name is None:
-if not os.path.isdir(path_file):
+            sys.exit("No valid collect host bundles found.")
    try:
        logger.info("extracting %s", path_file)
        subprocess.run(["tar", "xfC", path_file+".tar", input_dir], check=True)
    except subprocess.CalledProcessError as e:
        logger.error(e)
-elif args.debug:
+        obj.get_bundle_info(obj.bundle_name)
-    logger.debug("already extracted ...")
+        logger.debug("bundle info: %s", obj.bundle_info)
        for file in obj.bundle_info[1]:
            if file.endswith(('.tar')):
                logger.debug("bundle tar file: %s", file)
                obj.tars += 1
            elif file.endswith(('.tgz')):
                logger.debug("bundle tgz file: %s", file)
                obj.tgzs += 1
-# create the output directory ; report_analysis
+if not args.bundle:
-output_dir = os.path.join(path_file, analysis_folder_name)
+    obj.get_bundle_type()
-print("\nReport: %s\n" % output_dir)
+
 # now that the output directory is established create the analysis
 # folder, move the existing log files there and record the untar data
 if not os.path.exists(output_dir):
-    os.makedirs(output_dir, exist_ok=True)
+    try:
        result = os.makedirs(output_dir, exist_ok=True)
    except PermissionError as e:
        logger.error(e)
        sys.exit("Permission Error: Unable to create report")
 # relocate logging to the selected bundle directory
 remove_logging()
 new_log_file = output_dir + "/report.log"
 shutil.move(tmp_report_log[1], new_log_file)
 setup_logging(new_log_file)
 logger.info("")
 logger.info("Report: %s ", output_dir)
 logger.info("")
 # initialize the execution engine
 try:
-    engine = ExecutionEngine(args, path_file, output_dir)
+    engine = ExecutionEngine(args, obj.input_dir, output_dir)
 except ValueError as e:
    logger.error(str(e))
    logger.error("Confirm you are running the report tool on a collect bundle")