cloud-bulldozer · jtaleric · Mar 20, 2024 · Feb 5, 2024 · Mar 19, 2024
diff --git a/.github/workflows/pylint.yml b/.github/workflows/pylint.yml
@@ -22,4 +22,4 @@ jobs:
         pip install .
     - name: Analysing the code with pylint
       run: |
-        pylint -d C0103 $(git ls-files '*.py')
+        pylint -d C0103 -d R0912 $(git ls-files '*/*.py' '*.py')
diff --git a/README.md b/README.md
@@ -97,3 +97,19 @@ Additionally, users can specify a custom path for the output CSV file using the
 Orion's seamless integration with metadata and hunter ensures a robust regression detection tool for perf-scale CPT runs.
 
 
+```--uuid``` : If you have a specific uuid in mind (maybe a current run), you can bypass the metadata configuration portion of the config file and use this paraemter. You will still need to specify a config file that contains a metrics section for the metrics you want to collect on the current uuid and uuids that match the metadata of the uuid configuration
+
+```
+tests :
+  - name : current-uuid-etcd-duration
+    metrics : 
+    - name:  etcdDisck
+      metricName : 99thEtcdDiskBackendCommitDurationSeconds
+      metric_of_interest: value
+      agg:
+        value: duration
+        agg_type: avg
+```
+
+Orion provides flexibility if you know the comparison uuid you want to compare among, use the ```--baseline``` flag. This should only be used in conjunction when setting uuid. Similar to the uuid section mentioned above, you'll have to set a metrics section to specify the data points you want to collect on
+
diff --git a/orion.py b/orion.py
@@ -6,13 +6,13 @@
 from functools import reduce
 import logging
 import os
+import re
 
 import click
 import pandas as pd
 
 from fmatch.matcher import Matcher
-from utils.orion_funcs import run_hunter_analyze, get_metadata, \
-                                set_logging, load_config, get_metric_data
+from utils import orion_funcs
 
 
 @click.group()
@@ -24,24 +24,29 @@ def cli(max_content_width=120):
 
 # pylint: disable=too-many-locals
 @click.command()
+@click.option("--uuid", default="", help="UUID to use as base for comparisons")
+@click.option("--baseline", default="", help="Baseline UUID(s) to to compare against uuid")
 @click.option("--config", default="config.yaml", help="Path to the configuration file")
 @click.option("--output", default="output.csv", help="Path to save the output csv file")
 @click.option("--debug", is_flag=True, help="log level ")
 @click.option("--hunter-analyze",is_flag=True, help="run hunter analyze")
-def orion(config, debug, output,hunter_analyze):
-    """
-    Orion is the cli tool to detect regressions over the runs
+def orion(**kwargs):
+    """Orion is the cli tool to detect regressions over the runs
 
     \b
     Args:
+        uuid (str): gather metrics based on uuid
+        baseline (str): baseline uuid to compare against uuid (uuid must be set when using baseline)
         config (str): path to the config file
         debug (bool): lets you log debug mode
         output (str): path to the output csv file
+        hunter_analyze (bool): turns on hunter analysis of gathered uuid(s) data
     """
-    level = logging.DEBUG if debug else logging.INFO
+
+    level = logging.DEBUG if kwargs["debug"] else logging.INFO
     logger = logging.getLogger("Orion")
-    logger = set_logging(level, logger)
-    data = load_config(config,logger)
+    logger = orion_funcs.set_logging(level, logger)
+    data = orion_funcs.load_config(kwargs["config"],logger)
     ES_URL=None
 
     if "ES_SERVER" in data.keys():
@@ -54,14 +59,23 @@ def orion(config, debug, output,hunter_analyze):
             sys.exit(1)
 
     for test in data["tests"]:
-        metadata = get_metadata(test, logger)
-        logger.info("The test %s has started", test["name"])
+        uuid = kwargs["uuid"]
+        baseline = kwargs["baseline"]
         match = Matcher(index="perf_scale_ci", level=level, ES_URL=ES_URL)
-        uuids = match.get_uuid_by_metadata(metadata)
-        if len(uuids) == 0:
-            print("No UUID present for given metadata")
-            sys.exit()
+        if uuid == "":
+            metadata = orion_funcs.get_metadata(test, logger)
+        else:
+            metadata = orion_funcs.filter_metadata(uuid,match,logger)
 
+        logger.info("The test %s has started", test["name"])
+        if baseline == "":
+            uuids = match.get_uuid_by_metadata(metadata)
+            if len(uuids) == 0:
+                logging.info("No UUID present for given metadata")
+                sys.exit()
+        else:
+            uuids = re.split(' |,',baseline)
+            uuids.append(uuid)
         if metadata["benchmark.keyword"] == "k8s-netperf" :
             index = "k8s-netperf"
             ids = uuids
@@ -70,22 +84,27 @@ def orion(config, debug, output,hunter_analyze):
             ids = uuids
         else:
             index = "ripsaw-kube-burner"
-            runs = match.match_kube_burner(uuids)
-            ids = match.filter_runs(runs, runs)
+            if baseline == "":
+                runs = match.match_kube_burner(uuids)
+                ids = match.filter_runs(runs, runs)
+            else:
+                ids = uuids
 
         metrics = test["metrics"]
-        dataframe_list = get_metric_data(ids, index, metrics, match, logger)
+        dataframe_list = orion_funcs.get_metric_data(ids, index, metrics, match, logger)
 
         merged_df = reduce(
             lambda left, right: pd.merge(left, right, on="uuid", how="inner"),
             dataframe_list,
         )
-        match.save_results(merged_df, csv_file_path=output.split(".")[0]+"-"+test['name']+".csv")
-
-        if hunter_analyze:
-            run_hunter_analyze(merged_df,test)
 
+        csv_name = kwargs["output"].split(".")[0]+"-"+test['name']+".csv"
+        match.save_results(
+            merged_df, csv_file_path=csv_name
+        )
 
+        if kwargs["hunter_analyze"]:
+            orion_funcs.run_hunter_analyze(merged_df,test)
 
 
 if __name__ == "__main__":

diff --git a/utils/orion_funcs.py b/utils/orion_funcs.py
@@ -116,6 +116,51 @@ def get_metadata(test,logger):
     return metadata
 
 
+def filter_metadata(uuid,match,logger):
+    """Gets metadata of the run from each test
+
+    Args:
+        uuid (str): str of uuid ot find metadata of
+        match: the fmatch instance
+
+
+    Returns:
+        dict: dictionary of the metadata
+    """
+
+    test = match.get_metadata_by_uuid(uuid)
+    metadata = {
+        'platform': '', 
+        'clusterType': '', 
+        'masterNodesCount': 0,
+        'workerNodesCount': 0,
+        'infraNodesCount': 0,
+        'masterNodesType': '',
+        'workerNodesType': '',
+        'infraNodesType': '',
+        'totalNodesCount': 0,
+        'ocpVersion': '',
+        'networkType': '',
+        'ipsec': '',
+        'fips': '',
+        'encrypted': '',
+        'publish': '',
+        'computeArch': '', 
+        'controlPlaneArch': ''
+    }
+    for k,v in test.items():
+        if k not in metadata:
+            continue
+        metadata[k] = v
+    metadata['benchmark.keyword'] = test['benchmark']
+    metadata["ocpVersion"] = str(metadata["ocpVersion"])
+
+    #Remove any keys that have blank values
+    no_blank_meta = {k: v for k, v in metadata.items() if v}
+    logger.debug('No blank metadata dict: ' + str(no_blank_meta))
+    return no_blank_meta
+
+
 
 def set_logging(level, logger):
     """sets log level and format