WayScience · axiomcura · May 9, 2023 · Mar 14, 2023 · Mar 28, 2023 · Apr 12, 2023
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -1,10 +1,12 @@
 ---
 repos:
   # remove unused imports
+  # additional configs are in the pyproject.toml file
   - repo: https://github.com/hadialqattan/pycln.git
     rev: v2.1.3
     hooks:
       - id: pycln
+        args: [--config=pyproject.toml]
 
   # import formatter with black configurations
   - repo: https://github.com/pycqa/isort
@@ -17,28 +19,36 @@ repos:
   # Code formatter for both python files and jupyter notebooks
   # support pep 8 standards
   - repo: https://github.com/psf/black
-    rev: 22.10.0
+    rev: 23.3.0
     hooks:
       - id: black-jupyter
       - id: black
         language_version: python3.10
 
   # AI based formatter to improve readability
   - repo: https://github.com/sourcery-ai/sourcery
-    rev: v1.1.0
+    rev: v1.2.0
     hooks:
       - id: sourcery
         args: [--diff=git diff HEAD, --fix, --no-summary]
 
+  # adding ruff with auto fix on
+  # additional configs are in the pyproject.toml file
+  - repo: https://github.com/charliermarsh/ruff-pre-commit
+    rev: "v0.0.265"
+    hooks:
+      - id: ruff
+        args: [--config=pyproject.toml, --fix, --exit-non-zero-on-fix]
+
   # snakemake formatting
   - repo: https://github.com/snakemake/snakefmt
-    rev: v0.8.0
+    rev: v0.8.4
     hooks:
       - id: snakefmt
 
   # additional hooks found with in the pre-commit lib
   - repo: https://github.com/pre-commit/pre-commit-hooks
-    rev: v3.4.0
+    rev: v4.4.0
     hooks:
       - id: trailing-whitespace # removes trailing white spaces
       - id: mixed-line-ending # removes mixed end of line

diff --git a/cytosnake/cli/args.py b/cytosnake/cli/args.py
@@ -52,12 +52,12 @@ class WorkflowSearchPath(argparse.Action):
     """
 
     def __call__(self, parser, args, values, option_string=None):
-
         # checking if user provided workflow exists
         supported_wf = supported_workflows()
         if values not in supported_wf:
             raise InvalidWorkflowException(
-                f"Unable to find '{values}'. Please specify a supported workflow: {supported_wf}"
+                f"Unable to find '{values}'."
+                f"Please specify a supported workflow: {supported_wf}"
             )
         # grabbing and setting the new value with the extracted path
         values = str(load_workflow_path(values))

diff --git a/cytosnake/cli/cmd.py b/cytosnake/cli/cmd.py
@@ -9,13 +9,12 @@
 import sys
 from pathlib import Path
 
+# cytosnake imports
 from cytosnake.cli.args import CliControlPanel
 from cytosnake.cli.cli_docs import cli_docs, init_doc, run_doc
 from cytosnake.cli.exec.workflow_exec import workflow_executor
 from cytosnake.cli.setup_init import init_cp_data, init_dp_data
 from cytosnake.common.errors import ProjectExistsError, WorkflowFailedException
-
-# cytosnake imports
 from cytosnake.guards.input_guards import check_init_parameter_inputs
 from cytosnake.utils import cyto_paths
 from cytosnake.utils.cytosnake_setup import setup_cytosnake_env
@@ -65,7 +64,7 @@ def run_cmd() -> None:
             logging.info(msg="Formatting input files")
             init_args = args_handler.parse_init_args()
 
-            # before setup up, check the logic of the input parameters
+            # before setup, check the logic of the input parameters
             check_init_parameter_inputs(user_params=init_args)
 
             # identifying which data type was added and how to set it up
@@ -92,7 +91,6 @@ def run_cmd() -> None:
         # Executed if the user is using the `run` mode. This will execute the
         # workflow that are found within the `workflows` folder
         case "run":
-
             # display run help documentation
             if args_handler.mode_help is True:
                 print(run_doc)
@@ -125,5 +123,4 @@ def run_cmd() -> None:
 
 
 if __name__ == "__main__":
-
     run_cmd()
diff --git a/cytosnake/guards/input_guards.py b/cytosnake/guards/input_guards.py
@@ -32,7 +32,7 @@ def is_barcode_required(user_params: NameSpace) -> bool:
     metadata_path = pathlib.Path(user_params.metadata).resolve(strict=True)
 
     # counting number of platemaps in metadata
-    plate_maps_path = metadata_path / "platemaps"
+    plate_maps_path = (metadata_path / "platemap").resolve(strict=True)
     n_platemaps = len(list(plate_maps_path.glob("*")))
 
     # if the metadata directory has more than 1 plate maps and no barcode file return
@@ -46,7 +46,7 @@ def check_init_parameter_inputs(user_params: NameSpace) -> bool:
 
     Parameters
     ----------
-    args : NameSpace
+    user_params : NameSpace
         Argparse.NameSpace object that contains all user provided parameters.
 
     Returns
@@ -57,9 +57,9 @@ def check_init_parameter_inputs(user_params: NameSpace) -> bool:
     Raises
     ------
     BarcodeRequiredError
-        Raised if a multiple platemaps are found but not barcode file was provided
+        Raised if a multiple platemaps are found but no barcode file was provided
     """
 
     # checking if barcode is required
-    if not is_barcode_required:
-        BarcodeRequiredError("Barcode is required, multiple platemaps found")
+    if is_barcode_required(user_params=user_params):
+        raise BarcodeRequiredError("Barcode is required, multiple platemaps found")
diff --git a/cytosnake/helpers/helper_funcs.py b/cytosnake/helpers/helper_funcs.py
@@ -9,8 +9,6 @@
 from pathlib import Path
 from typing import Optional
 
-from snakemake.io import expand
-
 from cytosnake.guards.path_guards import is_valid_path
 from cytosnake.utils.config_utils import load_general_configs, load_meta_path_configs
 

diff --git a/cytosnake/tests/functional/datasets/dummyfiles/barcode.txt b/cytosnake/tests/functional/datasets/dummyfiles/barcode.txt
diff --git a/cytosnake/tests/functional/datasets/dummyfiles/metadata/platemap/platemap1.csv b/cytosnake/tests/functional/datasets/dummyfiles/metadata/platemap/platemap1.csv
diff --git a/cytosnake/tests/functional/datasets/dummyfiles/metadata/platemap/platemap2.csv b/cytosnake/tests/functional/datasets/dummyfiles/metadata/platemap/platemap2.csv
diff --git a/cytosnake/tests/functional/datasets/dummyfiles/plate_data1.sqlite b/cytosnake/tests/functional/datasets/dummyfiles/plate_data1.sqlite
diff --git a/cytosnake/tests/functional/datasets/dummyfiles/plate_data2.sqlite b/cytosnake/tests/functional/datasets/dummyfiles/plate_data2.sqlite
diff --git a/cytosnake/tests/functional/test_cli.py b/cytosnake/tests/functional/test_cli.py
@@ -0,0 +1,216 @@
+"""
+module: test_cli.py
+
+This testing module composes of functional tests that contains checks for both positive
+negative cases when using CytoSnake's CLI
+
+A positive case indicates that given the user parameters we expect it to run
+successfully.
+
+A negative case indicates that given with the user parameters, our tests are able to
+capture the errors.
+
+Ultimately, test_cli.py will contains functional test to all modes that CytoSnake
+contains.
+"""
+
+import os
+import pathlib
+import shutil
+import subprocess
+from typing import Optional
+
+# import tempfile
+# import pytest
+# import subprocess
+# import test_functions # This will contains helper functions for testing
+from cytosnake.common import errors
+
+
+# -----------------
+# Helper functions
+# -----------------
+class CleanUpHandler:
+    """Used to clean up directories in every single test run"""
+
+    def __init__(self, tmp_path):
+        self.tmp_path = tmp_path
+
+    def __call__(self) -> None:
+        shutil.rmtree(self.tmp_path)
+
+
+def transfer_data(
+    test_dir: pathlib.Path,
+    n_plates: int,
+    n_platemaps: int,
+    metadata_dir_name: Optional[str] = "metadata",
+    testing_data_dir="dummyfiles",
+) -> None:
+    """Wrapper function that transfer datasets found within the pytest module and
+    transfers it to the assigned directory where pytest is conducting the functional
+    tests.
+
+    Parameters
+    ----------
+    test_dir : LocalPath
+        `PyTest.LocalPath` object that contains the path were the test is being
+        conducted
+
+    Return
+    ------
+    None
+        Transfers datafiles from the PyTest module to the testing directory
+    """
+
+    # get files to transfer
+    dataset_dir = pathlib.Path(f"./datasets/{testing_data_dir}").resolve(strict=True)
+
+    # grabbing all input paths
+    sqlite_file_paths = list(dataset_dir.glob("*sqlite"))[:n_plates]
+    platemaps_dir = dataset_dir / "metadata" / "platemap"
+    plate_map_files = [
+        str(_path.absolute()) for _path in platemaps_dir.glob("platemap*")
+    ][:n_platemaps]
+    barcode = dataset_dir / "barcode.txt"
+
+    # create a metadata_dir in tmp_dir
+    if not isinstance(metadata_dir_name, str):
+        raise ValueError("metadata dir name must be a string")
+
+    tmpdir_metadata_path = test_dir / metadata_dir_name / "platemap"
+    tmpdir_metadata_path.mkdir(exist_ok=True, parents=True)
+
+    # transferring all files to tmp dir
+    for _path in plate_map_files:
+        shutil.copy(_path, str(tmpdir_metadata_path))
+    for _path in sqlite_file_paths:
+        shutil.copy(_path, test_dir)
+    shutil.copy(barcode, test_dir)
+
+
+def get_raised_error(traceback: str) -> str:
+    """Parses traceback and attempts to obtain raised exception error.
+
+    Traceback is parsed in this order:
+    1. split by new lines
+    2. grab the last line as it contains the raised exception and message
+    3. split by ":" to separate exception name and exception message
+    4. grab the first element since it contains that path to exception
+    5. split by "." and grab last element, which is the exception name
+
+    Parameters
+    ----------
+    traceback : str
+        complete traceback generated by executing CLI
+
+    Returns
+    -------
+    str
+        return raised exception error
+    """
+
+    # returns exception name, refer to function documentation to understand
+    # the order of parsing the traceback to obtain exception name.
+    return traceback.splitlines()[-1].split(":")[0].split(".")[-1]
+
+
+# --------------------------
+# init mode functional tests
+# --------------------------
+# The tests below focuses on only executing the init mode.
+def test_barcode_logic_no_barcode_one_platemap(tmp_path, request) -> None:
+    """Positive case: This tests expects a successful run where the user provides
+    multiple plate datasets, plate map, and no barcode. Since this is only one plate_map
+    , this means that the generated dataset came from one experiment and multiple
+    samples (plates) were used to generated the datasets.
+    """
+    # starting path
+    test_module = str(pathlib.Path().absolute())
+
+    # transfer dummy data to tmpdir
+    transfer_data(test_dir=tmp_path, n_plates=2, n_platemaps=1)
+
+    # change directory to tmpdir
+    os.chdir(tmp_path)
+
+    # execute CytoSnake
+    cmd = "cytosnake init -d *.sqlite -m metadata".split()
+    proc = subprocess.run(cmd, capture_output=True, text=True, check=False)
+
+    # leave test directory
+    os.chdir(test_module)
+
+    # clean directory,
+    cleanup_handler = CleanUpHandler(tmp_path)
+    request.addfinalizer(cleanup_handler)
+
+    # checking for success return code
+    assert proc.returncode == 0
+
+
+def test_barcode_logic_barcode_multi_platemaps(tmp_path, request) -> None:
+    """Positive case: This tests expects a successful run where the user provides
+    multiple plate datasets, multiple plate map, and barcode. Since this is only one
+    plate_map , this means that the generated dataset came from one experiment and
+    multiple samples (plates) were used to generated the datasets.
+    """
+    # PyTest module directory
+    test_module = str(pathlib.Path().absolute())
+
+    # transfer dummy data to tmpdir
+    transfer_data(test_dir=tmp_path, n_plates=2, n_platemaps=2)
+
+    # change directory to tmpdir
+    os.chdir(tmp_path)
+
+    # execute CytoSnake
+    cmd = "cytosnake init -d *.sqlite -m metadata -b barcode.txt".split()
+    proc = subprocess.run(cmd, capture_output=True, text=True, check=False)
+
+    # leave testing dir
+    os.chdir(test_module)
+
+    # clean directory,
+    cleanup_handler = CleanUpHandler(tmp_path)
+    request.addfinalizer(cleanup_handler)
+
+    # checking for success return code
+    assert proc.returncode == 0
+
+
+def test_barcode_logic_no_barcode_multi_platemaps(tmp_path, request) -> None:
+    """Negative case: This test expects a failed run where the user provides multiple
+    plate datasets, multiple plate maps (multi-experiments), and no barcode. Since
+    there are plate maps, this indicates that the generated datasets came from multiple
+    experiments.
+
+    Checks:
+    -------
+        non-zero return code
+        BarCodeRequiredError raised
+    """
+    # PyTest module directory
+    test_module = str(pathlib.Path().absolute())
+
+    # transfer dummy data to tmpdir
+    transfer_data(test_dir=tmp_path, n_plates=2, n_platemaps=2)
+
+    # change directory to tmpdir
+    os.chdir(tmp_path)
+
+    # execute CytoSnake
+    cmd = "cytosnake init -d *.sqlite -m metadata"
+    proc = subprocess.run(cmd, shell=True, capture_output=True, text=True, check=False)
+    raised_error = get_raised_error(proc.stderr)
+
+    # leave testing dir
+    os.chdir(test_module)
+
+    # clean directory,
+    cleanup_handler = CleanUpHandler(tmp_path)
+    request.addfinalizer(cleanup_handler)
+
+    # checking for sucess return code
+    assert proc.returncode == 1
+    assert raised_error == errors.BarcodeRequiredError.__name__
diff --git a/cytosnake/utils/config_utils.py b/cytosnake/utils/config_utils.py
@@ -114,7 +114,6 @@ def load_data_path_configs():
 
 
 def load_workflow_paths_config() -> dict:
-
     # load in _path.yaml and select key where all workflow paths are
     loaded_meta_paths = load_meta_path_configs()
     return loaded_meta_paths["workflow_dir"]["workflow"]

diff --git a/cytosnake/utils/cytosnake_setup.py b/cytosnake/utils/cytosnake_setup.py
@@ -68,7 +68,6 @@ def transport_project_files() -> None:
     # - configs: contains yaml files providing workflow and cli configurations
     target_dirs = ["workflows", "configs"]
     for target_dir in target_dirs:
-
         # construct source directory path
         src_path = pkg_path / target_dir
         target_dst = proj_path / target_dir