1 files changed, 188 insertions, 97 deletions
diff --git a/anta/runner.py b/anta/runner.py
index 89fb7c3..75391da 100644
--- a/anta/runner.py
+++ b/anta/runner.py
@@ -1,7 +1,6 @@
 # Copyright (c) 2023-2024 Arista Networks, Inc.
 # Use of this source code is governed by the Apache License 2.0
 # that can be found in the LICENSE file.
-# pylint: disable=too-many-branches
 """ANTA runner function."""
 
 from __future__ import annotations
@@ -10,31 +9,51 @@ import asyncio
 import logging
 import os
 import resource
-from typing import TYPE_CHECKING
+from collections import defaultdict
+from typing import TYPE_CHECKING, Any
 
 from anta import GITHUB_SUGGESTION
-from anta.catalog import AntaCatalog, AntaTestDefinition
-from anta.device import AntaDevice
 from anta.logger import anta_log_exception, exc_to_str
 from anta.models import AntaTest
+from anta.tools import Catchtime, cprofile
 
 if TYPE_CHECKING:
+    from collections.abc import Coroutine
+
+    from anta.catalog import AntaCatalog, AntaTestDefinition
+    from anta.device import AntaDevice
     from anta.inventory import AntaInventory
     from anta.result_manager import ResultManager
+    from anta.result_manager.models import TestResult
 
 logger = logging.getLogger(__name__)
 
-AntaTestRunner = tuple[AntaTestDefinition, AntaDevice]
-
-# Environment variable to set ANTA's maximum number of open file descriptors.
-# Maximum number of file descriptor the ANTA process will be able to open.
-# This limit is independent from the system's hard limit, the lower will be used.
 DEFAULT_NOFILE = 16384
-try:
-    __NOFILE__ = int(os.environ.get("ANTA_NOFILE", DEFAULT_NOFILE))
-except ValueError as exception:
-    logger.warning("The ANTA_NOFILE environment variable value is invalid: %s\nDefault to %s.", exc_to_str(exception), DEFAULT_NOFILE)
-    __NOFILE__ = DEFAULT_NOFILE
+
+
+def adjust_rlimit_nofile() -> tuple[int, int]:
+    """Adjust the maximum number of open file descriptors for the ANTA process.
+
+    The limit is set to the lower of the current hard limit and the value of the ANTA_NOFILE environment variable.
+
+    If the `ANTA_NOFILE` environment variable is not set or is invalid, `DEFAULT_NOFILE` is used.
+
+    Returns
+    -------
+        tuple[int, int]: The new soft and hard limits for open file descriptors.
+    """
+    try:
+        nofile = int(os.environ.get("ANTA_NOFILE", DEFAULT_NOFILE))
+    except ValueError as exception:
+        logger.warning("The ANTA_NOFILE environment variable value is invalid: %s\nDefault to %s.", exc_to_str(exception), DEFAULT_NOFILE)
+        nofile = DEFAULT_NOFILE
+
+    limits = resource.getrlimit(resource.RLIMIT_NOFILE)
+    logger.debug("Initial limit numbers for open file descriptors for the current ANTA process: Soft Limit: %s | Hard Limit: %s", limits[0], limits[1])
+    nofile = nofile if limits[1] > nofile else limits[1]
+    logger.debug("Setting soft limit for open file descriptors for the current ANTA process to %s", nofile)
+    resource.setrlimit(resource.RLIMIT_NOFILE, (nofile, limits[1]))
+    return resource.getrlimit(resource.RLIMIT_NOFILE)
 
 
 def log_cache_statistics(devices: list[AntaDevice]) -> None:
@@ -56,7 +75,120 @@ def log_cache_statistics(devices: list[AntaDevice]) -> None:
             logger.info("Caching is not enabled on %s", device.name)
 
 
-async def main(  # noqa: PLR0912 PLR0913 too-many-branches too-many-arguments - keep the main method readable
+async def setup_inventory(inventory: AntaInventory, tags: set[str] | None, devices: set[str] | None, *, established_only: bool) -> AntaInventory | None:
+    """Set up the inventory for the ANTA run.
+
+    Args:
+    ----
+        inventory: AntaInventory object that includes the device(s).
+        tags: Tags to filter devices from the inventory.
+        devices: Devices on which to run tests. None means all devices.
+
+    Returns
+    -------
+        AntaInventory | None: The filtered inventory or None if there are no devices to run tests on.
+    """
+    if len(inventory) == 0:
+        logger.info("The inventory is empty, exiting")
+        return None
+
+    # Filter the inventory based on the CLI provided tags and devices if any
+    selected_inventory = inventory.get_inventory(tags=tags, devices=devices) if tags or devices else inventory
+
+    with Catchtime(logger=logger, message="Connecting to devices"):
+        # Connect to the devices
+        await selected_inventory.connect_inventory()
+
+    # Remove devices that are unreachable
+    selected_inventory = selected_inventory.get_inventory(established_only=established_only)
+
+    # If there are no devices in the inventory after filtering, exit
+    if not selected_inventory.devices:
+        msg = f'No reachable device {f"matching the tags {tags} " if tags else ""}was found.{f" Selected devices: {devices} " if devices is not None else ""}'
+        logger.warning(msg)
+        return None
+
+    return selected_inventory
+
+
+def prepare_tests(
+    inventory: AntaInventory, catalog: AntaCatalog, tests: set[str] | None, tags: set[str] | None
+) -> defaultdict[AntaDevice, set[AntaTestDefinition]] | None:
+    """Prepare the tests to run.
+
+    Args:
+    ----
+        inventory: AntaInventory object that includes the device(s).
+        catalog: AntaCatalog object that includes the list of tests.
+        tests: Tests to run against devices. None means all tests.
+        tags: Tags to filter devices from the inventory.
+
+    Returns
+    -------
+        A mapping of devices to the tests to run or None if there are no tests to run.
+    """
+    # Build indexes for the catalog. If `tests` is set, filter the indexes based on these tests
+    catalog.build_indexes(filtered_tests=tests)
+
+    # Using a set to avoid inserting duplicate tests
+    device_to_tests: defaultdict[AntaDevice, set[AntaTestDefinition]] = defaultdict(set)
+
+    # Create AntaTestRunner tuples from the tags
+    for device in inventory.devices:
+        if tags:
+            # If there are CLI tags, only execute tests with matching tags
+            device_to_tests[device].update(catalog.get_tests_by_tags(tags))
+        else:
+            # If there is no CLI tags, execute all tests that do not have any tags
+            device_to_tests[device].update(catalog.tag_to_tests[None])
+
+            # Then add the tests with matching tags from device tags
+            device_to_tests[device].update(catalog.get_tests_by_tags(device.tags))
+
+        catalog.final_tests_count += len(device_to_tests[device])
+
+    if catalog.final_tests_count == 0:
+        msg = (
+            f"There are no tests{f' matching the tags {tags} ' if tags else ' '}to run in the current test catalog and device inventory, please verify your inputs."
+        )
+        logger.warning(msg)
+        return None
+
+    return device_to_tests
+
+
+def get_coroutines(selected_tests: defaultdict[AntaDevice, set[AntaTestDefinition]]) -> list[Coroutine[Any, Any, TestResult]]:
+    """Get the coroutines for the ANTA run.
+
+    Args:
+    ----
+        selected_tests: A mapping of devices to the tests to run. The selected tests are generated by the `prepare_tests` function.
+
+    Returns
+    -------
+        The list of coroutines to run.
+    """
+    coros = []
+    for device, test_definitions in selected_tests.items():
+        for test in test_definitions:
+            try:
+                test_instance = test.test(device=device, inputs=test.inputs)
+                coros.append(test_instance.test())
+            except Exception as e:  # noqa: PERF203, pylint: disable=broad-exception-caught
+                # An AntaTest instance is potentially user-defined code.
+                # We need to catch everything and exit gracefully with an error message.
+                message = "\n".join(
+                    [
+                        f"There is an error when creating test {test.test.module}.{test.test.__name__}.",
+                        f"If this is not a custom test implementation: {GITHUB_SUGGESTION}",
+                    ],
+                )
+                anta_log_exception(e, message, logger)
+    return coros
+
+
+@cprofile()
+async def main(  # noqa: PLR0913
     manager: ResultManager,
     inventory: AntaInventory,
     catalog: AntaCatalog,
@@ -65,6 +197,7 @@ async def main(  # noqa: PLR0912 PLR0913 too-many-branches too-many-arguments -
     tags: set[str] | None = None,
     *,
     established_only: bool = True,
+    dry_run: bool = False,
 ) -> None:
     # pylint: disable=too-many-arguments
     """Run ANTA.
@@ -77,103 +210,61 @@ async def main(  # noqa: PLR0912 PLR0913 too-many-branches too-many-arguments -
         manager: ResultManager object to populate with the test results.
         inventory: AntaInventory object that includes the device(s).
         catalog: AntaCatalog object that includes the list of tests.
-        devices: devices on which to run tests. None means all devices.
-        tests: tests to run against devices. None means all tests.
-        tags: Tags to filter devices from the inventory.
+        devices: Devices on which to run tests. None means all devices. These may come from the `--device / -d` CLI option in NRFU.
+        tests: Tests to run against devices. None means all tests. These may come from the `--test / -t` CLI option in NRFU.
+        tags: Tags to filter devices from the inventory. These may come from the `--tags` CLI option in NRFU.
         established_only: Include only established device(s).
+        dry_run: Build the list of coroutine to run and stop before test execution.
     """
-    limits = resource.getrlimit(resource.RLIMIT_NOFILE)
-    logger.debug("Initial limit numbers for open file descriptors for the current ANTA process: Soft Limit: %s | Hard Limit: %s", limits[0], limits[1])
-    nofile = __NOFILE__ if limits[1] > __NOFILE__ else limits[1]
-    logger.debug("Setting soft limit for open file descriptors for the current ANTA process to %s", nofile)
-    resource.setrlimit(resource.RLIMIT_NOFILE, (nofile, limits[1]))
-    limits = resource.getrlimit(resource.RLIMIT_NOFILE)
+    # Adjust the maximum number of open file descriptors for the ANTA process
+    limits = adjust_rlimit_nofile()
 
     if not catalog.tests:
         logger.info("The list of tests is empty, exiting")
         return
-    if len(inventory) == 0:
-        logger.info("The inventory is empty, exiting")
-        return
 
-    # Filter the inventory based on tags and devices parameters
-    selected_inventory = inventory.get_inventory(
-        tags=tags,
-        devices=devices,
-    )
-    await selected_inventory.connect_inventory()
+    with Catchtime(logger=logger, message="Preparing ANTA NRFU Run"):
+        # Setup the inventory
+        selected_inventory = inventory if dry_run else await setup_inventory(inventory, tags, devices, established_only=established_only)
+        if selected_inventory is None:
+            return
 
-    # Remove devices that are unreachable
-    inventory = selected_inventory.get_inventory(established_only=established_only)
-
-    if not inventory.devices:
-        msg = f'No reachable device {f"matching the tags {tags} " if tags else ""}was found.{f" Selected devices: {devices} " if devices is not None else ""}'
-        logger.warning(msg)
-        return
-    coros = []
+        with Catchtime(logger=logger, message="Preparing the tests"):
+            selected_tests = prepare_tests(selected_inventory, catalog, tests, tags)
+            if selected_tests is None:
+                return
 
-    # Select the tests from the catalog
-    if tests:
-        catalog = AntaCatalog(catalog.get_tests_by_names(tests))
+        run_info = (
+            "--- ANTA NRFU Run Information ---\n"
+            f"Number of devices: {len(inventory)} ({len(selected_inventory)} established)\n"
+            f"Total number of selected tests: {catalog.final_tests_count}\n"
+            f"Maximum number of open file descriptors for the current ANTA process: {limits[0]}\n"
+            "---------------------------------"
+        )
 
-    # Using a set to avoid inserting duplicate tests
-    selected_tests: set[AntaTestRunner] = set()
+        logger.info(run_info)
 
-    # Create AntaTestRunner tuples from the tags
-    for device in inventory.devices:
-        if tags:
-            # If there are CLI tags, only execute tests with matching tags
-            selected_tests.update((test, device) for test in catalog.get_tests_by_tags(tags))
-        else:
-            # If there is no CLI tags, execute all tests that do not have any filters
-            selected_tests.update((t, device) for t in catalog.tests if t.inputs.filters is None or t.inputs.filters.tags is None)
+        if catalog.final_tests_count > limits[0]:
+            logger.warning(
+                "The number of concurrent tests is higher than the open file descriptors limit for this ANTA process.\n"
+                "Errors may occur while running the tests.\n"
+                "Please consult the ANTA FAQ."
+            )
 
-            # Then add the tests with matching tags from device tags
-            selected_tests.update((t, device) for t in catalog.get_tests_by_tags(device.tags))
+        coroutines = get_coroutines(selected_tests)
 
-    if not selected_tests:
-        msg = f"There is no tests{f' matching the tags {tags} ' if tags else ' '}to run in the current test catalog and device inventory, please verify your inputs."
-        logger.warning(msg)
+    if dry_run:
+        logger.info("Dry-run mode, exiting before running the tests.")
+        for coro in coroutines:
+            coro.close()
         return
 
-    run_info = (
-        "--- ANTA NRFU Run Information ---\n"
-        f"Number of devices: {len(selected_inventory)} ({len(inventory)} established)\n"
-        f"Total number of selected tests: {len(selected_tests)}\n"
-        f"Maximum number of open file descriptors for the current ANTA process: {limits[0]}\n"
-        "---------------------------------"
-    )
-    logger.info(run_info)
-    if len(selected_tests) > limits[0]:
-        logger.warning(
-            "The number of concurrent tests is higher than the open file descriptors limit for this ANTA process.\n"
-            "Errors may occur while running the tests.\n"
-            "Please consult the ANTA FAQ."
-        )
-
-    for test_definition, device in selected_tests:
-        try:
-            test_instance = test_definition.test(device=device, inputs=test_definition.inputs)
-
-            coros.append(test_instance.test())
-        except Exception as e:  # pylint: disable=broad-exception-caught
-            # An AntaTest instance is potentially user-defined code.
-            # We need to catch everything and exit gracefully with an
-            # error message
-            message = "\n".join(
-                [
-                    f"There is an error when creating test {test_definition.test.__module__}.{test_definition.test.__name__}.",
-                    f"If this is not a custom test implementation: {GITHUB_SUGGESTION}",
-                ],
-            )
-            anta_log_exception(e, message, logger)
-
     if AntaTest.progress is not None:
-        AntaTest.nrfu_task = AntaTest.progress.add_task("Running NRFU Tests...", total=len(coros))
+        AntaTest.nrfu_task = AntaTest.progress.add_task("Running NRFU Tests...", total=len(coroutines))
 
-    logger.info("Running ANTA tests...")
-    test_results = await asyncio.gather(*coros)
-    for r in test_results:
-        manager.add(r)
+    with Catchtime(logger=logger, message="Running ANTA tests"):
+        test_results = await asyncio.gather(*coroutines)
+        for r in test_results:
+            manager.add(r)
 
-    log_cache_statistics(inventory.devices)
+    log_cache_statistics(selected_inventory.devices)