From 17d6a993fc17d533460c5f40f3908c708e057c18 Mon Sep 17 00:00:00 2001
From: Daniel Baumann <daniel.baumann@progress-linux.org>
Date: Thu, 23 May 2024 18:45:17 +0200
Subject: Merging upstream version 18.2.3.

Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
---
 .../features/cluster-prometheus-monitoring.feature |  14 +++
 src/pybind/mgr/rook/ci/tests/features/rook.feature |  59 ++++++++++-
 .../rook/ci/tests/features/steps/implementation.py | 109 ++++++++++++++++++++-
 .../mgr/rook/ci/tests/features/steps/utils.py      |  23 +++++
 4 files changed, 198 insertions(+), 7 deletions(-)
 create mode 100644 src/pybind/mgr/rook/ci/tests/features/cluster-prometheus-monitoring.feature

(limited to 'src/pybind/mgr/rook/ci/tests')

diff --git a/src/pybind/mgr/rook/ci/tests/features/cluster-prometheus-monitoring.feature b/src/pybind/mgr/rook/ci/tests/features/cluster-prometheus-monitoring.feature
new file mode 100644
index 000000000..5180c7293
--- /dev/null
+++ b/src/pybind/mgr/rook/ci/tests/features/cluster-prometheus-monitoring.feature
@@ -0,0 +1,14 @@
+Feature: Testing Rook orchestrator commands
+    Ceph has been installed using the cluster CRD available in deploy/examples/cluster-test.yaml
+
+    Scenario: Verify Prometheus metrics endpoint is working properly
+      Given I can get prometheus server configuration
+      Given the prometheus server is serving metrics
+
+    Scenario: Verify some basic metrics are working properly
+      Given I can get prometheus server configuration
+      Given the prometheus server is serving metrics
+      Then the response contains the metric "ceph_osd_in" where "ceph_daemon" is "osd.0" and value equal to 1
+      Then the response contains the metric "ceph_osd_in" where "ceph_daemon" is "osd.1" and value equal to 1
+      Then the response contains the metric "ceph_osd_in" where "ceph_daemon" is "osd.2" and value equal to 1
+      Then the response contains the metric "ceph_mon_quorum_status" where "ceph_daemon" is "mon.a" and value equal to 1
diff --git a/src/pybind/mgr/rook/ci/tests/features/rook.feature b/src/pybind/mgr/rook/ci/tests/features/rook.feature
index ae0478f8b..acf733f55 100644
--- a/src/pybind/mgr/rook/ci/tests/features/rook.feature
+++ b/src/pybind/mgr/rook/ci/tests/features/rook.feature
@@ -1,8 +1,8 @@
 Feature: Testing Rook orchestrator commands
-    Ceph has been installed using the cluster CRD available in deploy/examples/cluster-test.yaml and
+    Ceph has been installed using the cluster CRD available in deploy/examples/cluster-test.yaml
 
     Scenario: Verify ceph cluster health
-      When I run
+      When I run ceph command
           """
           ceph health | grep HEALTH
           """
@@ -10,3 +10,58 @@ Feature: Testing Rook orchestrator commands
           """
           HEALTH_OK
           """
+
+    Scenario: Verify rook orchestrator has been enabled correctly
+      When I run ceph command
+          """
+          ceph mgr module ls | grep rook
+          """
+      Then I get something like
+          """
+          rook +on
+          """
+
+    Scenario: Verify rook orchestrator lists services correctly
+        When I run ceph command
+            """
+            ceph orch ls
+            """
+        Then I get something like
+            """
+            NAME +PORTS +RUNNING +REFRESHED +AGE +PLACEMENT
+            crash +1/1 .+
+            mgr +1/1 .+
+            mon +1/1 .+
+            osd +3 .+
+            """
+
+    Scenario: Verify rook orchestrator lists daemons correctly
+        When I run ceph command
+            """
+            ceph orch ps
+            """
+        Then I get something like
+            """
+            NAME +HOST +PORTS +STATUS +REFRESHED +AGE +MEM +USE +MEM +LIM +VERSION +IMAGE +ID
+            ceph-exporter.exporter +minikube +running .+
+            crashcollector.crash +minikube +running .+
+            mgr.a +minikube +running .+
+            mon.a +minikube +running .+
+            osd.0 +minikube +running .+
+            osd.1 +minikube +running .+
+            osd.2 +minikube +running .+
+            """
+
+    Scenario: Verify rook orchestrator lists devices correctly
+        When I run ceph command
+            """
+            ceph orch device ls
+            """
+        Then I get something like
+            """
+            HOST +PATH +TYPE +DEVICE +ID +SIZE +AVAILABLE +REFRESHED +REJECT +REASONS
+            minikube +/dev/vdb  +unknown +None +10.0G .+
+            minikube +/dev/vdc  +unknown +None +20.0G .+
+            minikube +/dev/vdd  +unknown +None +20.0G .+
+            minikube +/dev/vde  +unknown +None +20.0G .+
+            """
diff --git a/src/pybind/mgr/rook/ci/tests/features/steps/implementation.py b/src/pybind/mgr/rook/ci/tests/features/steps/implementation.py
index adde61afd..59cb117c8 100644
--- a/src/pybind/mgr/rook/ci/tests/features/steps/implementation.py
+++ b/src/pybind/mgr/rook/ci/tests/features/steps/implementation.py
@@ -1,15 +1,35 @@
+import requests
+from behave import given, when, then
 from behave import *
 from utils import *
+import subprocess
 import re
 
-@when("I run")
+PROMETHEUS_SERVER_URL = None
+
+def get_prometheus_pod_host_ip():
+    try:
+        command = "minikube --profile minikube kubectl -- -n rook-ceph -o jsonpath='{.status.hostIP}' get pod prometheus-rook-prometheus-0"
+        result = subprocess.run(command, shell=True, capture_output=True, text=True, check=True)
+        host_ip = result.stdout.strip()
+        return host_ip
+    except subprocess.CalledProcessError as e:
+        print(f"Error running command: {e}")
+        return None
+
+@when("I run ceph command")
+def run_step(context):
+    context.output = run_ceph_commands(context.text)
+
+@when("I run k8s command")
 def run_step(context):
-    context.output = run_commands(context.text)
+    context.output = run_k8s_commands(context.text)
 
 @then("I get")
 def verify_result_step(context):
-    print(f"Output is:\n{context.output}\n--------------\n")
-    assert context.text == context.output
+    if (context.text != context.output):
+        display_side_by_side(context.text, context.output)
+    assert context.text == context.output, ""
 
 @then("I get something like")
 def verify_fuzzy_result_step(context):
@@ -18,4 +38,83 @@ def verify_fuzzy_result_step(context):
     num_lines = min(len(output_lines), len(expected_lines))
     for n in range(num_lines):
         if not re.match(expected_lines[n], output_lines[n]):
-            raise
+            display_side_by_side(expected_lines[n], output_lines[n])
+            assert False, ""
+
+@given('I can get prometheus server configuration')
+def step_get_prometheus_server_ip(context):
+    global PROMETHEUS_SERVER_URL
+    try:
+        PROMETHEUS_SERVER_URL = f"http://{get_prometheus_pod_host_ip()}:30900"
+    except requests.exceptions.RequestException as e:
+        print(f"Error connecting to Prometheus server: {e}")
+        assert False, f"Error connecting to Prometheus server: {e}"
+
+@given('the prometheus server is serving metrics')
+def step_given_server_running(context):
+    try:
+        params = {'match[]': '{__name__!=""}'}
+        response = requests.get(f"{PROMETHEUS_SERVER_URL}/federate", params)
+        # Check if the response status code is successful (2xx)
+        response.raise_for_status()
+        # Store the response object in the context for later use
+        context.response = response
+        print(f"Prometheus server is running. Status code: {response.status_code}")
+    except requests.exceptions.RequestException as e:
+        print(f"Error connecting to Prometheus server: {e}")
+        assert False, f"Error connecting to Prometheus server: {e}"
+
+@when('I query the Prometheus metrics endpoint')
+def step_when_query_metrics_endpoint(context):
+    params = {'match[]': '{__name__!=""}'}
+    context.response = requests.get(f"{PROMETHEUS_SERVER_URL}/federate", params)
+    context.response.raise_for_status()
+
+@then('the response contains the metric "{metric_name}"')
+def step_then_check_metric_value(context, metric_name):
+    metric_value = parse_metric_value(context.response.text, metric_name)
+    assert metric_value is not None, f"Metric '{metric_name}' not found in the response"
+
+@then('the response contains the metric "{metric_name}" with value equal to {expected_value}')
+def step_then_check_metric_value(context, metric_name, expected_value):
+    metric_value = parse_metric_value(context.response.text, metric_name)
+    assert metric_value is not None, f"Metric '{metric_name}' not found in the response"
+    assert metric_value == float(expected_value), f"Metric '{metric_name}' value {metric_value} is not equal to {expected_value}"
+
+@then('the response contains the metric "{metric_name}" with value greater than {expected_value}')
+def step_then_check_metric_value(context, metric_name, expected_value):
+    metric_value = parse_metric_value(context.response.text, metric_name)
+    assert metric_value is not None, f"Metric '{metric_name}' not found in the response"
+    assert metric_value > float(expected_value), f"Metric '{metric_name}' value {metric_value} is not greater than {expected_value}"
+
+@then('the response contains the metric "{metric_name}" with value less than {expected_value}')
+def step_then_check_metric_value(context, metric_name, expected_value):
+    metric_value = parse_metric_value(context.response.text, metric_name)
+    assert metric_value is not None, f"Metric '{metric_name}' not found in the response"
+    assert metric_value < float(expected_value), f"Metric '{metric_name}' value {metric_value} is not less than {expected_value}"
+
+@then('the response contains the metric "{metric_name}" with value in the range {min_value}-{max_value}')
+def step_then_check_metric_value(context, metric_name, min_value, max_value):
+    metric_value = parse_metric_value(context.response.text, metric_name)
+    assert metric_value is not None, f"Metric '{metric_name}' not found in the response"
+    assert metric_value >= float(min_value) and metric_value <= float(max_value), f"Metric '{metric_name}' value {metric_value} is not in the range {min_value}-{max_value}"
+
+@then('the response contains the metric "{metric_name}" where "{filter_by_field}" is "{field_value}" and value equal to {expected_value}')
+def step_then_check_metric_value(context, metric_name, expected_value, filter_by_field, field_value):
+    metric_value = parse_metric_value(context.response.text, metric_name, filter_by_field, field_value)
+    assert metric_value is not None, f"Metric '{metric_name}' not found in the response"
+    assert metric_value == float(expected_value), f"Metric '{metric_name}' value {metric_value} is not equal to {expected_value}"
+
+
+def parse_metric_value(metrics_text, metric_name, filter_by_field=None, field_value=None):
+    filter_condition = f'{filter_by_field}="{field_value}"' if filter_by_field and field_value else ''
+    pattern_str = rf'^{metric_name}\{{[^}}]*{filter_condition}[^}}]*\}} (\d+) (\d+)'
+    pattern = re.compile(pattern_str, re.MULTILINE)
+    match = pattern.search(metrics_text)
+    if match:
+        # Extract the values and timestamp from the matched groups
+        metric_value, _ = match.groups()
+        return float(metric_value)
+    else:
+        # Metric not found
+        return None
diff --git a/src/pybind/mgr/rook/ci/tests/features/steps/utils.py b/src/pybind/mgr/rook/ci/tests/features/steps/utils.py
index 41a71d0fb..f711ec3fe 100644
--- a/src/pybind/mgr/rook/ci/tests/features/steps/utils.py
+++ b/src/pybind/mgr/rook/ci/tests/features/steps/utils.py
@@ -1,4 +1,5 @@
 import subprocess
+from difflib import unified_diff
 
 ROOK_CEPH_COMMAND = "minikube kubectl -- -n rook-ceph exec -it deploy/rook-ceph-tools -- "
 CLUSTER_COMMAND = "minikube kubectl -- "
@@ -27,3 +28,25 @@ def run_commands(commands: str) -> str:
         output = execute_command(command)
 
     return output.strip("\n")
+
+def run_k8s_commands(commands: str) -> str:
+    commands_list = commands.split("\n")
+    output = ""
+    for cmd in commands_list:
+        command = CLUSTER_COMMAND + cmd
+        output = execute_command(command)
+
+    return output.strip("\n")
+
+def run_ceph_commands(commands: str) -> str:
+    commands_list = commands.split("\n")
+    output = ""
+    for cmd in commands_list:
+        command = ROOK_CEPH_COMMAND + cmd
+        output = execute_command(command)
+
+    return output.strip("\n")
+
+def display_side_by_side(expected, got):
+    diff = unified_diff(expected.splitlines(), got.splitlines(), lineterm='')
+    print('\n'.join(diff))
-- 
cgit v1.2.3