Changed to branch concept, YAML structure simplified as changed to Dict.

mashhurs · mashhurs · commit 552088017974 · 2024-10-01T17:21:40.000-07:00
diff --git a/.buildkite/scripts/health-report-tests/README.md b/.buildkite/scripts/health-report-tests/README.md
@@ -1,6 +1,6 @@
 ## Description
 This package for integration tests of the Health Report API.
-Export `LS_VERSION` (major and minor version such as 8.x) to run on a specific branch. By default, it uses the main branch.
+Export `LS_BRANCH` to run on a specific branch. By default, it uses the main branch.
 
 ## How to run the Health Report Integration test?
 ### Prerequisites
@@ -12,4 +12,7 @@ python3 -mpip install -r .buildkite/scripts/health-report-tests/requirements.txt
 ### Run the integration tests
 ```shell
 python3 .buildkite/scripts/health-report-tests/main.py
-```
+```
+
+### Troubleshooting
+- If you get `WARNING: pip is configured with locations that require TLS/SSL,...` warning message, make sure you have python >=3.12.4 installed.
diff --git a/.buildkite/scripts/health-report-tests/bootstrap.py b/.buildkite/scripts/health-report-tests/bootstrap.py
@@ -17,31 +17,31 @@ def __init__(self) -> None:
         f"""
         A constructor of the {Bootstrap}.
         Returns:
-            Resolves Logstash branch considering provided LS_VERSION
+            Resolves Logstash branch considering provided LS_BRANCH
             Checks out git branch
         """
-        logstash_version = os.environ.get("LS_VERSION")
-        if logstash_version is None:
+        logstash_branch = os.environ.get("LS_BRANCH")
+        if logstash_branch is None:
             # version is not specified, use the main branch, no need to git checkout
-            print(f"LS_VERSION is not specified, using main branch.")
+            print(f"LS_BRANCH is not specified, using main branch.")
         else:
-            # LS_VERSION accepts major latest as a major.x or specific version as X.Y
-            if logstash_version.find(".x") == -1:
-                print(f"Using specified branch: {logstash_version}")
-                util.git_check_out_branch(logstash_version)
+            # LS_BRANCH accepts major latest as a major.x or specific branch as X.Y
+            if logstash_branch.find(".x") == -1:
+                print(f"Using specified branch: {logstash_branch}")
+                util.git_check_out_branch(logstash_branch)
             else:
-                major_version = logstash_version.split(".")[0]
+                major_version = logstash_branch.split(".")[0]
                 if major_version and major_version.isnumeric():
                     resolved_version = self.__resolve_latest_stack_version_for(major_version)
                     minor_version = resolved_version.split(".")[1]
                     branch = major_version + "." + minor_version
                     print(f"Using resolved branch: {branch}")
                     util.git_check_out_branch(branch)
                 else:
-                    raise ValueError(f"Invalid value set to LS_VERSION. Please set it properly (ex: 8.x or 9.0) and "
+                    raise ValueError(f"Invalid value set to LS_BRANCH. Please set it properly (ex: 8.x or 9.0) and "
                                      f"rerun again")
 
-    def __resolve_latest_stack_version_for(self, major_version: str) -> None:
+    def __resolve_latest_stack_version_for(self, major_version: str) -> str:
         resolved_version = ""
         response = util.call_url_with_retry(self.ELASTIC_STACK_VERSIONS_URL)
         release_versions = response.json()["versions"]
diff --git a/.buildkite/scripts/health-report-tests/config_validator.py b/.buildkite/scripts/health-report-tests/config_validator.py
@@ -3,55 +3,45 @@
 
 
 class ConfigValidator:
-
-    REQUIRED_KEYS: Dict[str, List[str]] = {
+    REQUIRED_KEYS: Dict[str, List[Any]] = {
         "config": ["pipeline.id", "config.string"],
-        "expectation": ["status", "symptom", "diagnosis", "impacts", "details"],
-        "diagnosis": ["cause"],
-        "impacts": ["description", "impact_areas"],
-        "details": ["run_state"],
+        "expectation": ["status", "symptom", {"diagnosis": ["cause"]},
+                        {"impacts": ["description", "impact_areas"], "details": ["run_state"]}]
     }
 
     def __init__(self):
         self.yaml_content = None
 
-    def __validate_keys(self, actual_keys: List[str], expected_keys: List[str], section: str) -> bool:
-        """Validate the keys at the current level."""
-        missing_keys = set(expected_keys) - set(actual_keys)
-        if len(missing_keys) == len(expected_keys):
-            print(f"Missing keys in {section}: {missing_keys}")
-            return False
-        return True
-
-    def __validate_config(self, config_list: List[Dict[str, Any]]) -> bool:
-        """Validate the 'config' section."""
-        for config_item in config_list:
-            if not self.__validate_keys(list(config_item.keys()), self.REQUIRED_KEYS["config"], "config"):
+    def __validate_keys(self, data: Dict[str, Any], required_keys: Dict[str, List[Any]]) -> bool:
+        for key, required_list in required_keys.items():
+            if key not in data:
+                print(f"Missing top-level key: {key}")
                 return False
+            for item in required_list:
+                if isinstance(item, str):
+                    if not self.__check_nested_key(data[key], item):
+                        print(f"Missing nested key: {item} in {key}")
+                        return False
+                elif isinstance(item, dict):
+                    for sub_key, sub_value in item.items():
+                        if sub_key not in data[key]:
+                            print(f"Missing key: {sub_key} in {key}")
+                            return False
+                        # Recursively check the nested dictionary
+                        if not self.__validate_keys(data[key][sub_key], {sub_key: sub_value}):
+                            return False
         return True
 
-    def __validate_expectation(self, expectation_list: List[Dict[str, Any]]) -> bool:
-        """Validate the 'expectation' section."""
-        for expectation_item in expectation_list:
-            if not self.__validate_keys(list(expectation_item.keys()), self.REQUIRED_KEYS["expectation"], "expectation"):
+    def __check_nested_key(self, data: Dict[str, Any], nested_key: str) -> bool:
+        keys = nested_key.split('.')
+        for key in keys:
+            if key not in data:
                 return False
-            if "diagnosis" in expectation_item:
-                for diagnosis in expectation_item["diagnosis"]:
-                    if not self.__validate_keys(list(diagnosis.keys()), self.REQUIRED_KEYS["diagnosis"], "diagnosis"):
-                        return False
-            if "impacts" in expectation_item:
-                for impact in expectation_item["impacts"]:
-                    if not self.__validate_keys(list(impact.keys()), self.REQUIRED_KEYS["impacts"], "impacts"):
-                        return False
-            if "details" in expectation_item:
-                for detail in expectation_item["details"]:
-                    if not self.__validate_keys(list(detail.keys()), self.REQUIRED_KEYS["details"], "details"):
-                        return False
         return True
 
     def load(self, file_path: str) -> None:
         """Load the YAML file content into self.yaml_content."""
-        self.yaml_content: Union[List[Dict[str, Any]], None] = None
+        self.yaml_content: [Dict[str, Any]] = None
         try:
             with open(file_path, 'r') as file:
                 self.yaml_content = yaml.safe_load(file)
@@ -65,16 +55,19 @@ def is_valid(self) -> bool:
             print(f"YAML content is empty.")
             return False
 
-        if not isinstance(self.yaml_content, list):
-            print(f"YAML structure is not as expected, it should start with a list.")
+        if not isinstance(self.yaml_content, Dict):
+            print(f"YAML structure is not as expected, it should start with a Dict.")
             return False
 
+        required_config_keys = list(self.REQUIRED_KEYS.keys())
         for item in self.yaml_content:
-            if "config" in item and not self.__validate_config(item["config"]):
-                return False
-
-            if "expectation" in item and not self.__validate_expectation(item["expectation"]):
+            if item == "name":
+                continue
+            if item not in required_config_keys:
                 return False
 
-        print(f"YAML file validation successful!")
+        if self.__validate_keys(self.yaml_content, self.REQUIRED_KEYS):
+            print("Valid YAML content detected.")
+        else:
+            print("YAML validation failed.")
         return True
diff --git a/.buildkite/scripts/health-report-tests/main.py b/.buildkite/scripts/health-report-tests/main.py
@@ -7,7 +7,6 @@
 from scenario_executor import ScenarioExecutor
 from config_validator import ConfigValidator
 import yaml
-import util
 
 
 class BootstrapContextManager:
@@ -18,15 +17,15 @@ def __init__(self):
     def __enter__(self):
         print(f"Starting Logstash Health Report Integration test.")
         self.bootstrap = Bootstrap()
-        # self.bootstrap.build_logstash()
+        self.bootstrap.build_logstash()
 
         plugin_path = os.getcwd() + "/qa/support/logstash-integration-failure_injector/logstash-integration" \
                                     "-failure_injector-*.gem"
         matching_files = glob.glob(plugin_path)
         if len(matching_files) == 0:
             raise ValueError(f"Could not find logstash-integration-failure_injector plugin.")
 
-        # self.bootstrap.install_plugin(matching_files[0])
+        self.bootstrap.install_plugin(matching_files[0])
         print(f"logstash-integration-failure_injector successfully installed.")
         return self.bootstrap
 
@@ -56,13 +55,13 @@ def main():
 
         for scenario_file in scenario_files:
             with open(scenario_file, 'r') as file:
-                # scenario_content: Union[List[Dict[str, Any]], None] = None
+                # scenario_content: Dict[str, Any] = None
                 scenario_content = yaml.safe_load(file)
-                scenario_name = util.get_element_of_array(scenario_content, 'name')
-                config = util.get_element_of_array(scenario_content, 'config')
+                scenario_name = scenario_content['name']
+                config = scenario_content['config']
                 if config is not None:
                     bootstrap.apply_config(config)
-                    expectation = util.get_element_of_array(scenario_content, 'expectation')
+                    expectation = scenario_content['expectation']
                     process = bootstrap.run_logstash()
                     if process is not None:
                         scenario_executor.on(scenario_name, expectation)
diff --git a/.buildkite/scripts/health-report-tests/scenario_executor.py b/.buildkite/scripts/health-report-tests/scenario_executor.py
@@ -40,4 +40,4 @@ def __is_expected(self, scenario_content: list) -> None:
     def on(self, scenario_name: str, scenario_content: list) -> None:
         print(f"Testing the scenario: {scenario_content}")
         if self.__is_expected(scenario_content) is False:
-            raise Exception(f"{scenario_name} failed.")
+            raise Exception(f"{scenario_name} failed.")
diff --git a/.buildkite/scripts/health-report-tests/tests/slow-start.yaml b/.buildkite/scripts/health-report-tests/tests/slow-start.yaml
@@ -1,17 +1,17 @@
-- name: "Slow start pipeline"
-- config:
+name: "Slow start pipeline"
+config:
   - pipeline.id: slow-start-pp
     config.string: |
       input { heartbeat {} }
       filter { failure_injector { degrade_at => [register] } }
       output { stdout {} }
-- expectation:
-    - status: yellow
-    - symptom: "The pipeline is degraded or at risk of becoming unhealthy; 1 area is impacted and 1 diagnosis is available."
-    - diagnosis:
-        - cause: "pipeline is loading"
-    - impacts:
-      - description: "pipeline is loading"
-      - impact_areas: "pipeline_execution"
-    - details:
-      - run_state: "LOADING"
+expectation:
+  - status: yellow
+  - symptom: "The pipeline is degraded or at risk of becoming unhealthy; 1 area is impacted and 1 diagnosis is available."
+  - diagnosis:
+      - cause: "pipeline is loading"
+  - impacts:
+    - description: "pipeline is loading"
+    - impact_areas: "pipeline_execution"
+  - details:
+    - run_state: "LOADING"
diff --git a/.buildkite/scripts/health-report-tests/util.py b/.buildkite/scripts/health-report-tests/util.py
@@ -1,10 +1,12 @@
 import requests
 import subprocess
-from typing import Any, List, Dict, Union
 from requests.adapters import HTTPAdapter, Retry
 
 
 def call_url_with_retry(url: str, max_retries: int = 5, delay: int = 1) -> requests.Response:
+    f"""
+    Calls the given {url} with maximum of {max_retries} retries with {delay} delay.
+    """
     schema = "https://" if "https://" in url else "http://"
     session = requests.Session()
     # retry on most common failures such as connection timeout(408), etc...
@@ -13,21 +15,21 @@ def call_url_with_retry(url: str, max_retries: int = 5, delay: int = 1) -> reque
     return session.get(url)
 
 
-def git_check_out_branch(branch_name: str) -> bool:
+def git_check_out_branch(branch_name: str) -> None:
+    f"""
+    Checks out specified branch or fails with error if checkout operation fails.
+    """
     run_or_raise_error(["git", "checkout", branch_name],
                        "Error occurred while checking out the " + branch_name + " branch")
 
 
 def run_or_raise_error(commands: list, error_message):
+    f"""
+    Executes the {list} commands and raises an {Exception} if opration fails.
+    """
     result = subprocess.run(commands, universal_newlines=True, stdout=subprocess.PIPE)
     if result.returncode != 0:
         full_error_message = (error_message + ", output: " + result.stdout.decode('utf-8')) \
             if result.stdout else error_message
         raise Exception(f"{full_error_message}")
 
-
-def get_element_of_array(data: Union[List[Dict[str, Any]], None], key: str) -> str:
-    for element in data:
-        if key in element:
-            return element[key]
-    return None