SigmaHQ/tests/test_rules.py

#!/usr/bin/env python3
"""
Checks for noncompliance or common errors on all rules

Run using the command
# python -m unittest test_rules.py
"""

import os
import unittest
import yaml
import re
from attackcti import attack_client
from colorama import init
from colorama import Fore

class TestRules(unittest.TestCase):
    MITRE_TECHNIQUE_NAMES = ["process_injection", "signed_binary_proxy_execution", "process_injection"] # incomplete list
    MITRE_TACTICS = ["initial_access", "execution", "persistence", "privilege_escalation", "defense_evasion", "credential_access", "discovery", "lateral_movement", "collection", "exfiltration", "command_and_control", "impact", "launch"]

    path_to_rules = "rules"

    # Helper functions
    def yield_next_rule_file_path(self, path_to_rules:str) -> str:
        for root, _, files in os.walk(path_to_rules):
            for file in files:
                yield os.path.join(root, file)

    def get_rule_part(self, file_path:str, part_name:str):
        yaml_dicts = self.get_rule_yaml(file_path)
        for yaml_part in yaml_dicts:
            if part_name in yaml_part.keys():
                return yaml_part[part_name]

        return None

    def get_rule_yaml(self, file_path:str) -> dict:
        data = []

        with open(file_path) as f:
            yaml_parts = yaml.safe_load_all(f)
            for part in yaml_parts:
                data.append(part)

        return data

    # Tests
    def test_confirm_extension_is_yml(self):
        files_with_incorrect_extensions = []

        for file in self.yield_next_rule_file_path(self.path_to_rules):
            file_name_and_extension = os.path.splitext(file)
            if len(file_name_and_extension) == 2:
                extension = file_name_and_extension[1]
                if extension != ".yml":
                    files_with_incorrect_extensions.append(file)

        self.assertEqual(files_with_incorrect_extensions, [], Fore.RED + 
                        "There are rule files with extensions other than .yml")

    def test_confirm_correct_mitre_tags(self):
        files_with_incorrect_mitre_tags = []

        for file in self.yield_next_rule_file_path(self.path_to_rules):
            tags = self.get_rule_part(file_path=file, part_name="tags")
            if tags:
                for tag in tags:
                    if tag not in MITRE_ALL and tag.startswith("attack."):
                        print(Fore.RED + "Rule {} has the following incorrect tag {}".format(file, tag))
                        files_with_incorrect_mitre_tags.append(file)

        self.assertEqual(files_with_incorrect_mitre_tags, [], Fore.RED + 
                         "There are rules with incorrect/unknown MITRE Tags. (please inform us about new tags that are not yet supported in our tests) and check the correct tags here: https://attack.mitre.org/ ")

    def test_duplicate_tags(self):
        files_with_incorrect_mitre_tags = []

        for file in self.yield_next_rule_file_path(self.path_to_rules):
            tags = self.get_rule_part(file_path=file, part_name="tags")
            if tags:
                known_tags = []
                for tag in tags:
                    if tag in known_tags:
                        print(Fore.RED + "Rule {} has the duplicate tag {}".format(file, tag))
                        files_with_incorrect_mitre_tags.append(file)
                    else: 
                        known_tags.append(tag)

        self.assertEqual(files_with_incorrect_mitre_tags, [], Fore.RED + 
                         "There are rules with duplicate tags")

    def test_look_for_duplicate_filters(self):
        def check_list_or_recurse_on_dict(item, depth:int) -> None:
            if type(item) == list:
                check_if_list_contain_duplicates(item, depth)
            elif type(item) == dict and depth <= MAX_DEPTH:
                for sub_item in item.values():
                    check_list_or_recurse_on_dict(sub_item, depth + 1)

        def check_if_list_contain_duplicates(item:list, depth:int) -> None:
            try:
                if len(item) != len(set(item)):
                    print(Fore.RED + "Rule {} has duplicate filters".format(file))
                    files_with_duplicate_filters.append(file)
            except:
                # unhashable types like dictionaries
                for sub_item in item:
                    if type(sub_item) == dict and depth <= MAX_DEPTH:
                        check_list_or_recurse_on_dict(sub_item, depth + 1)

        MAX_DEPTH = 3
        files_with_duplicate_filters = []

        for file in self.yield_next_rule_file_path(self.path_to_rules):
            detection = self.get_rule_part(file_path=file, part_name="detection")
            check_list_or_recurse_on_dict(detection, 1)

        self.assertEqual(files_with_duplicate_filters, [], Fore.RED + 
                         "There are rules with duplicate filters")

    def test_single_named_condition_with_x_of_them(self):
        faulty_detections = []

        for file in self.yield_next_rule_file_path(self.path_to_rules):
            yaml = self.get_rule_yaml(file_path = file)
            detection = self.get_rule_part(file_path = file, part_name = "detection")

            has_them_in_condition = "them" in detection["condition"]
            has_only_one_named_condition = len(detection) == 2
            not_multipart_yaml_file = len(yaml) == 1

            if has_them_in_condition and \
                has_only_one_named_condition and \
                    not_multipart_yaml_file:
                faulty_detections.append(file)

        self.assertEqual(faulty_detections, [], Fore.RED +
                         "There are rules using '1/all of them' style conditions but only have one condition")

    def test_duplicate_titles(self):
        def compare_detections(detection1:dict, detection2:dict) -> bool:

            # detections not the same length can't be the same
            if len(detection1) != len(detection2):
                return False

            for named_condition in detection1:
                # condition clause must be the same too 
                if named_condition == "condition":
                    if detection1["condition"] != detection2["condition"]:
                        return False
                    else:
                        continue

                # Named condition must exist in both rule files
                if named_condition not in detection2:
                    return False

                if len(detection1[named_condition]) != len(detection2[named_condition]):
                    return False

                for condition in detection1[named_condition]:
                    if type(condition) != str:
                        return False

                    if condition not in detection2[named_condition]:
                        return False

                    condition_value1 = detection1[named_condition][condition]
                    condition_value2 = detection2[named_condition][condition]

                    if condition_value1 != condition_value2:
                        return False

            return True

        faulty_detections = []
        files_and_their_detections = {}

        for file in self.yield_next_rule_file_path(self.path_to_rules):
            detection = self.get_rule_part(file_path = file, part_name = "detection")
            yaml = self.get_rule_yaml(file_path = file)

            is_multipart_yaml_file = len(yaml) != 1
            if is_multipart_yaml_file:
                continue

            for key in files_and_their_detections:
                if compare_detections(detection, files_and_their_detections[key]):
                    faulty_detections.append((key, file))

            files_and_their_detections[file] = detection

        self.assertEqual(faulty_detections, [], Fore.YELLOW + 
                         "There are rule files with exactly the same detection logic.")

    def test_source_eventlog(self):
        faulty_detections = []

        for file in self.yield_next_rule_file_path(self.path_to_rules):
            detection = self.get_rule_part(file_path = file, part_name = "detection")
            detection_str = str(detection).lower()
            if "'source': 'eventlog'" in detection_str:
                faulty_detections.append(file)

        self.assertEqual(faulty_detections, [], Fore.YELLOW + 
                         "There are detections with 'Source: Eventlog'. This does not add value to the detection.")

    def test_event_id_instead_of_process_creation(self):
        faulty_detections = []
        for file in self.yield_next_rule_file_path(self.path_to_rules):
            with open(file) as f:
                for line in f:
                    if re.search(r'.*EventID: (?:1|4688)\s*$', line) and file not in faulty_detections:
                        faulty_detections.append(file)

        self.assertEqual(faulty_detections, [], Fore.YELLOW + 
                         "There are rules still using Sysmon 1 or Event ID 4688. Please migrate to the process_creation category.")

    def test_missing_id(self):
        faulty_rules = []
        for file in self.yield_next_rule_file_path(self.path_to_rules):
            id = self.get_rule_part(file_path=file, part_name="id")
            if not id:
                print(Fore.YELLOW + "Rule {} has no field 'id'.".format(file))
                faulty_rules.append(file)
            elif len(id) != 36:
                print(Fore.YELLOW + "Rule {} has a malformed 'id' (not 36 chars).".format(file))
                faulty_rules.append(file)                

        self.assertEqual(faulty_rules, [], Fore.RED + 
                         "There are rules with missing or malformed 'id' fields. Create an id (e.g. here: https://www.uuidgenerator.net/version4) and add it to the reported rule(s).")
    
    def test_sysmon_rule_without_eventid(self):
        faulty_rules = []
        for file in self.yield_next_rule_file_path(self.path_to_rules):
            logsource = self.get_rule_part(file_path=file, part_name="logsource")
            service = logsource.get('service', '')
            if service.lower() == 'sysmon':
                with open(file) as f:
                    found = False
                    for line in f:
                        if re.search(r'.*EventID:.*$', line):  # might be on a single line or in multiple lines
                            found = True
                            break
                    if not found:
                        faulty_rules.append(file)      

        self.assertEqual(faulty_rules, [], Fore.RED + 
                         "There are rules using sysmon events but with no EventID specified")


    def test_missing_date(self):
        faulty_rules = []
        for file in self.yield_next_rule_file_path(self.path_to_rules):
            datefield = self.get_rule_part(file_path=file, part_name="date")
            if not datefield:
                print(Fore.YELLOW + "Rule {} has no field 'date'.".format(file))
                faulty_rules.append(file)
            elif len(datefield) != 10:
                print(Fore.YELLOW + "Rule {} has a malformed 'date' (not 10 chars, should be YYYY/MM/DD).".format(file))
                faulty_rules.append(file)                

        self.assertEqual(faulty_rules, [], Fore.RED + 
                         "There are rules with missing or malformed 'date' fields. (create one, e.g. date: 2019/01/14)")

    def test_references(self):
        faulty_rules = []
        for file in self.yield_next_rule_file_path(self.path_to_rules):
            references = self.get_rule_part(file_path=file, part_name="references")
            # Reference field doesn't exist      
            #if not references:
                #print(Fore.YELLOW + "Rule {} has no field 'references'.".format(file))
                #faulty_rules.append(file)
            if references:
                # it exists but isn't a list
                if not isinstance(references, list):
                    print(Fore.YELLOW + "Rule {} has a references field that isn't a list.".format(file))
                    faulty_rules.append(file)     

        self.assertEqual(faulty_rules, [], Fore.RED + 
                         "There are rules with malformed 'references' fields. (has to be a list of values even if it contains only a single value)")

    def test_file_names(self):
        faulty_rules = []
        filename_pattern = re.compile('[a-z0-9_]{10,70}\.yml')
        for file in self.yield_next_rule_file_path(self.path_to_rules):
            filename = os.path.basename(file)
            if not filename_pattern.match(filename) and not '_' in filename:
                print(Fore.YELLOW + "Rule {} has a file name that doesn't match our standard.".format(file))
                faulty_rules.append(file)     

        self.assertEqual(faulty_rules, [], Fore.RED + 
                         "There are rules with malformed file names (too short, too long, uppercase letters, a minus sign etc.). Please see the file names used in our repository and adjust your file names accordingly. The pattern for a valid file name is '[a-z0-9_]{10,70}\.yml' and it has to contain at least an underline character.")

    def test_title(self):
        faulty_rules = []
        allowed_lowercase_words = [
                'the',
                'for',
                'in',
                'with',
                'via',
                'on',
                'to',
                'without',
                'of',
                'through',
                'from',
                'by',
                'as',
                'a',
                'or',
                'at',
                'and',
                'an',
                'over',
                'new',
                ]
        for file in self.yield_next_rule_file_path(self.path_to_rules):
            title = self.get_rule_part(file_path=file, part_name="title")
            if not title:
                print(Fore.RED + "Rule {} has no field 'title'.".format(file))
                faulty_rules.append(file)
                continue
            elif len(title) > 70:
                print(Fore.YELLOW + "Rule {} has a title field with too many characters (>70)".format(file))
                faulty_rules.append(file)
            if title.startswith("Detects "):
                print(Fore.RED + "Rule {} has a title that starts with 'Detects'".format(file))
                faulty_rules.append(file)
            wrong_casing = []
            for word in title.split(" "):
                if word.islower() and not word.lower() in allowed_lowercase_words and not "." in word and not "/" in word and not word[0].isdigit():
                    wrong_casing.append(word)
            if len(wrong_casing) > 0:
                print(Fore.RED + "Rule {} has a title that has not title capitalization. Words: '{}'".format(file, ", ".join(wrong_casing)))
                faulty_rules.append(file)

        self.assertEqual(faulty_rules, [], Fore.RED + 
                         "There are rules with non-conform 'title' fields. Please check: https://github.com/Neo23x0/sigma/wiki/Rule-Creation-Guide#title")

    def test_invalid_logsource_attributes(self):
        faulty_rules = []
        for file in self.yield_next_rule_file_path(self.path_to_rules):
            logsource = self.get_rule_part(file_path=file, part_name="logsource")
            for key in logsource:
                if key.lower() not in ['category', 'product', 'service', 'definition']:
                    print(Fore.RED + "Rule {} has a logsource with an invalid field ({})".format(file, key))
def get_mitre_data():
    """
    Generate tags from live MITRE ATT&CK® TAXI service to get up-to-date data
    """
    # Get ATT&CK information
    lift = attack_client()
    # Techniques
    MITRE_TECHNIQUES = []
    MITRE_TECHNIQUE_NAMES = []
    MITRE_PHASE_NAMES = set()
    MITRE_TOOLS = []
    MITRE_GROUPS = []
    # Techniques 
    enterprise_techniques = lift.get_enterprise_techniques()
    for t in enterprise_techniques:
        MITRE_TECHNIQUE_NAMES.append(t['name'].lower().replace(' ', '_').replace('-', '_'))
        for r in t.external_references:
            if 'external_id' in r:
                MITRE_TECHNIQUES.append(r['external_id'].lower())
        if 'kill_chain_phases' in t:
            for kc in t['kill_chain_phases']:
                if 'phase_name' in kc:
                    MITRE_PHASE_NAMES.add(kc['phase_name'].replace('-','_'))
    # Tools / Malware
    enterprise_tools = lift.get_enterprise_tools()
    for t in enterprise_tools:
        for r in t.external_references:
            if 'external_id' in r:
                MITRE_TOOLS.append(r['external_id'].lower())
    enterprise_malware = lift.get_enterprise_malware()
    for m in enterprise_malware:
        for r in m.external_references:
            if 'external_id' in r:
                MITRE_TOOLS.append(r['external_id'].lower())
    # Groups
    enterprise_groups = lift.get_enterprise_groups()
    for g in enterprise_groups:
        for r in g.external_references:
            if 'external_id' in r:
                MITRE_GROUPS.append(r['external_id'].lower())
    
    # Combine all IDs to a big tag list
    return ["attack." + item for item in MITRE_TECHNIQUES + MITRE_TECHNIQUE_NAMES + list(MITRE_PHASE_NAMES) + MITRE_GROUPS + MITRE_TOOLS]


if __name__ == "__main__":
    init(autoreset=True)
    # Get Current Data from MITRE ATT&CK®
    MITRE_ALL = get_mitre_data()
    # Run the tests
    unittest.main()
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00			`#!/usr/bin/env python3`
			`"""`
			`Checks for noncompliance or common errors on all rules`

Added a test for duplicate filters and a test for Source: Eventlog 2019-02-18 18:05:58 +00:00			`Run using the command`
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00			`# python -m unittest test_rules.py`
			`"""`

			`import os`
			`import unittest`
			`import yaml`
Added checks for Sysmon 1 or EID 4688 instead of process_creation 2019-03-02 17:51:49 +00:00			`import re`
refactor: tests use live data from MITRE's TAXI service 2020-07-14 15:54:02 +00:00			`from attackcti import attack_client`
feat: colorized output in test 2020-01-30 07:37:47 +00:00			`from colorama import init`
			`from colorama import Fore`
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00
			`class TestRules(unittest.TestCase):`
			`MITRE_TECHNIQUE_NAMES = ["process_injection", "signed_binary_proxy_execution", "process_injection"] # incomplete list`
fix: updated MITRE tags in test 2020-03-25 13:04:22 +00:00			`MITRE_TACTICS = ["initial_access", "execution", "persistence", "privilege_escalation", "defense_evasion", "credential_access", "discovery", "lateral_movement", "collection", "exfiltration", "command_and_control", "impact", "launch"]`
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00
Corrected path to rules 2019-01-25 09:25:51 +00:00			`path_to_rules = "rules"`
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00
			`# Helper functions`
			`def yield_next_rule_file_path(self, path_to_rules:str) -> str:`
			`for root, _, files in os.walk(path_to_rules):`
			`for file in files:`
			`yield os.path.join(root, file)`

			`def get_rule_part(self, file_path:str, part_name:str):`
			`yaml_dicts = self.get_rule_yaml(file_path)`
			`for yaml_part in yaml_dicts:`
			`if part_name in yaml_part.keys():`
			`return yaml_part[part_name]`

			`return None`

			`def get_rule_yaml(self, file_path:str) -> dict:`
			`data = []`

			`with open(file_path) as f:`
Removed deprecated PyYAML API from rule test 2019-04-22 21:21:08 +00:00			`yaml_parts = yaml.safe_load_all(f)`
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00			`for part in yaml_parts:`
			`data.append(part)`

			`return data`

			`# Tests`
			`def test_confirm_extension_is_yml(self):`
			`files_with_incorrect_extensions = []`

			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`file_name_and_extension = os.path.splitext(file)`
			`if len(file_name_and_extension) == 2:`
			`extension = file_name_and_extension[1]`
			`if extension != ".yml":`
			`files_with_incorrect_extensions.append(file)`

feat: colorized error messages 2020-01-30 07:50:22 +00:00			`self.assertEqual(files_with_incorrect_extensions, [], Fore.RED +`
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00			`"There are rule files with extensions other than .yml")`

			`def test_confirm_correct_mitre_tags(self):`
			`files_with_incorrect_mitre_tags = []`

			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`tags = self.get_rule_part(file_path=file, part_name="tags")`
			`if tags:`
			`for tag in tags:`
refactor: tests use live data from MITRE's TAXI service 2020-07-14 15:54:02 +00:00			`if tag not in MITRE_ALL and tag.startswith("attack."):`
feat: colorized error messages 2020-01-30 07:50:22 +00:00			`print(Fore.RED + "Rule {} has the following incorrect tag {}".format(file, tag))`
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00			`files_with_incorrect_mitre_tags.append(file)`
Added a test for duplicate filters and a test for Source: Eventlog 2019-02-18 18:05:58 +00:00
feat: colorized error messages 2020-01-30 07:50:22 +00:00			`self.assertEqual(files_with_incorrect_mitre_tags, [], Fore.RED +`
refactor: ignore sub techniques as long as we do not have a complete list 2020-07-14 09:56:28 +00:00			`"There are rules with incorrect/unknown MITRE Tags. (please inform us about new tags that are not yet supported in our tests) and check the correct tags here: https://attack.mitre.org/ ")`
Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00
feat: detect duplicate tags 2020-07-27 09:37:58 +00:00			`def test_duplicate_tags(self):`
			`files_with_incorrect_mitre_tags = []`

			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`tags = self.get_rule_part(file_path=file, part_name="tags")`
			`if tags:`
			`known_tags = []`
			`for tag in tags:`
			`if tag in known_tags:`
			`print(Fore.RED + "Rule {} has the duplicate tag {}".format(file, tag))`
			`files_with_incorrect_mitre_tags.append(file)`
			`else:`
			`known_tags.append(tag)`

			`self.assertEqual(files_with_incorrect_mitre_tags, [], Fore.RED +`
			`"There are rules with duplicate tags")`

Added a test to check for duplicate filters in rules 2019-01-25 09:22:28 +00:00			`def test_look_for_duplicate_filters(self):`
			`def check_list_or_recurse_on_dict(item, depth:int) -> None:`
			`if type(item) == list:`
			`check_if_list_contain_duplicates(item, depth)`
			`elif type(item) == dict and depth <= MAX_DEPTH:`
			`for sub_item in item.values():`
			`check_list_or_recurse_on_dict(sub_item, depth + 1)`

			`def check_if_list_contain_duplicates(item:list, depth:int) -> None:`
			`try:`
			`if len(item) != len(set(item)):`
feat: colorized error messages 2020-01-30 07:50:22 +00:00			`print(Fore.RED + "Rule {} has duplicate filters".format(file))`
Added a test to check for duplicate filters in rules 2019-01-25 09:22:28 +00:00			`files_with_duplicate_filters.append(file)`
			`except:`
			`# unhashable types like dictionaries`
			`for sub_item in item:`
			`if type(sub_item) == dict and depth <= MAX_DEPTH:`
			`check_list_or_recurse_on_dict(sub_item, depth + 1)`

			`MAX_DEPTH = 3`
			`files_with_duplicate_filters = []`

			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`detection = self.get_rule_part(file_path=file, part_name="detection")`
			`check_list_or_recurse_on_dict(detection, 1)`

feat: colorized error messages 2020-01-30 07:50:22 +00:00			`self.assertEqual(files_with_duplicate_filters, [], Fore.RED +`
Added a test to check for duplicate filters in rules 2019-01-25 09:22:28 +00:00			`"There are rules with duplicate filters")`

Added a test for unnecessary use of '1 of them' in condition 2019-02-13 18:27:27 +00:00			`def test_single_named_condition_with_x_of_them(self):`
			`faulty_detections = []`

			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`yaml = self.get_rule_yaml(file_path = file)`
			`detection = self.get_rule_part(file_path = file, part_name = "detection")`
Added a test for duplicate filters and a test for Source: Eventlog 2019-02-18 18:05:58 +00:00
Added a test for unnecessary use of '1 of them' in condition 2019-02-13 18:27:27 +00:00			`has_them_in_condition = "them" in detection["condition"]`
			`has_only_one_named_condition = len(detection) == 2`
			`not_multipart_yaml_file = len(yaml) == 1`

			`if has_them_in_condition and \`
			`has_only_one_named_condition and \`
			`not_multipart_yaml_file:`
			`faulty_detections.append(file)`

feat: colorized error messages 2020-01-30 07:50:22 +00:00			`self.assertEqual(faulty_detections, [], Fore.RED +`
Added a test for unnecessary use of '1 of them' in condition 2019-02-13 18:27:27 +00:00			`"There are rules using '1/all of them' style conditions but only have one condition")`

Added a test for duplicate filters and a test for Source: Eventlog 2019-02-18 18:05:58 +00:00			`def test_duplicate_titles(self):`
			`def compare_detections(detection1:dict, detection2:dict) -> bool:`

			`# detections not the same length can't be the same`
			`if len(detection1) != len(detection2):`
			`return False`

			`for named_condition in detection1:`
			`# condition clause must be the same too`
			`if named_condition == "condition":`
			`if detection1["condition"] != detection2["condition"]:`
			`return False`
			`else:`
			`continue`

			`# Named condition must exist in both rule files`
			`if named_condition not in detection2:`
			`return False`

			`if len(detection1[named_condition]) != len(detection2[named_condition]):`
			`return False`

			`for condition in detection1[named_condition]:`
			`if type(condition) != str:`
			`return False`

			`if condition not in detection2[named_condition]:`
			`return False`

			`condition_value1 = detection1[named_condition][condition]`
			`condition_value2 = detection2[named_condition][condition]`

			`if condition_value1 != condition_value2:`
			`return False`

			`return True`

			`faulty_detections = []`
			`files_and_their_detections = {}`

			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`detection = self.get_rule_part(file_path = file, part_name = "detection")`
			`yaml = self.get_rule_yaml(file_path = file)`

			`is_multipart_yaml_file = len(yaml) != 1`
			`if is_multipart_yaml_file:`
			`continue`

			`for key in files_and_their_detections:`
			`if compare_detections(detection, files_and_their_detections[key]):`
			`faulty_detections.append((key, file))`

			`files_and_their_detections[file] = detection`

feat: colorized error messages 2020-01-30 07:50:22 +00:00			`self.assertEqual(faulty_detections, [], Fore.YELLOW +`
Added a test for duplicate filters and a test for Source: Eventlog 2019-02-18 18:05:58 +00:00			`"There are rule files with exactly the same detection logic.")`

			`def test_source_eventlog(self):`
			`faulty_detections = []`

			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`detection = self.get_rule_part(file_path = file, part_name = "detection")`
			`detection_str = str(detection).lower()`
			`if "'source': 'eventlog'" in detection_str:`
			`faulty_detections.append(file)`

feat: colorized error messages 2020-01-30 07:50:22 +00:00			`self.assertEqual(faulty_detections, [], Fore.YELLOW +`
Added a test for duplicate filters and a test for Source: Eventlog 2019-02-18 18:05:58 +00:00			`"There are detections with 'Source: Eventlog'. This does not add value to the detection.")`

Enabled check for process_creation 2019-03-09 18:00:11 +00:00			`def test_event_id_instead_of_process_creation(self):`
Added checks for Sysmon 1 or EID 4688 instead of process_creation 2019-03-02 17:51:49 +00:00			`faulty_detections = []`
			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`with open(file) as f:`
			`for line in f:`
Properly end anchored the regex 2019-03-09 16:23:50 +00:00			`if re.search(r'.EventID: (?:1\|4688)\s$', line) and file not in faulty_detections:`
Added checks for Sysmon 1 or EID 4688 instead of process_creation 2019-03-02 17:51:49 +00:00			`faulty_detections.append(file)`

feat: colorized error messages 2020-01-30 07:50:22 +00:00			`self.assertEqual(faulty_detections, [], Fore.YELLOW +`
Enabled check for process_creation 2019-03-09 18:00:11 +00:00			`"There are rules still using Sysmon 1 or Event ID 4688. Please migrate to the process_creation category.")`
Added checks for Sysmon 1 or EID 4688 instead of process_creation 2019-03-02 17:51:49 +00:00
feat: detect missing id 2020-01-30 15:08:24 +00:00			`def test_missing_id(self):`
			`faulty_rules = []`
			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`id = self.get_rule_part(file_path=file, part_name="id")`
			`if not id:`
			`print(Fore.YELLOW + "Rule {} has no field 'id'.".format(file))`
			`faulty_rules.append(file)`
			`elif len(id) != 36:`
			`print(Fore.YELLOW + "Rule {} has a malformed 'id' (not 36 chars).".format(file))`
			`faulty_rules.append(file)`

			`self.assertEqual(faulty_rules, [], Fore.RED +`
			`"There are rules with missing or malformed 'id' fields. Create an id (e.g. here: https://www.uuidgenerator.net/version4) and add it to the reported rule(s).")`

add new test for sysmon rules without eventid 2020-05-23 14:25:37 +00:00			`def test_sysmon_rule_without_eventid(self):`
			`faulty_rules = []`
			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`logsource = self.get_rule_part(file_path=file, part_name="logsource")`
			`service = logsource.get('service', '')`
			`if service.lower() == 'sysmon':`
			`with open(file) as f:`
			`found = False`
			`for line in f:`
			`if re.search(r'.EventID:.$', line): # might be on a single line or in multiple lines`
			`found = True`
			`break`
			`if not found:`
			`faulty_rules.append(file)`

			`self.assertEqual(faulty_rules, [], Fore.RED +`
			`"There are rules using sysmon events but with no EventID specified")`


feat: detect missing date 2020-01-30 15:08:34 +00:00			`def test_missing_date(self):`
			`faulty_rules = []`
			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`datefield = self.get_rule_part(file_path=file, part_name="date")`
			`if not datefield:`
			`print(Fore.YELLOW + "Rule {} has no field 'date'.".format(file))`
			`faulty_rules.append(file)`
			`elif len(datefield) != 10:`
			`print(Fore.YELLOW + "Rule {} has a malformed 'date' (not 10 chars, should be YYYY/MM/DD).".format(file))`
			`faulty_rules.append(file)`

			`self.assertEqual(faulty_rules, [], Fore.RED +`
			`"There are rules with missing or malformed 'date' fields. (create one, e.g. date: 2019/01/14)")`
Added checks for Sysmon 1 or EID 4688 instead of process_creation 2019-03-02 17:51:49 +00:00
feat: test references is list 2020-07-13 16:07:19 +00:00			`def test_references(self):`
			`faulty_rules = []`
			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
fix: typo in field value 2020-07-13 16:08:00 +00:00			`references = self.get_rule_part(file_path=file, part_name="references")`
fix: nested check 2020-07-13 16:49:00 +00:00			`# Reference field doesn't exist`
refactor: references test without warnings for missing refs 2020-07-14 10:33:02 +00:00			`#if not references:`
			`#print(Fore.YELLOW + "Rule {} has no field 'references'.".format(file))`
fix: typo and reordered 2020-07-13 16:22:47 +00:00			`#faulty_rules.append(file)`
refactor: references test without warnings for missing refs 2020-07-14 10:33:02 +00:00			`if references:`
fix: nested check 2020-07-13 16:49:00 +00:00			`# it exists but isn't a list`
			`if not isinstance(references, list):`
			`print(Fore.YELLOW + "Rule {} has a references field that isn't a list.".format(file))`
			`faulty_rules.append(file)`
feat: test references is list 2020-07-13 16:07:19 +00:00
			`self.assertEqual(faulty_rules, [], Fore.RED +`
			`"There are rules with malformed 'references' fields. (has to be a list of values even if it contains only a single value)")`

feat: filename test 2020-07-14 10:33:16 +00:00			`def test_file_names(self):`
			`faulty_rules = []`
			`filename_pattern = re.compile('[a-z0-9_]{10,70}\.yml')`
			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`filename = os.path.basename(file)`
			`if not filename_pattern.match(filename) and not '_' in filename:`
			`print(Fore.YELLOW + "Rule {} has a file name that doesn't match our standard.".format(file))`
			`faulty_rules.append(file)`

			`self.assertEqual(faulty_rules, [], Fore.RED +`
			`"There are rules with malformed file names (too short, too long, uppercase letters, a minus sign etc.). Please see the file names used in our repository and adjust your file names accordingly. The pattern for a valid file name is '[a-z0-9_]{10,70}\.yml' and it has to contain at least an underline character.")`

feat: rule title tests 2020-01-30 16:26:21 +00:00			`def test_title(self):`
			`faulty_rules = []`
Rule fixes Made tests pass the new CI tests. Added further allowed lower case words in rule test. 2020-02-20 22:00:16 +00:00			`allowed_lowercase_words = [`
			`'the',`
			`'for',`
			`'in',`
			`'with',`
			`'via',`
			`'on',`
			`'to',`
			`'without',`
			`'of',`
			`'through',`
			`'from',`
			`'by',`
			`'as',`
			`'a',`
			`'or',`
			`'at',`
			`'and',`
			`'an',`
			`'over',`
			`'new',`
			`]`
feat: rule title tests 2020-01-30 16:26:21 +00:00			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`title = self.get_rule_part(file_path=file, part_name="title")`
			`if not title:`
			`print(Fore.RED + "Rule {} has no field 'title'.".format(file))`
			`faulty_rules.append(file)`
			`continue`
			`elif len(title) > 70:`
			`print(Fore.YELLOW + "Rule {} has a title field with too many characters (>70)".format(file))`
			`faulty_rules.append(file)`
			`if title.startswith("Detects "):`
			`print(Fore.RED + "Rule {} has a title that starts with 'Detects'".format(file))`
			`faulty_rules.append(file)`
			`wrong_casing = []`
			`for word in title.split(" "):`
fix test 2020-05-23 14:03:13 +00:00			`if word.islower() and not word.lower() in allowed_lowercase_words and not "." in word and not "/" in word and not word[0].isdigit():`
feat: rule title tests 2020-01-30 16:26:21 +00:00			`wrong_casing.append(word)`
			`if len(wrong_casing) > 0:`
			`print(Fore.RED + "Rule {} has a title that has not title capitalization. Words: '{}'".format(file, ", ".join(wrong_casing)))`
			`faulty_rules.append(file)`

			`self.assertEqual(faulty_rules, [], Fore.RED +`
			`"There are rules with non-conform 'title' fields. Please check: https://github.com/Neo23x0/sigma/wiki/Rule-Creation-Guide#title")`
Added checks for Sysmon 1 or EID 4688 instead of process_creation 2019-03-02 17:51:49 +00:00
Add logsource attribute rule test 2020-07-13 21:02:28 +00:00			`def test_invalid_logsource_attributes(self):`
			`faulty_rules = []`
			`for file in self.yield_next_rule_file_path(self.path_to_rules):`
			`logsource = self.get_rule_part(file_path=file, part_name="logsource")`
			`for key in logsource:`
			`if key.lower() not in ['category', 'product', 'service', 'definition']:`
			`print(Fore.RED + "Rule {} has a logsource with an invalid field ({})".format(file, key))`
refactor: tests use live data from MITRE's TAXI service 2020-07-14 15:54:02 +00:00			`def get_mitre_data():`
			`"""`
docs: MITRE ATT&CK(R) trademark references removed or adjusted https://github.com/Neo23x0/sigma/issues/1028 2020-09-30 06:53:52 +00:00			`Generate tags from live MITRE ATT&CK® TAXI service to get up-to-date data`
refactor: tests use live data from MITRE's TAXI service 2020-07-14 15:54:02 +00:00			`"""`
docs: MITRE ATT&CK(R) trademark references removed or adjusted https://github.com/Neo23x0/sigma/issues/1028 2020-09-30 06:53:52 +00:00			`# Get ATT&CK information`
refactor: tests use live data from MITRE's TAXI service 2020-07-14 15:54:02 +00:00			`lift = attack_client()`
			`# Techniques`
			`MITRE_TECHNIQUES = []`
			`MITRE_TECHNIQUE_NAMES = []`
			`MITRE_PHASE_NAMES = set()`
			`MITRE_TOOLS = []`
			`MITRE_GROUPS = []`
			`# Techniques`
			`enterprise_techniques = lift.get_enterprise_techniques()`
			`for t in enterprise_techniques:`
			`MITRE_TECHNIQUE_NAMES.append(t['name'].lower().replace(' ', '_').replace('-', '_'))`
			`for r in t.external_references:`
			`if 'external_id' in r:`
			`MITRE_TECHNIQUES.append(r['external_id'].lower())`
			`if 'kill_chain_phases' in t:`
			`for kc in t['kill_chain_phases']:`
			`if 'phase_name' in kc:`
			`MITRE_PHASE_NAMES.add(kc['phase_name'].replace('-','_'))`
			`# Tools / Malware`
			`enterprise_tools = lift.get_enterprise_tools()`
			`for t in enterprise_tools:`
			`for r in t.external_references:`
			`if 'external_id' in r:`
			`MITRE_TOOLS.append(r['external_id'].lower())`
			`enterprise_malware = lift.get_enterprise_malware()`
			`for m in enterprise_malware:`
			`for r in m.external_references:`
			`if 'external_id' in r:`
			`MITRE_TOOLS.append(r['external_id'].lower())`
			`# Groups`
			`enterprise_groups = lift.get_enterprise_groups()`
			`for g in enterprise_groups:`
			`for r in g.external_references:`
			`if 'external_id' in r:`
			`MITRE_GROUPS.append(r['external_id'].lower())`

			`# Combine all IDs to a big tag list`
			`return ["attack." + item for item in MITRE_TECHNIQUES + MITRE_TECHNIQUE_NAMES + list(MITRE_PHASE_NAMES) + MITRE_GROUPS + MITRE_TOOLS]`
Add logsource attribute rule test 2020-07-13 21:02:28 +00:00

Added two tests. One for MITRE and another for file extension. 2019-01-22 18:25:13 +00:00			`if __name__ == "__main__":`
feat: colorized output in test 2020-01-30 07:37:47 +00:00			`init(autoreset=True)`
docs: MITRE ATT&CK(R) trademark references removed or adjusted https://github.com/Neo23x0/sigma/issues/1028 2020-09-30 06:53:52 +00:00			`# Get Current Data from MITRE ATT&CK®`
refactor: tests use live data from MITRE's TAXI service 2020-07-14 15:54:02 +00:00			`MITRE_ALL = get_mitre_data()`
			`# Run the tests`
Added rule test to CI testing 2019-01-23 22:31:36 +00:00			`unittest.main()`