2020-06-29 23:19:23 -06:00
|
|
|
# Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
|
2021-03-03 22:12:11 -09:00
|
|
|
# or more contributor license agreements. Licensed under the Elastic License
|
|
|
|
|
# 2.0; you may not use this file except in compliance with the Elastic License
|
|
|
|
|
# 2.0.
|
2020-06-29 23:19:23 -06:00
|
|
|
|
|
|
|
|
"""Detection Rules tests."""
|
2025-07-01 15:20:55 +02:00
|
|
|
|
2020-06-29 23:19:23 -06:00
|
|
|
import json
|
|
|
|
|
import os
|
2025-07-01 15:20:55 +02:00
|
|
|
import pathlib
|
2020-06-29 23:19:23 -06:00
|
|
|
|
2025-07-01 15:20:55 +02:00
|
|
|
from detection_rules.eswrap import combine_sources
|
2020-06-29 23:19:23 -06:00
|
|
|
|
2025-07-01 15:20:55 +02:00
|
|
|
CURRENT_DIR = pathlib.Path(__file__).resolve().parent
|
|
|
|
|
DATA_DIR = CURRENT_DIR / "data"
|
|
|
|
|
TP_DIR = DATA_DIR / "true_positives"
|
|
|
|
|
FP_DIR = DATA_DIR / "false_positives"
|
2020-06-29 23:19:23 -06:00
|
|
|
|
|
|
|
|
|
|
|
|
|
def get_fp_dirs():
|
|
|
|
|
"""Get a list of fp dir names."""
|
2025-07-01 15:20:55 +02:00
|
|
|
return FP_DIR.glob("*")
|
2020-06-29 23:19:23 -06:00
|
|
|
|
|
|
|
|
|
|
|
|
|
def get_fp_data_files():
|
|
|
|
|
"""get FP data files by fp dir name."""
|
|
|
|
|
data = {}
|
|
|
|
|
for fp_dir in get_fp_dirs():
|
2025-07-01 15:20:55 +02:00
|
|
|
path = pathlib.Path(fp_dir)
|
|
|
|
|
fp_dir_name = path.name
|
|
|
|
|
relative_dir_name = pathlib.Path("false_positives") / fp_dir_name
|
2020-06-29 23:19:23 -06:00
|
|
|
data[fp_dir_name] = combine_sources(*get_data_files(relative_dir_name).values())
|
|
|
|
|
|
|
|
|
|
return data
|
|
|
|
|
|
|
|
|
|
|
2025-07-01 15:20:55 +02:00
|
|
|
def get_data_files_list(*folder, ext="ndjson", recursive=False):
|
2020-06-29 23:19:23 -06:00
|
|
|
"""Get TP or FP file list."""
|
|
|
|
|
folder = os.path.sep.join(folder)
|
2025-07-01 15:20:55 +02:00
|
|
|
data_dir = pathlib.Path(DATA_DIR) / folder
|
|
|
|
|
|
|
|
|
|
glob = "**" if recursive else ""
|
|
|
|
|
glob += f"*.{ext}"
|
2020-06-29 23:19:23 -06:00
|
|
|
|
2025-07-01 15:20:55 +02:00
|
|
|
return data_dir.glob(glob)
|
2020-06-29 23:19:23 -06:00
|
|
|
|
|
|
|
|
|
2025-07-01 15:20:55 +02:00
|
|
|
def get_data_files(*folder, ext="ndjson", recursive=False):
|
2020-06-29 23:19:23 -06:00
|
|
|
"""Get data from data files."""
|
|
|
|
|
data_files = {}
|
|
|
|
|
for data_file in get_data_files_list(*folder, ext=ext, recursive=recursive):
|
2025-07-01 15:20:55 +02:00
|
|
|
path = pathlib.Path(data_file)
|
|
|
|
|
with path.open() as f:
|
|
|
|
|
file_name = path.stem
|
2020-06-29 23:19:23 -06:00
|
|
|
|
2025-07-01 15:20:55 +02:00
|
|
|
if ext in (".ndjson", ".jsonl"):
|
2020-06-29 23:19:23 -06:00
|
|
|
data = f.readlines()
|
|
|
|
|
data_files[file_name] = [json.loads(d) for d in data]
|
|
|
|
|
else:
|
|
|
|
|
data_files[file_name] = json.load(f)
|
|
|
|
|
|
|
|
|
|
return data_files
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
def get_data_file(*folder):
|
2025-07-01 15:20:55 +02:00
|
|
|
path = pathlib.Path(DATA_DIR) / os.path.sep.join(folder)
|
|
|
|
|
if path.exists():
|
|
|
|
|
with path.open() as f:
|
2020-06-29 23:19:23 -06:00
|
|
|
return json.load(f)
|
2025-07-01 15:20:55 +02:00
|
|
|
return None
|