# Automatic Fs low values reduction calculator
This script automatically calculates the config parameter `min_value_for_not_reduce` for Fs small values reduction (for noisy Fs). It was written both for research (prior to writing production code) and for POCs (running versions of the product without automatic Fs low values reduction calculation in the production code).

### Assumptions:
This script assumes that there's an accessible mongo with the collections starting with `scored___aggr_event` populated. These are used in order to find which Fs are noisy (such that low values reduction can help reducing the noise).

### Configuration:
* `mongo_ip` should be configured with the right ip.
* `verbose` can be set to `True` in order to print more stuff.
* `show_graphs` should be set to `True` only when you want to display graphs (typically in research environment).
* `aggregated_feature_event_prevalance_stats_path` is the path to the version of the configuration installed for the customer. The reason this is needed is so we can undo the reduction done in runtime - so we can see the real values and scores and decide on the right new reduction (which might be different than what we've set during the installation process).

### Output:
The names of the Fs that should be reduced are printed following by a number - this is the `min_value_for_not_reduce` parameter. All the other parameters (`max_value_for_fully_reduce` and `reducing_factor`) should be set manually.

In [None]:
import time
import datetime
import sys
sys.path.append('..')
from common.utils import print_verbose
from fs_reduction import main
from common import config
if config.show_graphs:
    import matplotlib.pyplot as plt
    import seaborn as sns
    %matplotlib inline

In [None]:
%load_ext autoreload
%autoreload 2

In [None]:
%%javascript
//IPython.load_extensions('usability\\execute_time\\ExecuteTime');

In [None]:
main.load_data_and_run_algo()

In [43]:
good = {"fs_reducers": {"number_of_failed_crmsf_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 4, "reducing_factor": 0.10000000}, "number_of_successful_ssh_daily": {"max_value_for_fully_reduce": 6, "min_value_for_not_reduce": 8, "reducing_factor": 0.30000000}, "number_of_successful_oracle_events_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_dst_machines_kerberos_logins_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "number_of_successful_kerberos_logins_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "number_of_successful_kerberos_logins_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 13, "reducing_factor": 0.10000000}, "number_of_failed_oracle_hourly": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 2, "reducing_factor": 0.10000000}, "number_of_failed_ssh_daily": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 10, "reducing_factor": 0.10000000}, "distinct_number_of_destination_machines_oracle_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_kerberos_tgt_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "number_of_failed_ntlm_hourly": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 10, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_ssh_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_countries_vpn_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.30000000}, "number_of_failed_kerberos_logins_daily": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 2, "reducing_factor": 0.10000000}, "number_of_failed_ssh_events_hourly": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_dst_machines_ssh_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "number_of_successful_ssh_events_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_dst_machines_kerberos_logins_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_db_objects_oracle_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_vpn_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_ntlm_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.30000000}, "distinct_number_of_src_machines_kerberos_logins_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_src_machines_ssh_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 5, "reducing_factor": 0.10000000}, "distinct_number_of_countries_vpn_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_countries_crmsf_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 4, "reducing_factor": 0.20000000}, "distinct_number_of_countries_crmsf_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 8, "reducing_factor": 0.20000000}, "number_of_successful_crmsf_events_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 8, "reducing_factor": 0.30000000}, "distinct_number_of_db_objects_oracle_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_source_machines_oracle_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_source_machines_oracle_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_vpn_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 5, "reducing_factor": 0.20000000}, "distinct_number_of_dst_machines_ssh_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_src_machines_kerberos_logins_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "number_of_successful_kerberos_tgt_events_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "number_of_failed_kerberos_logins_hourly": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 2, "reducing_factor": 0.10000000}}, "hourly_reducer": {"max_value_for_fully_reduce": 0.00067089, "min_value_for_not_reduce": 0.00142790, "reducing_factor": 0.10000000}, "w": {"normalized_username_hourly": {"P": {"highest_score_gwame_hourly": 0.00083203, "sum_of_highest_scores_over_action_type_oracle_hourly": 0.00094790, "sum_of_highest_scores_over_dst_machines_ssh_hourly": 0.00088182, "highest_score_over_date_time_events_vpn_hourly": 0.00074589, "sum_of_highest_scores_per_action_type_wame_hourly": 0.00096257, "sum_of_highest_scores_over_country_vpn_hourly": 0.00075748, "sum_of_highest_scores_over_src_machines_oracle_hourly": 0.00093656, "sum_of_highest_scores_over_failure_code_kerberos_logins_hourly": 0.00065670, "sum_of_highest_scores_over_src_machines_vpn_hourly": 0.00100000, "sum_of_highest_scores_over_db_username_oracle_hourly": 0.00083152, "sum_of_highest_scores_over_src_machines_kerberos_logins_hourly": 0.00077374, "highest_scores_over_failure_code_ntlm_hourly": 0.00082098, "sum_of_highest_scores_over_country_crmsf_hourly": 0.00077542, "sum_of_highest_scores_over_src_machines_kerberos_tgt_hourly": 0.00093250, "sum_of_scores_rate_vpn_session_hourly": 0.00070066, "sum_of_highest_scores_over_dest_machines_oracle_hourly": 0.00094435, "highest_date_time_score_wame_hourly": 0.00095568, "highest_score_over_date_time_events_kerberos_logins_hourly": 0.00071770, "highest_score_over_auth_method_events_ssh_hourly": 0.00093031, "highest_score_over_date_time_events_ssh_hourly": 0.00074460, "highest_score_over_date_time_events_oracle_hourly": 0.00085281, "highest_score_over_date_time_events_crmsf_hourly": 0.00085460, "highest_event_time_score_ntlm_hourly": 0.00100000, "sum_of_highest_scores_over_src_machines_prnlog_hourly": 0.00100000, "sum_of_highest_scores_over_dst_machines_prnlog_hourly": 0.00099676, "sum_of_highest_scores_over_dst_machines_kerberos_logins_hourly": 0.00083237, "highest_score_over_date_time_events_prnlog_hourly": 0.00093060, "sum_of_highest_scores_over_status_crmsf_hourly": 0.00081523, "sum_of_highest_scores_over_src_machines_ssh_hourly": 0.00089802, "sum_of_highest_scores_over_src_machines_ntlm_hourly": 0.00093698, "highest_event_time_score_kerberos_tgt_hourly": 0.00080482, "sum_of_file_size_prnlog_hourly": 0.00000001, "sum_of_pages_prnlog_hourly": 0.00100000, "sum_of_highest_scores_over_db_object_oracle_hourly": 0.00083295, "highest_scores_over_failure_code_kerberos_tgt_hourly": 0.00082076, "sum_of_highest_scores_over_return_code_oracle_hourly": 0.00082179}, "F": {"number_of_failed_kerberos_tgt_hourly": 0.07999280, "number_of_failed_crmsf_hourly": 0.08813594, "distinct_number_of_src_machines_prnlog_hourly": 0.09753915, "distinct_number_of_db_usernames_oracle_hourly": 0.07797539, "number_of_successful_oracle_events_hourly": 0.08127811, "distinct_number_of_dst_machines_kerberos_logins_hourly": 0.07918063, "distinct_number_of_events_prnlog_hourly": 0.09508973, "number_of_successful_kerberos_logins_hourly": 0.07877742, "number_of_failed_oracle_hourly": 0.07648063, "number_of_events_wame_hourly": 0.09508973, "distinct_number_of_total_pages_prnlog_hourly": 0.09508973, "distinct_number_of_destination_machines_oracle_hourly": 0.07615755, "distinct_number_of_src_machines_ntlm_hourly": 0.09899275, "number_of_events_gwame_hourly": 0.08130556, "number_of_failed_ntlm_hourly": 0.08130556, "distinct_number_of_db_objects_oracle_hourly": 0.07757040, "distinct_number_of_src_machines_vpn_hourly": 0.08719627, "number_of_failed_ssh_events_hourly": 0.08510221, "distinct_number_of_file_size_bytes_prnlog_hourly": 0.09508814, "number_of_successful_ssh_events_hourly": 0.07019710, "distinct_number_of_src_machines_ssh_hourly": 0.07673035, "distinct_number_of_src_machines_kerberos_logins_hourly": 0.09122561, "distinct_number_of_src_machines_kerberos_tgt_hourly": 0.08296688, "distinct_number_of_countries_vpn_hourly": 0.07757014, "distinct_number_of_countries_crmsf_hourly": 0.08296688, "number_of_successful_crmsf_events_hourly": 0.08509111, "number_of_successful_ntlm_events_hourly": 0.09953457, "distinct_number_of_source_machines_oracle_hourly": 0.07714851, "distinct_number_of_dst_machines_ssh_hourly": 0.07907357, "number_of_successful_kerberos_tgt_events_hourly": 0.07742631, "number_of_failed_vpn_events_hourly": 0.09181731, "number_of_failed_kerberos_logins_hourly": 0.07294040}}, "normalized_username_daily": {"P": {"highest_score_over_date_time_events_vpn_daily": 0.00074481, "sum_of_highest_scores_over_src_machines_prnlog_daily": 0.00100000, "sum_of_pages_prnlog_daily": 0.00100000, "sum_of_highest_scores_over_src_machines_ntlm_daily": 0.00086605, "sum_of_highest_scores_over_src_machines_oracle_daily": 0.00100000, "highest_date_time_score_wame_daily": 0.00092310, "highest_score_over_date_time_events_oracle_daily": 0.00086641, "sum_of_highest_scores_over_src_machines_kerberos_logins_daily": 0.00077519, "sum_of_highest_scores_over_failure_code_kerberos_logins_daily": 0.00069869, "highest_event_time_score_kerberos_tgt_daily": 0.00080860, "sum_of_highest_scores_over_dst_machines_ssh_daily": 0.00086262, "sum_of_highest_scores_over_src_machines_kerberos_tgt_daily": 0.00100000, "sum_of_highest_scores_over_db_object_oracle_daily": 0.00087661, "sum_of_highest_scores_over_dst_machines_kerberos_logins_daily": 0.00083591, "sum_of_highest_scores_over_dst_machines_prnlog_daily": 0.00100000, "highest_score_gwame_daily": 0.00088167, "sum_of_highest_scores_over_src_machines_vpn_daily": 0.00100000, "sum_of_highest_scores_over_dest_machines_oracle_daily": 0.00097996, "sum_of_highest_scores_over_return_code_oracle_daily": 0.00076399, "sum_of_highest_scores_over_status_crmsf_daily": 0.00081943, "highest_score_over_auth_method_events_ssh_daily": 0.00094275, "sum_of_file_size_prnlog_daily": 0.00000001, "sum_of_highest_scores_per_action_type_wame_daily": 0.00093144, "highest_score_over_date_time_events_kerberos_logins_daily": 0.00071715, "sum_of_highest_scores_over_src_machines_ssh_daily": 0.00089959, "sum_of_highest_scores_over_db_username_oracle_daily": 0.00086641, "highest_score_over_date_time_events_crmsf_daily": 0.00084202, "sum_of_highest_scores_over_country_vpn_daily": 0.00076841, "sum_of_highest_scores_over_action_type_oracle_daily": 0.00099293, "sum_of_scores_rate_vpn_session_daily": 0.00070124, "highest_scores_over_failure_code_ntlm_daily": 0.00080982, "highest_score_over_date_time_events_ssh_daily": 0.00074728, "sum_of_highest_scores_over_country_crmsf_daily": 0.00078751, "highest_scores_over_failure_code_kerberos_tgt_daily": 0.00081207, "highest_event_time_score_ntlm_daily": 0.00099293, "highest_score_over_date_time_events_prnlog_daily": 0.00093251}, "F": {"distinct_number_of_total_pages_prnlog_daily": 0.09194930, "distinct_number_of_countries_vpn_daily": 0.07395026, "number_of_successful_ssh_daily": 0.08094480, "number_of_successful_kerberos_logins_daily": 0.10000000, "distinct_number_of_file_size_bytes_prnlog_daily": 0.09191167, "number_of_failed_crmsf_daily": 0.09194930, "number_of_failed_kerberos_tgt_daily": 0.09487406, "distinct_number_of_events_prnlog_daily": 0.09194930, "number_of_failed_ssh_daily": 0.08937909, "distinct_number_of_src_machines_prnlog_daily": 0.09487406, "number_of_successful_kerberos_tgt_events_daily": 0.08949090, "distinct_number_of_src_machines_kerberos_tgt_daily": 0.08772228, "number_of_successful_ntlm_events_daily": 0.09858740, "number_of_failed_ntlm_daily": 0.09194930, "number_of_failed_vpn_daily": 0.10000000, "distinct_number_of_src_machines_ssh_daily": 0.07831642, "number_of_events_wame_daily": 0.09487406, "number_of_failed_kerberos_logins_daily": 0.07529806, "number_of_events_gwame_daily": 0.08782008, "number_of_failed_oracle_daily": 0.08630328, "distinct_number_of_dst_machines_ssh_daily": 0.07551451, "distinct_number_of_dst_machines_kerberos_logins_daily": 0.07684845, "distinct_number_of_db_objects_oracle_daily": 0.08630328, "distinct_number_of_src_machines_vpn_daily": 0.07487054, "distinct_number_of_src_machines_ntlm_daily": 0.08938249, "distinct_number_of_countries_crmsf_daily": 0.08388250, "distinct_number_of_source_machines_oracle_daily": 0.08962071, "distinct_number_of_destination_machines_oracle_daily": 0.08782008, "number_of_successful_crmsf_events_daily": 0.08782008, "distinct_number_of_src_machines_kerberos_logins_daily": 0.08110962, "number_of_successful_oracle_events_daily": 0.08630328, "distinct_number_of_db_usernames_oracle_daily": 0.08630328}}}, "daily_reducer": {"max_value_for_fully_reduce": 0.00067089, "min_value_for_not_reduce": 0.00142790, "reducing_factor": 0.10000000}}
new = {"fs_reducers": {"number_of_failed_crmsf_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 4, "reducing_factor": 0.10000000}, "number_of_successful_ssh_daily": {"max_value_for_fully_reduce": 6, "min_value_for_not_reduce": 8, "reducing_factor": 0.30000000}, "number_of_successful_oracle_events_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_dst_machines_kerberos_logins_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "number_of_successful_kerberos_logins_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "number_of_successful_kerberos_logins_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 13, "reducing_factor": 0.10000000}, "number_of_failed_oracle_hourly": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 2, "reducing_factor": 0.10000000}, "number_of_failed_ssh_daily": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 10, "reducing_factor": 0.10000000}, "distinct_number_of_destination_machines_oracle_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_kerberos_tgt_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "number_of_failed_ntlm_hourly": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 10, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_ssh_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_countries_vpn_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.30000000}, "number_of_failed_kerberos_logins_daily": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 2, "reducing_factor": 0.10000000}, "number_of_failed_ssh_events_hourly": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_dst_machines_ssh_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "number_of_successful_ssh_events_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_dst_machines_kerberos_logins_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_db_objects_oracle_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_vpn_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_ntlm_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.30000000}, "distinct_number_of_src_machines_kerberos_logins_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_src_machines_ssh_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 5, "reducing_factor": 0.10000000}, "distinct_number_of_countries_vpn_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_countries_crmsf_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 4, "reducing_factor": 0.20000000}, "distinct_number_of_countries_crmsf_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 8, "reducing_factor": 0.20000000}, "number_of_successful_crmsf_events_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 8, "reducing_factor": 0.30000000}, "distinct_number_of_db_objects_oracle_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_source_machines_oracle_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_source_machines_oracle_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "distinct_number_of_src_machines_vpn_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 5, "reducing_factor": 0.20000000}, "distinct_number_of_dst_machines_ssh_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "distinct_number_of_src_machines_kerberos_logins_daily": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.20000000}, "number_of_successful_kerberos_tgt_events_hourly": {"max_value_for_fully_reduce": 2, "min_value_for_not_reduce": 3, "reducing_factor": 0.10000000}, "number_of_failed_kerberos_logins_hourly": {"max_value_for_fully_reduce": 1, "min_value_for_not_reduce": 2, "reducing_factor": 0.10000000}}, "hourly_reducer": {"max_value_for_fully_reduce": 0.00067089, "min_value_for_not_reduce": 0.00142790, "reducing_factor": 0.10000000}, "w": {"normalized_username_hourly": {"P": {"highest_score_gwame_hourly": 0.00083203, "sum_of_highest_scores_over_action_type_oracle_hourly": 0.00094790, "sum_of_highest_scores_over_dst_machines_ssh_hourly": 0.00088182, "highest_score_over_date_time_events_vpn_hourly": 0.00074589, "sum_of_highest_scores_per_action_type_wame_hourly": 0.00096257, "sum_of_highest_scores_over_country_vpn_hourly": 0.00075748, "sum_of_highest_scores_over_src_machines_oracle_hourly": 0.00093656, "sum_of_highest_scores_over_country_crmsf_hourly": 0.00077542, "sum_of_highest_scores_over_src_machines_vpn_hourly": 0.00100000, "sum_of_highest_scores_over_db_username_oracle_hourly": 0.00083152, "highest_event_time_score_kerberos_tgt_hourly": 0.00080482, "highest_scores_over_failure_code_ntlm_hourly": 0.00082098, "sum_of_highest_scores_over_failure_code_kerberos_logins_hourly": 0.00065670, "sum_of_highest_scores_over_src_machines_kerberos_tgt_hourly": 0.00093250, "sum_of_highest_scores_over_db_object_oracle_hourly": 0.00083295, "sum_of_highest_scores_over_dest_machines_oracle_hourly": 0.00094435, "highest_date_time_score_wame_hourly": 0.00095568, "highest_score_over_date_time_events_kerberos_logins_hourly": 0.00071770, "highest_score_over_auth_method_events_ssh_hourly": 0.00093031, "highest_score_over_date_time_events_ssh_hourly": 0.00074460, "highest_score_over_date_time_events_oracle_hourly": 0.00085281, "highest_score_over_date_time_events_crmsf_hourly": 0.00085460, "highest_event_time_score_ntlm_hourly": 0.00100000, "sum_of_highest_scores_over_src_machines_prnlog_hourly": 0.00100000, "sum_of_highest_scores_over_dst_machines_prnlog_hourly": 0.00099676, "sum_of_highest_scores_over_dst_machines_kerberos_logins_hourly": 0.00083237, "highest_score_over_date_time_events_prnlog_hourly": 0.00093060, "sum_of_highest_scores_over_src_machines_ssh_hourly": 0.00089802, "sum_of_highest_scores_over_status_crmsf_hourly": 0.00081523, "sum_of_highest_scores_over_src_machines_ntlm_hourly": 0.00093698, "sum_of_highest_scores_over_src_machines_kerberos_logins_hourly": 0.00077374, "sum_of_file_size_prnlog_hourly": 0.00000001, "sum_of_pages_prnlog_hourly": 0.00100000, "sum_of_scores_rate_vpn_session_hourly": 0.00070066, "highest_scores_over_failure_code_kerberos_tgt_hourly": 0.00082076, "sum_of_highest_scores_over_return_code_oracle_hourly": 0.00082179}, "F": {"number_of_failed_kerberos_tgt_hourly": 0.07999280, "number_of_failed_crmsf_hourly": 0.08813594, "distinct_number_of_src_machines_prnlog_hourly": 0.09753915, "distinct_number_of_db_usernames_oracle_hourly": 0.07797539, "number_of_successful_oracle_events_hourly": 0.08127811, "distinct_number_of_dst_machines_kerberos_logins_hourly": 0.07918063, "distinct_number_of_events_prnlog_hourly": 0.09508973, "number_of_successful_kerberos_logins_hourly": 0.07877742, "number_of_failed_oracle_hourly": 0.07648063, "number_of_events_wame_hourly": 0.09508973, "distinct_number_of_total_pages_prnlog_hourly": 0.09508973, "distinct_number_of_destination_machines_oracle_hourly": 0.07615755, "distinct_number_of_src_machines_ntlm_hourly": 0.09899275, "number_of_events_gwame_hourly": 0.08130556, "number_of_failed_ntlm_hourly": 0.08130556, "distinct_number_of_db_objects_oracle_hourly": 0.07757040, "distinct_number_of_src_machines_vpn_hourly": 0.08719627, "number_of_failed_ssh_events_hourly": 0.08510221, "distinct_number_of_file_size_bytes_prnlog_hourly": 0.09508814, "number_of_successful_ssh_events_hourly": 0.07019710, "distinct_number_of_src_machines_ssh_hourly": 0.07673035, "distinct_number_of_src_machines_kerberos_logins_hourly": 0.09122561, "distinct_number_of_src_machines_kerberos_tgt_hourly": 0.08296688, "distinct_number_of_countries_vpn_hourly": 0.07757014, "distinct_number_of_countries_crmsf_hourly": 0.08296688, "number_of_successful_crmsf_events_hourly": 0.08509111, "number_of_successful_ntlm_events_hourly": 0.09953457, "distinct_number_of_source_machines_oracle_hourly": 0.07714851, "distinct_number_of_dst_machines_ssh_hourly": 0.07907357, "number_of_successful_kerberos_tgt_events_hourly": 0.07742631, "number_of_failed_vpn_events_hourly": 0.09181731, "number_of_failed_kerberos_logins_hourly": 0.07294040}}, "normalized_username_daily": {"P": {"highest_score_over_date_time_events_vpn_daily": 0.00074481, "sum_of_highest_scores_over_src_machines_prnlog_daily": 0.00100000, "sum_of_pages_prnlog_daily": 0.00100000, "sum_of_highest_scores_over_src_machines_ntlm_daily": 0.00086605, "sum_of_highest_scores_over_src_machines_oracle_daily": 0.00100000, "highest_date_time_score_wame_daily": 0.00092310, "highest_score_over_date_time_events_oracle_daily": 0.00086641, "sum_of_highest_scores_over_src_machines_kerberos_logins_daily": 0.00077519, "sum_of_highest_scores_over_failure_code_kerberos_logins_daily": 0.00069869, "highest_score_over_date_time_events_kerberos_logins_daily": 0.00071715, "sum_of_highest_scores_over_dst_machines_ssh_daily": 0.00086262, "sum_of_highest_scores_over_src_machines_kerberos_tgt_daily": 0.00100000, "sum_of_highest_scores_over_db_object_oracle_daily": 0.00087661, "sum_of_highest_scores_over_dst_machines_kerberos_logins_daily": 0.00083591, "sum_of_highest_scores_over_dst_machines_prnlog_daily": 0.00100000, "highest_score_gwame_daily": 0.00088167, "sum_of_highest_scores_over_src_machines_vpn_daily": 0.00100000, "sum_of_highest_scores_over_dest_machines_oracle_daily": 0.00097996, "sum_of_file_size_prnlog_daily": 0.00000001, "sum_of_highest_scores_over_status_crmsf_daily": 0.00081943, "highest_score_over_auth_method_events_ssh_daily": 0.00094275, "sum_of_highest_scores_over_return_code_oracle_daily": 0.00076399, "sum_of_highest_scores_per_action_type_wame_daily": 0.00093144, "highest_event_time_score_kerberos_tgt_daily": 0.00080860, "sum_of_highest_scores_over_src_machines_ssh_daily": 0.00089959, "sum_of_highest_scores_over_db_username_oracle_daily": 0.00086641, "highest_score_over_date_time_events_crmsf_daily": 0.00084202, "sum_of_highest_scores_over_country_vpn_daily": 0.00076841, "sum_of_highest_scores_over_action_type_oracle_daily": 0.00099293, "sum_of_scores_rate_vpn_session_daily": 0.00070124, "highest_scores_over_failure_code_ntlm_daily": 0.00080982, "highest_score_over_date_time_events_ssh_daily": 0.00074728, "sum_of_highest_scores_over_country_crmsf_daily": 0.00078751, "highest_scores_over_failure_code_kerberos_tgt_daily": 0.00081207, "highest_event_time_score_ntlm_daily": 0.00099293, "highest_score_over_date_time_events_prnlog_daily": 0.00093251}, "F": {"distinct_number_of_total_pages_prnlog_daily": 0.09194930, "distinct_number_of_source_machines_oracle_daily": 0.08962071, "distinct_number_of_countries_vpn_daily": 0.07395026, "number_of_successful_ssh_daily": 0.08094480, "distinct_number_of_destination_machines_oracle_daily": 0.08782008, "number_of_successful_kerberos_logins_daily": 0.10000000, "distinct_number_of_file_size_bytes_prnlog_daily": 0.09191167, "number_of_failed_kerberos_tgt_daily": 0.09487406, "distinct_number_of_events_prnlog_daily": 0.09194930, "number_of_failed_ssh_daily": 0.08937909, "distinct_number_of_src_machines_prnlog_daily": 0.09487406, "distinct_number_of_src_machines_kerberos_logins_daily": 0.08110962, "distinct_number_of_src_machines_kerberos_tgt_daily": 0.08772228, "number_of_successful_ntlm_events_daily": 0.09858740, "number_of_failed_ntlm_daily": 0.09194930, "distinct_number_of_src_machines_ssh_daily": 0.07831642, "number_of_events_wame_daily": 0.09487406, "number_of_failed_kerberos_logins_daily": 0.07529806, "number_of_events_gwame_daily": 0.08782008, "number_of_failed_oracle_daily": 0.08630328, "distinct_number_of_dst_machines_ssh_daily": 0.07551451, "distinct_number_of_dst_machines_kerberos_logins_daily": 0.07684845, "distinct_number_of_db_objects_oracle_daily": 0.08630328, "distinct_number_of_src_machines_vpn_daily": 0.07487054, "distinct_number_of_src_machines_ntlm_daily": 0.08938249, "distinct_number_of_countries_crmsf_daily": 0.08388250, "number_of_failed_crmsf_daily": 0.09194930, "number_of_failed_vpn_daily": 0.10000000, "number_of_successful_crmsf_events_daily": 0.08782008, "number_of_successful_kerberos_tgt_events_daily": 0.08949090, "number_of_successful_oracle_events_daily": 0.08630328, "distinct_number_of_db_usernames_oracle_daily": 0.08630328}}}, "daily_reducer": {"max_value_for_fully_reduce": 0.00067089, "min_value_for_not_reduce": 0.00142790, "reducing_factor": 0.10000000}}

In [44]:
(set(new['fs_reducers'].iterkeys()) - set(good['fs_reducers'].iterkeys())).union(set(good['fs_reducers'].iterkeys()) - set(new['fs_reducers'].iterkeys()))

set()