ampel/contrib/hu/t2/T2BayesianBlocks.py

#!/usr/bin/env python
# -*- coding: utf-8 -*-
# File              : ampel/contrib/hu/t2/T2BayesianBlocks.py
# License           : BSD-3-Clause
# Author            : Eleni
# Date              : 28.04.2021
# Last Modified Date: 10.01.2023
# Last Modified By  : Eleni

import itertools
import math
import os
from collections.abc import Sequence
from typing import Any

import matplotlib.pyplot as plt  # type: ignore
import more_itertools as mit
import numpy as np
import pandas as pd  # type: ignore
from astropy.stats import bayesian_blocks  # type: ignore
from numpy.typing import ArrayLike
from scipy.signal import find_peaks  # type: ignore
from sklearn.metrics import mean_squared_error  # type: ignore
from uncertainties import unumpy  # type: ignore

from ampel.abstract.AbsLightCurveT2Unit import AbsLightCurveT2Unit
from ampel.contrib.hu.utils import flatten
from ampel.model.PlotProperties import PlotProperties
from ampel.plot.create import create_plot_record
from ampel.struct.UnitResult import UnitResult
from ampel.types import StockId, UBson
from ampel.view.LightCurve import LightCurve
from ampel.ztf.util.ZTFIdMapper import ZTFIdMapper
from ampel.ztf.util.ZTFNoisifiedIdMapper import ZTFNoisifiedIdMapper

# ruff: noqa: E712


class T2BayesianBlocks(AbsLightCurveT2Unit):
    """
    T2 unit for running a bayesian block search algorithm to highlight excess regions.
    Currently implemented for WISE infrared and ZTF optical lightcurves.
    """

    min_det_per_block: float = 1  # Minimum detections per block
    # blocks with lower number of detections will be removed

    # Rejection sigma
    rej_sigma: float = 3  # A lower number will more aggressively reject data

    # Plot
    plot: bool = True

    # Use Npoints per observed datapoint
    Npoints: bool = False

    # Type of data we will process, valid ztf_alert, ztf_fp, wise
    data_type: str = "wise"

    debug: bool = False

    debug_dir: None | str

    # in case of ZTF: Must be called 'ZTF_g', 'ZTF_r', 'ZTF_i'
    filters: Sequence[str]

    # Work with fluxes instead of magnitude
    flux: bool = False
    #
    plot_props: None | PlotProperties
    # Color of filters for the plots

    PlotColor: Sequence[str] = ["red", "blue"]

    def get_baseline(self, df, baye_block):
        if self.flux:
            if self.data_type in ["ztf_alert", "ztf_fp", "ztf_fp_noisy"]:
                baseline_df = baye_block.copy()
                baseline_df.sort_values(by="mag", inplace=True)
                for index, row in baseline_df.iterrows():
                    if row["measurements_nu"] < 5:
                        baseline_df.drop(index, inplace=True)

                if len(baseline_df) == 0:
                    baseline_df = baye_block.copy()

                baseline = baseline_df["mag"][baseline_df["mag"].idxmin()]
                baseline_sigma = baseline_df["mag.err"][baseline_df["mag"].idxmin()]
                baye_block.loc[baye_block["mag"].idxmin(), "level"] = "baseline"

            elif self.data_type == "wise":
                # baseline = baye_block["mag"][baye_block["mag"].idxmin()]
                # baseline_sigma = baye_block["mag.err"][baye_block["mag"].idxmin()]
                baye_block.loc[baye_block["mag"].idxmin(), "level"] = "baseline"
                (baseline, baseline_sigma, baseline_rms) = self.calculate_baseline(
                    df, baye_block
                )

                if baye_block["measurements_nu"][baye_block["mag"].idxmin()] == 1:
                    #   baye_block.loc[baye_block["mag"].idxmin(), "level"] = "baseline"
                    baye_block.loc[
                        baye_block.index[
                            baye_block["mag"]
                            == baye_block.sort_values(by=["mag"]).iloc[1]["mag"]
                        ].tolist()[0],
                        "level",
                    ] = "baseline"
                    (baseline, baseline_sigma, baseline_rms) = self.calculate_baseline(
                        df, baye_block
                    )
            #       value = unumpy.uarray(
            #           np.array(baye_block[baye_block["level"] == "baseline"]["mag"]),
            #           np.array(
            #               baye_block[baye_block["level"] == "baseline"]["mag.err"]
            #           ),
            #       )
            #       baseline = np.mean(value).nominal_value
            #       baseline_sigma = np.mean(value).std_dev
        else:
            baseline = baye_block["mag"][baye_block["mag"].idxmax()]
            baseline_sigma = baye_block["mag.err"][baye_block["mag"].idxmax()]
            baye_block["level"][baye_block["mag"].idxmax()] = "baseline"

            if baye_block["measurements_nu"][baye_block["mag"].idxmax()] == 1:
                #       baye_block["level"][baye_block["mag"].idxmax()] = "baseline"
                baye_block["level"][
                    baye_block.index[
                        baye_block["mag"]
                        == baye_block.sort_values(by=["mag"]).iloc[-2]["mag"]
                    ].tolist()[0]
                ] = "baseline"
                value = unumpy.uarray(
                    np.array(baye_block[baye_block["level"] == "baseline"]["mag"]),
                    np.array(baye_block[baye_block["level"] == "baseline"]["mag.err"]),
                )
                baseline = np.mean(value).nominal_value
                baseline_sigma = np.mean(value).std_dev

        if np.isnan(baseline_sigma):
            baseline_sigma = baye_block.sort_values(by="mag.err", ascending=False)[
                "mag.err"
            ].iloc[0]
        return (baseline, baseline_sigma)

    def calculate_baseline(self, df, baye_block):
        baseline_region = baye_block[baye_block["level"] == "baseline"]
        baseline_values = []
        baseline_error_values = []
        for i in baseline_region.index:
            baseline_values.append(
                df[
                    df["jd"].between(
                        baseline_region["jd_measurement_start"][i],
                        baseline_region["jd_measurement_end"][i],
                        inclusive="both",
                    )
                ]["mag"].values
            )
            baseline_error_values.append(
                df[
                    df["jd"].between(
                        baseline_region["jd_measurement_start"][i],
                        baseline_region["jd_measurement_end"][i],
                        inclusive="both",
                    )
                ]["mag.err"].values
            )

        value = unumpy.uarray(
            list(itertools.chain(*baseline_values)),
            list(itertools.chain(*baseline_error_values)),
        )
        baseline = np.mean(value).nominal_value
        baseline_sigma = np.mean(value).std_dev
        baseline_rms = mean_squared_error(
            list(itertools.chain(*baseline_values)),
            [baseline] * len(list(itertools.chain(*baseline_values))),
            squared=False,
        )
        return (baseline, baseline_sigma, baseline_rms)

    def baye_block_levels(self, df, baye_block, baseline, baseline_sigma):
        for nu, mag in enumerate(baye_block["mag"]):
            idx = baye_block.index.tolist()[nu]
            if np.isnan(baye_block["mag.err"][idx]):
                if abs((baseline - mag) / baseline_sigma) < self.rej_sigma:
                    baye_block.loc[idx, "level"] = "baseline"
                else:
                    baye_block.loc[idx, "level"] = "excess"
            elif baye_block["level"][idx] != "baseline":
                if (
                    baseline + (self.rej_sigma * baseline_sigma)
                    >= mag
                    >= baseline - (self.rej_sigma * baseline_sigma)
                ) and (
                    baseline + (self.rej_sigma * baseline_sigma)
                    >= mag - baye_block["mag.err"][idx]
                ):
                    baye_block.loc[idx, "level"] = "baseline"
                else:
                    baye_block.loc[idx, "level"] = "excess"
        (baseline, baseline_sigma, baseline_rms) = self.calculate_baseline(
            df, baye_block
        )
        return (baye_block, baseline, baseline_sigma, baseline_rms)

    def baye_block_levels_with_changing_baseline(
        self, df, baye_block, baseline, baseline_sigma
    ):
        for mag in baye_block.sort_values(by="mag")["mag"]:
            #  idx = baye_block.index.tolist()[nu]
            idx = baye_block.index[baye_block["mag"] == mag].tolist()[0]
            if np.isnan(baye_block["mag.err"][idx]):
                if abs((baseline - mag) / baseline_sigma) < self.rej_sigma:
                    baye_block.loc[idx, "level"] = "baseline"
                else:
                    baye_block.loc[idx, "level"] = "excess"
            elif baye_block["level"][idx] != "baseline":
                diff = abs(baseline - mag)
                diff_e = np.sqrt(baseline_sigma**2 + baye_block["mag.err"][idx] ** 2)
                diff_significance = diff / diff_e

                if diff_significance <= self.rej_sigma:
                    baye_block.loc[idx, "level"] = "baseline"

                else:
                    baye_block.loc[idx, "level"] = "excess"

            if "baseline" in baye_block["level"].values:
                (baseline, baseline_sigma, baseline_rms) = self.calculate_baseline(
                    df, baye_block
                )
        return (baye_block, baseline, baseline_sigma, baseline_rms)

    def idx_of_excess_regions(self, excess_region) -> list[ArrayLike]:
        length = 1
        excess_regions: list[ArrayLike] = []
        for nu in range(1, len(excess_region) + 1):
            if (
                nu == len(excess_region)
                or excess_region.index[nu] - excess_region.index[nu - 1] != 1
            ):
                if length == 1:
                    excess_regions.append([excess_region.index[nu - length]])
                elif length == len(excess_region):
                    excess_regions.append(
                        np.arange(
                            excess_region.index[0], excess_region.index[nu - 1] + 1
                        )
                    )
                else:
                    excess_regions.append(
                        np.arange(
                            excess_region.index[nu - length],
                            excess_region.index[nu - 1] + 1,
                        )
                    )
                length = 1
            else:
                length += 1
        return excess_regions

    def outliers(self, excess_regions, df, baye_block, measurements_nu):
        for value in excess_regions:
            if (
                len(value) == 1
                and measurements_nu[value[0]] == 1.0
                and (
                    baye_block["Npoints"][value[0]] == 1
                    and baye_block["sigma_from_baseline"][value[0]] > 5.0
                )
            ):
                df.loc[
                    df.index[
                        df["jd"].between(
                            baye_block["jd_measurement_start"][value[0]],
                            baye_block["jd_measurement_end"][value[0]],
                            inclusive="both",
                        )
                    ].tolist()[0],
                    "Outlier",
                ] = True
                baye_block.loc[value[0], "level"] = "outlier"
        return baye_block

    def description(self, excess_regions: list, measurements_nu: dict) -> list:
        # 0: The excess region has one baye block with one measurement, 1: The excess region has one baye block with multiple measurements, 2: The excess region has multiple baye blocks
        description = []
        for value in excess_regions:
            if len(value) == 1:
                if measurements_nu[value[0]] == 1.0:
                    description.append(0)
                else:
                    description.append(1)
            else:
                description.append(2)

        return description

    def coincide_peak_block(self, output_per_filter: dict) -> int:
        # It returns 1 if the PEAK mag bayesian regions of different filters coincide; -1 otherwise

        coincide_region = 0
        # we select the first filter to later compare it to the others
        if len(self.filters_lc) < 2:
            return coincide_region

        if self.data_type in ["ztf_alert", "ztf_fp", "ztf_fp_noisy"]:
            base_filter = "ZTF_g"
            # as the i-band is spotty in the case of ZTF, we skip it
            compare_filters = [
                i for i in self.filters_lc if i not in [base_filter, "ZTF_i"]
            ]
        elif self.data_type == "wise":
            base_filter = "Wise_W1"
            compare_filters = [i for i in self.filters_lc if i != base_filter]

        if output_per_filter[base_filter].get("nu_of_excess_regions") in [0, None]:
            return coincide_region

        if self.flux:
            idx = np.argmax(output_per_filter[base_filter]["max_mag_excess_region"])
        else:
            idx = np.argmin(output_per_filter[base_filter]["max_mag_excess_region"])
        start_region = output_per_filter[base_filter]["jd_excess_regions"][idx][0]
        end_region = output_per_filter[base_filter]["jd_excess_regions"][idx][-1]

        # now we select the other filters
        for compare_filter in compare_filters:
            if output_per_filter[compare_filter].get("nu_of_excess_regions") in [
                0,
                None,
            ]:
                return coincide_region

            if int(output_per_filter[compare_filter].get("nu_of_excess_regions")) > 0:
                if self.flux:
                    idx = np.argmax(
                        output_per_filter[compare_filter]["max_mag_excess_region"]
                    )
                else:
                    idx = np.argmin(
                        output_per_filter[compare_filter]["max_mag_excess_region"]
                    )
                if (
                    (
                        output_per_filter[compare_filter]["jd_excess_regions"][idx][-1]
                        >= start_region
                        >= output_per_filter[compare_filter]["jd_excess_regions"][idx][
                            0
                        ]
                    )
                    or (
                        output_per_filter[compare_filter]["jd_excess_regions"][idx][-1]
                        >= end_region
                        >= output_per_filter[compare_filter]["jd_excess_regions"][idx][
                            0
                        ]
                    )
                    or (
                        start_region
                        <= output_per_filter[compare_filter]["jd_excess_regions"][idx][
                            0
                        ]
                        <= end_region
                    )
                ):
                    coincide_region += 1
        return coincide_region

    @staticmethod
    def fill_with_empty(output: dict) -> dict:
        """
        If unit fails, return empty output dict (with all the keys)
        """
        output["nu_of_excess_regions"] = None
        output["nu_of_excess_blocks"] = None
        output["nu_of_baseline_regions"] = None
        output["jd_excess_regions"] = []
        output["mag_edge_excess"] = None
        output["max_mag_excess_region"] = None
        output["max_jd_excess_region"] = None
        output["max_sigma_excess_region"] = None
        output["max_baye_block_timescale"] = None
        output["baseline"] = None
        output["baseline_sigma"] = None
        output["baseline_rms"] = None
        output["jd_baseline_regions"] = None
        output["jd_outlier"] = None
        output["mag_edge_baseline"] = None
        output["sigma_from_baseline"] = None
        output["sigma_from_baseline_excess"] = None
        output["significance_of_variability_excess"] = [None, None]
        output["significance_of_fluctuation"] = None
        output["max_mag"] = None
        output["significance"] = None
        output["strength_sjoert"] = None
        output["description"] = None

        return output

    def count_overlapping_regions(self, output_per_filter: dict) -> int:
        """
        Returns the number of overlapping regions. Note: In case of ZTF data, we only consider the g- and r-band (i-band coverage is spotty)
        """
        coincidences = 0

        if self.data_type in ["ztf_alert", "ztf_fp", "ztf_fp_noisy"]:
            basefilter = "ZTF_g"
            comparefilter = "ZTF_r"

        elif self.data_type == "wise":
            if len(self.filters_lc) < 2:
                return coincidences
            basefilter = self.filters_lc[0]
            comparefilter = self.filters_lc[1]

        baseoutput = output_per_filter[basefilter]
        compareoutput = output_per_filter[comparefilter]

        if (
            baseoutput.get("nu_of_excess_regions") == 0
            or compareoutput["nu_of_excess_regions"] == 0
        ):
            return coincidences

        remaining_regions = compareoutput["jd_excess_regions"]
        comp_regions_checked = []

        for region_base in baseoutput["jd_excess_regions"]:
            for region_comp in remaining_regions:
                if region_comp not in comp_regions_checked:
                    latest_start = max(region_base[0], region_comp[0])
                    earliest_end = min(region_base[1], region_comp[1])
                    delta = earliest_end - latest_start

                    if delta > 0:
                        coincidences += 1
                        comp_regions_checked.append(region_comp)

        return coincidences

    def process(self, light_curve: LightCurve) -> UBson | UnitResult:
        """ """
        assert self.data_type in ["ztf_alert", "ztf_fp", "wise", "ztf_fp_noisy"]

        if self.data_type in ["ztf_alert", "ztf_fp", "ztf_fp_noisy"]:
            if isinstance(light_curve.stock_id, int):
                if self.data_type in [
                    "ztf_alert",
                    "ztf_fp",
                ]:
                    self.ztfid = ZTFIdMapper.to_ext_id(light_curve.stock_id)
                else:
                    self.ztfid = ZTFNoisifiedIdMapper.to_ext_id(light_curve.stock_id)

            if self.debug:
                print("---------------------------")
                print(f"Processing {self.ztfid}")
                print("---------------------------")
            self.PlotColor = ["green", "red", "orange"]

            for entry in self.filters:
                assert entry in ["ZTF_g", "ZTF_r", "ZTF_i"]

        ################################
        ######## Bayesian blocks #######
        output_per_filter: dict[str, Any] = {}

        self.filters_lc = self.filters

        if self.plot:
            fig = plt.figure()
            ax = fig.add_subplot(len(self.filters_lc) + 1, 1, 1)

        for fid, passband in enumerate(self.filters_lc, 1):
            baye_block = pd.DataFrame(
                columns=[
                    "jd_start",
                    "jd_end",
                    "jd_measurement_start",
                    "jd_measurement_end",
                    "mag",
                    "mag.err",
                    "measurements_nu",
                    "sigma_from_old_baseline",
                    "sigma_from_baseline",
                    "mag_edge",
                ]
            )
            output: dict[str, Any] = {
                "mag_edge_excess": [],
                "max_mag_excess_region": [],
                "max_jd_excess_region": [],
                "max_sigma_excess_region": [],
                "nu_of_excess_blocks": [],
                "significance_after_peak": [],
                "strength_after_peak": [],
                "jd_baseline_regions": [],
                "mag_edge_baseline": [],
                "significance_of_variability_excess": [[], []],
            }

            if self.data_type in ["ztf_fp", "ztf_fp_noisy"]:
                if self.flux:
                    phot_tuple = light_curve.get_ntuples(
                        ["jd", "flux_Jy", "flux_err_Jy"],
                        {"attribute": "fid", "operator": "==", "value": fid},
                    )

                else:
                    phot_tuple = light_curve.get_ntuples(
                        ["jd", "magpsf", "sigmapsf"],
                        {"attribute": "fid", "operator": "==", "value": fid},
                    )
            elif self.data_type == "ztf_alert":
                if self.flux:
                    raise ValueError("Not implemented yet")
                phot_tuple = light_curve.get_ntuples(
                    ["jd", "magpsf", "sigmapsf"],
                    {"attribute": "fid", "operator": "==", "value": fid},
                )
            elif self.data_type == "wise":
                if self.flux:
                    if self.Npoints:
                        phot_tuple = light_curve.get_ntuples(
                            ["jd", "mean_flux", "flux_rms", "flux_density_Npoints"],
                            [
                                {
                                    "attribute": "filter",
                                    "operator": "==",
                                    "value": passband,
                                },
                                {
                                    "attribute": "flux_ul",
                                    "operator": "==",
                                    "value": "False",
                                },
                            ],
                        )
                    else:
                        phot_tuple = light_curve.get_ntuples(
                            ["jd", "mean_flux", "flux_rms"],
                            [
                                {
                                    "attribute": "filter",
                                    "operator": "==",
                                    "value": passband,
                                },
                                {
                                    "attribute": "flux_ul",
                                    "operator": "==",
                                    "value": "False",
                                },
                            ],
                        )
                elif self.Npoints:
                    phot_tuple = light_curve.get_ntuples(
                        ["jd", "magpsf", "sigmapsf", "mag_Npoints"],
                        [
                            {
                                "attribute": "filter",
                                "operator": "==",
                                "value": passband,
                            },
                            {
                                "attribute": "mag_ul",
                                "operator": "==",
                                "value": "False",
                            },
                        ],
                    )
                else:
                    phot_tuple = light_curve.get_ntuples(
                        ["jd", "magpsf", "sigmapsf"],
                        [
                            {
                                "attribute": "filter",
                                "operator": "==",
                                "value": passband,
                            },
                            {
                                "attribute": "mag_ul",
                                "operator": "==",
                                "value": "False",
                            },
                        ],
                    )

            output_per_filter[passband] = []

            if phot_tuple is None or len(phot_tuple) <= 1:
                output = self.fill_with_empty(output)
                output_per_filter[str(passband)] = output
                continue

            if self.Npoints:
                df = pd.DataFrame(
                    phot_tuple, columns=["jd", "mag", "mag.err", "Npoints"]
                )
            else:
                df = pd.DataFrame(phot_tuple, columns=["jd", "mag", "mag.err"])

            # Now we use a rolling window as extreme outlier rejection for ZTF data
            if self.data_type in ["ztf_alert", "ztf_fp", "ztf_fp_noisy"]:
                df["median"] = df["mag"].rolling(10).median()
                df["std"] = df["mag"].rolling(10).std()
                df = df[
                    (df.mag <= df["median"] + 3 * df["std"])
                    & (df.mag >= df["median"] - 3 * df["std"])
                ]

            df = df.sort_values(by=["jd"], ignore_index=True)
            df["Outlier"] = False

            if len(df) == 0:
                output = self.fill_with_empty(output)
                output_per_filter[str(passband)] = output
                continue

            if self.data_type == "wise":
                ncp_prior = 1.32 + 0.577 * math.log10(len(df))
            elif self.data_type in ["ztf_fp", "ztf_fp_noisy"]:
                ncp_prior = 10 * math.log10(len(df))

            """
            in case multiple measurements have the same
            jd (there are cases where df['jd'].unique() contains no
            unique values, but np.unique(df['jd'].values) does, for
            whichever reason). We simply use the first of the measurements
            with the same jd
            """
            unique_jd, unique_jd_idx = np.unique(df["jd"].values, return_index=True)

            edges = bayesian_blocks(
                unique_jd,
                df["mag"].values[unique_jd_idx],
                sigma=df["mag.err"].values[unique_jd_idx],
                ncp_prior=ncp_prior,
                fitness="measures",
            )

            for i in range(1, len(edges)):
                baye_block_all = df.loc[
                    df["jd"].between(edges[i - 1], edges[i], inclusive="both")
                ]

                all_value_per_block = unumpy.uarray(
                    np.array(baye_block_all["mag"]), np.array(baye_block_all["mag.err"])
                )

                if self.data_type == "wise":
                    mag_err = np.mean(all_value_per_block).std_dev

                elif self.data_type in ["ztf_fp", "ztf_fp_noisy"]:
                    mag_err = mean_squared_error(
                        unumpy.nominal_values(all_value_per_block),
                        [np.mean(all_value_per_block).nominal_value]
                        * len(all_value_per_block),
                        squared=False,
                    )

                to_append = pd.DataFrame(
                    {
                        "jd_start": edges[i - 1],
                        "jd_end": edges[i],
                        "jd_measurement_start": min(baye_block_all["jd"]),
                        "jd_measurement_end": max(baye_block_all["jd"]),
                        "mag": np.mean(all_value_per_block).nominal_value,
                        "mag.err": mag_err,
                        "measurements_nu": len(baye_block_all),
                        "mag_edge": baye_block_all["mag"][
                            baye_block_all["jd"].idxmax()
                        ],
                    },
                    index=[0],
                )

                if self.Npoints:
                    to_append["Npoints"] = [np.array(baye_block_all["Npoints"])]

                baye_block = pd.concat([baye_block, to_append], ignore_index=True)

            baye_block["level"] = None

            """
            Now we remove bayesian blocks with less detections
            than min_det_per_block
            """
            for index, row in baye_block.iterrows():
                if row["measurements_nu"] < self.min_det_per_block:
                    baye_block.drop(index, inplace=True)
            baye_block.reset_index(drop=True, inplace=True)

            if len(baye_block) == 0:
                output = self.fill_with_empty(output)
                output_per_filter[str(passband)] = output
                continue

            baye_block = baye_block.astype(
                {
                    "jd_start": "float",
                    "jd_end": "float",
                    "jd_measurement_start": "float",
                    "jd_measurement_end": "float",
                    "mag": "float",
                    "mag.err": "float",
                    "measurements_nu": "float",
                    "sigma_from_old_baseline": "float",
                    "sigma_from_baseline": "float",
                    "mag_edge": "float",
                }
            )
            #######################################
            ######### Find the baseline ###########
            for sigma_discr in ["sigma_from_old_baseline", "sigma_from_baseline"]:
                (baseline_init, baseline_init_sigma) = self.get_baseline(df, baye_block)

                if sigma_discr == "sigma_from_old_baseline":
                    (baseline, baseline_sigma) = self.get_baseline(df, baye_block)
                    baseline = baseline_init
                    baseline_sigma = baseline_init_sigma
                elif self.data_type == "wise":
                    (
                        baye_block,
                        baseline,
                        baseline_sigma,
                        baseline_rms,
                    ) = self.baye_block_levels_with_changing_baseline(
                        df,
                        baye_block,
                        baseline_init,
                        baseline_init_sigma,
                    )
                elif self.data_type in ["ztf_fp", "ztf_fp_noisy"]:
                    (
                        baye_block,
                        baseline,
                        baseline_sigma,
                        baseline_rms,
                    ) = self.baye_block_levels(
                        df,
                        baye_block,
                        baseline_init,
                        baseline_init_sigma,
                    )

                baye_block[str(sigma_discr)] = (baye_block["mag"] - baseline) / np.sqrt(
                    baseline_sigma**2 + baye_block["mag.err"] ** 2
                )

            #######################################
            ########## Excess region  #############
            excess_region = baye_block[baye_block["level"] == "excess"]
            if not excess_region.empty:
                # Find the excess regions (baye block that are accumulated to a region)
                excess_regions_idx = [
                    list(group)
                    for group in mit.consecutive_groups(excess_region.index.tolist())
                ]
                # Assign levels as outlier
                if self.Npoints == True:
                    baye_block = self.outliers(
                        excess_regions_idx,
                        df,
                        baye_block,
                        excess_region["measurements_nu"],
                    )
                    # Calculate again the excess regions
                    excess_regions_idx = [
                        list(group)
                        for group in mit.consecutive_groups(
                            baye_block[baye_block["level"] == "excess"].index.tolist()
                        )
                    ]
                    if not baye_block[baye_block["level"] == "outlier"].empty:
                        outlier = [
                            baye_block[baye_block["level"] == "outlier"][
                                "jd_measurement_start"
                            ].values,
                            baye_block[baye_block["level"] == "outlier"][
                                "jd_measurement_end"
                            ].values,
                        ]
                        output["jd_outlier"] = np.array(outlier).T.tolist()
                    else:
                        output["jd_outlier"] = None
                else:
                    output["jd_outlier"] = None
                output["description"] = self.description(
                    excess_regions_idx, excess_region["measurements_nu"]
                )

            excess_region = baye_block[baye_block["level"] == "excess"]
            baseline_region = baye_block[baye_block["level"] != "excess"]
            ##########################
            everything_except_excess_values = []
            if not excess_region.empty:
                if self.flux:
                    global_peak_idx = (
                        baye_block["mag"].loc[flatten(excess_regions_idx)].idxmax()
                    )
                else:
                    global_peak_idx = (
                        baye_block["mag"].loc[flatten(excess_regions_idx)].idxmin()
                    )
                for idx in excess_regions_idx:
                    if global_peak_idx in idx:
                        everything_except_excess_values.append(
                            df[
                                (
                                    (
                                        df["jd"]
                                        < baye_block["jd_measurement_start"].loc[idx[0]]
                                    )
                                    & (df["Outlier"] == False)
                                )
                                | (
                                    (
                                        df["jd"]
                                        > baye_block["jd_measurement_end"].loc[idx[-1]]
                                    )
                                    & (df["Outlier"] == False)
                                )
                            ]["mag"].values
                        )

                        first = next(iter(everything_except_excess_values))
                        everything_except_excess_rms = mean_squared_error(
                            first,
                            np.ones(len(first)) * np.mean(first),
                            squared=False,
                        )
            else:
                everything_except_excess_rms = baseline_rms

            baseline_regions_idx = [
                list(group)
                for group in mit.consecutive_groups(baseline_region.index.tolist())
            ]
            output["sigma_from_baseline"] = baye_block[
                "sigma_from_baseline"
            ].values.tolist()

            output["baseline"] = baseline
            output["baseline_sigma"] = baseline_sigma
            # Add baseline_rms, calculate max magnitude, flux from df['mag']
            # strength: Delta flux/rms, significance: rms/baseline_sigma
            output["baseline_rms"] = baseline_rms
            output["significance"] = everything_except_excess_rms / baseline_sigma

            if self.flux == True:
                output["max_mag"] = max(df[df["Outlier"] == False]["mag"].values)

                output["strength_sjoert"] = (
                    max(df[df["Outlier"] == False]["mag"].values) - baseline
                ) / everything_except_excess_rms

            else:
                output["max_mag"] = min(df[df["Outlier"] == False]["mag"].values)
                output["strength_sjoert"] = (
                    min(df[df["Outlier"] == False]["mag"].values) - baseline
                ) / everything_except_excess_rms

            for idx in baseline_regions_idx:
                if baye_block["level"][idx[-1]] == "outlier":
                    if len(idx) != 1:
                        output["nu_of_baseline_regions"] = len(baseline_regions_idx) - 1
                        output["jd_baseline_regions"].append(
                            [
                                baye_block["jd_measurement_start"][idx[0]],
                                baye_block["jd_measurement_end"][idx[-1] - 1],
                            ]
                        )
                        output["mag_edge_baseline"].append(
                            baye_block["mag_edge"][idx[-1] - 1]
                        )

                elif baye_block["level"][idx[0]] == "outlier":
                    if len(idx) != 1:
                        output["nu_of_baseline_regions"] = len(baseline_regions_idx) - 1
                        output["jd_baseline_regions"].append(
                            [
                                baye_block["jd_measurement_start"][idx[0] + 1],
                                baye_block["jd_measurement_end"][idx[-1]],
                            ]
                        )
                        output["mag_edge_baseline"].append(
                            baye_block["mag_edge"][idx[-1]]
                        )

                else:
                    output["nu_of_baseline_regions"] = len(baseline_regions_idx)
                    output["jd_baseline_regions"].append(
                        [
                            baye_block["jd_measurement_start"][idx[0]],
                            baye_block["jd_measurement_end"][idx[-1]],
                        ]
                    )

                    output["mag_edge_baseline"].append(baye_block["mag_edge"][idx[-1]])

            if not excess_region.empty:
                output["nu_of_excess_regions"] = len(excess_regions_idx)
                output["jd_excess_regions"] = []
                significance_of_fluctuation_before_peak = []
                significance_of_fluctuation_after_peak = []
                for idx in excess_regions_idx:
                    output["nu_of_excess_blocks"].append(len(idx))
                    #  output["nu_of_excess_blocks"] = len(idx)

                    output["jd_excess_regions"].append(
                        [
                            baye_block["jd_measurement_start"][idx[0]],
                            baye_block["jd_measurement_end"][idx[-1]],
                        ]
                    )

                    output["mag_edge_excess"].append(baye_block["mag_edge"][idx[-1]])
                    output["max_sigma_excess_region"].append(
                        max(baye_block["sigma_from_baseline"][idx[0] : idx[-1] + 1])
                    )

                    output["sigma_from_baseline_excess"] = baye_block[
                        "sigma_from_baseline"
                    ][idx[0] : idx[-1] + 1].values.tolist()

                    each_excess_max_idx = baye_block["mag"].loc[idx].idxmax()
                    if global_peak_idx == each_excess_max_idx:
                        # Inside the excess region with the highest intensity
                        # Calculate the local peaks inside the excess region of the highest intensity
                        local_peaks, _ = np.array(
                            find_peaks(
                                np.concatenate(
                                    (
                                        [min(baye_block["mag"].loc[idx].values)],
                                        baye_block["mag"].loc[idx].values,
                                        [min(baye_block["mag"].loc[idx].values)],
                                    )
                                )
                            ),
                            dtype=object,
                        )
                        local_peaks = local_peaks - 1
                        for peak in local_peaks:
                            if idx[peak] != global_peak_idx:
                                if idx[peak] < global_peak_idx:
                                    significance_of_fluctuation_before_peak.append(
                                        (
                                            baye_block["mag"].loc[global_peak_idx]
                                            - baye_block["mag"].loc[idx[peak]]
                                        )
                                        / math.sqrt(
                                            sum(
                                                np.array(baye_block["mag.err"].values)
                                                ** 2
                                            )
                                        )
                                    )
                                else:
                                    significance_of_fluctuation_after_peak.append(
                                        (
                                            baye_block["mag"].loc[global_peak_idx]
                                            - baye_block["mag"].loc[idx[peak]]
                                        )
                                        / math.sqrt(
                                            sum(
                                                np.array(baye_block["mag.err"].values)
                                                ** 2
                                            )
                                        )
                                    )
                        output[
                            "significance_of_fluctuation"
                        ] = significance_of_fluctuation_before_peak

                        output[
                            "significance_of_fluctuation"
                        ] = significance_of_fluctuation_after_peak

                        # Calculate the significance of each bayesian block, inside the excess region of the highest intensity
                        if (
                            len(post_peak := [i for i in idx if (i > global_peak_idx)])
                            >= 2
                        ):
                            after_peak_excess_values = df[
                                (
                                    (
                                        df["jd"]
                                        >= baye_block["jd_measurement_start"].loc[
                                            post_peak[0]
                                        ]
                                    )
                                    & (df["Outlier"] == False)
                                )
                                & (
                                    (
                                        df["jd"]
                                        <= baye_block["jd_measurement_end"].loc[
                                            post_peak[-1]
                                        ]
                                    )
                                    & (df["Outlier"] == False)
                                )
                            ]["mag"].values
                            after_peak_excess_error = df[
                                (
                                    (
                                        df["jd"]
                                        >= baye_block["jd_measurement_start"].loc[
                                            post_peak[0]
                                        ]
                                    )
                                    & (df["Outlier"] == False)
                                )
                                & (
                                    (
                                        df["jd"]
                                        <= baye_block["jd_measurement_end"].loc[
                                            post_peak[-1]
                                        ]
                                    )
                                    & (df["Outlier"] == False)
                                )
                            ]["mag.err"].values
                            after_peak_excess_rms = mean_squared_error(
                                list(after_peak_excess_values),
                                [np.mean(after_peak_excess_values)]
                                * len(after_peak_excess_values),
                                squared=False,
                            )
                            after_peak_excess_sigma = mean_squared_error(
                                list(after_peak_excess_values),
                                [np.mean(after_peak_excess_values)]
                                * len(after_peak_excess_values),
                                squared=True,
                            )

                            output["significance_after_peak"].append(
                                after_peak_excess_rms / after_peak_excess_sigma
                            )

                            output["strength_after_peak"].append(
                                (
                                    baye_block["mag"].loc[global_peak_idx]
                                    - baye_block["mag"].loc[post_peak[0]]
                                )
                                / after_peak_excess_rms
                            )

                        for baye_excess_idx in [i for i in idx if i != global_peak_idx]:
                            sig = (
                                baye_block["mag"].loc[global_peak_idx]
                                - baye_block["mag"].loc[baye_excess_idx]
                            ) / math.sqrt(
                                sum(np.array(baye_block["mag.err"].values) ** 2)
                            )

                            if baye_excess_idx < global_peak_idx:
                                output["significance_of_variability_excess"][0].append(
                                    sig
                                )

                            elif baye_excess_idx > global_peak_idx:
                                output["significance_of_variability_excess"][1].append(
                                    sig
                                )

                    if self.flux == True:
                        max_idx = df["mag"][
                            df["jd"].between(
                                baye_block["jd_measurement_start"][idx[0]],
                                baye_block["jd_measurement_end"][idx[-1]],
                            )
                        ].idxmax()
                    else:
                        max_idx = df["mag"][
                            df["jd"].between(
                                baye_block["jd_measurement_start"][idx[0]],
                                baye_block["jd_measurement_end"][idx[-1]],
                            )
                        ].idxmin()
                    output["max_mag_excess_region"].append(df["mag"][max_idx])
                    output["max_jd_excess_region"].append(df["jd"][max_idx])

                if self.flux == True:
                    output["max_baye_block_timescale"] = float(
                        (
                            excess_region["jd_measurement_end"]
                            - excess_region["jd_measurement_start"]
                        )[
                            flatten(
                                excess_region[
                                    excess_region["mag"] == max(excess_region["mag"])
                                ].index.tolist()
                            )
                        ].to_string(index=False)
                    )

                else:
                    output["max_baye_block_timescale"] = float(
                        (
                            excess_region["jd_measurement_end"]
                            - excess_region["jd_measurement_start"]
                        )[
                            flatten(
                                excess_region[
                                    excess_region["mag"] == min(excess_region["mag"])
                                ].index.tolist()
                            )
                        ].to_string(index=False)
                    )

            else:
                output["nu_of_excess_regions"] = 0
                output["nu_of_excess_blocks"] = None
                output["jd_excess_regions"] = []
                output["mag_edge_excess"] = None
                output["max_mag_excess_region"] = None
                output["max_jd_excess_region"] = None
                output["max_sigma_excess_region"] = None
                output["sigma_from_baseline_excess"] = None
                output["significance_of_variability_excess"] = [None, None]
                output["significance_of_fluctuation"] = None
                output["max_baye_block_timescale"] = None
                output["description"] = None

            output_per_filter[str(passband)] = dict(output)

            ##############################################
            ################## Plots #####################
            if self.plot:
                df["mjd"] = df["jd"] - 2400000.5
                ax.errorbar(
                    df[df["Outlier"] == False]["mjd"],
                    df[df["Outlier"] == False]["mag"],
                    yerr=df[df["Outlier"] == False]["mag.err"],
                    label=passband,
                    fmt="s",
                    color=self.PlotColor[fid - 1],
                    ecolor="lightgray",
                    markeredgecolor="black",
                    elinewidth=3,
                    capsize=0,
                )
                ax.errorbar(
                    df[df["Outlier"] == True]["mjd"],
                    df[df["Outlier"] == True]["mag"],
                    yerr=df[df["Outlier"] == True]["mag.err"],
                    label="Outlier",
                    fmt="o",
                    color="lightgray",
                    ecolor="lightgray",
                    markeredgecolor="black",
                    elinewidth=3,
                    capsize=0,
                )

                for block in output["jd_excess_regions"]:
                    if block:
                        ax.axvline(
                            x=(block[0] - 40) - 2400000.5,
                            label="T2 guess",
                            color=self.PlotColor[fid - 1],
                        )
                        ax.axvline(
                            x=(block[-1] + 40) - 2400000.5,
                            color=self.PlotColor[fid - 1],
                        )
                        ax.axvspan(
                            (block[0] - 40) - 2400000.5,
                            (block[-1] + 40) - 2400000.5,
                            alpha=0.05,
                            color=self.PlotColor[fid - 1],
                        )
                    else:
                        ax.axhline(
                            y=output["baseline"],
                            label="Baseline",
                            color=self.PlotColor[fid - 1],
                        )

                for sp in ["left", "bottom", "top", "right"]:
                    ax.spines[sp].set_linewidth(3)

                ax.set_title(str(light_curve.stock_id), fontsize=25)
                ax.legend(
                    bbox_to_anchor=(1.05, 1),
                    loc=2,
                    borderaxespad=0.0,
                    prop={"size": 20},
                )
                plt.tick_params(axis="both", which="major", pad=12, length=10, width=3)
                plt.xticks(fontsize=20)
                plt.yticks(fontsize=20)

                locals()["ax" + str(passband)] = fig.add_subplot(
                    len(self.filters_lc) + 1, 1, fid + 1, sharex=ax
                )

                if self.debug and self.data_type in [
                    "ztf_alert",
                    "ztf_fp",
                    "ztf_fp_noisy",
                ]:
                    alpha = 0.07
                else:
                    alpha = 1

                locals()["ax" + str(passband)] = plt.errorbar(
                    df[df["Outlier"] == False]["mjd"],
                    df[df["Outlier"] == False]["mag"],
                    yerr=df[df["Outlier"] == False]["mag.err"],
                    label=passband,
                    fmt="s",
                    color=self.PlotColor[fid - 1],
                    alpha=alpha,
                    ecolor="lightgray",
                    markeredgecolor="black",
                    elinewidth=3,
                    capsize=0,
                )
                locals()["ax" + str(passband)] = plt.errorbar(
                    df[df["Outlier"] == True]["mjd"],
                    df[df["Outlier"] == True]["mag"],
                    yerr=df[df["Outlier"] == True]["mag.err"],
                    label="Outlier",
                    fmt="o",
                    color="lightgray",
                    ecolor="lightgray",
                    markeredgecolor="black",
                    elinewidth=3,
                    capsize=0,
                )
                baye_block["mjd_start"] = baye_block["jd_start"] - 2400000.5
                baye_block["mjd_end"] = baye_block["jd_end"] - 2400000.5

                for nu, value in enumerate(baye_block["mag"]):
                    linestyle = "solid"
                    linewidth = 1.5
                    if baye_block["level"][nu] == "excess":
                        color_block = self.PlotColor[fid - 1]
                        if self.data_type in ["ztf_fp", "ztf_fp_noisy"]:
                            linestyle = "dashdot"
                    elif baye_block["level"][nu] == "baseline":
                        color_block = self.PlotColor[fid - 1]
                        if self.data_type in ["ztf_fp", "ztf_fp_noisy"]:
                            linewidth = 3
                    else:
                        color_block = "lightgray"
                        if self.data_type in ["ztf_fp", "ztf_fp_noisy"]:
                            linestyle = "dashdot"

                    locals()["ax" + str(passband)] = plt.hlines(
                        value,
                        baye_block["mjd_start"][nu],
                        baye_block["mjd_end"][nu],
                        color=color_block,
                        linestyles=linestyle,
                        linewidth=linewidth,
                    )
                    locals()["ax" + str(passband)] = plt.hlines(
                        value + baye_block["mag.err"][nu],
                        baye_block["mjd_start"][nu],
                        baye_block["mjd_end"][nu],
                        color=color_block,
                        linestyles="dashed",
                    )
                    locals()["ax" + str(passband)] = plt.hlines(
                        value - baye_block["mag.err"][nu],
                        baye_block["mjd_start"][nu],
                        baye_block["mjd_end"][nu],
                        color=color_block,
                        linestyles="dashed",
                    )

                if self.flux == False:
                    plt.gca().invert_yaxis()

                locals()["ax" + str(passband)] = plt.gca()
                for sp in ["left", "bottom", "top", "right"]:
                    locals()["ax" + str(passband)].spines[sp].set_linewidth(3)

                plt.tick_params(axis="both", which="major", pad=22, length=10, width=3)
                plt.xticks(fontsize=20)
                plt.yticks(fontsize=20)

        if self.plot:
            if self.flux == False and "ax" in locals():
                ax.invert_yaxis()

            if self.flux == True:
                fig.supylabel("Flux Density", fontsize=30)
            else:
                fig.supylabel("Difference magnitude", fontsize=30)

            fig.supxlabel("MJD", fontsize=30)

            if self.plot or self.debug:
                if isinstance(self.plot_props, PlotProperties):
                    output_per_filter["Plots"] = [
                        create_plot_record(
                            fig,
                            self.plot_props,
                            extra={"band": "All", "stock": light_curve.stock_id},  # type: ignore
                        )
                    ]

                if self.debug and isinstance(self.debug_dir, str):
                    if self.data_type in ["ztf_alert", "ztf_fp", "ztf_fp_noisy"]:
                        object_id: StockId | Sequence[StockId] = self.ztfid
                    else:
                        object_id = light_curve.stock_id

                    if not os.path.exists(self.debug_dir):
                        os.makedirs(self.debug_dir)

                    title = str(object_id)

                    overlapping_regions_count = self.count_overlapping_regions(
                        output_per_filter
                    )

                    if self.data_type in ["ztf_alert", "ztf_fp", "ztf_fp_noisy"]:
                        title += (
                            f"\n{overlapping_regions_count} overlapping regions (g+r)"
                        )

                    fig.suptitle(
                        title,
                        fontsize=30,
                    )

                    outfile = os.path.join(self.debug_dir, str(object_id) + ".pdf")

                    fig.savefig(outfile)
                    output_per_filter.pop("Plots")

                plt.close()

            fig.tight_layout()
        """
        Further check if the PEAK bayesian excess regions of different filter coincide. Works only for two filter
        """
        coincide_peak_block = self.coincide_peak_block(output_per_filter)

        if coincide_peak_block >= 1:
            output_per_filter["coincide_peak_block"] = 1
        else:
            output_per_filter["coincide_peak_block"] = -1

        # # Now we get the number of overlapping regions (regardless whether they contain the peak flux or not)
        output_per_filter["overlapping_regions_count"] = self.count_overlapping_regions(
            output_per_filter
        )

        output_per_filter["start_excess"] = None
        output_per_filter["size_excess"] = 0

        for keys in [key for key in output_per_filter if key in self.filters]:
            if output_per_filter[keys].get("nu_of_excess_regions") not in [0, None]:
                idxmax = np.argmax(output_per_filter[keys]["max_sigma_excess_region"])
                output_per_filter["start_excess"] = output_per_filter[keys][
                    "jd_excess_regions"
                ][idxmax][0]
                output_per_filter["size_excess"] = (
                    output_per_filter[keys]["jd_excess_regions"][idxmax][-1]
                    - output_per_filter[keys]["jd_excess_regions"][idxmax][0]
                )

        t2_output: dict[str, UBson] = output_per_filter

        if self.debug and self.data_type in ["ztf_alert", "ztf_fp", "ztf_fp_noisy"]:
            for fil in self.filters_lc:
                print(f"{fil}\n")
                print(
                    f"# excess regions: {output_per_filter[fil]['nu_of_excess_regions']}"
                )
                print(
                    f"# excess blocks: {output_per_filter[fil]['nu_of_excess_blocks']}"
                )
                print("--------")
            print(
                f"coincident regions between g and r: {output_per_filter['coincide_peak_block']!s}"
            )

        return t2_output