In [1]:
%load_ext autoreload
%autoreload 2

In [2]:
import os
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

from zwad.ad.postprocess import *

from IPython.display import display, HTML
pd.set_option('display.max_rows', 2000)
plt.rcParams['figure.max_open_warning'] = 100

# Table of contents
* [M31](#M31)
* [Deep](#Deep)
* [Disk](#Disk)

In [3]:
data_dir = '../data/'


def load_ad_results(filenames):
    table = load_ad_tables_by_patterns([os.path.join(data_dir, fname)
                                        for fname in filenames])
    # Sort the table
    table = table.loc[table.isna().sum(axis=1).sort_values(kind='mergesort').index].reset_index(drop=True)

    return table


def result_comparison(ad_filenames, expert_filename): 
    table = load_ad_results(ad_filenames)
    expert_table = load_expert_table(expert_filename)
    subtable = pd.merge(table, expert_table, on='oid', how='left')
    return subtable

# M31

In [4]:
subtable = result_comparison(
    [os.path.join(data_dir, name) for name in ['m31_iso.csv', 'm31_gmm.csv', 'm31_lof.csv', 'm31_svm.csv']],
    os.path.join(data_dir, 'm31_maria.csv'))

display(subtable)

Unnamed: 0,oid,m31_iso,m31_gmm,m31_lof,m31_svm,tag,tag_detailed,comments,alerts
0,695211400034403,-0.742695,-447.694306,-3.629885,1.003855,artefact,bright star,bright star,
1,695211400124577,-0.735534,-355.171565,-3.084022,1.007907,artefact,bright star,bright star,
2,695211400102351,-0.728004,-309.761947,-2.832976,1.003213,artefact,bright star,bright star,
3,695211400053697,-0.727037,-289.921585,-2.668397,1.014733,artefact,bright star,bright star,
4,695211200075348,-0.723084,-229.932966,-3.008947,1.000484,transient,red star,"MASTER transient, red star; has spectra but st...",
5,695211400000352,-0.714944,-337.016507,-2.966133,1.023181,artefact,bright star,bright star,
6,695211400088968,-0.723894,-217.579138,,1.347984,artefact,,empty field fits,
7,695211400117334,-0.722743,-192.799983,,1.146374,artefact,bright star,bright star,
8,695211400028274,-0.72169,-247.925193,,1.012351,artefact,bright star,bright star,
9,695211400133827,-0.716548,-218.952155,,1.363846,artefact,,empty field fits,


# Deep

## Scale Std

In [5]:
result_comparison(
    [os.path.join(data_dir, name) for name in [
        'deep_iso.csv', 'deep_gmm.csv', 'deep_lof.csv', 'deep_svm.csv',
    ]],
    os.path.join(data_dir, 'deep_maria.csv'))

Unnamed: 0,oid,deep_iso,deep_gmm,deep_lof,deep_svm,tag,tag_detailed,comments,alerts
0,795203200009604,-0.793451,-515.679608,-3.015798,1.0,AM Herculis,,cataclysmic; polars,
1,795205400022890,-0.783779,-4514.610588,-9.895412,1.0,Mira,,pulsating,
2,795215300016556,-0.744711,-674.992993,-3.212606,1.0,atrefact,bright star,,
3,795212100007964,-0.75806,,-2.660216,1.0,uncat,,SN???,
4,795206400033919,-0.756697,-472.180551,,1.000002,artefact,spaceship,high disperstion LC,
5,795205100007271,-0.749604,,-2.582768,1.002898,uncat,,SN???,
6,795204200006882,-0.74846,,-2.826101,1.000548,EB,EA,eclipsing,
7,795209300012791,-0.744955,-406.75934,,1.000073,RRLyr,RRAB,pulsating; RR Lyrae variables with asymmetric ...,
8,795206400000500,,-604.742722,-4.536239,1.005467,artefact,plane/flying body,plane/flying body; 1-point transient,
9,795216300023263,,-474.470484,-2.532907,1.000042,artefact,plane/flying body,plane/flying body; 1-point transient,


## Scale Norm

In [6]:
result_comparison(
    [os.path.join(data_dir, name) for name in [
        'deep_iso_norm.csv', 'deep_gmm_norm.csv', 'deep_lof_norm.csv', 'deep_svm_norm.csv',
    ]],
    os.path.join(data_dir, 'deep_maria.csv'))

Unnamed: 0,oid,deep_iso_norm,deep_gmm_norm,deep_lof_norm,deep_svm_norm,tag,tag_detailed,comments,alerts
0,795205400022890,-0.705834,,-1.885991,68.051405,Mira,,pulsating,
1,795203200009604,-0.705658,,-1.915205,57.669751,AM Herculis,,cataclysmic; polars,
2,795204200006882,-0.685122,,-2.050948,87.086276,EB,EA,eclipsing,
3,795211200035931,-0.699831,,,87.416585,SN,SN Ia,SN 2018coi,
4,795209200003484,-0.697626,,,111.043347,uncat,,SN???,
5,795212100007964,-0.689524,,,69.481313,uncat,,SN???,
6,795205400027537,-0.688804,,,154.972395,Mira_projected,Mira_projected,Automatic photometry artefact; due to pulsatio...,
7,795206400001319,-0.687589,,,123.478434,artefact,plane/flying body,plane/flying body; 1-point transient,
8,795205100007271,-0.682054,,,128.153432,uncat,,SN???,
9,795206400012603,-0.679513,,,109.156964,artefact,plane/flying body,plane/flying body; 1-point transient,


# Disk

In [7]:
result_comparison(
    [os.path.join(data_dir, name) for name in ['disk_iso.csv', 'disk_gmm.csv', 'disk_lof.csv', 'disk_svm.csv']],
    os.path.join(data_dir, 'disk_maria.csv'))

Unnamed: 0,oid,disk_iso,disk_gmm,disk_svm,tag,tag_detailed,comments,alerts
0,807208200059506,-0.820094,-4822.542267,1.0,Eruptive,INS,,
1,807206200014645,-0.818799,-2538.01759,1.0,Var,YSO,Young stellar Object of unspecified variable t...,
2,807209400037670,-0.817158,-5182.12164,1.0,Pulsating,Mira,,
3,807206400014916,-0.814964,-9986.607794,1.0,Pulsating,Mira:,"Not 100% confirmed, bumps on LC?",
4,807211300006190,-0.812376,-3335.349534,1.0,Pulsating,Mira:,"Not 100% confirmed, bumps on LC?",
5,807202300038681,-0.812179,-2955.133379,1.0,Cataclysmic,UG,,
6,807216100038423,-0.811749,-1498.252326,1.0,Pulsating,AGB,,
7,807208300016714,-0.811539,-3433.445451,1.0,Pulsating,Mira,,
8,807206300013468,-0.81111,-1023.723297,1.0,Pulsating,Mira,,
9,807214300010833,-0.808035,-1093.025005,1.0,Pulsating,Mira:,,
