In [None]:
import os
from os import path
from astropy.time import Time
from astropy.io import fits, ascii
import astropy.units as u
from astropy.table import Table
from astropy.constants import G

import numpy as np
import matplotlib.pyplot as plt
from matplotlib.colors import LogNorm
%matplotlib inline
import h5py
import pandas as pd
from sqlalchemy import func
from scipy.optimize import root
from scipy.stats import scoreatpercentile
import tqdm

from thejoker import JokerSamples
from thejoker.sampler import JokerParams, TheJoker
from thejoker.plot import plot_rv_curves

from twoface.config import TWOFACE_CACHE_PATH
from twoface.db import (db_connect, AllStar, AllVisit, AllVisitToAllStar, 
                        StarResult, Status, JokerRun, initialize_db)
from twoface.data import APOGEERVData
from twoface.plot import plot_data_orbits

In [None]:
TWOFACE_CACHE_PATH = path.abspath('../cache/')
samples_file = path.join(TWOFACE_CACHE_PATH, 'apogee-jitter.hdf5')

In [None]:
Session, _ = db_connect(path.join(TWOFACE_CACHE_PATH, 'apogee.sqlite'))
session = Session()

In [None]:
stars = session.query(AllStar).join(StarResult, Status)\
                              .filter(Status.id.in_([1,2]))\
                              .all()
len(stars)

In [None]:
%%time

rows = None
with h5py.File(samples_file, 'r') as f:
    for star in tqdm.tqdm(stars):
        # samples = JokerSamples.from_hdf5(f[star.apogee_id])
        K = f[star.apogee_id]['K'][:]
        P = f[star.apogee_id]['P'][:]
        ecc = f[star.apogee_id]['e'][:]
        vsini = [star.vsini] * len(P)
        loggs = [star.logg] * len(P)
        status = [star.results[0].status_id] * len(P)
        apogee_ids = [star.apogee_id] * len(P)
        
        this_rows = list(zip(apogee_ids, loggs, vsini, P, ecc, K, status))
        
        if rows is None:
            rows = this_rows
        else:
            rows = rows + this_rows
            
tbl_ = np.array(rows, dtype=[('apogee_id', 'U25'), ('logg', float), ('vsini', float),
                             ('P', float), ('e', float), ('K', float), 
                             ('status', int)])
df = pd.DataFrame(tbl_)
print(len(df))

In [None]:
huh = df.groupby('apogee_id')
tbl = huh.filter(lambda x: np.percentile(x['K'], 15) > 1.)
len(tbl)

In [None]:
def get_P(m1, m2, logg):
    logg = np.asarray(logg)
    return (2*np.pi * G**(1/4.) * (m1+m2) / (m1**(3/4.)) * (10**logg*u.cm/u.s**2)**(-3/4)).to(u.day)

In [None]:
fig, ax = plt.subplots(1, 1, figsize=(6, 6))
ax.plot(tbl['P'], tbl['logg'], marker='.', 
        linestyle='none', alpha=0.2, ms=2, color='k')

# -- P curves --
logg = np.linspace(0, 4, 1024)

for M1 in [0.5, 1., 2] * u.Msun:
    P1 = get_P(M1, 1E-5*u.Msun, logg).value
    P2 = get_P(M1, M1, logg).value
    
    ax.fill_betweenx(logg, P1, P2, alpha=0.5, linewidth=0,
                     label='{0:.1f} {1:latex_inline}'.format(M1.value, M1.unit))

ax.legend(loc='upper right')
    
ax.set_xscale('log')
ax.set_xlim(1, 32768)
ax.set_ylim(3.55, 0)
ax.set_xlabel('$P$ [day]')
ax.set_ylabel('$\log g$')
    
fig.tight_layout()

In [None]:
sub_tbl = tbl[tbl['status'] == 2]

In [None]:
def make_plot(tbl, c=None, clabel='', **kw):
    
    if c is None:
        fig, ax = plt.subplots(1, 1, figsize=(6, 6))
        ax.plot(tbl['P'], tbl['logg'], linestyle='none', 
                marker='.', ms=4, alpha=0.3)
        
    else:
        fig, ax = plt.subplots(1, 1, figsize=(7.2, 6))
        cs = ax.scatter(tbl['P'], tbl['logg'], c=c,
                        marker='o', alpha=0.65, s=15, linewidth=0,
                        cmap='magma_r', **kw)
        cb = fig.colorbar(cs)
        cb.set_label(clabel)

    # -- P curves --
    logg = np.linspace(0, 4, 1024)

    for M1 in [1.] * u.Msun:
        P1 = get_P(M1, 1E-5*u.Msun, logg).value
        P2 = get_P(M1, M1, logg).value

        ax.fill_betweenx(logg, P1, P2, alpha=0.5, linewidth=0, color='#aaaaaa', zorder=-100,
                         label='$M_1 = ${0:.1f} {1:latex_inline}'.format(M1.value, M1.unit))

    ax.legend(loc='upper right')

    ax.set_xscale('log')
    ax.set_xlim(1, 32768)
    ax.set_ylim(3.55, 0)
    ax.set_xlabel('$P$ [day]')
    ax.set_ylabel('$\log g$')

    fig.tight_layout()

In [None]:
fig = make_plot(sub_tbl, sub_tbl['K'], 
                '$K$ [{0:latex_inline}]'.format(u.km/u.s),
                norm=LogNorm(1., 50.))
fig

In [None]:
fig = make_plot(sub_tbl, sub_tbl['e'], 
                '$e$', vmin=0, vmax=1)
fig

In [None]:
fig = make_plot(sub_tbl[sub_tbl['vsini']>0], sub_tbl['vsini'][sub_tbl['vsini']>0], 
                r'$v \sin i$', norm=LogNorm(0.1, 100.))
fig

### Now select stars in the upper corner to look at:

In [None]:
corner_tmp = tbl[(tbl['logg'] > 0.) & (tbl['logg'] < 2.)].groupby('apogee_id')
corner = corner_tmp.filter(lambda x: np.percentile(x['P'], 85) < get_P(1.5*u.Msun, 0.01*u.Msun, x['logg']).value[0])

In [None]:
cmap = plt.get_cmap('magma_r')
norm = LogNorm(1, 10)
colors = cmap(norm(corner['K']))

for apid in np.unique(corner['apogee_id']):
    mask = corner['apogee_id'] == apid
    colors[mask, 3] = min(1, np.sqrt(1/mask.sum()))

In [None]:
fig, ax = plt.subplots(1, 1, figsize=(7.2, 6))

ax.scatter(corner['P'], corner['logg'], color=colors,
           marker='o', s=7, linewidth=0, cmap=cmap, norm=norm)
cs = ax.scatter([-9999, -9999], [-9999, -9999], c=[norm.vmin, norm.vmax], 
                cmap=cmap, norm=norm) # major hack to put in colorbar!
cb = fig.colorbar(cs)
cb.set_label('$K$ [{0:latex_inline}]'.format(u.km/u.s))

# -- P curves --
logg = np.linspace(0, 4, 1024)
M1 = 1.5*u.Msun
P1 = get_P(M1, 1E-5*u.Msun, logg).value
P2 = get_P(M1, M1, logg).value
ax.fill_betweenx(logg, P1, P2, alpha=0.5, linewidth=0, color='#aaaaaa', zorder=-100,
                 label='$M_1 = ${0:.1f} {1:latex_inline}'.format(M1.value, M1.unit))

ax.legend(loc='lower right')

ax.set_xscale('log')
ax.set_xlim(1, 1000)
ax.set_ylim(2., -0.02)
ax.set_xlabel('$P$ [day]')
ax.set_ylabel('$\log g$')

fig.tight_layout()