# Imports

---

In [1]:
import numpy as np 
import pandas as pd

from sklearn.model_selection import train_test_split

from sklearn.metrics import confusion_matrix, accuracy_score

# Cargar Data

---

In [2]:
#index col para que sepa que esa corresponde a los indices
df_data = pd.read_csv('./dataset_clean.csv', index_col=[0])

# Split entre target y patron
---

- Split

In [3]:
x = df_data.drop('StarType', axis=1)
y = df_data['StarType']

- Validación

In [4]:
print(x.shape)
print(y.shape)

(240, 6)
(240,)


# Split entre train y test

---

- Split

In [5]:
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.2, random_state=42, shuffle = True)

- Validación

In [6]:
print(x_train.shape)
print(x_test.shape)

(192, 6)
(48, 6)


# Análisis exploratorio - Entrenamiento

---

> Formo DF con la data a entrenar

In [7]:
data = x_train
data['StarType'] = y_train

> Gráficas 2D, feature vs target

- Target vs variables categóricas (Gráfica de repetición)

In [8]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"bar","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"nominal","field":"StarType","scale":{"type":"linear"}},"y":{"sort":null,"type":"nominal","field":"StarColor","scale":{"type":"linear"}},"color":{"sort":null,"type":"quantitative","scale":{"scheme":"redpurple"},"aggregate":"count"}}}""")

<__main__.DeepnoteChart at 0x7f95b5dd2fa0>

In [9]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"bar","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"nominal","field":"StarType","scale":{"type":"linear"}},"y":{"sort":null,"type":"nominal","field":"SpectralClass","scale":{"type":"linear"}},"color":{"sort":null,"type":"quantitative","scale":{"scheme":"redpurple"},"aggregate":"count"}}}""")

<__main__.DeepnoteChart at 0x7f95b5e046d0>

- Target vs varaibles numéricas (Gráficas de dispersión

In [10]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"StarType","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"quantitative","field":"Temperature","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95c12f1ca0>

In [11]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"StarType","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"quantitative","field":"Luminosity","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b5e041f0>

In [12]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"StarType","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"quantitative","field":"Radius","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b5dd2cd0>

In [13]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"StarType","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"quantitative","field":"AbsoluteMagnitude","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95c1225d90>

> Gráficas 3D, 2_features vs target

In [14]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"Temperature","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"quantitative","field":"AbsoluteMagnitude","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b542f730>

In [15]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"Luminosity","scale":{"type":"linear","zero":false,"domainMax":0.1}},"y":{"sort":null,"type":"quantitative","field":"AbsoluteMagnitude","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b54179a0>

In [16]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"Radius","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"quantitative","field":"AbsoluteMagnitude","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b5e040a0>

In [17]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"Temperature","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"quantitative","field":"Luminosity","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b539eb80>

In [18]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"Radius","scale":{"type":"linear","zero":false,"domainMax":17}},"y":{"sort":null,"type":"quantitative","field":"Luminosity","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b539e310>

In [19]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"Radius","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"quantitative","field":"Temperature","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b539e880>

In [20]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"Radius","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"nominal","field":"StarColor","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b539ee20>

In [21]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"AbsoluteMagnitude","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"nominal","field":"StarColor","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b52c4700>

In [22]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"Radius","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"nominal","field":"SpectralClass","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b52c49a0>

In [23]:
DeepnoteChart(data, """{"mark":{"clip":true,"type":"point","tooltip":true},"config":{"legend":{}},"$schema":"https://vega.github.io/schema/vega-lite/v5.json","encoding":{"x":{"sort":null,"type":"quantitative","field":"AbsoluteMagnitude","scale":{"type":"linear","zero":false}},"y":{"sort":null,"type":"nominal","field":"SpectralClass","scale":{"type":"linear","zero":false}},"color":{"sort":null,"type":"nominal","field":"StarType","scale":{"scheme":"tableau10"}}}}""")

<__main__.DeepnoteChart at 0x7f95b52c4e80>

<a style='text-decoration:none;line-height:16px;display:flex;color:#5B5B62;padding:10px;justify-content:end;' href='https://deepnote.com?utm_source=created-in-deepnote-cell&projectId=dbb742f7-e9e6-418d-9e02-197ef81a0ca5' target="_blank">
 </img>
Created in <span style='font-weight:600;margin-left:4px;'>Deepnote</span></a>