# Semantic Similarity - Experiment 01
The objective of this trial is to expand the SCA_index (i.e., Semantic Content Analysis Index) to a full word embedding, setting a subjective or objective load for each word.

## Introduction

### Libraries

In [239]:
## Data analysis packages:
import pandas as pd
import numpy as np
from math import isnan  #Verifies if a given value is numerical.
import re  # Regular Expression

In [240]:
## Visualization packages:
# import seaborn as sns
import matplotlib.pyplot as plt
%matplotlib inline

### Definitions

In [241]:
## Forcing Pandas to display any number of elements
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', 50)
pd.set_option('display.max_seq_items', None)
pd.set_option('display.width', 2000)
pd.set_option('display.max_colwidth', None)

## SpaCy Word Embeddings: 
Also using Spacy library: https://spacy.io/
> !pip install -U spacy  
> !python -m spacy download en_core_web_sm  
> !python -m spacy download en_core_web_lg

Some instructions on how to use it:  
https://spacy.io/usage/spacy-101

In [242]:
## Importing SpaCy library:
import spacy

# Load English tokenizer, tagger, parser and NER
nlp = spacy.load("en_core_web_lg")

In [243]:
## We check below that this model has 514.157 keys and vectors, respectively.
nlp.meta['vectors']

{'width': 300,
 'vectors': 514157,
 'keys': 514157,
 'name': 'en_vectors',
 'mode': 'default'}

In [244]:
## Again, checking the number of keys.
nlp.vocab.vectors.n_keys

514157

In [245]:
## Finding the SpaCy index for a given word:
nlp.vocab.strings['case']

8110129090154140942

In [246]:
## Getting the text and vector for a given index:
tmp_Idx = 8110129090154140942

tmp_vector = nlp.vocab[tmp_Idx].vector
tmp_text = nlp.vocab[tmp_Idx].text

In [247]:
print(f'{tmp_Idx}: {tmp_text}:\n{tmp_vector[0:3]}...')

8110129090154140942: case:
[-0.3132   0.13839 -5.2377 ]...


In [249]:
## Defining a method to get vector and text information for a word:
def nlp_getVector(word, verbose=False):
    '''
    Obtains the vector representation of a given word from SpaCy word embedding.
    Usage:  nlp_getVector(word)[0] to get the text; nlp_getVector(word)[1] to get the vector.
            var_text, var_vector = nlp_getVector(word)
    '''
    ## Generates the word hash:
    hash = nlp.vocab.strings[word]
    try:
        word_vector = nlp.vocab[hash].vector
        word_text = nlp.vocab[hash].text
    except:
        if verbose:
            print('Error: word vector not available.')
        return None
    return (word_text, word_vector)

In [259]:
## Testing the method:
print(f'Word: {nlp_getVector("study")[0]} <-> Vector 3rd elements: {nlp_getVector("study")[1][:3]}')

Word: study <-> Vector 3rd elements: [-0.64776 -1.3091   2.0104 ]


---
## SCA - Glasgow Norms
* Read the SCA from Glasgow Norms;  
* Import F_s and F_o from the previous study;  
* Train the MLP classifier.

In [11]:
df_factors = pd.read_csv('../data/df_factors.csv', sep=';')
df_factors.head()

Unnamed: 0,words,F_Objectivity,F_Subjectivity,F_Context
0,abattoir,0.512527,0.380603,0.960466
1,abbey,0.714765,0.240456,0.696198
2,abbreviate,0.286952,0.171052,0.767043
3,abdicate,0.144736,0.3843,0.863127
4,abdication,0.167654,0.334086,0.896733


### DataPrep: De-Duplicating words  
There are words in the Glasgow Norms that were differentiated from their homonymous, such as 'case'. In this section, we first select those words and then input a mean value for them.

In [266]:
## Exemplifying the need for de-duplication:
df_factors[df_factors['words'].str.contains('case')]

Unnamed: 0,words,F_Objectivity,F_Subjectivity,F_Context
533,bookcase,0.926393,0.374441,0.335542
756,case,0.715863,0.1641,0.409611
757,case (container),0.821136,0.079956,0.400335
758,case (instance),0.23382,0.213528,0.651273
759,case (legal),0.45626,0.369828,0.733642
4808,suitcase,0.961068,0.256584,0.356338


In [13]:
## Creating a new dataframe by splitting the 'words' column into two columns:
df_homonym = df_factors.copy()
df_homonym[['word','distinction']] = df_homonym['words'].str.split('(', expand=True)
## Renaming the columns of the new dataframe:
# df_homonym.columns = ['word','distinction']

# Stripping whitespace from the new columns
df_homonym['word'] = df_homonym['word'].str.strip()
df_homonym['distinction'] = df_homonym['distinction'].str.strip().str.rstrip(')')

## Showing dataframe:
df_homonym.head(5)

Unnamed: 0,words,F_Objectivity,F_Subjectivity,F_Context,word,distinction
0,abattoir,0.512527,0.380603,0.960466,abattoir,
1,abbey,0.714765,0.240456,0.696198,abbey,
2,abbreviate,0.286952,0.171052,0.767043,abbreviate,
3,abdicate,0.144736,0.3843,0.863127,abdicate,
4,abdication,0.167654,0.334086,0.896733,abdication,


In [15]:
# Calculating the number of distinct elements in the 'distinction' column for each word in the 'word' column
distinct_count = df_homonym.groupby('word')['distinction'].nunique().reset_index()

# Counting the frequency of different numbers of distinct elements
pivot_table = distinct_count.groupby('distinction')['word'].count().reset_index()

# Renaming the columns
pivot_table.columns = ['n_distinction', 'n_words']
pivot_table

Unnamed: 0,n_distinction,n_words
0,0,4303
1,1,2
2,2,288
3,3,69
4,4,19
5,5,2


#### Analyzing the words with 5 distinct meaning:

In [18]:
## Getting the word with the highest number of distinct meanings: 
distinct_count[distinct_count['distinction'] == 5]

Unnamed: 0,word,distinction
721,charge,5
822,club,5


In [22]:
df_homonym[(df_homonym['word']=='club') | (df_homonym['word']=='charge')]

Unnamed: 0,words,F_Objectivity,F_Subjectivity,F_Context,word,distinction
819,charge,0.340881,0.330534,0.438418,charge,
820,charge (card),0.477083,0.293352,0.671798,charge,card
821,charge (dependent),0.256759,0.164572,0.791042,charge,dependent
822,charge (electric),0.391504,0.41308,0.697287,charge,electric
823,charge (price),0.428509,0.353942,0.49877,charge,price
824,charge (rush),0.551191,0.557549,0.591914,charge,rush
942,club,0.774815,0.476734,0.467275,club,
943,club (card suit),0.773094,0.187918,0.492067,club,card suit
944,club (disco),0.863845,0.547812,0.658553,club,disco
945,club (hit),0.725571,0.435103,0.60793,club,hit


#### Replacing the distinct values for the average (column 'word'):

In [24]:
# Calculating the mean of F_Objectivity and F_Subjectivity for each group of "word"
mean_values = df_homonym.groupby('word')[['F_Objectivity', 'F_Subjectivity']].mean().reset_index()

In [25]:
mean_values

Unnamed: 0,word,F_Objectivity,F_Subjectivity
0,Apple,0.940620,0.524376
1,Christmas,0.850793,0.833898
2,Dad,0.856533,0.493834
3,Dame,0.626968,0.300580
4,FALSE,0.156905,0.473624
...,...,...,...
4678,zeppelin,0.864760,0.396531
4679,zero,0.379392,0.315118
4680,zest,0.402894,0.476800
4681,zoo,0.867152,0.507390


In [111]:
## Merging the mean values back into the original DataFrame
df = pd.merge(df_homonym, mean_values, on='word', suffixes=('', '_mean'))

## Checking an example (is the "_mean" values equal for all instances?): 
df[df['word'] == 'charge']

Unnamed: 0,words,F_Objectivity,F_Subjectivity,F_Context,word,distinction,F_Objectivity_mean,F_Subjectivity_mean
819,charge,0.340881,0.330534,0.438418,charge,,0.407655,0.352172
820,charge (card),0.477083,0.293352,0.671798,charge,card,0.407655,0.352172
821,charge (dependent),0.256759,0.164572,0.791042,charge,dependent,0.407655,0.352172
822,charge (electric),0.391504,0.41308,0.697287,charge,electric,0.407655,0.352172
823,charge (price),0.428509,0.353942,0.49877,charge,price,0.407655,0.352172
824,charge (rush),0.551191,0.557549,0.591914,charge,rush,0.407655,0.352172


In [112]:
## Dropping duplicated words (by column)
df.drop_duplicates(subset=['word'], inplace=True)

## Selecting only the columns of interest:
df = df[['word', 'F_Objectivity_mean', 'F_Subjectivity_mean']]

## Renaming the columns to remove the "_mean" suffix
df.rename(columns={'F_Objectivity_mean': 'F_Objectivity', 'F_Subjectivity_mean': 'F_Subjectivity'}, inplace=True)

In [113]:
## Showing dataframe:
print(df.info())
df.head(5)

<class 'pandas.core.frame.DataFrame'>
Int64Index: 4683 entries, 0 to 5552
Data columns (total 3 columns):
 #   Column          Non-Null Count  Dtype  
---  ------          --------------  -----  
 0   word            4683 non-null   object 
 1   F_Objectivity   4683 non-null   float64
 2   F_Subjectivity  4683 non-null   float64
dtypes: float64(2), object(1)
memory usage: 146.3+ KB
None


Unnamed: 0,word,F_Objectivity,F_Subjectivity
0,abattoir,0.512527,0.380603
1,abbey,0.714765,0.240456
2,abbreviate,0.286952,0.171052
3,abdicate,0.144736,0.3843
4,abdication,0.167654,0.334086


In [114]:
## Saving the prepared data:
df.to_csv('../data/df_factors_prepared.csv')

In [115]:
# ### Selecionando apenas as palavras no df_factors que atendam aos critérios:
# df_selected = df.loc[((df['F_Subjectivity'] > 0.75) | (df['F_Subjectivity'] < 0.3)) & ((df['F_Objectivity'] > 0.75) | (df['F_Objectivity'] < 0.3))]
# df_factors = df_selected.copy()

In [116]:
## Generating a list of words from SCA for training.
SCA_words = [word for word in df.word]
len(SCA_words)

4683

In [117]:
## Preparing dataframe for training:
# df.set_index('word', inplace=True)

In [118]:
df

Unnamed: 0,word,F_Objectivity,F_Subjectivity
0,abattoir,0.512527,0.380603
1,abbey,0.714765,0.240456
2,abbreviate,0.286952,0.171052
3,abdicate,0.144736,0.384300
4,abdication,0.167654,0.334086
...,...,...,...
5548,zeppelin,0.864760,0.396531
5549,zero,0.379392,0.315118
5550,zest,0.402894,0.476800
5551,zoo,0.867152,0.507390


### Splitting SCA-Glasgow Norms data into train and test:

In [119]:
from sklearn.model_selection import train_test_split

# Splitting data in train (75%) and test (25%)
train_df, test_df = train_test_split(df, test_size=0.25, random_state=42)

In [120]:
train_df.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 3512 entries, 213 to 1012
Data columns (total 3 columns):
 #   Column          Non-Null Count  Dtype  
---  ------          --------------  -----  
 0   word            3512 non-null   object 
 1   F_Objectivity   3512 non-null   float64
 2   F_Subjectivity  3512 non-null   float64
dtypes: float64(2), object(1)
memory usage: 109.8+ KB


In [272]:
def generateData(df_sca:pd.DataFrame):
    '''Creates a dataset with explanatory variables from word embedding and dependent variables based on the SCA target data.
    Usage example: "X_train, Y_train = generateData(df)"
    Input: Pandas.DataFrame with SCA words.
    Output: X: dataframe with explanatory variables; Y: dataframe with dependent variables.
    '''
    X = {}
    Y = {}
    
    for i, row in df_sca.iterrows():
        word = row['word']
        f_objectivity = row['F_Objectivity']
        f_subjectivity = row['F_Subjectivity']

        try:
            X[word] = nlp_getVector(word)[1]  # Stores the word vector
            Y[word] = {'F_Objectivity': f_objectivity, 'F_Subjectivity': f_subjectivity}
            # print(f'Debug: {word} <=> {nlp_getVector(word)[0]}')
        except:
            pass

    return pd.DataFrame.from_dict(X, orient='index'), pd.DataFrame.from_dict(Y, orient='index')

In [273]:
## Generating data:
X_train, Y_train = generateData(train_df)
X_test, Y_test = generateData(test_df)

In [274]:
## Checking the generated data dimension:
print("Train data dimension:")
print("X_train:", X_train.shape)
print("Y_train:", Y_train.shape)

print("\nTest data dimension:")
print("X_test:", X_test.shape)
print("Y_test:", Y_test.shape)

Train data dimension:
X_train: (3511, 300)
Y_train: (3511, 2)

Test data dimension:
X_test: (1170, 300)
Y_test: (1170, 2)


In [275]:
Y_train

Unnamed: 0,F_Objectivity,F_Subjectivity
argument,0.365722,0.647198
awful,0.201122,0.507171
decorator,0.774472,0.291107
misconception,0.013464,0.474901
crab,0.816438,0.227631
...,...,...
vaccinate,0.678125,0.443751
boastful,0.437815,0.575248
phrase,0.265757,0.144886
ski,0.900524,0.370531


---
### Training a MLP Classifier for word semantic content

In [134]:
import numpy as np
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
from sklearn.preprocessing import LabelEncoder
from sklearn.preprocessing import OneHotEncoder
from sklearn.preprocessing import MultiLabelBinarizer

In [276]:
### Model 01: MLP architecture for continuous output:
model = Sequential([
    Dense(256, activation='relu', input_shape=(300,)),
    Dense(128, activation='relu'),
    Dense(64, activation='relu'),
    Dense(32, activation='relu'),
    Dense(2, activation='linear')  # 2 neurons for continuous output between 0 and 1
])

# Compile the model
model.compile(optimizer='adam',
              loss='mean_squared_error',
              metrics=['accuracy'])

In [279]:
# Print model summary
model.summary()

Model: "sequential_3"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_15 (Dense)            (None, 256)               77056     
                                                                 
 dense_16 (Dense)            (None, 128)               32896     
                                                                 
 dense_17 (Dense)            (None, 64)                8256      
                                                                 
 dense_18 (Dense)            (None, 32)                2080      
                                                                 
 dense_19 (Dense)            (None, 2)                 66        
                                                                 
Total params: 120354 (470.13 KB)
Trainable params: 120354 (470.13 KB)
Non-trainable params: 0 (0.00 Byte)
_________________________________________________________________


In [280]:
## Transforming data into numpy array:
Y_train_array = Y_train.to_numpy()
Y_test_array = Y_test.to_numpy()

X_train_array = X_train.to_numpy()
X_test_array = X_test.to_numpy()

# Print the first few elements to verify
print(Y_train_array[:5])  # Print the first 5 elements


[[0.36572243 0.64719766]
 [0.20112169 0.50717064]
 [0.77447234 0.29110657]
 [0.01346386 0.47490132]
 [0.81643835 0.2276313 ]]


In [284]:
# Train the model
history = model.fit(X_train_array, Y_train_array, epochs=50, batch_size=16, validation_split=0.2)

Epoch 1/50
Epoch 2/50
Epoch 3/50
Epoch 4/50
Epoch 5/50
Epoch 6/50
Epoch 7/50
Epoch 8/50
Epoch 9/50
Epoch 10/50
Epoch 11/50
Epoch 12/50
Epoch 13/50
Epoch 14/50
Epoch 15/50
Epoch 16/50
Epoch 17/50
Epoch 18/50
Epoch 19/50
Epoch 20/50
Epoch 21/50
Epoch 22/50
Epoch 23/50
Epoch 24/50
Epoch 25/50
Epoch 26/50
Epoch 27/50
Epoch 28/50
Epoch 29/50
Epoch 30/50
Epoch 31/50
Epoch 32/50
Epoch 33/50
Epoch 34/50
Epoch 35/50
Epoch 36/50
Epoch 37/50
Epoch 38/50
Epoch 39/50
Epoch 40/50
Epoch 41/50
Epoch 42/50
Epoch 43/50
Epoch 44/50
Epoch 45/50
Epoch 46/50
Epoch 47/50
Epoch 48/50
Epoch 49/50
Epoch 50/50


In [285]:
# Evaluate the model
loss, accuracy = model.evaluate(X_test_array, Y_test_array)
print(f"Test Accuracy: {accuracy * 100:.2f}%")

Test Accuracy: 86.32%


### Applying the trained model to predict SCA for a distinct word:

In [316]:
# X_test_array[0]

In [287]:
entry = 'monster'

new_entry = nlp_getVector(entry)[1]
new_entry = np.expand_dims(new_entry, axis=0)

In [289]:
result = model.predict(new_entry)
result



array([[0.73337203, 0.6955369 ]], dtype=float32)

In [290]:
def wordClassifier(word):
    '''Given a word vector, shows the probability for objective and subjective semantic content, respectively.'''
    new_entry = nlp_getVector(word)
    if new_entry:
        vector = nlp_getVector(word)[1]
        vector = np.expand_dims(vector, axis=0)
        result = model.predict(vector)
    else:
        print('Word not existent in database.')
        return
    print(f'--- {word}:\n{result[0][0]*100:.2f} of objectivity\n{result[0][1]*100:.2f} of subjectivity')
    return


In [319]:
trial_word = 'hippopotamus'

In [320]:
wordClassifier(trial_word)



--- hippopotamus:
98.58 of objectivity
33.37 of subjectivity


In [321]:
df_factors[df_factors['words']==trial_word]

Unnamed: 0,words,F_Objectivity,F_Subjectivity,F_Context
2387,hippopotamus,0.973593,0.377959,0.309328


----
### Training a model for multilabel classification:

In [None]:
# Define a new MLP architecture
model = Sequential([
    Dense(256, activation='relu', input_shape=(300,)),
    Dense(128, activation='relu'),
    Dense(64, activation='relu'),
    Dense(32, activation='relu'),
    Dense(2, activation='softmax')  # 2 neurons for binary classification with softmax activation
])

# Compile the model
model.compile(optimizer='adam',
              loss='binary_crossentropy',  # Use categorical_crossentropy for categorical data
              metrics=['accuracy'])





In [None]:
# Como converti a saída em dados categóricos, é preciso antes utilizar OneHotEncoder:
# Use categorical_crossentropy for categorical data

#### Binarizing Y_train and Y_test
Once we run the first MLP model, the performance wasn't over 54%. 
In this Section, we will binarize the semantic factor values following the median values.

In [None]:
# Binarizing through list comprehension
Y_train['F_Objectivity'] = ['high' if f_objectivity >= 0.565 else 'low' for f_objectivity in Y_train['F_Objectivity']]
Y_train['F_Subjectivity'] = ['high' if f_subjectivity >= 0.392 else 'low' for f_subjectivity in Y_train['F_Subjectivity']]

Y_test['F_Objectivity'] = ['high' if f_objectivity >= 0.565 else 'low' for f_objectivity in Y_test['F_Objectivity']]
Y_test['F_Subjectivity'] = ['high' if f_subjectivity >= 0.392 else 'low' for f_subjectivity in Y_test['F_Subjectivity']]

In [None]:
# Binarizing through list comprehension
Y_train['F_Objectivity'] = [1 if f_objectivity >= 0.565 else 0 for f_objectivity in Y_train['F_Objectivity']]
Y_train['F_Subjectivity'] = [1 if f_subjectivity >= 0.392 else 0 for f_subjectivity in Y_train['F_Subjectivity']]

Y_test['F_Objectivity'] = [1 if f_objectivity >= 0.565 else 0 for f_objectivity in Y_test['F_Objectivity']]
Y_test['F_Subjectivity'] = [1 if f_subjectivity >= 0.392 else 0 for f_subjectivity in Y_test['F_Subjectivity']]

In [None]:
# Convert multilabel categorical labels to binary vectors
multi_label_binarizer = MultiLabelBinarizer()
Y_train_encoded = multi_label_binarizer.fit_transform(Y_train)
Y_test_encoded = multi_label_binarizer.transform(Y_test)

In [None]:
len(Y_train_encoded)

2

In [None]:
Y_train_encoded

array([[1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1],
       [1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]])

---
### Choosing outperformed model through PyCaret:

In [322]:
import pycaret.classification
import pycaret.regression

> Adjustin Y_train for use with PyCaret:

In [148]:
df = X_train.copy()

In [149]:
# Definir uma função para mapear os valores das colunas para os rótulos desejados
def map_labels(row):
    if row['F_Objectivity'] == 0 and row['F_Subjectivity'] == 1:
        return 'Latent'
    elif row['F_Objectivity'] == 0 and row['F_Subjectivity'] == 0:
        return 'Contextual'
    elif row['F_Objectivity'] == 1 and row['F_Subjectivity'] == 0:
        return 'Manifest'
    elif row['F_Objectivity'] == 1 and row['F_Subjectivity'] == 1:
        return 'Perceptual'

In [154]:
# Aplicar a função de mapeamento para criar a nova coluna "Target"
df['target'] = Y_train.apply(map_labels, axis=1)

In [151]:
## Adding F_Subjectivity and F_Objectivity to df:
df['F_Subjectivity'] = Y_train['F_Subjectivity']
df['F_Objectivity'] = Y_train['F_Objectivity']

In [152]:
df['target'] = Y_train['F_Subjectivity']

In [155]:
# Exibir as primeiras linhas do DataFrame resultante para verificar
df.head(10)

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111,112,113,114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132,133,134,135,136,137,138,139,140,141,142,143,144,145,146,147,148,149,150,151,152,153,154,155,156,157,158,159,160,161,162,163,164,165,166,167,168,169,170,171,172,173,174,175,176,177,178,179,180,181,182,183,184,185,186,187,188,189,190,191,192,193,194,195,196,197,198,199,200,201,202,203,204,205,206,207,208,209,210,211,212,213,214,215,216,217,218,219,220,221,222,223,224,225,226,227,228,229,230,231,232,233,234,235,236,237,238,239,240,241,242,243,244,245,246,247,248,249,250,251,252,253,254,255,256,257,258,259,260,261,262,263,264,265,266,267,268,269,270,271,272,273,274,275,276,277,278,279,280,281,282,283,284,285,286,287,288,289,290,291,292,293,294,295,296,297,298,299,target,F_Subjectivity,F_Objectivity
argument,-2.3992,-0.31061,0.16248,1.1939,4.553,2.608,2.3816,4.3793,-6.4059,-2.8989,6.9065,3.6357,-3.4818,-3.072,-1.5625,4.4574,2.4062,0.61288,-2.0203,1.854,-1.2827,-0.86692,-2.2344,-0.20293,-0.98764,-2.5703,-0.42565,-0.67371,-2.9512,2.5231,3.6174,2.046,0.93659,0.80884,-1.8359,-4.1538,-0.77178,-0.91474,0.3574,2.4311,-2.8427,-4.3941,0.18871,1.0475,-0.79925,-1.5843,3.4804,-2.8958,-1.4625,0.56112,-2.8675,2.7701,2.3915,-1.9063,-2.2535,-0.62433,3.1455,1.222,2.2854,0.36479,3.0918,1.6108,-1.6584,-1.6451,0.65175,2.8537,-3.2931,-4.5797,1.7337,3.352,1.7681,1.599,-5.0516,1.6644,-4.3692,1.1405,-3.9987,5.0947,-0.79874,-0.6081,-3.2158,-0.42495,1.4047,2.5423,0.58327,2.5293,-3.5585,-2.1892,4.4176,1.6439,3.4725,2.232,5.6429,-2.5572,3.2299,-2.3217,0.044789,3.1062,2.8293,-2.2333,3.6981,3.2175,4.477,3.1264,-0.69679,3.0372,3.2599,-4.1551,1.0466,-2.3053,0.066955,-0.96005,-0.48711,1.0598,1.9121,2.154,-4.6148,-0.60629,0.35795,-0.86739,-0.40956,-5.4357,0.59216,-1.7533,-3.3679,0.39749,3.545,-3.5528,0.71102,-4.57,-4.5825,-1.8462,3.9507,0.42573,0.61037,0.72052,0.78121,2.5482,0.79837,-1.8534,-1.4698,-0.71325,-0.21927,1.6808,1.2657,-0.95549,-4.6534,-0.4225,-0.65577,3.7836,0.58572,4.7582,-1.2812,1.6873,-1.4343,5.1048,1.8411,-0.33209,-2.8453,-4.3376,2.2446,0.060355,-0.28312,2.1109,-0.21476,-2.0898,-2.9909,1.6846,1.2215,-1.663,-0.2914,-0.15043,-0.089668,-1.3618,4.2523,1.0499,-0.83556,3.3452,-2.7199,-3.494,2.8196,3.0722,-0.12998,1.6373,-1.9782,2.9238,-2.1324,-1.1832,3.4495,2.6386,-2.6228,-3.0572,0.77354,1.6173,2.1261,-3.067,-0.84982,3.683,1.6198,6.2091,-2.4882,0.70562,0.36068,-0.85727,2.0703,-0.057408,-0.63836,0.62888,-0.26941,-1.8637,-2.4216,-1.4942,-2.671,4.4052,-0.89783,1.8478,1.4274,1.1662,4.0038,2.2062,-3.7706,-0.94775,0.081936,-0.052859,-1.1466,0.97386,1.6578,5.1659,1.9735,-0.10786,1.4671,-4.1792,1.5281,0.1311,1.1956,0.49311,2.8842,1.0306,2.3504,-2.6875,-1.0097,1.2478,1.2949,4.5648,0.51724,0.52477,-2.0162,2.0893,0.60699,1.5926,1.0539,-4.595,-3.701,-0.75894,-0.64485,-4.1829,-1.9371,-0.26863,0.26782,-0.63142,-2.1099,1.1534,1.6628,4.7483,0.86838,0.88791,4.31,4.3719,-3.0734,-1.1162,-0.31119,-1.4985,-1.2099,0.359,3.4704,-0.40592,0.012269,-1.6215,-1.3837,4.2299,1.4631,0.48673,1.7178,3.7604,4.8459,1.2913,4.031,-0.37738,-3.634,0.84509,3.235,-1.7311,1.3996,2.051,-4.2522,1.0911,3.7819,-0.92356,-1.8916,3.3504,Latent,1,0
awful,-0.33203,-0.3522,-0.011708,-0.88964,-0.75291,1.8457,0.62379,1.0119,2.1302,1.7795,1.2335,-1.2077,-1.6876,0.33506,0.37671,0.83856,0.031083,-4.4312,-0.83196,-1.0364,-1.2641,1.848,-0.28883,-1.5275,0.73359,-1.5575,0.28682,-0.65072,-0.7927,1.7292,0.32438,-0.93549,2.1866,-0.79948,-1.1394,-3.9373,-0.99964,-1.9653,1.9457,4.2572,-0.8012,-0.56891,-1.0241,-4.0848,-5.5438,0.4382,-0.082399,-4.6469,-2.4376,2.1422,-0.80818,-2.2621,3.8545,-2.4708,-1.7014,1.7238,1.5033,0.32218,-1.2073,0.41837,0.11265,0.39928,1.0922,-1.8873,-5.8734,-1.3336,-2.49,-1.3867,-1.2559,-1.1797,2.5552,1.7587,-1.9658,0.065817,1.1824,0.97211,-0.6205,0.44542,0.92654,1.3347,0.74309,1.5598,1.817,-1.1325,-2.7145,1.5573,-0.29974,-0.84252,2.1585,-1.295,-1.2291,-2.2871,-0.085077,-3.6376,-1.6964,-0.69068,0.93347,0.28267,-0.34476,-2.1725,-1.4491,1.3936,0.1783,1.5847,-3.98,0.54971,-0.37694,1.6987,-1.978,2.3775,-1.3384,-3.1121,1.7957,-1.1368,-0.49529,1.629,-2.4188,2.5688,2.2806,0.1688,-0.40327,0.6983,-4.5009,4.1832,-0.55077,0.054487,-0.59604,0.87615,-1.5814,-1.5783,1.6821,4.7371,-1.1554,-2.0906,0.3265,2.5854,1.3447,0.16899,1.9046,-3.2121,-3.2308,-1.037,0.58301,2.3261,-5.8928,0.38668,0.40396,0.6546,1.1612,-1.4183,0.32217,0.82264,-2.0215,1.3695,-2.7139,2.8976,2.1415,2.3856,-0.9723,0.96908,1.2456,-0.26443,-1.9519,0.051155,-1.987,0.65262,3.9224,-0.29806,-1.2094,3.4512,1.473,0.21217,2.3084,-4.0059,-2.395,-2.8058,-1.6577,2.8943,3.2329,-0.91901,-0.37853,1.1244,2.9871,1.3323,-0.92495,0.23867,-2.9782,0.13664,2.3691,-1.6737,-2.3126,0.50444,-0.86522,-1.8385,-1.9724,-4.2468,-1.9862,-0.92723,-0.16031,0.90947,-0.82526,1.7251,0.051674,-2.0646,-2.9562,1.9119,2.2549,-0.18586,-0.42561,0.40343,-1.3311,0.57066,-0.44766,-1.3727,-1.8881,-1.8829,-2.9078,1.7616,1.5483,-2.2205,-0.28344,-1.3311,-0.059834,3.8593,1.2231,-0.0147,-3.2513,0.46675,-1.0193,0.27312,-2.5954,-1.9974,3.3218,0.074786,-0.7847,0.012676,-0.83699,3.1354,-0.92994,0.1729,0.37295,-1.1619,1.3987,0.62199,-2.9019,-1.4288,-0.070483,-1.0229,-1.2622,1.1389,-1.6718,3.0847,-3.7988,1.9069,0.7855,-3.1037,-1.1206,1.8812,-0.89774,1.7879,3.1563,-0.67044,0.604,-0.74343,-0.13245,1.9818,1.4718,0.23751,-1.756,-0.94157,1.3824,-0.013683,-1.5881,1.7418,-2.3436,1.6381,2.5274,-1.5634,2.2981,-1.798,-1.6546,-2.3959,0.46843,0.99801,1.7397,-1.9655,3.3896,-0.55801,-0.75166,-0.4585,-0.33523,-0.37922,4.5423,-2.3235,-1.3455,-2.0702,0.20349,3.63,1.0342,1.6829,Latent,1,0
decorator,-4.1386,-3.1015,-2.3938,-1.231,-0.20878,-3.9616,0.000133,1.2154,-0.7785,4.8967,4.6354,0.25068,-3.1679,1.7419,3.6225,0.49026,0.04773,3.9378,-0.35841,-2.4302,-1.5988,-0.020996,1.0556,3.4888,-1.6606,0.7027,-4.4183,-0.22423,-1.404,-3.2849,0.30462,-1.9961,2.2648,-0.64048,-1.9628,2.4705,1.264,0.27926,1.726,-0.9893,-1.4099,-2.0769,3.544,-0.39312,-2.4564,0.75642,-1.4308,-1.3723,0.48491,-0.73407,-1.7195,2.1652,1.165,-1.0638,-2.987,1.4789,-0.13572,-0.41703,0.25105,-1.4597,-0.014275,-2.8683,-0.30213,-2.4969,-0.70024,-2.5352,-0.99733,-2.2389,-1.1097,0.57388,-2.2268,-0.81113,-2.3714,1.4812,3.1252,-0.3127,0.97177,-0.68518,-0.18344,-1.3845,-0.98578,-1.6648,-0.58721,-1.8918,-0.90744,-0.50375,1.9869,3.0689,-1.6181,-1.1639,-2.7764,1.0395,1.7028,-2.0478,3.119,-2.6577,4.217,-0.88798,0.50361,0.24387,-2.4982,-1.1432,0.86359,0.58194,1.0584,1.3055,-0.97641,0.24125,3.9932,-0.97158,1.3091,0.77322,0.42159,0.75759,-2.7845,-2.2285,1.3547,0.15916,1.37,-2.327,-1.4164,2.1623,0.47771,1.7667,4.5932,-0.92376,-1.7562,-0.83212,5.2864,-0.7798,-1.9111,1.7821,-0.20666,-4.1798,0.37562,-2.3209,0.69554,-2.982,2.3817,1.5393,0.42728,2.9439,-1.1859,0.38971,3.1219,-0.89303,-2.5645,-0.035272,1.3756,-1.8025,0.86336,-0.94475,-0.53347,-0.32559,0.94793,-2.7279,0.87363,0.27429,0.68351,-2.7655,2.0413,-1.9574,2.7513,-0.91174,1.2906,1.8918,-4.4985,-2.9007,-1.0319,0.038302,0.6212,-1.6631,0.20181,1.2056,1.642,0.30736,1.3917,-1.7526,-1.3786,-1.4609,-1.4873,0.95038,-3.1008,-2.8572,1.4541,-0.70981,3.7476,-1.2609,-2.7944,3.4474,0.94558,-0.54897,-1.9714,1.9329,-0.28302,2.7275,1.3642,2.6148,5.4589,-1.3626,3.5898,-2.922,0.5044,-0.21339,-0.45199,-2.4134,-1.1713,1.0255,1.1701,-1.5612,1.5171,-0.048064,2.6453,3.546,-0.010302,0.45441,3.3834,-1.7095,-1.4317,1.0584,3.4095,1.3125,-2.1436,2.8298,-0.96006,-1.7471,2.0353,2.6907,1.5716,1.2965,-1.5845,1.2718,-1.0468,1.0376,-4.0034,-1.697,-2.6232,-1.3854,1.9864,0.70325,-1.2446,2.1575,0.95457,1.7929,2.8269,-3.7791,0.25697,0.070994,-4.4222,2.7658,0.2541,0.13624,-2.5759,-2.7518,-1.2851,1.6678,0.51108,1.2275,-2.1805,-3.1717,-0.35066,2.2748,-2.3825,-1.2273,-0.024748,0.44043,1.3198,1.6581,-3.0111,0.53332,-0.081214,1.185,-3.5595,-0.49396,-1.608,-1.6824,-1.6511,2.8946,-1.3568,2.4459,-0.19233,0.1483,-0.14696,2.2328,5.9329,-0.84719,-1.3155,3.2719,-2.6182,1.6468,-0.68108,1.7715,0.45993,1.2345,-2.6731,-0.080917,-0.17837,0.10582,-2.1597,-0.78127,Manifest,0,1
misconception,-1.4402,-0.65446,1.4217,-0.39426,2.4413,1.2243,3.4867,3.9112,-1.8492,-0.8338,5.1676,0.86987,-1.9083,-0.31838,0.43387,3.0635,2.5631,1.4277,-2.3653,0.17331,0.11683,2.0736,-3.4689,1.2091,-1.9544,-2.7962,-1.2776,-0.51866,-2.1115,1.3227,1.4151,-0.012075,-1.1209,-1.7492,-2.2638,-0.74907,0.69087,0.06555,0.039321,-0.48229,0.36317,-0.8468,-1.3201,0.32879,-3.1619,0.33472,2.2814,-2.2169,0.88499,1.0909,-1.7011,1.191,-0.39597,-2.0544,-1.559,1.1961,0.93411,1.8918,0.77402,1.4895,0.063936,0.77872,-0.73827,-0.33916,0.36916,0.17412,-1.8379,-5.0217,1.6003,3.2665,-0.16008,1.0169,-2.3414,1.0779,-3.2839,1.1322,-2.1571,1.1552,-1.6779,-0.063517,-1.9009,1.266,1.6506,0.56655,1.6223,0.6485,-4.2968,-2.347,1.7901,1.047,1.3449,0.47285,2.6631,-3.5844,0.1274,-0.72851,-0.5126,0.8937,2.0055,-0.12694,1.384,2.2943,2.5281,1.6349,-0.17525,4.5608,0.28487,-1.1896,0.98215,-2.406,0.5531,-0.084463,-0.16912,0.65434,0.27161,2.6443,-4.8506,-1.3368,0.15755,-0.63597,-1.2589,-2.0001,-0.17487,0.20887,-1.9063,-2.197,0.34965,-3.1823,2.2248,-2.9995,-3.9624,0.38309,3.677,0.93066,-1.8817,-0.28573,-0.2224,-0.4528,1.749,-1.1686,-0.61897,-1.2477,0.51393,1.5266,1.5007,-0.78604,-5.0657,-1.3547,0.014334,2.572,1.7036,1.3756,-0.83479,0.49078,-0.94801,1.0211,2.2587,0.4133,0.33318,-2.2485,0.8179,-0.44951,2.3934,1.4027,-0.92554,-2.6183,-2.7874,0.46414,1.5608,-0.99683,-1.9825,-1.4086,1.5608,-0.20157,2.2863,2.3746,0.2102,1.6613,-1.8168,-1.8884,-2.3221,0.338,3.5442,0.17021,-2.1183,1.2442,-4.5057,-2.297,2.7645,-0.59,-2.9532,-0.53757,1.1516,0.22778,1.8715,-0.58833,-3.2131,1.7799,0.2306,1.7487,0.30053,-0.91628,-1.5132,-0.56853,3.4144,0.67373,-2.3471,-0.4056,-0.77719,-2.7197,-0.55854,-0.44305,-2.018,1.6621,0.31626,2.2798,-0.019118,-3.1911,2.6161,-0.22491,-2.0511,0.1054,0.15916,-0.21171,-3.1359,0.24266,0.63316,3.1142,3.0083,1.0304,3.2249,-2.129,0.88666,1.3206,1.4633,0.52763,-0.14561,1.048,1.5947,2.4876,-1.0903,2.0532,2.1596,1.6949,1.0212,-0.024739,-1.2934,0.79863,-2.2456,1.8509,-0.57083,-2.7462,-3.6962,-1.1295,1.5435,-1.164,0.57704,-0.16744,-1.0351,-0.98163,-0.7997,1.0689,4.2378,3.0994,0.34475,0.84469,-0.054672,3.0686,-2.4895,2.0819,-0.60857,0.26739,2.0732,-1.3259,1.8659,-0.41704,0.65279,-2.4071,-1.3299,2.6432,1.0332,-0.08317,1.5587,-1.6429,1.7027,0.51001,2.03,0.98399,-0.32521,-0.73525,2.6954,-1.2421,2.6301,-0.89313,-0.80961,0.53661,2.653,-2.677,-2.5539,3.2993,Latent,1,0
crab,-0.29427,-3.7722,-0.70715,0.25983,1.1896,-4.6194,-3.1746,3.5919,-2.7857,2.0993,5.1909,-2.9512,4.8228,2.4383,2.7648,-6.8133,1.2498,1.5006,2.3022,-3.0483,0.36441,1.4081,0.2072,-1.0621,3.856,-1.655,-2.6829,1.2367,1.147,-0.44072,-1.8968,-3.5897,2.8847,-1.0354,4.1177,-2.9036,2.1296,-1.4676,1.7176,0.3518,0.94584,-1.8373,1.6568,2.3472,1.336,0.36764,-0.066217,0.026254,-1.3419,-0.54964,-2.2419,4.5371,1.8795,-1.1457,-0.97683,-3.3804,-2.9459,1.4787,3.6315,-1.4301,2.2153,-2.654,4.4665,4.6551,-1.0925,-3.4833,-3.3094,1.8197,1.0144,-0.83145,-1.4881,-2.9439,2.0533,2.0508,-0.33346,-1.1789,-3.0011,-5.8109,2.9063,-1.8477,1.8378,2.5305,2.2667,0.56153,-0.744,-0.9307,6.2968,0.41122,-4.4369,-1.893,7.9089,-0.12312,1.2284,-2.9929,-0.86969,1.3083,3.6287,-2.3695,-0.57882,-3.6461,-1.0322,-2.6258,0.012072,-4.2169,-2.1101,-0.88852,-5.93,5.0993,-1.0264,-1.1267,2.0179,2.9652,-0.76725,0.52211,-1.5886,1.9468,3.9383,1.2072,-2.6141,-1.2892,-0.85353,5.0776,-7.4852,-0.99613,-4.8849,-0.11981,-0.43466,-5.6086,2.0115,2.623,1.0902,-0.068215,3.4199,-1.1515,4.626,-2.5621,-3.0781,-2.581,-7.8281,-4.7115,-5.977,-2.6534,-3.8619,-1.5465,1.2815,-1.4557,-0.57384,2.7916,-4.704,-5.4503,-0.46227,5.7129,1.221,-3.0806,3.5463,-3.199,1.6612,-0.46012,-2.2152,-0.22702,-0.86561,-2.1312,-0.17625,-3.0669,-2.314,-2.9181,-0.54938,1.9334,2.5295,1.8297,2.2901,0.73415,0.081001,-1.2242,-4.2767,0.76178,-0.061992,-4.3725,2.7237,-0.17234,0.30793,-0.28302,1.2182,2.7848,-0.65654,0.28948,1.6417,-2.6799,-1.3383,0.13474,-2.311,0.55091,0.29671,-1.239,0.37136,-1.3171,-1.0493,0.99578,0.63019,-2.4233,-0.031176,0.99886,1.9838,3.1585,0.64745,-2.3745,0.064163,-1.466,1.1143,-0.34595,3.8584,5.0711,-0.055536,-2.4047,1.3484,-0.22253,4.4948,1.0491,-1.1675,-3.1552,5.7374,-3.4235,1.7186,2.8864,-0.40758,-6.4238,-2.595,-2.3009,1.6254,3.1015,2.7358,-1.5354,3.0235,-0.8343,-3.4694,-0.31298,-1.1528,0.83032,-2.0859,-1.8289,-1.7176,-4.3441,1.5275,5.9588,-3.1113,0.42588,2.7929,-1.1499,-1.5478,-1.7938,-1.8773,-0.66235,0.52911,-0.1756,-1.5163,-2.8854,4.7417,9.2722,-1.8559,2.9054,1.9735,-0.069534,0.75262,0.87348,-5.2076,-0.63884,-1.3027,-3.7327,-4.3943,4.9316,3.5591,-0.11526,1.0412,4.1393,0.55631,-4.3276,3.124,3.0651,1.5307,0.5209,0.91262,-0.33345,-3.4183,-0.089182,0.59738,1.8521,-1.3994,-2.9822,-2.7877,1.508,3.998,-2.5987,7.186,-0.18771,-1.6689,1.5884,0.81274,1.517,-2.0713,2.9804,Manifest,0,1
slack,-0.8903,2.5954,-1.4784,2.9799,-0.22046,1.2561,-2.2329,1.5948,-2.6639,-2.4245,0.41425,3.808,0.66122,-1.3428,2.3146,-0.11182,2.5034,1.8001,0.18106,0.94973,2.5664,1.5234,1.5861,-5.8773,2.2164,-2.4085,-1.5474,-1.7697,-0.47438,0.91776,-1.9555,-3.2811,1.4936,1.1842,0.28826,0.3609,0.50114,1.3362,1.8242,3.8384,4.1685,-1.8755,-1.844,-0.73599,0.26254,0.93965,1.7538,0.3011,-1.8249,2.1807,-0.9006,0.10381,0.82836,-0.17692,0.49856,0.46803,0.28309,-1.4599,1.0971,-0.13214,1.3233,-1.9648,-0.023416,-2.6204,-1.4012,-0.71628,0.5118,-1.8845,1.0451,1.7601,0.54192,-2.0165,0.59448,0.22698,-0.44282,0.95428,-0.36659,-0.86948,2.3956,-1.0599,-3.4164,-0.52142,-2.6785,0.29957,3.1993,-0.039422,-2.0735,0.44614,4.1061,1.4386,0.42342,-0.49562,0.42647,-1.0925,0.89019,-0.83806,0.63935,-1.102,1.1813,-2.5209,2.5081,2.4966,-0.4641,1.1914,0.11763,-0.29394,-2.0839,-0.41003,-0.070168,-2.8342,2.5002,-4.1873,0.88369,0.81094,0.66169,1.6059,-1.834,-2.3441,2.964,0.002939,-0.2914,0.43373,-1.51,-2.2681,-1.5034,-0.67508,-1.7825,3.6395,1.6102,0.24247,-2.2217,2.2085,3.8143,3.3068,-0.99312,3.1788,-0.8643,-3.4111,1.5183,0.62223,1.9671,-0.95848,2.1614,-0.21469,0.89678,-0.024023,0.40798,-0.41839,0.58291,-1.385,-6.2618,0.45302,0.33743,1.5306,0.78857,1.3755,0.095243,1.153,0.74797,-1.1455,-0.2259,-1.9771,2.1955,1.1756,-2.1415,-0.3243,-4.086,0.28695,-2.6816,1.8983,0.077645,0.67917,1.8373,3.138,-2.6342,-2.4456,-0.775,-2.5607,1.0454,0.64258,-2.5356,1.0291,1.8934,0.22673,-0.45322,0.28502,1.0087,-0.51799,0.30775,-0.15162,0.72072,-0.47759,2.8986,-1.1608,0.66712,-3.6739,-3.3189,0.66693,-0.2114,0.67098,0.089591,0.31114,-1.4788,-0.93713,-0.52022,1.6745,-1.6608,0.61151,1.0716,-0.92285,-2.2407,1.9831,1.4997,-3.2467,-2.0687,-0.74996,1.0539,-4.1746,0.0134,0.25335,0.015917,-1.9932,1.4343,2.6578,-0.51555,-2.5133,2.0605,1.4505,1.0183,1.7249,1.301,-0.14663,1.6317,-4.0557,0.695,-2.1324,0.63212,-0.26903,1.4962,-2.3066,0.092501,2.1119,-1.3166,-1.1616,-0.4525,-0.6486,0.67535,-0.34923,1.3296,-0.72564,0.59667,-0.92969,0.21703,0.35521,1.8624,-2.9266,-0.33166,2.3685,2.3753,1.8406,3.5168,0.096914,2.0623,2.035,0.72157,-3.3915,-0.71025,-4.1361,0.14886,1.4299,0.082345,1.759,2.0764,-0.98032,-3.1572,0.33557,-1.1114,-0.91674,-1.6428,0.96515,-2.5633,1.1287,1.0855,1.3941,1.7328,-2.037,1.0043,-1.3566,-0.72758,0.99147,-2.9325,0.9988,5.3997,-1.544,-0.46333,2.8462,-0.49473,-0.52168,-3.7121,-1.3846,Contextual,0,0
disco,2.392,1.2872,0.26181,-2.5414,2.6851,-1.0966,0.33368,1.836,-4.1653,-2.3493,5.1199,-2.9307,-1.3718,1.8979,0.12346,-0.81259,-1.6832,2.8336,-0.70751,1.5079,0.57596,3.1794,-3.0267,-4.0731,-0.68806,-1.5667,-3.4247,-0.64155,1.6498,1.0278,-0.082309,3.4059,-2.108,-0.46739,1.2023,2.4861,-1.7816,0.61137,1.6514,-2.8592,-0.65683,2.1383,-0.70105,1.7965,1.3895,-0.067563,-6.6849,3.2178,2.2218,4.8262,0.0115,0.97408,-2.2196,-1.3517,-1.5365,0.14408,2.1851,1.24,1.6643,1.9936,4.2995,-1.2598,-0.82626,-3.5864,0.077077,-1.0027,-2.6029,-0.068453,-2.2732,5.4021,-2.8346,-2.4617,-2.2899,-0.50964,-0.47589,3.1139,0.25853,1.8126,0.023456,1.9935,0.15922,1.7447,3.581,-0.7445,2.1538,-1.7238,2.4671,-3.5263,0.7862,-1.421,-0.68775,2.3205,1.9238,-3.3133,1.5032,2.3692,6.1574,-5.11,0.78186,-3.4755,-2.7255,1.438,0.57636,3.3933,-1.0392,3.6632,-0.038298,1.4944,-2.8476,-0.35035,0.32608,-1.6733,-1.5284,-0.3039,0.34898,1.1292,-6.4067,-3.1597,-0.4512,0.9755,0.15026,-0.31235,2.0106,4.0536,-2.514,-2.237,0.053691,-7.8374,-1.1089,3.203,-4.7866,3.594,4.856,0.57031,-0.49048,-0.79287,-1.6776,-6.0111,3.6505,-1.3245,2.0943,-0.024907,-1.66,-2.1225,1.0841,-4.0856,-1.9516,0.50204,3.2221,3.2578,-2.1051,-2.753,0.36353,4.1758,0.17913,4.1322,3.5979,3.2368,-0.75075,-3.4694,-1.1615,0.20023,-1.0547,-1.4875,0.37853,-1.8034,-4.8843,-1.8492,1.3195,-1.2784,0.12384,-0.26376,3.4097,-0.19853,0.5242,0.3811,3.3499,3.0442,-2.9601,-3.1561,-0.49786,-1.8495,4.2477,-5.67,-0.63822,0.83123,1.2017,-3.4364,0.81451,-0.17023,-4.4082,-1.4109,-0.65497,-2.7259,3.9794,-3.723,-3.3726,-0.45039,-3.5694,-1.0233,1.2494,0.81303,1.5016,-1.2414,0.97507,0.52745,-3.0035,0.20906,-1.1532,-5.4726,2.4839,-1.4425,2.3797,1.1145,1.9978,0.69081,2.953,-0.27592,-0.32147,0.67161,-4.7206,-1.2597,-4.106,2.4742,-4.1514,0.79341,1.6187,2.5484,0.46811,1.5177,2.5344,-2.1564,-1.3625,2.6035,2.2756,-0.28145,1.5235,5.4766,0.21824,0.055679,-4.5548,-1.2157,-2.1333,3.187,-1.6437,2.8823,-2.4073,-0.096027,-4.5948,0.12474,0.55114,0.097157,-5.3848,0.34617,-2.6227,0.38416,1.4138,3.0809,1.8772,2.3589,-0.4215,3.722,-0.75095,0.36352,0.54589,1.4899,-0.55099,-0.53149,-0.1427,-0.82555,0.793,-0.21669,-0.94276,-1.146,-0.15985,0.39349,4.8305,0.16846,-1.9319,-1.419,-2.3323,-1.0841,-0.95217,1.9655,3.0157,-1.9716,-2.4958,-3.4154,-2.7819,-0.77876,3.8638,-1.9264,-0.31104,0.1151,-4.0921,-0.84042,-1.099,2.5453,-4.1871,2.9975,Perceptual,1,1
battery,-1.7446,4.4681,-3.2095,1.1895,3.0722,-0.81434,2.0602,4.3548,-3.8731,-0.15324,4.8957,1.4782,-7.8442,3.3315,-1.4291,1.3699,5.2786,3.9345,-1.3713,-0.027716,1.7224,3.5122,-2.441,-0.55226,0.14303,-2.9811,-4.9281,-7.2853,-0.39962,3.4887,0.61495,-1.8036,-1.6782,0.75166,-1.5183,-0.14718,1.9124,3.331,2.7737,2.9954,2.754,-4.0085,3.1187,5.9124,-1.6791,0.008456,-0.14439,-0.061056,1.1743,-3.3582,3.1204,1.4875,-0.3623,-1.0858,0.39747,-0.57418,0.82755,0.23305,1.0163,-0.64763,-0.83047,3.671,-5.1769,-8.3713,0.88403,-0.61946,-4.662,-0.59814,-0.63216,2.3605,1.0159,0.51678,-1.0843,1.4965,-2.7525,1.4828,-1.1879,-0.37949,-1.8958,-1.675,-0.9198,-0.69312,-1.1844,-1.9014,-1.1055,-2.8573,1.7177,-1.1353,-0.25151,2.8281,-5.3294,2.541,4.1808,-1.7198,2.2068,0.35714,3.7836,4.4826,-2.3571,1.163,-1.5634,-2.3403,1.2256,1.5629,-0.59648,3.7569,-4.693,-4.5817,4.0695,0.62165,-1.0169,-1.4923,0.081439,-2.2022,-0.45925,2.8678,0.13359,1.3665,3.3675,3.0503,-0.29398,-4.3389,-2.084,0.10162,-2.2879,-3.0491,2.0271,-3.0822,4.7464,-2.8623,-2.89,-0.25572,3.2507,7.0021,-0.46029,-0.082138,1.2979,0.25265,1.993,3.5598,4.0458,-4.0581,-2.5271,-0.33137,1.741,-1.9426,0.42614,-0.19772,-0.92785,4.5063,-2.2368,-1.311,3.9707,-1.0485,1.4044,-3.791,2.4133,-0.53487,-0.88329,0.016593,-2.9697,-1.1288,3.1805,-1.4169,-2.2311,-0.069124,-2.1741,3.2901,3.7142,1.7446,-2.0838,3.0192,-3.4482,0.991,-0.14516,0.17282,-2.5933,-1.1562,1.3318,-1.8616,1.1135,2.9308,2.1158,-0.76174,-2.0171,-1.586,-3.9565,-1.7537,-2.4417,-0.48298,1.7529,0.42727,0.76746,-0.46785,-1.3524,-1.5915,3.4221,-0.69862,1.0942,-2.9,-2.4363,-6.029,3.7453,-0.57933,-3.2859,2.6528,-3.0118,0.11188,-0.8651,-1.1028,2.3109,1.7844,-3.3536,4.2815,-4.0696,-0.031581,3.8806,-3.0563,-1.6979,0.8524,-3.142,1.038,-0.53821,-2.8271,0.81732,-4.6438,-6.3701,-1.4559,-0.15776,-3.2349,0.43719,-2.4026,1.9699,1.7802,0.086858,2.1576,-5.6018,-1.6964,1.6517,-1.0947,-2.5703,-1.824,1.0211,0.95648,-0.44163,-1.5313,-1.4751,4.86,3.1683,5.0971,4.221,-0.23262,-2.4343,-0.41505,-0.76286,-1.8082,0.71051,-0.89785,-3.5709,1.1067,-0.93633,7.8361,0.10651,-0.37391,0.72862,2.839,-1.608,2.3615,0.052349,2.235,-1.5802,-4.096,-2.5441,0.63631,-3.4063,-1.7697,2.4638,-2.6599,1.7518,0.43995,3.1064,-1.0953,1.4623,-1.417,7.3607,-0.89796,-4.2763,2.4707,-2.7437,3.313,0.75275,-0.47947,0.36715,-1.762,-2.4975,4.3208,1.5464,-1.6617,-0.6762,2.4541,Manifest,0,1
tsunami,1.056,-1.7829,-0.78786,-2.3121,-1.7645,-0.75033,0.27454,1.1699,-0.79019,-1.4246,-0.64655,-3.433,-0.87662,2.4594,1.8321,0.11747,0.74306,-0.55652,-0.88385,-0.054145,2.285,4.2267,0.46698,-0.9867,0.19035,0.017541,-0.58131,-4.5742,0.50023,-0.51335,0.377,-1.4814,-0.58551,-1.2259,1.3063,-3.5637,-4.4114,-0.53042,3.8432,1.791,-3.6484,-2.5059,-1.435,1.7601,-0.82274,0.80344,-2.5871,-2.9217,0.083976,1.9096,1.0125,1.6624,3.7825,-2.2997,0.35166,0.65544,-0.3718,-1.6329,2.029,3.9725,-1.0586,2.6982,-1.8641,2.2067,1.5841,2.7721,-1.4962,1.2729,2.3829,0.64442,-0.66518,1.6778,-3.5215,1.2681,-4.4363,1.8096,4.5358,-2.496,-1.0822,2.0668,-0.29369,-1.435,1.0777,-1.014,2.7926,-1.2829,-0.52001,-2.5739,-1.5314,-2.1729,2.5385,0.11051,1.2988,0.040865,-1.8819,2.5003,2.3288,-0.1608,0.37775,-0.023312,2.9085,-0.036929,1.6416,-2.0546,-2.5297,-0.875,0.9025,-1.8161,0.94333,-1.4064,-0.97368,3.0087,1.621,1.1157,-2.1188,0.99672,-1.2427,-0.9413,-0.68275,2.6315,-1.7646,0.38338,2.4362,4.2164,0.40089,1.2682,0.7112,6.6467,-3.6251,3.378,1.2875,1.2895,1.8698,-0.31841,1.4889,-3.1073,-0.24315,-1.092,-0.30781,0.59306,-0.96914,0.19868,-0.089811,0.70388,-0.66346,0.3686,-2.2955,1.6758,-2.2923,-0.029467,0.01455,3.4905,2.129,0.59318,2.4456,-0.31414,2.7054,0.86683,2.407,-0.28495,1.7451,0.80075,0.30098,0.60878,1.1348,-0.99984,0.91584,1.6335,-1.0692,3.4726,-0.55204,2.5266,0.59733,-2.0851,-1.9037,-2.1293,-2.1822,0.89029,-0.11388,0.33812,1.008,-1.3879,-0.47167,1.195,-0.91429,0.25106,-0.75769,0.20126,0.014398,-2.7834,-1.6111,-0.7774,-2.503,-4.1863,-1.9774,1.2322,0.34337,1.3536,-1.1562,2.8644,-0.46018,-1.1924,2.4592,-2.4997,4.0565,1.8376,-0.53675,1.0315,-4.0721,-1.8389,0.55005,3.4307,-3.9789,-1.1871,-0.53211,1.1172,2.0336,-0.22482,0.6803,-3.7565,1.1132,1.2793,-0.22078,1.3404,-2.994,-2.8916,-2.317,1.211,-0.60215,2.2188,1.5764,2.2257,-0.80374,4.2017,-0.85806,-0.058575,0.16069,1.1253,-1.8047,-1.0705,-1.3396,1.2445,0.90311,0.19101,-2.0006,2.3227,-0.81608,0.55839,-2.7406,0.79603,-0.13176,-1.2491,-4.3797,-0.33274,2.344,-1.5467,2.5863,-1.8878,0.67795,0.44499,-2.2004,1.9368,4.9402,0.53738,-0.24282,-1.8767,0.051886,2.8548,-1.4288,-0.16662,3.5606,-1.7179,0.60132,-2.7645,-1.1551,-0.64273,1.4753,-3.9604,-2.1148,-4.0346,-0.97461,-0.28952,0.21912,1.5296,0.60485,-0.64384,-2.4283,-2.025,-1.1905,-1.5838,3.4075,-0.94756,2.2333,1.7924,-0.68678,2.1833,2.3015,-1.4344,-1.0784,2.7339,Perceptual,1,1
mother,1.4643,-1.3328,-4.519,-1.814,2.2399,1.2033,0.90458,5.163,-0.25482,4.4821,6.802,-0.24648,-3.0857,3.5672,3.4167,0.61645,-1.978,-2.8676,-2.2306,1.0382,-5.9201,-0.1304,2.6683,0.71046,0.33743,-5.6531,-1.5503,3.7883,0.27711,-5.1051,3.1329,0.56239,-1.16,0.92542,-2.9151,-2.7113,-0.63987,2.0122,-3.3556,-2.6268,-2.1942,-4.7417,0.96389,2.4219,5.2138,1.2845,-0.7825,2.0482,-1.7571,3.3425,-1.7641,3.4754,2.0818,-1.5787,-0.89939,-2.0108,-0.34208,-5.1683,3.9969,-1.608,-3.0466,-3.1419,-0.08504,2.0502,2.6915,0.65306,-0.75046,-4.805,4.797,1.3323,3.4012,0.91096,-0.64516,1.3469,-1.3509,2.0603,-6.7006,3.4606,0.081272,0.85685,-2.9857,-0.87417,0.82994,-0.76378,1.5849,-0.96828,-1.476,0.046581,-4.4146,-7.2689,2.0656,1.3671,1.9073,-3.9928,-3.267,2.134,1.374,2.5597,5.2804,0.64349,5.1885,1.5911,1.664,0.49418,-1.2484,2.0863,-0.72064,1.221,2.6734,-5.9388,2.0962,2.8054,0.63608,-0.2721,8.1392,3.4135,-1.8817,-2.7961,1.0427,-4.9728,-1.4273,-3.9646,-1.9971,-0.11384,-1.8679,-2.377,3.1556,0.055094,3.0325,1.4853,-3.2317,-1.04,2.3737,-1.898,-0.61924,0.37485,-1.4619,0.75559,5.305,-2.8045,-3.9333,1.4176,2.1894,2.7123,2.585,-2.2332,-6.8792,0.45227,4.978,0.40413,2.7745,1.5401,3.4021,4.3969,-2.4849,0.90064,2.3435,0.1574,-2.1943,-8.2654,-2.1654,-8.7999,-3.7229,1.7917,-3.0174,-4.412,-1.2453,2.1328,-1.415,1.4697,3.7426,-0.58897,0.079984,1.0556,4.5864,-3.1688,0.77339,-0.030732,-0.7443,-3.6211,2.9674,-2.7326,5.9004,0.28226,0.38392,2.0818,-1.5185,1.0594,2.7715,3.2249,1.7201,-1.583,-2.9139,-0.32307,2.736,-2.4643,-2.4658,3.8696,3.4452,0.7964,3.2573,-2.5084,-1.6517,-2.2814,-1.5952,-2.0107,0.81573,0.7263,-6.4151,-5.2575,-1.494,-2.033,1.6191,3.7027,0.10216,-0.4439,-1.6315,-1.645,-2.9812,1.6774,-0.64852,-2.5135,1.7424,6.2187,-1.5381,4.3916,-1.5479,-2.6406,2.6128,0.28993,-0.26954,-4.0006,-5.1241,-0.20829,0.86908,2.0919,-5.3781,4.0317,-1.0861,-2.8226,-3.1569,7.6989,4.9138,0.85393,3.8212,0.087089,-2.1578,3.7445,2.8334,2.6013,-0.85963,-2.0128,-3.5931,1.9111,-0.19832,-3.8453,0.5539,1.5081,-1.7597,0.40334,1.9251,2.0039,0.90338,-1.6602,-0.1875,-2.2625,1.9125,2.134,-4.886,3.1515,1.1943,-0.82898,-3.8514,-1.2394,-2.0052,1.9839,-0.66585,-5.6369,1.2406,2.5902,-0.99776,-0.79997,4.3022,2.803,5.517,-2.3531,-4.1298,3.9135,-4.8855,-1.7582,2.402,-1.582,-4.0844,-4.8611,-3.4569,-3.8682,1.6765,2.7701,-5.8157,1.2973,Perceptual,1,1


In [156]:
## Descartando a última coluna:
df_last = df.iloc[:,:-2]
df_last.head(1)

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111,112,113,114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132,133,134,135,136,137,138,139,140,141,142,143,144,145,146,147,148,149,150,151,152,153,154,155,156,157,158,159,160,161,162,163,164,165,166,167,168,169,170,171,172,173,174,175,176,177,178,179,180,181,182,183,184,185,186,187,188,189,190,191,192,193,194,195,196,197,198,199,200,201,202,203,204,205,206,207,208,209,210,211,212,213,214,215,216,217,218,219,220,221,222,223,224,225,226,227,228,229,230,231,232,233,234,235,236,237,238,239,240,241,242,243,244,245,246,247,248,249,250,251,252,253,254,255,256,257,258,259,260,261,262,263,264,265,266,267,268,269,270,271,272,273,274,275,276,277,278,279,280,281,282,283,284,285,286,287,288,289,290,291,292,293,294,295,296,297,298,299,target
argument,-2.3992,-0.31061,0.16248,1.1939,4.553,2.608,2.3816,4.3793,-6.4059,-2.8989,6.9065,3.6357,-3.4818,-3.072,-1.5625,4.4574,2.4062,0.61288,-2.0203,1.854,-1.2827,-0.86692,-2.2344,-0.20293,-0.98764,-2.5703,-0.42565,-0.67371,-2.9512,2.5231,3.6174,2.046,0.93659,0.80884,-1.8359,-4.1538,-0.77178,-0.91474,0.3574,2.4311,-2.8427,-4.3941,0.18871,1.0475,-0.79925,-1.5843,3.4804,-2.8958,-1.4625,0.56112,-2.8675,2.7701,2.3915,-1.9063,-2.2535,-0.62433,3.1455,1.222,2.2854,0.36479,3.0918,1.6108,-1.6584,-1.6451,0.65175,2.8537,-3.2931,-4.5797,1.7337,3.352,1.7681,1.599,-5.0516,1.6644,-4.3692,1.1405,-3.9987,5.0947,-0.79874,-0.6081,-3.2158,-0.42495,1.4047,2.5423,0.58327,2.5293,-3.5585,-2.1892,4.4176,1.6439,3.4725,2.232,5.6429,-2.5572,3.2299,-2.3217,0.044789,3.1062,2.8293,-2.2333,3.6981,3.2175,4.477,3.1264,-0.69679,3.0372,3.2599,-4.1551,1.0466,-2.3053,0.066955,-0.96005,-0.48711,1.0598,1.9121,2.154,-4.6148,-0.60629,0.35795,-0.86739,-0.40956,-5.4357,0.59216,-1.7533,-3.3679,0.39749,3.545,-3.5528,0.71102,-4.57,-4.5825,-1.8462,3.9507,0.42573,0.61037,0.72052,0.78121,2.5482,0.79837,-1.8534,-1.4698,-0.71325,-0.21927,1.6808,1.2657,-0.95549,-4.6534,-0.4225,-0.65577,3.7836,0.58572,4.7582,-1.2812,1.6873,-1.4343,5.1048,1.8411,-0.33209,-2.8453,-4.3376,2.2446,0.060355,-0.28312,2.1109,-0.21476,-2.0898,-2.9909,1.6846,1.2215,-1.663,-0.2914,-0.15043,-0.089668,-1.3618,4.2523,1.0499,-0.83556,3.3452,-2.7199,-3.494,2.8196,3.0722,-0.12998,1.6373,-1.9782,2.9238,-2.1324,-1.1832,3.4495,2.6386,-2.6228,-3.0572,0.77354,1.6173,2.1261,-3.067,-0.84982,3.683,1.6198,6.2091,-2.4882,0.70562,0.36068,-0.85727,2.0703,-0.057408,-0.63836,0.62888,-0.26941,-1.8637,-2.4216,-1.4942,-2.671,4.4052,-0.89783,1.8478,1.4274,1.1662,4.0038,2.2062,-3.7706,-0.94775,0.081936,-0.052859,-1.1466,0.97386,1.6578,5.1659,1.9735,-0.10786,1.4671,-4.1792,1.5281,0.1311,1.1956,0.49311,2.8842,1.0306,2.3504,-2.6875,-1.0097,1.2478,1.2949,4.5648,0.51724,0.52477,-2.0162,2.0893,0.60699,1.5926,1.0539,-4.595,-3.701,-0.75894,-0.64485,-4.1829,-1.9371,-0.26863,0.26782,-0.63142,-2.1099,1.1534,1.6628,4.7483,0.86838,0.88791,4.31,4.3719,-3.0734,-1.1162,-0.31119,-1.4985,-1.2099,0.359,3.4704,-0.40592,0.012269,-1.6215,-1.3837,4.2299,1.4631,0.48673,1.7178,3.7604,4.8459,1.2913,4.031,-0.37738,-3.634,0.84509,3.235,-1.7311,1.3996,2.051,-4.2522,1.0911,3.7819,-0.92356,-1.8916,3.3504,Latent


In [75]:
df_scnd_last = df.iloc[:, :-2].join(df.iloc[:, -1])
df_scnd_last.head(1)

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111,112,113,114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132,133,134,135,136,137,138,139,140,141,142,143,144,145,146,147,148,149,150,151,152,153,154,155,156,157,158,159,160,161,162,163,164,165,166,167,168,169,170,171,172,173,174,175,176,177,178,179,180,181,182,183,184,185,186,187,188,189,190,191,192,193,194,195,196,197,198,199,200,201,202,203,204,205,206,207,208,209,210,211,212,213,214,215,216,217,218,219,220,221,222,223,224,225,226,227,228,229,230,231,232,233,234,235,236,237,238,239,240,241,242,243,244,245,246,247,248,249,250,251,252,253,254,255,256,257,258,259,260,261,262,263,264,265,266,267,268,269,270,271,272,273,274,275,276,277,278,279,280,281,282,283,284,285,286,287,288,289,290,291,292,293,294,295,296,297,298,299,target,F_Objectivity
periodical,-1.6272,-0.78238,1.6661,0.64415,5.8025,-3.8606,2.1145,2.2464,0.11389,-0.57345,5.7366,2.6897,-2.9695,2.0592,1.1753,2.1266,4.7035,2.7336,-3.5872,1.1187,-0.33484,-1.4071,-4.7561,2.2302,-2.059,-0.14411,-1.9042,-3.213,-0.34878,1.1597,-1.3406,0.47455,0.76463,0.62292,-2.3959,-0.086495,1.1585,-0.68091,1.1494,1.3205,1.8991,-0.035937,-0.36217,2.4583,1.1064,2.3078,-0.64062,0.28873,-1.6005,-2.3947,-2.2164,3.735,-0.78451,-0.50572,-2.4039,1.9877,-2.2064,2.1254,2.0112,-3.4274,0.38636,-0.99008,-2.2497,1.6211,3.0944,0.64471,1.4321,-0.62388,0.8677,1.1196,-1.9251,-2.9001,-2.8303,-2.8833,-0.33352,3.1787,-1.475,1.1811,-1.86,0.12378,-1.6496,-0.14419,-0.56384,1.1399,2.2299,3.6695,-1.0809,-2.7011,2.3617,-2.0884,-0.71105,1.6108,3.7237,-1.2607,2.374,-1.998,1.72,1.4512,-0.39968,4.1796,2.6991,2.5275,2.0868,1.2196,-1.0239,3.438,3.123,-3.8607,1.4855,-4.1848,3.7903,0.88335,-2.853,-0.98828,1.9463,1.1769,-1.8306,2.754,-1.7812,-1.4768,0.84724,-4.4108,1.7444,1.4066,1.8559,-4.2074,-0.42883,-2.2853,2.6108,-2.4452,-1.5658,0.6037,2.0717,2.7407,0.50984,0.82838,-1.9149,-1.2288,0.70129,-3.165,-0.40373,-1.5314,-0.56426,1.6354,3.8474,-0.94437,-0.99321,-0.052637,0.75979,3.275,2.3954,0.05155,0.77701,1.3314,-1.7912,0.54084,-0.39345,-0.94512,-1.1933,-1.5246,-1.9794,1.4443,1.1399,3.4458,-2.8027,-1.2135,-6.3629,1.6438,-0.24045,0.16754,1.4184,0.92152,2.7786,0.41264,2.3382,3.1647,1.2647,1.1072,-3.2381,-1.2591,-0.83185,-1.6059,0.57993,-2.118,-0.54878,0.76078,-0.074174,0.30904,-0.28318,1.7597,-0.83301,-2.5778,-3.7242,0.58209,3.8249,1.4794,-2.242,-2.0715,0.82211,3.4849,-1.6172,-4.0141,-0.16727,-2.0282,7.0865,0.84765,-3.4945,1.2765,2.2956,0.47523,2.3143,-0.93912,0.030626,-1.4647,-0.42383,1.7943,-0.78176,-3.8079,0.45426,0.58407,-0.15175,2.4248,-3.8759,-0.19335,-3.5155,-1.3907,-1.2319,0.48635,1.6602,0.84975,4.6175,-0.81367,0.47439,1.6774,1.7393,4.3165,0.14046,1.4182,-1.8713,-1.4948,-1.0273,-1.264,2.5117,2.1463,-1.052,2.5754,-2.8909,2.0706,-0.56698,2.6587,2.5999,-4.9548,-2.0778,-0.67968,-0.62967,-2.5925,-1.5708,-2.252,-0.10327,1.2572,-2.7904,2.8963,3.1598,2.2888,3.2515,-0.4181,2.1012,2.7386,-0.1432,-0.35501,-1.7387,1.5427,1.7338,-2.4797,1.0412,1.8452,-0.01234,-1.6399,-1.29,-0.055819,3.7824,0.87042,3.8564,0.43643,0.13927,-2.9037,0.46992,0.76273,0.52487,-2.5186,2.5555,-1.1517,-1.5503,-2.034,-2.3307,-0.35606,0.2412,-5.179,-3.2397,-1.4073,0,0


### Pycaret Regression: 300 inputs and 1 numerical outputs

In [159]:
exp_regr = pycaret.regression.setup(df_last, target='target', session_id=123)

Unnamed: 0,Description,Value
0,Session id,123
1,Target,target
2,Target type,Regression
3,Original data shape,"(3511, 301)"
4,Transformed data shape,"(3511, 301)"
5,Transformed train set shape,"(2457, 301)"
6,Transformed test set shape,"(1054, 301)"
7,Numeric features,300
8,Preprocess,True
9,Imputation type,simple


In [160]:
exp_regr.compare_models()

[]

In [100]:
exp_regr.compare_models()

Unnamed: 0,Model,MAE,MSE,RMSE,R2,RMSLE,MAPE,TT (Sec)
lasso,Lasso Regression,0.1549,0.035,0.1869,-0.003,0.1311,0.5698,0.033
en,Elastic Net,0.1549,0.035,0.1869,-0.003,0.1311,0.5698,0.03
dummy,Dummy Regressor,0.1549,0.035,0.1869,-0.003,0.1311,0.5698,0.03
llar,Lasso Least Angle Regression,0.1549,0.035,0.1869,-0.003,0.1311,0.5698,0.028
br,Bayesian Ridge,0.1552,0.0351,0.1873,-0.0076,0.1314,0.5705,0.032
omp,Orthogonal Matching Pursuit,0.1552,0.0352,0.1875,-0.0094,0.1315,0.57,0.029
lr,Linear Regression,0.1562,0.0357,0.1887,-0.0228,0.1324,0.5732,0.031
lar,Least Angle Regression,0.156,0.0357,0.1887,-0.0233,0.1324,0.5724,0.029
ridge,Ridge Regression,0.1562,0.0357,0.1888,-0.0239,0.1325,0.5725,0.03
ada,AdaBoost Regressor,0.1579,0.036,0.1895,-0.0318,0.1339,0.6074,0.146


### Pycaret Classification

In [90]:
df

Unnamed: 0,0,1,2,3,4,5,6,7,8,9,...,291,292,293,294,295,296,297,298,299,target
periodical,-1.627200,-0.782380,1.666100,0.64415,5.802500,-3.86060,2.11450,2.246400,0.11389,-0.57345,...,-1.15170,-1.55030,-2.03400,-2.33070,-0.35606,0.241200,-5.179000,-3.23970,-1.40730,Contextual
intellect,-0.154690,1.676800,-0.351630,-0.57609,2.088700,2.61040,0.66495,2.229900,-4.99240,-1.65200,...,-1.79910,-1.50010,-3.83950,1.14140,0.38565,1.783600,-0.127660,-5.47600,5.23490,Latent
culture,-0.025891,-2.009300,0.494080,-0.33639,5.294000,-0.38846,3.17880,2.941100,-2.58270,-1.90800,...,-0.75585,-0.47891,-2.78880,-0.65771,-4.51980,1.242700,-1.250500,-7.25270,5.32900,Latent
emancipation,-3.593900,-0.710900,2.035000,2.18820,2.327500,0.66056,2.73950,0.424270,1.17990,-0.65433,...,-0.22063,-1.37600,2.01930,1.47420,-0.93661,0.339360,-4.583200,-1.69060,-0.82634,Contextual
chasm,2.750600,2.573200,1.016900,-2.14450,-1.060800,1.80230,3.07630,3.057700,-1.46700,1.42200,...,0.71314,3.44560,-1.67040,2.73970,1.79250,-1.171300,0.825910,1.09540,-0.33145,Latent
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
prawn,-1.104300,-2.707300,-0.040561,0.26686,-0.001637,-2.23060,-0.22431,0.000931,-3.39360,0.79063,...,-2.56200,1.02140,-2.52040,-1.98950,1.48670,1.859700,-0.720330,-1.17220,4.63340,Manifest
tweezers,-1.051400,2.791100,1.661000,2.09520,-0.197260,-1.18820,-2.49820,0.762750,-3.10200,0.28440,...,-0.44270,1.51110,0.88290,-2.94660,0.53499,0.968740,-0.909550,-0.77088,-1.42830,Manifest
university,-1.409000,0.093909,0.172970,-0.25512,2.648800,2.68320,3.31220,3.572100,-0.04109,0.20994,...,-1.17040,-1.25060,-0.83331,0.25252,0.19663,1.934500,-0.546330,0.59882,0.67005,Perceptual
wasteful,-1.105000,-0.335100,-1.827500,-3.49660,1.209300,1.20280,0.13930,-1.561000,-0.51685,-0.91023,...,-0.92690,2.68170,-0.71914,-1.27960,0.42766,-1.082500,0.035378,-3.72800,1.17320,Latent


In [161]:
## Fazendo um experimento:
exp_class = pycaret.classification.setup(df_last, target='target', session_id=9088)

Unnamed: 0,Description,Value
0,Session id,9088
1,Target,target
2,Target type,Multiclass
3,Target mapping,"Contextual: 0, Latent: 1, Manifest: 2, Perceptual: 3"
4,Original data shape,"(3511, 301)"
5,Transformed data shape,"(3511, 301)"
6,Transformed train set shape,"(2457, 301)"
7,Transformed test set shape,"(1054, 301)"
8,Numeric features,300
9,Preprocess,True


In [162]:
exp_class.compare_models()

Unnamed: 0,Model,Accuracy,AUC,Recall,Prec.,F1,Kappa,MCC,TT (Sec)
ridge,Ridge Classifier,0.6789,0.0,0.6789,0.6689,0.6675,0.5516,0.5552,0.03
lda,Linear Discriminant Analysis,0.6777,0.8846,0.6777,0.677,0.6758,0.5564,0.5573,0.052
lightgbm,Light Gradient Boosting Machine,0.6712,0.8857,0.6712,0.6594,0.6541,0.5381,0.5441,2.139
gbc,Gradient Boosting Classifier,0.659,0.883,0.659,0.6475,0.6451,0.5227,0.527,14.341
lr,Logistic Regression,0.6443,0.8568,0.6443,0.6458,0.644,0.5121,0.5128,0.555
svm,SVM - Linear Kernel,0.6325,0.0,0.6325,0.6294,0.6254,0.4924,0.4956,0.069
rf,Random Forest Classifier,0.6305,0.8571,0.6305,0.6097,0.581,0.4691,0.4888,0.419
et,Extra Trees Classifier,0.626,0.8647,0.626,0.6127,0.5636,0.4588,0.4857,0.1
knn,K Neighbors Classifier,0.6215,0.8314,0.6215,0.6134,0.6043,0.4684,0.4747,0.036
qda,Quadratic Discriminant Analysis,0.6125,0.7806,0.6125,0.5969,0.4932,0.4298,0.479,0.046
