In [1]:
!pip install gensim --user
!pip install textblob



In [2]:
import pandas as pd
import numpy as np
import re

#Timing
from tqdm import tqdm

#Word Embeddings
import nltk
from textblob import TextBlob
from gensim.models import Word2Vec
from nltk.tokenize import word_tokenize
from nltk.corpus import stopwords

#Models
from sklearn.svm import SVC
from sklearn.metrics import accuracy_score

nltk.download('punkt')
nltk.download('stopwords')

[nltk_data] Downloading package punkt to C:\Users\Cameron
[nltk_data]     Milne\AppData\Roaming\nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package stopwords to C:\Users\Cameron
[nltk_data]     Milne\AppData\Roaming\nltk_data...
[nltk_data]   Package stopwords is already up-to-date!


True

## EDA

In [3]:
scored_tweets = pd.read_csv('scored_tweets.csv')

In [4]:
scored_tweets.columns

Index(['created_at', 'text', 'username', 'screen_name', 'verified',
       'followers_count', 'TOXICITY', 'INSULT', 'PROFANITY', 'THREAT',
       'SEXUALLY_EXPLICIT'],
      dtype='object')

In [5]:
scored_tweets.corr()

Unnamed: 0,TOXICITY,INSULT,PROFANITY,THREAT,SEXUALLY_EXPLICIT
TOXICITY,1.0,0.945739,0.921274,0.572428,0.70061
INSULT,0.945739,1.0,0.827742,0.464412,0.542923
PROFANITY,0.921274,0.827742,1.0,0.442225,0.758937
THREAT,0.572428,0.464412,0.442225,1.0,0.425812
SEXUALLY_EXPLICIT,0.70061,0.542923,0.758937,0.425812,1.0


In [6]:
scored_tweets.head(3)

Unnamed: 0,created_at,text,username,screen_name,verified,followers_count,TOXICITY,INSULT,PROFANITY,THREAT,SEXUALLY_EXPLICIT
0,created_at,text,username,screen_name,verified,followers_count,0.042518,0.01574,0.037332,0.043029,0.040426
1,Thu Dec 02 15:39:21 +0000 2021,This needs to become a real thing. I wanna see...,GhostFedoraTWEET,GhostyRBLX,False,28,0.552407,0.666591,0.313011,0.431656,0.10075
2,Thu Dec 02 15:39:21 +0000 2021,@ENHYPEN_members love u more jake,aii.laa,jayenaii,False,85,0.084299,0.061555,0.109649,0.069504,0.119767


## New Preprocessing

In [7]:
scored_tweets.dropna(subset=['text'], inplace=True)

In [8]:
from nltk.tokenize import sent_tokenize, word_tokenize

#tokenizes every tweet
tokenizer = nltk.RegexpTokenizer(r"\w+")
scored_tweets['processed'] = scored_tweets['text'].apply(tokenizer.tokenize)
scored_tweets['processed']

0                                                  [text]
1       [This, needs, to, become, a, real, thing, I, w...
2                  [ENHYPEN_members, love, u, more, jake]
3       [ENHYPEN_members, i, hope, you, ll, get, a, go...
4       [Mal_DuBois, It, was, dragged, across, on, a, ...
                              ...                        
1957    [Nurseries, in, Glasgow, Come, along, to, a, t...
1958    [jimin, is, a, real, life, angel, https, t, co...
1959    [8Ball, Who, Want, it, 600, 00, If, You, WIN, ...
1960               [I, no, longer, have, time, to, waste]
1961    [BugCatNoms, Awwwwww, Puppet, Bugalo, Cat, Tha...
Name: processed, Length: 1962, dtype: object

In [9]:
from nltk.corpus import stopwords 

#Widely used stopword library
stop_words = set(stopwords.words('english'))

#gets rid of numbers
stop_words.update([str(x) for x in np.arange(10)])

#apply to tokens
scored_tweets['processed'] = scored_tweets.processed.apply(lambda x: [i for i in x if not i in stop_words])
scored_tweets['processed']

0                                                  [text]
1       [This, needs, become, real, thing, I, wanna, s...
2                        [ENHYPEN_members, love, u, jake]
3       [ENHYPEN_members, hope, get, good, rest, fight...
4               [Mal_DuBois, It, dragged, across, dinghy]
                              ...                        
1957    [Nurseries, Glasgow, Come, along, taster, sess...
1958    [jimin, real, life, angel, https, co, 1LsoCrsG1I]
1959    [8Ball, Who, Want, 600, 00, If, You, WIN, If, ...
1960                             [I, longer, time, waste]
1961    [BugCatNoms, Awwwwww, Puppet, Bugalo, Cat, Tha...
Name: processed, Length: 1962, dtype: object

In [10]:
scored_tweets['processed'] = [' '.join(l) for l in scored_tweets['processed']]
scored_tweets['processed']

0                                                    text
1       This needs become real thing I wanna see full ...
2                             ENHYPEN_members love u jake
3       ENHYPEN_members hope get good rest fighting to...
4                     Mal_DuBois It dragged across dinghy
                              ...                        
1957    Nurseries Glasgow Come along taster session fi...
1958            jimin real life angel https co 1LsoCrsG1I
1959    8Ball Who Want 600 00 If You WIN If I Win TRYI...
1960                                  I longer time waste
1961    BugCatNoms Awwwwww Puppet Bugalo Cat Thank u n...
Name: processed, Length: 1962, dtype: object

## Models

In [11]:
!pip install lightgbm
!pip install hyperopt



In [12]:
def split_data(df=scored_tweets, feature='processed', label='TOXICITY'):
    from sklearn.model_selection import train_test_split
    
    train_data, test_data = train_test_split(df, test_size=0.25, random_state=7)
    X_train, X_test = np.asarray(train_data['processed']), np.asarray(test_data['processed'])
    y_train, y_test = np.asarray(train_data[label]), np.asarray(test_data[label])
    
    return X_train, X_test, y_train, y_test

In [13]:
def TFIDF(X_train, X_test):
    from sklearn.feature_extraction.text import TfidfVectorizer

    vectorizer = TfidfVectorizer()
    train_tfidf = vectorizer.fit_transform(X_train)
    test_tfidf = vectorizer.transform(X_test)
    
    return train_tfidf, test_tfidf    

In [14]:
def LinearRegression(feature_category):
    from sklearn.linear_model import LinearRegression
    from sklearn.metrics import mean_absolute_error
    from sklearn.metrics import r2_score
    from sklearn.metrics import accuracy_score
    
    X_train, X_test, y_train, y_test = split_data(label=feature_category)
    train_tfidf, test_tfidf = TFIDF(X_train, X_test)

    model = LinearRegression().fit(train_tfidf, y_train)
    y_pred = model.predict(test_tfidf)
    
    mae = round(mean_absolute_error(y_pred, y_test), 4)
    r2 = round(r2_score(y_pred, y_test), 4)
    
    return (r2, mae, model)

In [15]:
def LightGBM(feature_category):
    import lightgbm as lgb
    from sklearn.metrics import mean_absolute_error
    from sklearn.metrics import r2_score
    
    X_train, X_test, y_train, y_test = split_data(label=feature_category)
    train_tfidf, test_tfidf = TFIDF(X_train, X_test)
    
    hyper_params = {
    'task': 'train',
    'boosting_type': 'gbdt',
    'objective': 'regression',
    'metric': ['l1','l2'],
    'learning_rate': 0.005,
    'feature_fraction': 0.9,
    'bagging_fraction': 0.7,
    'bagging_freq': 10,
    'verbose': 0,
    "max_depth": 8,
    "num_leaves": 128,  
    "max_bin": 512,
    "num_iterations": 100000
    }
    
    gbm = lgb.LGBMRegressor(**hyper_params)
    gbm.fit(train_tfidf, y_train, eval_set=[(test_tfidf, y_test)], eval_metric='l1', early_stopping_rounds=1000)
    y_pred = gbm.predict(test_tfidf, num_iteration=gbm.best_iteration_)
    
    mae = round(mean_absolute_error(y_pred, y_test), 4)
    r2 = round(r2_score(y_pred, y_test), 4)
    
    return (r2, mae, gbm)

In [16]:
def SVR(feature_category):
    from sklearn.svm import SVR
    from sklearn.metrics import mean_absolute_error
    from sklearn.metrics import r2_score
    
    X_train, X_test, y_train, y_test = split_data(label=feature_category)
    train_tfidf, test_tfidf = TFIDF(X_train, X_test)
    
    svr = SVR(kernel='linear').fit(train_tfidf, y_train)
    y_pred = svr.predict(test_tfidf)
    
    mae = round(mean_absolute_error(y_pred, y_test), 4)
    r2 = round(r2_score(y_pred, y_test), 4) 
    
    return (r2, mae, svr)

In [17]:
def ElasticNet(feature_category):
    from sklearn.linear_model import ElasticNet
    from sklearn.metrics import mean_absolute_error
    from sklearn.metrics import r2_score
    
    X_train, X_test, y_train, y_test = split_data(label=feature_category)
    train_tfidf, test_tfidf = TFIDF(X_train, X_test)
    
    model = ElasticNet(random_state=0).fit(train_tfidf, y_train)
    y_pred = model.predict(test_tfidf)
    
    mae = round(mean_absolute_error(y_pred, y_test), 4)
    r2 = round(r2_score(y_pred, y_test), 4) 
    
    return (r2, mae, model)

### Toxicity

In [18]:
category = 'TOXICITY'

lr_results = LinearRegression(category)
gbm_results = LightGBM(category)
svr_results = SVR(category)
en_results = ElasticNet(category)



You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	valid_0's l1: 0.15316	valid_0's l2: 0.0433886
[2]	valid_0's l1: 0.153127	valid_0's l2: 0.043372
[3]	valid_0's l1: 0.153094	valid_0's l2: 0.0433543
[4]	valid_0's l1: 0.153057	valid_0's l2: 0.0433353
[5]	valid_0's l1: 0.153022	valid_0's l2: 0.0433156
[6]	valid_0's l1: 0.152997	valid_0's l2: 0.0433011
[7]	valid_0's l1: 0.152961	valid_0's l2: 0.0432828
[8]	valid_0's l1: 0.152921	valid_0's l2: 0.0432641
[9]	valid_0's l1: 0.152885	valid_0's l2: 0.0432463
[10]	valid_0's l1: 0.152844	valid_0's l2: 0.0432278
[11]	valid_0's l1: 0.152808	valid_0's l2: 0.0432071
[12]	valid_0's l1: 0.15277	valid_0's l2: 0.0431848
[13]	valid_0's l1: 0.152732	valid_0's l2: 0.0431628
[14]	valid_0's l1: 0.152693	valid_0's l2: 0.0431415
[15]	valid_0's l1: 0.152659	valid_0's l2: 0.0431199
[16]	valid_0's l1: 0.152625	valid_0's l2: 0.0430986
[17]	valid_0's l1: 0.152588	valid_0's l2: 0.0430776
[18]	v

[56]	valid_0's l1: 0.15128	valid_0's l2: 0.0422617
[57]	valid_0's l1: 0.15122	valid_0's l2: 0.0422299
[58]	valid_0's l1: 0.151149	valid_0's l2: 0.0421945
[59]	valid_0's l1: 0.15108	valid_0's l2: 0.0421588
[60]	valid_0's l1: 0.151016	valid_0's l2: 0.042122
[61]	valid_0's l1: 0.150965	valid_0's l2: 0.0421012
[62]	valid_0's l1: 0.150917	valid_0's l2: 0.0420823
[63]	valid_0's l1: 0.150856	valid_0's l2: 0.0420547
[64]	valid_0's l1: 0.150796	valid_0's l2: 0.0420274
[65]	valid_0's l1: 0.150749	valid_0's l2: 0.0420091
[66]	valid_0's l1: 0.150704	valid_0's l2: 0.0419922
[67]	valid_0's l1: 0.150657	valid_0's l2: 0.0419742
[68]	valid_0's l1: 0.150615	valid_0's l2: 0.0419569
[69]	valid_0's l1: 0.150569	valid_0's l2: 0.0419392
[70]	valid_0's l1: 0.150531	valid_0's l2: 0.0419223
[71]	valid_0's l1: 0.15051	valid_0's l2: 0.0419097
[72]	valid_0's l1: 0.15049	valid_0's l2: 0.0418966
[73]	valid_0's l1: 0.150472	valid_0's l2: 0.0418836
[74]	valid_0's l1: 0.150451	valid_0's l2: 0.0418705
[75]	valid_0's l1:

[161]	valid_0's l1: 0.148512	valid_0's l2: 0.0407365
[162]	valid_0's l1: 0.148485	valid_0's l2: 0.0407185
[163]	valid_0's l1: 0.14846	valid_0's l2: 0.0407046
[164]	valid_0's l1: 0.148435	valid_0's l2: 0.0406909
[165]	valid_0's l1: 0.148421	valid_0's l2: 0.0406799
[166]	valid_0's l1: 0.148395	valid_0's l2: 0.0406621
[167]	valid_0's l1: 0.148368	valid_0's l2: 0.0406431
[168]	valid_0's l1: 0.148347	valid_0's l2: 0.0406303
[169]	valid_0's l1: 0.148326	valid_0's l2: 0.0406176
[170]	valid_0's l1: 0.14831	valid_0's l2: 0.040605
[171]	valid_0's l1: 0.148322	valid_0's l2: 0.0406005
[172]	valid_0's l1: 0.148335	valid_0's l2: 0.0405963
[173]	valid_0's l1: 0.148348	valid_0's l2: 0.0405938
[174]	valid_0's l1: 0.148358	valid_0's l2: 0.0405892
[175]	valid_0's l1: 0.148365	valid_0's l2: 0.0405853
[176]	valid_0's l1: 0.148383	valid_0's l2: 0.0405827
[177]	valid_0's l1: 0.148395	valid_0's l2: 0.0405792
[178]	valid_0's l1: 0.148414	valid_0's l2: 0.0405772
[179]	valid_0's l1: 0.148425	valid_0's l2: 0.0405

[273]	valid_0's l1: 0.147308	valid_0's l2: 0.0398025
[274]	valid_0's l1: 0.147301	valid_0's l2: 0.0397972
[275]	valid_0's l1: 0.147274	valid_0's l2: 0.0397887
[276]	valid_0's l1: 0.147256	valid_0's l2: 0.039785
[277]	valid_0's l1: 0.147243	valid_0's l2: 0.0397818
[278]	valid_0's l1: 0.147239	valid_0's l2: 0.0397742
[279]	valid_0's l1: 0.14723	valid_0's l2: 0.0397709
[280]	valid_0's l1: 0.147209	valid_0's l2: 0.0397648
[281]	valid_0's l1: 0.147184	valid_0's l2: 0.0397544
[282]	valid_0's l1: 0.147159	valid_0's l2: 0.0397441
[283]	valid_0's l1: 0.147134	valid_0's l2: 0.0397339
[284]	valid_0's l1: 0.147109	valid_0's l2: 0.0397239
[285]	valid_0's l1: 0.147085	valid_0's l2: 0.0397139
[286]	valid_0's l1: 0.14706	valid_0's l2: 0.0397041
[287]	valid_0's l1: 0.147036	valid_0's l2: 0.0396944
[288]	valid_0's l1: 0.14703	valid_0's l2: 0.0396878
[289]	valid_0's l1: 0.147006	valid_0's l2: 0.0396782
[290]	valid_0's l1: 0.146994	valid_0's l2: 0.0396705
[291]	valid_0's l1: 0.146958	valid_0's l2: 0.03966

[392]	valid_0's l1: 0.146251	valid_0's l2: 0.0394814
[393]	valid_0's l1: 0.146243	valid_0's l2: 0.0394815
[394]	valid_0's l1: 0.14622	valid_0's l2: 0.0394727
[395]	valid_0's l1: 0.1462	valid_0's l2: 0.03947
[396]	valid_0's l1: 0.146178	valid_0's l2: 0.0394634
[397]	valid_0's l1: 0.146154	valid_0's l2: 0.0394563
[398]	valid_0's l1: 0.146135	valid_0's l2: 0.0394538
[399]	valid_0's l1: 0.146113	valid_0's l2: 0.0394469
[400]	valid_0's l1: 0.146104	valid_0's l2: 0.0394484
[401]	valid_0's l1: 0.146099	valid_0's l2: 0.0394443
[402]	valid_0's l1: 0.146096	valid_0's l2: 0.039443
[403]	valid_0's l1: 0.1461	valid_0's l2: 0.0394423
[404]	valid_0's l1: 0.146092	valid_0's l2: 0.0394397
[405]	valid_0's l1: 0.146081	valid_0's l2: 0.0394342
[406]	valid_0's l1: 0.146086	valid_0's l2: 0.0394337
[407]	valid_0's l1: 0.146082	valid_0's l2: 0.0394322
[408]	valid_0's l1: 0.146077	valid_0's l2: 0.0394285
[409]	valid_0's l1: 0.146071	valid_0's l2: 0.039427
[410]	valid_0's l1: 0.14607	valid_0's l2: 0.0394247
[41

[520]	valid_0's l1: 0.145754	valid_0's l2: 0.0393234
[521]	valid_0's l1: 0.145758	valid_0's l2: 0.0393215
[522]	valid_0's l1: 0.14576	valid_0's l2: 0.0393188
[523]	valid_0's l1: 0.145764	valid_0's l2: 0.039317
[524]	valid_0's l1: 0.145767	valid_0's l2: 0.0393153
[525]	valid_0's l1: 0.145768	valid_0's l2: 0.039314
[526]	valid_0's l1: 0.145769	valid_0's l2: 0.0393127
[527]	valid_0's l1: 0.145772	valid_0's l2: 0.0393111
[528]	valid_0's l1: 0.145768	valid_0's l2: 0.0393072
[529]	valid_0's l1: 0.145764	valid_0's l2: 0.0393033
[530]	valid_0's l1: 0.14576	valid_0's l2: 0.0393011
[531]	valid_0's l1: 0.145748	valid_0's l2: 0.0392937
[532]	valid_0's l1: 0.145743	valid_0's l2: 0.0392864
[533]	valid_0's l1: 0.145731	valid_0's l2: 0.0392791
[534]	valid_0's l1: 0.145727	valid_0's l2: 0.0392735
[535]	valid_0's l1: 0.145715	valid_0's l2: 0.0392664
[536]	valid_0's l1: 0.145698	valid_0's l2: 0.0392584
[537]	valid_0's l1: 0.145683	valid_0's l2: 0.039251
[538]	valid_0's l1: 0.145675	valid_0's l2: 0.039245

[648]	valid_0's l1: 0.145751	valid_0's l2: 0.0393144
[649]	valid_0's l1: 0.145747	valid_0's l2: 0.0393155
[650]	valid_0's l1: 0.145743	valid_0's l2: 0.0393167
[651]	valid_0's l1: 0.145745	valid_0's l2: 0.0393187
[652]	valid_0's l1: 0.145746	valid_0's l2: 0.0393209
[653]	valid_0's l1: 0.14574	valid_0's l2: 0.0393199
[654]	valid_0's l1: 0.145743	valid_0's l2: 0.039323
[655]	valid_0's l1: 0.145744	valid_0's l2: 0.0393251
[656]	valid_0's l1: 0.145745	valid_0's l2: 0.0393272
[657]	valid_0's l1: 0.145748	valid_0's l2: 0.0393294
[658]	valid_0's l1: 0.145752	valid_0's l2: 0.0393316
[659]	valid_0's l1: 0.145755	valid_0's l2: 0.0393338
[660]	valid_0's l1: 0.145755	valid_0's l2: 0.0393349
[661]	valid_0's l1: 0.14577	valid_0's l2: 0.0393384
[662]	valid_0's l1: 0.145774	valid_0's l2: 0.0393396
[663]	valid_0's l1: 0.145781	valid_0's l2: 0.03934
[664]	valid_0's l1: 0.145777	valid_0's l2: 0.0393387
[665]	valid_0's l1: 0.145784	valid_0's l2: 0.0393411
[666]	valid_0's l1: 0.145789	valid_0's l2: 0.039344

[775]	valid_0's l1: 0.145552	valid_0's l2: 0.0391755
[776]	valid_0's l1: 0.145564	valid_0's l2: 0.0391771
[777]	valid_0's l1: 0.145571	valid_0's l2: 0.0391779
[778]	valid_0's l1: 0.145578	valid_0's l2: 0.0391787
[779]	valid_0's l1: 0.14559	valid_0's l2: 0.0391806
[780]	valid_0's l1: 0.145601	valid_0's l2: 0.0391817
[781]	valid_0's l1: 0.145601	valid_0's l2: 0.0391832
[782]	valid_0's l1: 0.145606	valid_0's l2: 0.0391879
[783]	valid_0's l1: 0.145599	valid_0's l2: 0.0391867
[784]	valid_0's l1: 0.145591	valid_0's l2: 0.0391856
[785]	valid_0's l1: 0.145587	valid_0's l2: 0.0391892
[786]	valid_0's l1: 0.145591	valid_0's l2: 0.0391938
[787]	valid_0's l1: 0.145587	valid_0's l2: 0.0391963
[788]	valid_0's l1: 0.145586	valid_0's l2: 0.0391976
[789]	valid_0's l1: 0.145589	valid_0's l2: 0.0392023
[790]	valid_0's l1: 0.145595	valid_0's l2: 0.0392065
[791]	valid_0's l1: 0.145619	valid_0's l2: 0.0392127
[792]	valid_0's l1: 0.145632	valid_0's l2: 0.0392188
[793]	valid_0's l1: 0.145645	valid_0's l2: 0.03

[839]	valid_0's l1: 0.145635	valid_0's l2: 0.039243
[840]	valid_0's l1: 0.145626	valid_0's l2: 0.039244
[841]	valid_0's l1: 0.145618	valid_0's l2: 0.0392407
[842]	valid_0's l1: 0.145616	valid_0's l2: 0.0392373
[843]	valid_0's l1: 0.145606	valid_0's l2: 0.039236
[844]	valid_0's l1: 0.145597	valid_0's l2: 0.0392347
[845]	valid_0's l1: 0.145603	valid_0's l2: 0.0392339
[846]	valid_0's l1: 0.145595	valid_0's l2: 0.0392308
[847]	valid_0's l1: 0.145588	valid_0's l2: 0.0392278
[848]	valid_0's l1: 0.145581	valid_0's l2: 0.0392249
[849]	valid_0's l1: 0.14557	valid_0's l2: 0.0392216
[850]	valid_0's l1: 0.145565	valid_0's l2: 0.0392209
[851]	valid_0's l1: 0.145557	valid_0's l2: 0.0392212
[852]	valid_0's l1: 0.145552	valid_0's l2: 0.039222
[853]	valid_0's l1: 0.145547	valid_0's l2: 0.0392228
[854]	valid_0's l1: 0.145541	valid_0's l2: 0.0392236
[855]	valid_0's l1: 0.145533	valid_0's l2: 0.0392239
[856]	valid_0's l1: 0.145528	valid_0's l2: 0.0392248
[857]	valid_0's l1: 0.145523	valid_0's l2: 0.039225

[906]	valid_0's l1: 0.145424	valid_0's l2: 0.0392742
[907]	valid_0's l1: 0.145424	valid_0's l2: 0.0392745
[908]	valid_0's l1: 0.145423	valid_0's l2: 0.039275
[909]	valid_0's l1: 0.145425	valid_0's l2: 0.0392742
[910]	valid_0's l1: 0.145428	valid_0's l2: 0.0392764
[911]	valid_0's l1: 0.145421	valid_0's l2: 0.0392707
[912]	valid_0's l1: 0.145423	valid_0's l2: 0.039266
[913]	valid_0's l1: 0.145416	valid_0's l2: 0.0392618
[914]	valid_0's l1: 0.145422	valid_0's l2: 0.0392617
[915]	valid_0's l1: 0.145419	valid_0's l2: 0.0392553
[916]	valid_0's l1: 0.145413	valid_0's l2: 0.0392535
[917]	valid_0's l1: 0.14541	valid_0's l2: 0.0392471
[918]	valid_0's l1: 0.145415	valid_0's l2: 0.0392426
[919]	valid_0's l1: 0.145421	valid_0's l2: 0.0392389
[920]	valid_0's l1: 0.145424	valid_0's l2: 0.0392344
[921]	valid_0's l1: 0.145407	valid_0's l2: 0.0392305
[922]	valid_0's l1: 0.145396	valid_0's l2: 0.0392296
[923]	valid_0's l1: 0.145385	valid_0's l2: 0.0392284
[924]	valid_0's l1: 0.145363	valid_0's l2: 0.0392

[971]	valid_0's l1: 0.145378	valid_0's l2: 0.0391941
[972]	valid_0's l1: 0.145381	valid_0's l2: 0.0391934
[973]	valid_0's l1: 0.145376	valid_0's l2: 0.0391933
[974]	valid_0's l1: 0.145372	valid_0's l2: 0.039193
[975]	valid_0's l1: 0.145372	valid_0's l2: 0.0391943
[976]	valid_0's l1: 0.145367	valid_0's l2: 0.0391944
[977]	valid_0's l1: 0.145359	valid_0's l2: 0.0391933
[978]	valid_0's l1: 0.14536	valid_0's l2: 0.0391939
[979]	valid_0's l1: 0.145355	valid_0's l2: 0.0391941
[980]	valid_0's l1: 0.145358	valid_0's l2: 0.0391965
[981]	valid_0's l1: 0.145378	valid_0's l2: 0.0391957
[982]	valid_0's l1: 0.145393	valid_0's l2: 0.0391943
[983]	valid_0's l1: 0.145408	valid_0's l2: 0.0391952
[984]	valid_0's l1: 0.145422	valid_0's l2: 0.0391932
[985]	valid_0's l1: 0.145437	valid_0's l2: 0.0391921
[986]	valid_0's l1: 0.145454	valid_0's l2: 0.0391909
[987]	valid_0's l1: 0.145471	valid_0's l2: 0.0391897
[988]	valid_0's l1: 0.145488	valid_0's l2: 0.0391888
[989]	valid_0's l1: 0.145503	valid_0's l2: 0.039

[1037]	valid_0's l1: 0.145893	valid_0's l2: 0.0392952
[1038]	valid_0's l1: 0.145895	valid_0's l2: 0.0392959
[1039]	valid_0's l1: 0.1459	valid_0's l2: 0.0392972
[1040]	valid_0's l1: 0.145899	valid_0's l2: 0.0392991
[1041]	valid_0's l1: 0.145902	valid_0's l2: 0.039304
[1042]	valid_0's l1: 0.145892	valid_0's l2: 0.039303
[1043]	valid_0's l1: 0.145897	valid_0's l2: 0.0393084
[1044]	valid_0's l1: 0.145903	valid_0's l2: 0.0393138
[1045]	valid_0's l1: 0.145909	valid_0's l2: 0.0393192
[1046]	valid_0's l1: 0.145915	valid_0's l2: 0.0393246
[1047]	valid_0's l1: 0.145919	valid_0's l2: 0.0393285
[1048]	valid_0's l1: 0.14592	valid_0's l2: 0.0393319
[1049]	valid_0's l1: 0.145926	valid_0's l2: 0.0393374
[1050]	valid_0's l1: 0.145933	valid_0's l2: 0.0393429
[1051]	valid_0's l1: 0.145922	valid_0's l2: 0.0393407
[1052]	valid_0's l1: 0.145911	valid_0's l2: 0.0393378
[1053]	valid_0's l1: 0.145895	valid_0's l2: 0.0393364
[1054]	valid_0's l1: 0.14589	valid_0's l2: 0.0393323
[1055]	valid_0's l1: 0.145879	vali

[1103]	valid_0's l1: 0.146028	valid_0's l2: 0.0394338
[1104]	valid_0's l1: 0.146031	valid_0's l2: 0.0394363
[1105]	valid_0's l1: 0.146024	valid_0's l2: 0.039437
[1106]	valid_0's l1: 0.146017	valid_0's l2: 0.0394377
[1107]	valid_0's l1: 0.146011	valid_0's l2: 0.0394384
[1108]	valid_0's l1: 0.146013	valid_0's l2: 0.0394394
[1109]	valid_0's l1: 0.146004	valid_0's l2: 0.0394392
[1110]	valid_0's l1: 0.145998	valid_0's l2: 0.03944
[1111]	valid_0's l1: 0.146015	valid_0's l2: 0.0394453
[1112]	valid_0's l1: 0.146038	valid_0's l2: 0.03945
[1113]	valid_0's l1: 0.146056	valid_0's l2: 0.0394526
[1114]	valid_0's l1: 0.146075	valid_0's l2: 0.0394583
[1115]	valid_0's l1: 0.146096	valid_0's l2: 0.0394637
[1116]	valid_0's l1: 0.146115	valid_0's l2: 0.0394694
[1117]	valid_0's l1: 0.146134	valid_0's l2: 0.0394752
[1118]	valid_0's l1: 0.146155	valid_0's l2: 0.0394811
[1119]	valid_0's l1: 0.146169	valid_0's l2: 0.0394844
[1120]	valid_0's l1: 0.146178	valid_0's l2: 0.0394852
[1121]	valid_0's l1: 0.146176	val

[1231]	valid_0's l1: 0.145795	valid_0's l2: 0.0395241
[1232]	valid_0's l1: 0.145766	valid_0's l2: 0.0395187
[1233]	valid_0's l1: 0.145739	valid_0's l2: 0.0395123
[1234]	valid_0's l1: 0.14571	valid_0's l2: 0.0395073
[1235]	valid_0's l1: 0.145681	valid_0's l2: 0.039502
[1236]	valid_0's l1: 0.145652	valid_0's l2: 0.0394957
[1237]	valid_0's l1: 0.145622	valid_0's l2: 0.0394894
[1238]	valid_0's l1: 0.145592	valid_0's l2: 0.0394832
[1239]	valid_0's l1: 0.145563	valid_0's l2: 0.0394771
[1240]	valid_0's l1: 0.145546	valid_0's l2: 0.0394742
[1241]	valid_0's l1: 0.145534	valid_0's l2: 0.0394757
[1242]	valid_0's l1: 0.145522	valid_0's l2: 0.0394772
[1243]	valid_0's l1: 0.145506	valid_0's l2: 0.0394761
[1244]	valid_0's l1: 0.145496	valid_0's l2: 0.0394775
[1245]	valid_0's l1: 0.145488	valid_0's l2: 0.0394807
[1246]	valid_0's l1: 0.145482	valid_0's l2: 0.0394839
[1247]	valid_0's l1: 0.145471	valid_0's l2: 0.0394841
[1248]	valid_0's l1: 0.145465	valid_0's l2: 0.0394874
[1249]	valid_0's l1: 0.145452	

[1295]	valid_0's l1: 0.145451	valid_0's l2: 0.039538
[1296]	valid_0's l1: 0.145453	valid_0's l2: 0.0395421
[1297]	valid_0's l1: 0.145456	valid_0's l2: 0.0395463
[1298]	valid_0's l1: 0.145454	valid_0's l2: 0.0395469
[1299]	valid_0's l1: 0.145456	valid_0's l2: 0.0395511
[1300]	valid_0's l1: 0.145459	valid_0's l2: 0.0395554
[1301]	valid_0's l1: 0.145444	valid_0's l2: 0.0395508
[1302]	valid_0's l1: 0.145429	valid_0's l2: 0.0395463
[1303]	valid_0's l1: 0.145414	valid_0's l2: 0.0395419
[1304]	valid_0's l1: 0.14541	valid_0's l2: 0.0395434
[1305]	valid_0's l1: 0.145398	valid_0's l2: 0.0395395
[1306]	valid_0's l1: 0.145376	valid_0's l2: 0.0395347
[1307]	valid_0's l1: 0.145366	valid_0's l2: 0.0395324
[1308]	valid_0's l1: 0.145349	valid_0's l2: 0.0395284
[1309]	valid_0's l1: 0.145345	valid_0's l2: 0.039531
[1310]	valid_0's l1: 0.145333	valid_0's l2: 0.0395273
[1311]	valid_0's l1: 0.145345	valid_0's l2: 0.0395287
[1312]	valid_0's l1: 0.145358	valid_0's l2: 0.0395301
[1313]	valid_0's l1: 0.145373	v

[1364]	valid_0's l1: 0.145612	valid_0's l2: 0.0396396
[1365]	valid_0's l1: 0.145631	valid_0's l2: 0.0396454
[1366]	valid_0's l1: 0.145636	valid_0's l2: 0.0396497
[1367]	valid_0's l1: 0.145649	valid_0's l2: 0.0396544
[1368]	valid_0's l1: 0.145663	valid_0's l2: 0.0396592
[1369]	valid_0's l1: 0.145679	valid_0's l2: 0.0396637
[1370]	valid_0's l1: 0.14569	valid_0's l2: 0.0396677
[1371]	valid_0's l1: 0.145697	valid_0's l2: 0.0396664
[1372]	valid_0's l1: 0.145713	valid_0's l2: 0.0396666
[1373]	valid_0's l1: 0.145719	valid_0's l2: 0.0396647
[1374]	valid_0's l1: 0.145734	valid_0's l2: 0.0396672
[1375]	valid_0's l1: 0.145745	valid_0's l2: 0.0396667
[1376]	valid_0's l1: 0.145765	valid_0's l2: 0.0396691
[1377]	valid_0's l1: 0.145777	valid_0's l2: 0.0396688
[1378]	valid_0's l1: 0.145793	valid_0's l2: 0.0396718
[1379]	valid_0's l1: 0.145804	valid_0's l2: 0.039674
[1380]	valid_0's l1: 0.145817	valid_0's l2: 0.0396753
[1381]	valid_0's l1: 0.145807	valid_0's l2: 0.039671
[1382]	valid_0's l1: 0.145794	v

[1484]	valid_0's l1: 0.145952	valid_0's l2: 0.0396993
[1485]	valid_0's l1: 0.145947	valid_0's l2: 0.0396984
[1486]	valid_0's l1: 0.145942	valid_0's l2: 0.0396975
[1487]	valid_0's l1: 0.145935	valid_0's l2: 0.0396958
[1488]	valid_0's l1: 0.14593	valid_0's l2: 0.039695
[1489]	valid_0's l1: 0.145923	valid_0's l2: 0.0396933
[1490]	valid_0's l1: 0.145922	valid_0's l2: 0.0396926
[1491]	valid_0's l1: 0.145922	valid_0's l2: 0.0396923
[1492]	valid_0's l1: 0.145926	valid_0's l2: 0.0396924
[1493]	valid_0's l1: 0.145926	valid_0's l2: 0.0396911
[1494]	valid_0's l1: 0.14593	valid_0's l2: 0.0396918
[1495]	valid_0's l1: 0.14593	valid_0's l2: 0.0396906
[1496]	valid_0's l1: 0.145935	valid_0's l2: 0.0396917
[1497]	valid_0's l1: 0.145932	valid_0's l2: 0.0396893
[1498]	valid_0's l1: 0.14593	valid_0's l2: 0.0396899
[1499]	valid_0's l1: 0.14594	valid_0's l2: 0.0396939
[1500]	valid_0's l1: 0.145939	valid_0's l2: 0.0396932
[1501]	valid_0's l1: 0.145937	valid_0's l2: 0.0396895
[1502]	valid_0's l1: 0.145929	vali

[1614]	valid_0's l1: 0.145911	valid_0's l2: 0.0396631
[1615]	valid_0's l1: 0.145919	valid_0's l2: 0.0396673
[1616]	valid_0's l1: 0.145927	valid_0's l2: 0.0396715
[1617]	valid_0's l1: 0.145926	valid_0's l2: 0.0396693
[1618]	valid_0's l1: 0.145934	valid_0's l2: 0.0396735
[1619]	valid_0's l1: 0.145943	valid_0's l2: 0.0396771
[1620]	valid_0's l1: 0.14595	valid_0's l2: 0.0396811
[1621]	valid_0's l1: 0.145942	valid_0's l2: 0.0396765
[1622]	valid_0's l1: 0.145933	valid_0's l2: 0.0396718
[1623]	valid_0's l1: 0.145929	valid_0's l2: 0.0396691
[1624]	valid_0's l1: 0.145912	valid_0's l2: 0.0396628
[1625]	valid_0's l1: 0.145899	valid_0's l2: 0.0396566
[1626]	valid_0's l1: 0.145895	valid_0's l2: 0.039654
[1627]	valid_0's l1: 0.14588	valid_0's l2: 0.0396478
[1628]	valid_0's l1: 0.145873	valid_0's l2: 0.0396442
[1629]	valid_0's l1: 0.14586	valid_0's l2: 0.0396382
[1630]	valid_0's l1: 0.145845	valid_0's l2: 0.0396322
[1631]	valid_0's l1: 0.145851	valid_0's l2: 0.0396294
[1632]	valid_0's l1: 0.145856	va

[1735]	valid_0's l1: 0.146013	valid_0's l2: 0.0397718
[1736]	valid_0's l1: 0.146011	valid_0's l2: 0.0397696
[1737]	valid_0's l1: 0.146012	valid_0's l2: 0.0397695
[1738]	valid_0's l1: 0.14602	valid_0's l2: 0.0397707
[1739]	valid_0's l1: 0.14602	valid_0's l2: 0.0397706
[1740]	valid_0's l1: 0.14602	valid_0's l2: 0.0397704
[1741]	valid_0's l1: 0.146016	valid_0's l2: 0.0397666
[1742]	valid_0's l1: 0.14601	valid_0's l2: 0.0397609
[1743]	valid_0's l1: 0.146005	valid_0's l2: 0.0397553
[1744]	valid_0's l1: 0.146006	valid_0's l2: 0.0397548
[1745]	valid_0's l1: 0.146001	valid_0's l2: 0.0397492
[1746]	valid_0's l1: 0.146009	valid_0's l2: 0.0397524
[1747]	valid_0's l1: 0.146008	valid_0's l2: 0.0397504
[1748]	valid_0's l1: 0.146003	valid_0's l2: 0.039745
[1749]	valid_0's l1: 0.146002	valid_0's l2: 0.0397431
[1750]	valid_0's l1: 0.146002	valid_0's l2: 0.0397419


In [19]:
print("Toxicity Results")
print("================")
print("[r2_score, mean_absolute_error, model]")
print("================")
for model in [lr_results, gbm_results, svr_results, en_results]:
    print(model)

Toxicity Results
[r2_score, mean_absolute_error, model]
(-0.4175, 0.1149, LinearRegression())
(-11.9107, 0.1451, LGBMRegressor(bagging_fraction=0.7, bagging_freq=10, feature_fraction=0.9,
              learning_rate=0.005, max_bin=512, max_depth=8,
              metric=['l1', 'l2'], num_iterations=100000, num_leaves=128,
              objective='regression', task='train', verbose=0))
(-1.597, 0.1341, SVR(kernel='linear'))
(-1.408699114373207e+31, 0.1532, ElasticNet(random_state=0))


### Profanity

In [20]:
category = 'PROFANITY'

lr_results = LinearRegression(category)
gbm_results = LightGBM(category)
svr_results = SVR(category)
en_results = ElasticNet(category)



You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[1]	valid_0's l1: 0.131234	valid_0's l2: 0.0398203
[2]	valid_0's l1: 0.131209	valid_0's l2: 0.0398067
[3]	valid_0's l1: 0.131179	valid_0's l2: 0.0397944
[4]	valid_0's l1: 0.131155	valid_0's l2: 0.0397848
[5]	valid_0's l1: 0.131125	valid_0's l2: 0.0397722
[6]	valid_0's l1: 0.1311	valid_0's l2: 0.0397625
[7]	valid_0's l1: 0.131073	valid_0's l2: 0.0397525
[8]	valid_0's l1: 0.131045	valid_0's l2: 0.0397426
[9]	valid_0's l1: 0.131035	valid_0's l2: 0.0397336
[10]	valid_0's l1: 0.131009	valid_0's l2: 0.0397198
[11]	valid_0's l1: 0.131007	valid_0's l2: 0.039706
[12]	valid_0's l1: 0.131005	valid_0's l2: 0.0396913
[13]	valid_0's l1: 0.131002	valid_0's l2: 0.0396766
[14]	valid_0's l1: 0.130988	valid_0's l2: 0.0396618
[15]	valid_0's l1: 0.130986	valid_0's l2: 0.0396476
[16]	valid_0's l1: 0.130984	valid_0's l2: 0.0396337
[17]	valid_0's l1: 0.130981	valid_0's l2: 0.0396199
[18]	v

[86]	valid_0's l1: 0.12951	valid_0's l2: 0.0387032
[87]	valid_0's l1: 0.129492	valid_0's l2: 0.0386895
[88]	valid_0's l1: 0.129463	valid_0's l2: 0.0386763
[89]	valid_0's l1: 0.129439	valid_0's l2: 0.0386634
[90]	valid_0's l1: 0.129415	valid_0's l2: 0.0386506
[91]	valid_0's l1: 0.129384	valid_0's l2: 0.0386374
[92]	valid_0's l1: 0.129354	valid_0's l2: 0.0386236
[93]	valid_0's l1: 0.129339	valid_0's l2: 0.0386151
[94]	valid_0's l1: 0.129308	valid_0's l2: 0.0385999
[95]	valid_0's l1: 0.129293	valid_0's l2: 0.0385915
[96]	valid_0's l1: 0.129263	valid_0's l2: 0.038578
[97]	valid_0's l1: 0.129234	valid_0's l2: 0.0385647
[98]	valid_0's l1: 0.129218	valid_0's l2: 0.0385565
[99]	valid_0's l1: 0.129189	valid_0's l2: 0.0385433
[100]	valid_0's l1: 0.129158	valid_0's l2: 0.0385302
[101]	valid_0's l1: 0.129149	valid_0's l2: 0.0385193
[102]	valid_0's l1: 0.129123	valid_0's l2: 0.0385083
[103]	valid_0's l1: 0.129091	valid_0's l2: 0.0384942
[104]	valid_0's l1: 0.129064	valid_0's l2: 0.0384803
[105]	val

[190]	valid_0's l1: 0.128322	valid_0's l2: 0.037822
[191]	valid_0's l1: 0.128324	valid_0's l2: 0.0378147
[192]	valid_0's l1: 0.128325	valid_0's l2: 0.0378098
[193]	valid_0's l1: 0.128325	valid_0's l2: 0.0378029
[194]	valid_0's l1: 0.128329	valid_0's l2: 0.0377965
[195]	valid_0's l1: 0.128317	valid_0's l2: 0.0377897
[196]	valid_0's l1: 0.128321	valid_0's l2: 0.0377835
[197]	valid_0's l1: 0.128334	valid_0's l2: 0.0377834
[198]	valid_0's l1: 0.128338	valid_0's l2: 0.0377774
[199]	valid_0's l1: 0.128342	valid_0's l2: 0.0377714
[200]	valid_0's l1: 0.128346	valid_0's l2: 0.0377656
[201]	valid_0's l1: 0.128365	valid_0's l2: 0.0377671
[202]	valid_0's l1: 0.128368	valid_0's l2: 0.0377626
[203]	valid_0's l1: 0.128373	valid_0's l2: 0.0377581
[204]	valid_0's l1: 0.128384	valid_0's l2: 0.0377557
[205]	valid_0's l1: 0.128389	valid_0's l2: 0.0377514
[206]	valid_0's l1: 0.128393	valid_0's l2: 0.0377473
[207]	valid_0's l1: 0.1284	valid_0's l2: 0.0377407
[208]	valid_0's l1: 0.128404	valid_0's l2: 0.0377

[277]	valid_0's l1: 0.12839	valid_0's l2: 0.0375456
[278]	valid_0's l1: 0.128399	valid_0's l2: 0.0375452
[279]	valid_0's l1: 0.128382	valid_0's l2: 0.0375417
[280]	valid_0's l1: 0.128364	valid_0's l2: 0.0375383
[281]	valid_0's l1: 0.128355	valid_0's l2: 0.0375346
[282]	valid_0's l1: 0.128355	valid_0's l2: 0.0375322
[283]	valid_0's l1: 0.128343	valid_0's l2: 0.0375264
[284]	valid_0's l1: 0.128343	valid_0's l2: 0.0375241
[285]	valid_0's l1: 0.128343	valid_0's l2: 0.0375219
[286]	valid_0's l1: 0.12833	valid_0's l2: 0.0375164
[287]	valid_0's l1: 0.12833	valid_0's l2: 0.0375143
[288]	valid_0's l1: 0.128331	valid_0's l2: 0.0375101
[289]	valid_0's l1: 0.12832	valid_0's l2: 0.0375057
[290]	valid_0's l1: 0.128318	valid_0's l2: 0.0375025
[291]	valid_0's l1: 0.128291	valid_0's l2: 0.037498
[292]	valid_0's l1: 0.128271	valid_0's l2: 0.0374935
[293]	valid_0's l1: 0.128243	valid_0's l2: 0.0374868
[294]	valid_0's l1: 0.128214	valid_0's l2: 0.0374797
[295]	valid_0's l1: 0.128185	valid_0's l2: 0.037472

[366]	valid_0's l1: 0.127956	valid_0's l2: 0.0374786
[367]	valid_0's l1: 0.127954	valid_0's l2: 0.0374757
[368]	valid_0's l1: 0.127953	valid_0's l2: 0.0374729
[369]	valid_0's l1: 0.127952	valid_0's l2: 0.0374703
[370]	valid_0's l1: 0.127951	valid_0's l2: 0.0374687
[371]	valid_0's l1: 0.127948	valid_0's l2: 0.0374692
[372]	valid_0's l1: 0.127945	valid_0's l2: 0.0374719
[373]	valid_0's l1: 0.127938	valid_0's l2: 0.0374701
[374]	valid_0's l1: 0.127931	valid_0's l2: 0.0374686
[375]	valid_0's l1: 0.127924	valid_0's l2: 0.03747
[376]	valid_0's l1: 0.127916	valid_0's l2: 0.0374695
[377]	valid_0's l1: 0.127911	valid_0's l2: 0.0374719
[378]	valid_0's l1: 0.127898	valid_0's l2: 0.0374716
[379]	valid_0's l1: 0.127899	valid_0's l2: 0.0374749
[380]	valid_0's l1: 0.127892	valid_0's l2: 0.0374765
[381]	valid_0's l1: 0.127895	valid_0's l2: 0.037477
[382]	valid_0's l1: 0.127903	valid_0's l2: 0.0374814
[383]	valid_0's l1: 0.12793	valid_0's l2: 0.0374843
[384]	valid_0's l1: 0.127933	valid_0's l2: 0.03748

[454]	valid_0's l1: 0.127872	valid_0's l2: 0.0375101
[455]	valid_0's l1: 0.12786	valid_0's l2: 0.0375064
[456]	valid_0's l1: 0.12786	valid_0's l2: 0.0375097
[457]	valid_0's l1: 0.127859	valid_0's l2: 0.0375123
[458]	valid_0's l1: 0.127856	valid_0's l2: 0.0375129
[459]	valid_0's l1: 0.127853	valid_0's l2: 0.0375135
[460]	valid_0's l1: 0.127849	valid_0's l2: 0.0375142
[461]	valid_0's l1: 0.127848	valid_0's l2: 0.0375172
[462]	valid_0's l1: 0.127829	valid_0's l2: 0.0375162
[463]	valid_0's l1: 0.127817	valid_0's l2: 0.0375169
[464]	valid_0's l1: 0.127803	valid_0's l2: 0.0375153
[465]	valid_0's l1: 0.127785	valid_0's l2: 0.0375166
[466]	valid_0's l1: 0.127771	valid_0's l2: 0.0375151
[467]	valid_0's l1: 0.127769	valid_0's l2: 0.0375147
[468]	valid_0's l1: 0.127759	valid_0's l2: 0.0375146
[469]	valid_0's l1: 0.127753	valid_0's l2: 0.0375143
[470]	valid_0's l1: 0.127739	valid_0's l2: 0.0375131
[471]	valid_0's l1: 0.127738	valid_0's l2: 0.037512
[472]	valid_0's l1: 0.127737	valid_0's l2: 0.0375

[538]	valid_0's l1: 0.127845	valid_0's l2: 0.0375746
[539]	valid_0's l1: 0.12783	valid_0's l2: 0.0375687
[540]	valid_0's l1: 0.127826	valid_0's l2: 0.0375627
[541]	valid_0's l1: 0.127816	valid_0's l2: 0.0375587
[542]	valid_0's l1: 0.127802	valid_0's l2: 0.0375528
[543]	valid_0's l1: 0.127796	valid_0's l2: 0.0375485
[544]	valid_0's l1: 0.127789	valid_0's l2: 0.0375444
[545]	valid_0's l1: 0.127779	valid_0's l2: 0.0375407
[546]	valid_0's l1: 0.127773	valid_0's l2: 0.0375366
[547]	valid_0's l1: 0.127767	valid_0's l2: 0.0375326
[548]	valid_0's l1: 0.12776	valid_0's l2: 0.0375287
[549]	valid_0's l1: 0.127754	valid_0's l2: 0.0375249
[550]	valid_0's l1: 0.127741	valid_0's l2: 0.0375196
[551]	valid_0's l1: 0.127764	valid_0's l2: 0.0375221
[552]	valid_0's l1: 0.127791	valid_0's l2: 0.0375253
[553]	valid_0's l1: 0.127814	valid_0's l2: 0.0375279
[554]	valid_0's l1: 0.127831	valid_0's l2: 0.0375277
[555]	valid_0's l1: 0.127854	valid_0's l2: 0.0375304
[556]	valid_0's l1: 0.127874	valid_0's l2: 0.037

[602]	valid_0's l1: 0.12808	valid_0's l2: 0.03766
[603]	valid_0's l1: 0.128075	valid_0's l2: 0.0376589
[604]	valid_0's l1: 0.128076	valid_0's l2: 0.0376588
[605]	valid_0's l1: 0.128071	valid_0's l2: 0.0376577
[606]	valid_0's l1: 0.128065	valid_0's l2: 0.0376567
[607]	valid_0's l1: 0.12806	valid_0's l2: 0.0376563
[608]	valid_0's l1: 0.128055	valid_0's l2: 0.0376553
[609]	valid_0's l1: 0.128045	valid_0's l2: 0.037655
[610]	valid_0's l1: 0.12804	valid_0's l2: 0.0376541
[611]	valid_0's l1: 0.128054	valid_0's l2: 0.0376552
[612]	valid_0's l1: 0.12807	valid_0's l2: 0.0376574
[613]	valid_0's l1: 0.128078	valid_0's l2: 0.0376574
[614]	valid_0's l1: 0.128094	valid_0's l2: 0.0376596
[615]	valid_0's l1: 0.128103	valid_0's l2: 0.0376597
[616]	valid_0's l1: 0.128119	valid_0's l2: 0.037662
[617]	valid_0's l1: 0.128129	valid_0's l2: 0.0376622
[618]	valid_0's l1: 0.128136	valid_0's l2: 0.0376621
[619]	valid_0's l1: 0.128149	valid_0's l2: 0.0376632
[620]	valid_0's l1: 0.128156	valid_0's l2: 0.0376627
[

[668]	valid_0's l1: 0.128233	valid_0's l2: 0.0377607
[669]	valid_0's l1: 0.128237	valid_0's l2: 0.0377627
[670]	valid_0's l1: 0.128241	valid_0's l2: 0.0377629
[671]	valid_0's l1: 0.128243	valid_0's l2: 0.0377631
[672]	valid_0's l1: 0.128244	valid_0's l2: 0.0377614
[673]	valid_0's l1: 0.128246	valid_0's l2: 0.0377598
[674]	valid_0's l1: 0.128251	valid_0's l2: 0.0377623
[675]	valid_0's l1: 0.128252	valid_0's l2: 0.0377607
[676]	valid_0's l1: 0.128258	valid_0's l2: 0.0377643
[677]	valid_0's l1: 0.128264	valid_0's l2: 0.0377679
[678]	valid_0's l1: 0.12827	valid_0's l2: 0.0377715
[679]	valid_0's l1: 0.128272	valid_0's l2: 0.0377704
[680]	valid_0's l1: 0.12828	valid_0's l2: 0.0377728
[681]	valid_0's l1: 0.128275	valid_0's l2: 0.03777
[682]	valid_0's l1: 0.128269	valid_0's l2: 0.037768
[683]	valid_0's l1: 0.12827	valid_0's l2: 0.0377666
[684]	valid_0's l1: 0.128264	valid_0's l2: 0.0377646
[685]	valid_0's l1: 0.128258	valid_0's l2: 0.0377626
[686]	valid_0's l1: 0.128262	valid_0's l2: 0.0377606

[737]	valid_0's l1: 0.128139	valid_0's l2: 0.0377064
[738]	valid_0's l1: 0.12814	valid_0's l2: 0.0377061
[739]	valid_0's l1: 0.128143	valid_0's l2: 0.0377099
[740]	valid_0's l1: 0.128144	valid_0's l2: 0.0377097
[741]	valid_0's l1: 0.128125	valid_0's l2: 0.0377071
[742]	valid_0's l1: 0.128108	valid_0's l2: 0.0377049
[743]	valid_0's l1: 0.128089	valid_0's l2: 0.0377027
[744]	valid_0's l1: 0.128073	valid_0's l2: 0.037701
[745]	valid_0's l1: 0.128052	valid_0's l2: 0.0376988
[746]	valid_0's l1: 0.128035	valid_0's l2: 0.0376967
[747]	valid_0's l1: 0.128019	valid_0's l2: 0.0376947
[748]	valid_0's l1: 0.128	valid_0's l2: 0.0376865
[749]	valid_0's l1: 0.127983	valid_0's l2: 0.0376846
[750]	valid_0's l1: 0.127966	valid_0's l2: 0.0376828
[751]	valid_0's l1: 0.127981	valid_0's l2: 0.0376873
[752]	valid_0's l1: 0.127996	valid_0's l2: 0.0376919
[753]	valid_0's l1: 0.128013	valid_0's l2: 0.0376999
[754]	valid_0's l1: 0.128028	valid_0's l2: 0.0377067
[755]	valid_0's l1: 0.128048	valid_0's l2: 0.037714

[807]	valid_0's l1: 0.128495	valid_0's l2: 0.0378694
[808]	valid_0's l1: 0.128485	valid_0's l2: 0.0378701
[809]	valid_0's l1: 0.128476	valid_0's l2: 0.0378707
[810]	valid_0's l1: 0.128475	valid_0's l2: 0.0378734
[811]	valid_0's l1: 0.128462	valid_0's l2: 0.0378678
[812]	valid_0's l1: 0.128456	valid_0's l2: 0.0378642
[813]	valid_0's l1: 0.128441	valid_0's l2: 0.0378584
[814]	valid_0's l1: 0.128429	valid_0's l2: 0.0378529
[815]	valid_0's l1: 0.128424	valid_0's l2: 0.0378488
[816]	valid_0's l1: 0.128418	valid_0's l2: 0.0378478
[817]	valid_0's l1: 0.128415	valid_0's l2: 0.0378461
[818]	valid_0's l1: 0.12841	valid_0's l2: 0.0378421
[819]	valid_0's l1: 0.128402	valid_0's l2: 0.0378384
[820]	valid_0's l1: 0.128406	valid_0's l2: 0.0378383
[821]	valid_0's l1: 0.128418	valid_0's l2: 0.0378377
[822]	valid_0's l1: 0.128436	valid_0's l2: 0.037839
[823]	valid_0's l1: 0.128443	valid_0's l2: 0.0378404
[824]	valid_0's l1: 0.128463	valid_0's l2: 0.0378448
[825]	valid_0's l1: 0.12848	valid_0's l2: 0.0378

[930]	valid_0's l1: 0.128196	valid_0's l2: 0.0378951
[931]	valid_0's l1: 0.1282	valid_0's l2: 0.0378917
[932]	valid_0's l1: 0.128204	valid_0's l2: 0.0378905
[933]	valid_0's l1: 0.128206	valid_0's l2: 0.0378864
[934]	valid_0's l1: 0.128208	valid_0's l2: 0.0378824
[935]	valid_0's l1: 0.128215	valid_0's l2: 0.0378802
[936]	valid_0's l1: 0.128218	valid_0's l2: 0.0378766
[937]	valid_0's l1: 0.128227	valid_0's l2: 0.037874
[938]	valid_0's l1: 0.128226	valid_0's l2: 0.0378729
[939]	valid_0's l1: 0.12823	valid_0's l2: 0.0378697
[940]	valid_0's l1: 0.12823	valid_0's l2: 0.0378687
[941]	valid_0's l1: 0.128261	valid_0's l2: 0.0378767
[942]	valid_0's l1: 0.128291	valid_0's l2: 0.0378839
[943]	valid_0's l1: 0.128317	valid_0's l2: 0.0378854
[944]	valid_0's l1: 0.128342	valid_0's l2: 0.0378869
[945]	valid_0's l1: 0.128358	valid_0's l2: 0.0378875
[946]	valid_0's l1: 0.128388	valid_0's l2: 0.0378947
[947]	valid_0's l1: 0.128415	valid_0's l2: 0.0379016
[948]	valid_0's l1: 0.128439	valid_0's l2: 0.037904

[1062]	valid_0's l1: 0.128941	valid_0's l2: 0.0380919
[1063]	valid_0's l1: 0.128958	valid_0's l2: 0.0380969
[1064]	valid_0's l1: 0.128974	valid_0's l2: 0.038102
[1065]	valid_0's l1: 0.128993	valid_0's l2: 0.0381066
[1066]	valid_0's l1: 0.129011	valid_0's l2: 0.0381117
[1067]	valid_0's l1: 0.129026	valid_0's l2: 0.0381152
[1068]	valid_0's l1: 0.129043	valid_0's l2: 0.0381203
[1069]	valid_0's l1: 0.129061	valid_0's l2: 0.0381255
[1070]	valid_0's l1: 0.129079	valid_0's l2: 0.0381306
[1071]	valid_0's l1: 0.129081	valid_0's l2: 0.0381333
[1072]	valid_0's l1: 0.129101	valid_0's l2: 0.0381385
[1073]	valid_0's l1: 0.129094	valid_0's l2: 0.0381392
[1074]	valid_0's l1: 0.129085	valid_0's l2: 0.0381402
[1075]	valid_0's l1: 0.129087	valid_0's l2: 0.0381429
[1076]	valid_0's l1: 0.129077	valid_0's l2: 0.038144
[1077]	valid_0's l1: 0.129072	valid_0's l2: 0.038145
[1078]	valid_0's l1: 0.129107	valid_0's l2: 0.0381517
[1079]	valid_0's l1: 0.129113	valid_0's l2: 0.0381548
[1080]	valid_0's l1: 0.129116	v

[1128]	valid_0's l1: 0.129616	valid_0's l2: 0.0383374
[1129]	valid_0's l1: 0.129623	valid_0's l2: 0.0383413
[1130]	valid_0's l1: 0.129633	valid_0's l2: 0.0383469
[1131]	valid_0's l1: 0.12963	valid_0's l2: 0.0383496
[1132]	valid_0's l1: 0.12963	valid_0's l2: 0.0383522
[1133]	valid_0's l1: 0.129632	valid_0's l2: 0.0383561
[1134]	valid_0's l1: 0.129636	valid_0's l2: 0.0383619
[1135]	valid_0's l1: 0.129638	valid_0's l2: 0.0383659
[1136]	valid_0's l1: 0.12963	valid_0's l2: 0.0383668
[1137]	valid_0's l1: 0.129622	valid_0's l2: 0.0383671
[1138]	valid_0's l1: 0.129604	valid_0's l2: 0.0383684
[1139]	valid_0's l1: 0.129606	valid_0's l2: 0.0383724
[1140]	valid_0's l1: 0.129609	valid_0's l2: 0.0383764
[1141]	valid_0's l1: 0.129587	valid_0's l2: 0.0383712
[1142]	valid_0's l1: 0.129565	valid_0's l2: 0.0383663
[1143]	valid_0's l1: 0.129539	valid_0's l2: 0.0383604
[1144]	valid_0's l1: 0.129528	valid_0's l2: 0.0383572
[1145]	valid_0's l1: 0.12952	valid_0's l2: 0.0383579
[1146]	valid_0's l1: 0.1295	vali

[1193]	valid_0's l1: 0.129577	valid_0's l2: 0.0383645
[1194]	valid_0's l1: 0.129579	valid_0's l2: 0.0383619
[1195]	valid_0's l1: 0.129574	valid_0's l2: 0.0383564
[1196]	valid_0's l1: 0.129573	valid_0's l2: 0.038352
[1197]	valid_0's l1: 0.129568	valid_0's l2: 0.0383467
[1198]	valid_0's l1: 0.129569	valid_0's l2: 0.0383442
[1199]	valid_0's l1: 0.129576	valid_0's l2: 0.0383423
[1200]	valid_0's l1: 0.129578	valid_0's l2: 0.0383394
[1201]	valid_0's l1: 0.129555	valid_0's l2: 0.0383409
[1202]	valid_0's l1: 0.129534	valid_0's l2: 0.0383417
[1203]	valid_0's l1: 0.129511	valid_0's l2: 0.0383432
[1204]	valid_0's l1: 0.129487	valid_0's l2: 0.0383398
[1205]	valid_0's l1: 0.129464	valid_0's l2: 0.0383385
[1206]	valid_0's l1: 0.129441	valid_0's l2: 0.0383401
[1207]	valid_0's l1: 0.129419	valid_0's l2: 0.0383418
[1208]	valid_0's l1: 0.129398	valid_0's l2: 0.038343
[1209]	valid_0's l1: 0.129376	valid_0's l2: 0.0383448
[1210]	valid_0's l1: 0.129359	valid_0's l2: 0.0383473
[1211]	valid_0's l1: 0.129372	

[1257]	valid_0's l1: 0.12922	valid_0's l2: 0.0383253
[1258]	valid_0's l1: 0.129218	valid_0's l2: 0.038323
[1259]	valid_0's l1: 0.129215	valid_0's l2: 0.038322
[1260]	valid_0's l1: 0.129214	valid_0's l2: 0.0383198
[1261]	valid_0's l1: 0.129209	valid_0's l2: 0.0383194
[1262]	valid_0's l1: 0.129206	valid_0's l2: 0.0383181
[1263]	valid_0's l1: 0.129199	valid_0's l2: 0.0383153
[1264]	valid_0's l1: 0.12919	valid_0's l2: 0.0383122
[1265]	valid_0's l1: 0.129187	valid_0's l2: 0.038311
[1266]	valid_0's l1: 0.129184	valid_0's l2: 0.0383099
[1267]	valid_0's l1: 0.129175	valid_0's l2: 0.038307
[1268]	valid_0's l1: 0.129172	valid_0's l2: 0.0383059
[1269]	valid_0's l1: 0.12917	valid_0's l2: 0.0383049
[1270]	valid_0's l1: 0.129167	valid_0's l2: 0.0383037
[1271]	valid_0's l1: 0.129144	valid_0's l2: 0.0383015
[1272]	valid_0's l1: 0.129132	valid_0's l2: 0.0383007
[1273]	valid_0's l1: 0.129109	valid_0's l2: 0.0382986
[1274]	valid_0's l1: 0.129092	valid_0's l2: 0.0382976
[1275]	valid_0's l1: 0.129075	valid

In [21]:
print("Profanity Results")
print("================")
print("[r2_score, mean_absolute_error, model]")
print("================")
for model in [lr_results, gbm_results, svr_results, en_results]:
    print(model)

Profanity Results
[r2_score, mean_absolute_error, model]
(-0.5004, 0.1062, LinearRegression())
(-39.1523, 0.1281, LGBMRegressor(bagging_fraction=0.7, bagging_freq=10, feature_fraction=0.9,
              learning_rate=0.005, max_bin=512, max_depth=8,
              metric=['l1', 'l2'], num_iterations=100000, num_leaves=128,
              objective='regression', task='train', verbose=0))
(-1.8409, 0.1287, SVR(kernel='linear'))
(-5.170404951616488e+31, 0.1313, ElasticNet(random_state=0))


### Sexually Explicit

In [22]:
category = 'SEXUALLY_EXPLICIT'

lr_results = LinearRegression(category)
gbm_results = LightGBM(category)
svr_results = SVR(category)
en_results = ElasticNet(category)



You can set `force_col_wise=true` to remove the overhead.
[1]	valid_0's l1: 0.106153	valid_0's l2: 0.0288719
[2]	valid_0's l1: 0.106149	valid_0's l2: 0.0288639
[3]	valid_0's l1: 0.106151	valid_0's l2: 0.0288569
[4]	valid_0's l1: 0.10616	valid_0's l2: 0.0288494
[5]	valid_0's l1: 0.106159	valid_0's l2: 0.0288407
[6]	valid_0's l1: 0.106165	valid_0's l2: 0.0288342
[7]	valid_0's l1: 0.106165	valid_0's l2: 0.0288269
[8]	valid_0's l1: 0.106171	valid_0's l2: 0.02882
[9]	valid_0's l1: 0.106177	valid_0's l2: 0.0288132
[10]	valid_0's l1: 0.106185	valid_0's l2: 0.0288098
[11]	valid_0's l1: 0.106213	valid_0's l2: 0.0288026
[12]	valid_0's l1: 0.106242	valid_0's l2: 0.0287952
[13]	valid_0's l1: 0.10627	valid_0's l2: 0.028788
[14]	valid_0's l1: 0.106276	valid_0's l2: 0.0287849
[15]	valid_0's l1: 0.106303	valid_0's l2: 0.0287778
[16]	valid_0's l1: 0.106333	valid_0's l2: 0.028772
[17]	valid_0's l1: 0.106362	valid_0's l2: 0.0287654
[18]	valid_0's l1: 0.106394	valid_0's l2: 0.0287623
[19]	valid_0's l1: 0.

[85]	valid_0's l1: 0.106574	valid_0's l2: 0.0285565
[86]	valid_0's l1: 0.106574	valid_0's l2: 0.0285494
[87]	valid_0's l1: 0.10657	valid_0's l2: 0.0285433
[88]	valid_0's l1: 0.106575	valid_0's l2: 0.0285375
[89]	valid_0's l1: 0.106574	valid_0's l2: 0.0285302
[90]	valid_0's l1: 0.106572	valid_0's l2: 0.0285228
[91]	valid_0's l1: 0.106582	valid_0's l2: 0.0285219
[92]	valid_0's l1: 0.106592	valid_0's l2: 0.0285253
[93]	valid_0's l1: 0.106605	valid_0's l2: 0.0285262
[94]	valid_0's l1: 0.106619	valid_0's l2: 0.0285266
[95]	valid_0's l1: 0.106629	valid_0's l2: 0.0285286
[96]	valid_0's l1: 0.106638	valid_0's l2: 0.0285321
[97]	valid_0's l1: 0.106651	valid_0's l2: 0.0285331
[98]	valid_0's l1: 0.10666	valid_0's l2: 0.0285367
[99]	valid_0's l1: 0.106672	valid_0's l2: 0.0285379
[100]	valid_0's l1: 0.106681	valid_0's l2: 0.0285416
[101]	valid_0's l1: 0.106667	valid_0's l2: 0.028538
[102]	valid_0's l1: 0.10665	valid_0's l2: 0.0285351
[103]	valid_0's l1: 0.106632	valid_0's l2: 0.0285299
[104]	valid_

[211]	valid_0's l1: 0.106768	valid_0's l2: 0.0285237
[212]	valid_0's l1: 0.106765	valid_0's l2: 0.028521
[213]	valid_0's l1: 0.106761	valid_0's l2: 0.0285183
[214]	valid_0's l1: 0.106758	valid_0's l2: 0.0285157
[215]	valid_0's l1: 0.106748	valid_0's l2: 0.0285129
[216]	valid_0's l1: 0.106738	valid_0's l2: 0.0285101
[217]	valid_0's l1: 0.106755	valid_0's l2: 0.0285146
[218]	valid_0's l1: 0.106745	valid_0's l2: 0.0285119
[219]	valid_0's l1: 0.106735	valid_0's l2: 0.0285093
[220]	valid_0's l1: 0.106744	valid_0's l2: 0.028512
[221]	valid_0's l1: 0.106762	valid_0's l2: 0.0285156
[222]	valid_0's l1: 0.106772	valid_0's l2: 0.0285181
[223]	valid_0's l1: 0.106788	valid_0's l2: 0.0285233
[224]	valid_0's l1: 0.1068	valid_0's l2: 0.0285251
[225]	valid_0's l1: 0.106811	valid_0's l2: 0.0285269
[226]	valid_0's l1: 0.106832	valid_0's l2: 0.0285304
[227]	valid_0's l1: 0.106844	valid_0's l2: 0.0285331
[228]	valid_0's l1: 0.106856	valid_0's l2: 0.0285359
[229]	valid_0's l1: 0.106866	valid_0's l2: 0.02853

[335]	valid_0's l1: 0.106635	valid_0's l2: 0.0285785
[336]	valid_0's l1: 0.106626	valid_0's l2: 0.0285795
[337]	valid_0's l1: 0.106606	valid_0's l2: 0.028578
[338]	valid_0's l1: 0.106605	valid_0's l2: 0.0285815
[339]	valid_0's l1: 0.106595	valid_0's l2: 0.0285824
[340]	valid_0's l1: 0.106586	valid_0's l2: 0.0285835
[341]	valid_0's l1: 0.106583	valid_0's l2: 0.0285826
[342]	valid_0's l1: 0.106588	valid_0's l2: 0.0285832
[343]	valid_0's l1: 0.106585	valid_0's l2: 0.0285826
[344]	valid_0's l1: 0.106582	valid_0's l2: 0.0285818
[345]	valid_0's l1: 0.106587	valid_0's l2: 0.0285825
[346]	valid_0's l1: 0.106591	valid_0's l2: 0.0285828
[347]	valid_0's l1: 0.106598	valid_0's l2: 0.0285834
[348]	valid_0's l1: 0.106599	valid_0's l2: 0.0285837
[349]	valid_0's l1: 0.1066	valid_0's l2: 0.0285821
[350]	valid_0's l1: 0.106598	valid_0's l2: 0.0285815
[351]	valid_0's l1: 0.106615	valid_0's l2: 0.0285869
[352]	valid_0's l1: 0.106633	valid_0's l2: 0.0285898
[353]	valid_0's l1: 0.106651	valid_0's l2: 0.0285

[468]	valid_0's l1: 0.106665	valid_0's l2: 0.0287473
[469]	valid_0's l1: 0.106653	valid_0's l2: 0.0287476
[470]	valid_0's l1: 0.106633	valid_0's l2: 0.0287466
[471]	valid_0's l1: 0.106624	valid_0's l2: 0.0287471
[472]	valid_0's l1: 0.106615	valid_0's l2: 0.0287477
[473]	valid_0's l1: 0.106603	valid_0's l2: 0.0287479
[474]	valid_0's l1: 0.106595	valid_0's l2: 0.0287478
[475]	valid_0's l1: 0.10659	valid_0's l2: 0.0287481
[476]	valid_0's l1: 0.106583	valid_0's l2: 0.0287488
[477]	valid_0's l1: 0.106575	valid_0's l2: 0.0287496
[478]	valid_0's l1: 0.106571	valid_0's l2: 0.02875
[479]	valid_0's l1: 0.106566	valid_0's l2: 0.0287511
[480]	valid_0's l1: 0.106555	valid_0's l2: 0.0287509
[481]	valid_0's l1: 0.106575	valid_0's l2: 0.0287513
[482]	valid_0's l1: 0.106601	valid_0's l2: 0.0287538
[483]	valid_0's l1: 0.106628	valid_0's l2: 0.0287564
[484]	valid_0's l1: 0.106647	valid_0's l2: 0.0287574
[485]	valid_0's l1: 0.106661	valid_0's l2: 0.028757
[486]	valid_0's l1: 0.106681	valid_0's l2: 0.02875

[533]	valid_0's l1: 0.106667	valid_0's l2: 0.0288
[534]	valid_0's l1: 0.106667	valid_0's l2: 0.0287991
[535]	valid_0's l1: 0.106672	valid_0's l2: 0.0287962
[536]	valid_0's l1: 0.106683	valid_0's l2: 0.0287945
[537]	valid_0's l1: 0.106694	valid_0's l2: 0.0287928
[538]	valid_0's l1: 0.10669	valid_0's l2: 0.0287913
[539]	valid_0's l1: 0.106696	valid_0's l2: 0.0287903
[540]	valid_0's l1: 0.106707	valid_0's l2: 0.0287888
[541]	valid_0's l1: 0.106707	valid_0's l2: 0.0287833
[542]	valid_0's l1: 0.10671	valid_0's l2: 0.0287844
[543]	valid_0's l1: 0.106717	valid_0's l2: 0.0287856
[544]	valid_0's l1: 0.106724	valid_0's l2: 0.0287865
[545]	valid_0's l1: 0.10673	valid_0's l2: 0.0287879
[546]	valid_0's l1: 0.106735	valid_0's l2: 0.028789
[547]	valid_0's l1: 0.106743	valid_0's l2: 0.0287883
[548]	valid_0's l1: 0.106749	valid_0's l2: 0.0287895
[549]	valid_0's l1: 0.106752	valid_0's l2: 0.0287844
[550]	valid_0's l1: 0.106758	valid_0's l2: 0.0287857
[551]	valid_0's l1: 0.106778	valid_0's l2: 0.0287913


[598]	valid_0's l1: 0.106986	valid_0's l2: 0.0288934
[599]	valid_0's l1: 0.106992	valid_0's l2: 0.0288976
[600]	valid_0's l1: 0.106987	valid_0's l2: 0.0288995
[601]	valid_0's l1: 0.106985	valid_0's l2: 0.0288994
[602]	valid_0's l1: 0.106984	valid_0's l2: 0.0288988
[603]	valid_0's l1: 0.106976	valid_0's l2: 0.0288963
[604]	valid_0's l1: 0.106982	valid_0's l2: 0.0288967
[605]	valid_0's l1: 0.106976	valid_0's l2: 0.0288936
[606]	valid_0's l1: 0.10697	valid_0's l2: 0.0288906
[607]	valid_0's l1: 0.106965	valid_0's l2: 0.0288888
[608]	valid_0's l1: 0.106959	valid_0's l2: 0.0288875
[609]	valid_0's l1: 0.106953	valid_0's l2: 0.0288861
[610]	valid_0's l1: 0.106946	valid_0's l2: 0.0288834
[611]	valid_0's l1: 0.106958	valid_0's l2: 0.0288848
[612]	valid_0's l1: 0.106972	valid_0's l2: 0.0288871
[613]	valid_0's l1: 0.106987	valid_0's l2: 0.0288895
[614]	valid_0's l1: 0.106998	valid_0's l2: 0.0288913
[615]	valid_0's l1: 0.107008	valid_0's l2: 0.0288926
[616]	valid_0's l1: 0.107024	valid_0's l2: 0.02

[722]	valid_0's l1: 0.10775	valid_0's l2: 0.029017
[723]	valid_0's l1: 0.107753	valid_0's l2: 0.0290178
[724]	valid_0's l1: 0.107759	valid_0's l2: 0.0290187
[725]	valid_0's l1: 0.107767	valid_0's l2: 0.0290211
[726]	valid_0's l1: 0.107772	valid_0's l2: 0.029021
[727]	valid_0's l1: 0.107775	valid_0's l2: 0.029022
[728]	valid_0's l1: 0.107778	valid_0's l2: 0.029023
[729]	valid_0's l1: 0.107781	valid_0's l2: 0.0290237
[730]	valid_0's l1: 0.107782	valid_0's l2: 0.0290217
[731]	valid_0's l1: 0.107769	valid_0's l2: 0.029022
[732]	valid_0's l1: 0.107761	valid_0's l2: 0.0290226
[733]	valid_0's l1: 0.107751	valid_0's l2: 0.0290245
[734]	valid_0's l1: 0.107741	valid_0's l2: 0.0290264
[735]	valid_0's l1: 0.107728	valid_0's l2: 0.0290278
[736]	valid_0's l1: 0.107718	valid_0's l2: 0.0290289
[737]	valid_0's l1: 0.107714	valid_0's l2: 0.0290301
[738]	valid_0's l1: 0.107701	valid_0's l2: 0.0290316
[739]	valid_0's l1: 0.107697	valid_0's l2: 0.0290348
[740]	valid_0's l1: 0.107686	valid_0's l2: 0.0290363

[847]	valid_0's l1: 0.108261	valid_0's l2: 0.0292552
[848]	valid_0's l1: 0.108256	valid_0's l2: 0.0292542
[849]	valid_0's l1: 0.108252	valid_0's l2: 0.0292527
[850]	valid_0's l1: 0.10825	valid_0's l2: 0.0292524
[851]	valid_0's l1: 0.108248	valid_0's l2: 0.0292534
[852]	valid_0's l1: 0.108246	valid_0's l2: 0.0292541
[853]	valid_0's l1: 0.108244	valid_0's l2: 0.0292551
[854]	valid_0's l1: 0.108242	valid_0's l2: 0.0292561
[855]	valid_0's l1: 0.108242	valid_0's l2: 0.0292573
[856]	valid_0's l1: 0.10824	valid_0's l2: 0.0292583
[857]	valid_0's l1: 0.10824	valid_0's l2: 0.0292592
[858]	valid_0's l1: 0.108235	valid_0's l2: 0.0292596
[859]	valid_0's l1: 0.108235	valid_0's l2: 0.0292608
[860]	valid_0's l1: 0.108235	valid_0's l2: 0.0292614
[861]	valid_0's l1: 0.10822	valid_0's l2: 0.0292585
[862]	valid_0's l1: 0.108193	valid_0's l2: 0.0292543
[863]	valid_0's l1: 0.108172	valid_0's l2: 0.029253
[864]	valid_0's l1: 0.108151	valid_0's l2: 0.0292496
[865]	valid_0's l1: 0.10814	valid_0's l2: 0.0292481

[966]	valid_0's l1: 0.108353	valid_0's l2: 0.0294186
[967]	valid_0's l1: 0.108359	valid_0's l2: 0.029419
[968]	valid_0's l1: 0.108372	valid_0's l2: 0.0294221
[969]	valid_0's l1: 0.10838	valid_0's l2: 0.0294231
[970]	valid_0's l1: 0.10839	valid_0's l2: 0.0294249
[971]	valid_0's l1: 0.108407	valid_0's l2: 0.029426
[972]	valid_0's l1: 0.108413	valid_0's l2: 0.0294248
[973]	valid_0's l1: 0.108432	valid_0's l2: 0.0294263
[974]	valid_0's l1: 0.108437	valid_0's l2: 0.0294251
[975]	valid_0's l1: 0.108451	valid_0's l2: 0.0294254
[976]	valid_0's l1: 0.108459	valid_0's l2: 0.0294247
[977]	valid_0's l1: 0.108473	valid_0's l2: 0.0294254
[978]	valid_0's l1: 0.108485	valid_0's l2: 0.0294258
[979]	valid_0's l1: 0.108496	valid_0's l2: 0.0294272
[980]	valid_0's l1: 0.108509	valid_0's l2: 0.0294276
[981]	valid_0's l1: 0.108504	valid_0's l2: 0.029423
[982]	valid_0's l1: 0.108496	valid_0's l2: 0.0294202
[983]	valid_0's l1: 0.108489	valid_0's l2: 0.0294175
[984]	valid_0's l1: 0.108482	valid_0's l2: 0.029414

In [23]:
print("Sexually Explicit Results")
print("================")
print("[r2_score, mean_absolute_error, model]")
print("================")
for model in [lr_results, gbm_results, svr_results, en_results]:
    print(model)

Sexually Explicit Results
[r2_score, mean_absolute_error, model]
(-0.3737, 0.0969, LinearRegression())
(-118063.8676, 0.1061, LGBMRegressor(bagging_fraction=0.7, bagging_freq=10, feature_fraction=0.9,
              learning_rate=0.005, max_bin=512, max_depth=8,
              metric=['l1', 'l2'], num_iterations=100000, num_leaves=128,
              objective='regression', task='train', verbose=0))
(-1.8407, 0.119, SVR(kernel='linear'))
(-3.7488045902794363e+31, 0.1062, ElasticNet(random_state=0))
