In [1]:
from texture.datasets import Doc2DocDataset, DocClassifierDataset
from texture.tasks import MultiTaskModel
import torch

# To Do List
* Dedup tv and television, language and languages
* Add sports, animals, nature, country, tourism

In [2]:
m = MultiTaskModel()

m.add_doc2doc_task(
    "title_embedding",
    Doc2DocDataset(
        "./data/wikipedia/title_content_train.tsv",
        m.doc_vocab),
    Doc2DocDataset(
        "./data/wikipedia/title_content_test.tsv",
        m.doc_vocab))

m.add_doc2doc_task(
    "answer_embedding",
    Doc2DocDataset(
        "./data/jeopardy/jeopardy_train.tsv",
        m.doc_vocab),
    Doc2DocDataset(
        "./data/jeopardy/jeopardy_test.tsv",
        m.doc_vocab))

m.add_doc_classification_task(
    "offensive_classification",
    DocClassifierDataset(
        "./data/offensive/labels.tsv",
        "./data/offensive/queries_train.tsv",
        m.doc_vocab),
    DocClassifierDataset(
        "./data/offensive/labels.tsv",
        "./data/offensive/queries_test.tsv",
        m.doc_vocab))
    
m.add_doc_classification_task(
    "topic_tagging",
    DocClassifierDataset(
        "./data/delicious/labels.tsv",
        "./data/delicious/title_labels_train.tsv",
        m.doc_vocab),
    DocClassifierDataset(
        "./data/delicious/labels.tsv",
        "./data/delicious/title_labels_test.tsv",
        m.doc_vocab))

m.add_doc_classification_task(
    "hate_speech",
    DocClassifierDataset(
        "./data/hate/labels.tsv",
        "./data/hate/hate_train.tsv",
        m.doc_vocab),
    DocClassifierDataset(
        "./data/hate/labels.tsv",
        "./data/hate/hate_test.tsv",
        m.doc_vocab))

Doc2DocModule(
  (input_encoder): DocEmbedding(
    (lang_embed): Embedding(50, 64, max_norm=1.0, sparse=True)
    (break_embed): Embedding(4, 8, max_norm=1.0, sparse=True)
    (caps_embed): Embedding(4, 8, max_norm=1.0, sparse=True)
    (text_embed): Embedding(1000000, 512, padding_idx=0, max_norm=1.0, sparse=True)
    (toks_layer): Linear(in_features=528, out_features=512)
    (phrase_dropout): Dropout(p=0.5)
    (phrase_PReLU): PReLU(num_parameters=1)
    (docs_layer): Linear(in_features=576, out_features=512)
  )
  (input_transformer): Linear(in_features=512, out_features=512)
  (output_encoder): DocEmbedding(
    (lang_embed): Embedding(50, 64, max_norm=1.0, sparse=True)
    (break_embed): Embedding(4, 8, max_norm=1.0, sparse=True)
    (caps_embed): Embedding(4, 8, max_norm=1.0, sparse=True)
    (text_embed): Embedding(1000000, 512, padding_idx=0, max_norm=1.0, sparse=True)
    (toks_layer): Linear(in_features=528, out_features=512)
    (phrase_dropout): Dropout(p=0.5)
    (phrase

In [3]:
m.load_model("model_data/latest_512/")

Loading title_embedding
Loading answer_embedding
Loading offensive_classification
Loading topic_tagging
Loading hate_speech


In [4]:
m.train(wait=False)

offensive_classification (100, 0.2752335978671908, 0.35778034318238494)
topic_tagging (100, 2.200085091590881, 2.1599194550514222)
hate_speech (100, 0.13582995053380728, 0.4977792777121067)
offensive_classification (200, 0.28521821377798917, 0.36916599474847317)
topic_tagging (200, 2.1976747769117355, 2.1608505558967592)
hate_speech (200, 0.1463711972720921, 0.4709086456894875)
offensive_classification (300, 0.3006052066323658, 0.3694709554190437)
answer_embedding (100, 0.0, 0.00010641160909472092)
topic_tagging (300, 2.173438890973727, 2.155319709777832)
hate_speech (300, 0.16026853440639874, 0.47276348709439237)
offensive_classification (400, 0.29435760222841056, 0.36278827757574617)
topic_tagging (400, 2.1701993606984615, 2.1601135578751562)
hate_speech (400, 0.16049970496213065, 0.4726781690539792)
title_embedding (100, 0.00015726206824183463, 3.515650983189289e-05)
offensive_classification (500, 0.29291106079518797, 0.3705348996892571)
topic_tagging (500, 2.1633632897138595, 2.160

topic_tagging (3600, 2.149901713848114, 2.1562069003582)
offensive_classification (3900, 0.3038358562961221, 0.37062725687026976)
answer_embedding (1300, 0.008116892485633277, 0.0001322900739451498)
hate_speech (3600, 0.16201601014565675, 0.47572497494798155)
title_embedding (800, 0.006617607064521829, 0.0020599957994268765)
topic_tagging (3700, 2.155380511522293, 2.1540406597852706)
offensive_classification (4000, 0.3096102091036737, 0.37105487218871713)
hate_speech (3700, 0.1630569616127759, 0.4795358222331852)
topic_tagging (3800, 2.1628898859024046, 2.154575447320938)
offensive_classification (4100, 0.30970837876945734, 0.37085193011537193)
hate_speech (3800, 0.16405074606463313, 0.477798917863518)
topic_tagging (3900, 2.1548233711719513, 2.1562673637866974)
offensive_classification (4200, 0.2982312764208764, 0.37335560920462013)
answer_embedding (1400, 0.00402766832029925, 0.00012789162741505322)
topic_tagging (4000, 2.163664755821228, 2.1584962186813352)
hate_speech (3900, 0.1630

hate_speech (6900, 0.1598182831266895, 0.4708953531207517)
offensive_classification (7500, 0.3156533311791718, 0.3685567750129849)
topic_tagging (7200, 2.1800651724338533, 2.1538913789987566)
hate_speech (7000, 0.1641987740304321, 0.4703619961515069)
offensive_classification (7600, 0.3125797169171274, 0.37062214003503324)
topic_tagging (7300, 2.182811352491379, 2.1566269619464875)
answer_embedding (2600, 0.003616326703069647, 9.393442016772102e-05)
hate_speech (7100, 0.16474975075758994, 0.4747729689851403)
offensive_classification (7700, 0.3097819184996188, 0.36841290004178884)
title_embedding (1600, 0.014411804676664374, 0.004110202491407456)
topic_tagging (7400, 2.169152160406113, 2.1551764291524886)
offensive_classification (7800, 0.3054330850802362, 0.36995546332374213)
hate_speech (7200, 0.1618371416144073, 0.46976622274983676)
topic_tagging (7500, 2.1703873488903045, 2.156182577729225)
offensive_classification (7900, 0.29831476728990675, 0.3684125363752246)
hate_speech (7300, 0.

title_embedding (2300, 0.011884969906846798, 0.004941535931902459)
offensive_classification (11200, 0.3094622120708227, 0.36962425147742034)
topic_tagging (10800, 2.1666626931428907, 2.1509264415502547)
answer_embedding (3800, 0.006472981699361158, 0.0014271877866323948)
offensive_classification (11300, 0.30720235626772047, 0.3670752235166729)
hate_speech (10300, 0.1661926252199337, 0.4726174551099539)
topic_tagging (10900, 2.1663267509937287, 2.15188439643383)
offensive_classification (11400, 0.3073185682054609, 0.3675756349749863)
hate_speech (10400, 0.1677717514531687, 0.4702060977788642)
topic_tagging (11000, 2.155299067854881, 2.1554286984205246)
offensive_classification (11500, 0.31079369687475267, 0.36745337963476776)
hate_speech (10500, 0.16485801998432725, 0.468794731345959)
answer_embedding (3900, 0.008034363525701301, 0.0014396500751826125)
offensive_classification (11600, 0.3126533259022981, 0.36926188483461736)
topic_tagging (11100, 2.151448705077171, 2.154451515555382)
ha

answer_embedding (5000, 0.005903036778770317, 0.0009013504896772098)
hate_speech (13400, 0.16802191724907606, 0.46924851995613426)
offensive_classification (15000, 0.31441679188609123, 0.3698551340866834)
topic_tagging (14300, 2.186197807431221, 2.1515809291601182)
hate_speech (13500, 0.16502064598258584, 0.4689200028879568)
offensive_classification (15100, 0.313313816793263, 0.36976561179198325)
topic_tagging (14400, 2.189738406419754, 2.1536105132102965)
hate_speech (13600, 0.16323315501678734, 0.46668797822948543)
offensive_classification (15200, 0.3146341502480209, 0.36821920130588115)
answer_embedding (5100, 0.006564745348200734, 0.0009014800261441622)
topic_tagging (14500, 2.183231855392456, 2.1527278275489805)
offensive_classification (15300, 0.3110458851531148, 0.3701896698269993)
hate_speech (13700, 0.16394593319064008, 0.4667296401085332)
title_embedding (3100, 0.00139360994171615, 0.0019097739948587078)
offensive_classification (15400, 0.3044290616102517, 0.367115726897493)


topic_tagging (17800, 2.1824084615707395, 2.1539759212732315)
answer_embedding (6200, 0.009769674659826517, 0.001614697830837878)
offensive_classification (18700, 0.3051500251032412, 0.3704289921410382)
hate_speech (16800, 0.1617199387969449, 0.4694915871331468)
topic_tagging (17900, 2.177040667116642, 2.157457383990288)
offensive_classification (18800, 0.3055203719120473, 0.3670030624456704)
hate_speech (16900, 0.15678635582793504, 0.46822660097386687)
topic_tagging (18000, 2.169976995885372, 2.15693929374218)
offensive_classification (18900, 0.3096648626308888, 0.36853075421229003)
title_embedding (3800, 0.0032910478915101644, 0.0026385871621678633)
hate_speech (17000, 0.15939191898796706, 0.4675443069031462)
answer_embedding (6300, 0.009415387339078485, 0.0016154532055423728)
topic_tagging (18100, 2.165211108148098, 2.159143750309944)
offensive_classification (19000, 0.30796684238500893, 0.36662237483076754)
hate_speech (17100, 0.1612131471009925, 0.4628446639319882)
topic_tagging (

topic_tagging (21300, 2.1737714489102364, 2.157955204129219)
hate_speech (20100, 0.16203031982854008, 0.4678200207538903)
title_embedding (4500, 0.0021829561695481162, 0.002903361873426182)
offensive_classification (22400, 0.29288884284347294, 0.3679971720036119)
topic_tagging (21400, 2.175842346727848, 2.155497883439064)
hate_speech (20200, 0.15893555088713765, 0.4662638076748699)
offensive_classification (22500, 0.3011291140243411, 0.3684398089442402)
topic_tagging (21500, 2.177907934486866, 2.1561089265346527)
answer_embedding (7500, 0.0065847054288948395, 0.002068989430315061)
offensive_classification (22600, 0.30879077917709946, 0.3688482387829572)
hate_speech (20300, 0.16231650223396718, 0.46382610278017816)
topic_tagging (21600, 2.172985918343067, 2.1554764119386673)
offensive_classification (22700, 0.3116874535754323, 0.36760769062303006)
hate_speech (20400, 0.16594716413132846, 0.4671075912937522)
topic_tagging (21700, 2.172341975390911, 2.1574740059375763)
offensive_classific

offensive_classification (26000, 0.2928419825527817, 0.37147751222364606)
hate_speech (23400, 0.1649509374788031, 0.4630768973864615)
topic_tagging (24900, 2.1336583322882654, 2.1555203582048414)
offensive_classification (26100, 0.28340920857526364, 0.3707345041837543)
hate_speech (23500, 0.1651472712298855, 0.4683913486450911)
topic_tagging (25000, 2.1350369423031808, 2.154915784358978)
offensive_classification (26200, 0.29222087892331183, 0.37304103122465315)
answer_embedding (8700, 0.008622934299846077, 0.002484652261574671)
topic_tagging (25100, 2.1376851359009743, 2.1578493411540984)
hate_speech (23600, 0.16135006509069352, 0.4685755140371621)
offensive_classification (26300, 0.2882648595701903, 0.3706368254777044)
topic_tagging (25200, 2.1430213246941565, 2.15948071539402)
title_embedding (5300, 0.0005360529641285634, 0.0017824644360553527)
offensive_classification (26400, 0.284875011684373, 0.3718603924456984)
hate_speech (23700, 0.16472413108777254, 0.4665870828675106)
topic_ta

offensive_classification (29800, 0.3075824235845357, 0.3705457953363657)
hate_speech (26600, 0.16668953408580273, 0.4733675545128062)
topic_tagging (28500, 2.1647827226519585, 2.160776441335678)
offensive_classification (29900, 0.31048799507692454, 0.36944813761115075)
hate_speech (26700, 0.16672392618004234, 0.47300246522482486)
title_embedding (6000, 1.5239086211730423e-05, 0.0016924740901819097)
offensive_classification (30000, 0.30707106275111434, 0.369168044231832)
topic_tagging (28600, 2.165578574359417, 2.1605790266990663)
answer_embedding (9900, 0.009304159333494063, 0.0026448339207622777)
offensive_classification (30100, 0.3100097400918603, 0.3688728286195546)
hate_speech (26800, 0.16813268810603768, 0.47085325730219485)
topic_tagging (28700, 2.1731706214547155, 2.158576914072037)
offensive_classification (30200, 0.3108792911022902, 0.3707105754148215)
hate_speech (26900, 0.16320092569757252, 0.47090830688271673)
topic_tagging (28800, 2.169216100513935, 2.1589389419555665)
off

title_embedding (6700, 0.0008587209444074335, 0.0017719364546058011)
topic_tagging (31900, 2.1477422339320182, 2.1563835631608965)
hate_speech (29900, 0.16277907500229777, 0.46447880803048613)
offensive_classification (33600, 0.30502225874364375, 0.3684753715954721)
topic_tagging (32000, 2.146263943135738, 2.151205974817276)
hate_speech (30000, 0.16536148769408465, 0.4648178242025897)
offensive_classification (33700, 0.30972021451592446, 0.369165937256068)
topic_tagging (32100, 2.1526360747218134, 2.1529098864793776)
answer_embedding (11100, 0.01189474589381395, 0.0010585876308880247)
offensive_classification (33800, 0.30921288718283174, 0.36700311298295857)
hate_speech (30100, 0.16474528014007955, 0.46889323528204113)
topic_tagging (32200, 2.1676226126551628, 2.1536593025922777)
offensive_classification (33900, 0.3025304340478033, 0.36986815388128164)
hate_speech (30200, 0.16205953252222388, 0.4661173339644447)
topic_tagging (32300, 2.1703980974555015, 2.1533682874441147)
offensive_cl

offensive_classification (37200, 0.29429930963367223, 0.36848413245752454)
hate_speech (33100, 0.16590218921843916, 0.4724375791000202)
topic_tagging (35500, 2.155434729218483, 2.154496677041054)
offensive_classification (37300, 0.2962052995935082, 0.37115142164751885)
hate_speech (33200, 0.15975384030584247, 0.47997972830105573)
topic_tagging (35600, 2.1489907494783402, 2.153614443182945)
offensive_classification (37400, 0.30040496837720276, 0.3700168251991272)
answer_embedding (12300, 0.006027670860676149, 0.0005583959121738506)
title_embedding (7500, 0.00990526510569713, 0.004144530532601823)
hate_speech (33300, 0.16304683756362648, 0.4753977723903954)
offensive_classification (37500, 0.31670346619188783, 0.3710020473320037)
topic_tagging (35700, 2.1479077578783037, 2.1543769134283064)
hate_speech (33400, 0.16330264656990767, 0.47897494031488896)
offensive_classification (37600, 0.3182410313375294, 0.3683877723645419)
topic_tagging (35800, 2.157006424188614, 2.1584103527069094)
hate

answer_embedding (13400, 0.00757203908132615, 0.0013120703583358502)
offensive_classification (41100, 0.2987020726390183, 0.3706783370561898)
hate_speech (36400, 0.15943783662468194, 0.4754394516106695)
title_embedding (8200, 0.0071449677113315565, 0.00787752013267993)
topic_tagging (38900, 2.1993523958325385, 2.1492444162368773)
offensive_classification (41200, 0.29609313322603703, 0.37126433654129504)
hate_speech (36500, 0.16392320158146323, 0.4736085735596716)
topic_tagging (39000, 2.1961177323460577, 2.148748997449875)
offensive_classification (41300, 0.29263269521296026, 0.3700232961848378)
hate_speech (36600, 0.163035824008286, 0.4766112518366426)
topic_tagging (39100, 2.199197069585323, 2.1485099858045578)
answer_embedding (13500, 0.007000572805988082, 0.0013119645952384537)
offensive_classification (41400, 0.2973712205197662, 0.37288020553439855)
hate_speech (36700, 0.16409252114780248, 0.47627512050420046)
topic_tagging (39200, 2.1849130373597143, 2.150812390804291)
offensive_

offensive_classification (44700, 0.31356273555196823, 0.36916357674077155)
topic_tagging (42500, 2.1612939016819, 2.1524757355451585)
hate_speech (39700, 0.16639127255603672, 0.46666337585262957)
offensive_classification (44800, 0.3116211967933923, 0.3712240726798773)
answer_embedding (14600, 0.007381881622326249, 0.0008076378189367546)
topic_tagging (42600, 2.1555597288012502, 2.1504168590307238)
offensive_classification (44900, 0.3149891924057156, 0.36869215190038085)
hate_speech (39800, 0.16706397483311594, 0.4631912312107161)
topic_tagging (42700, 2.152388387262821, 2.150660835623741)
offensive_classification (45000, 0.31460651502572, 0.36894458600506186)
hate_speech (39900, 0.165318002326414, 0.4693022911483422)
topic_tagging (42800, 2.1535444051623345, 2.1517849515676497)
offensive_classification (45100, 0.3096393280662596, 0.36789337246492504)
hate_speech (40000, 0.16737082713469864, 0.469973309581168)
answer_embedding (14700, 0.007419952271313173, 0.0007129325472162989)
offensi

offensive_classification (48500, 0.3120748592093587, 0.36916303118690846)
hate_speech (42900, 0.16309302341751755, 0.4729298951001838)
topic_tagging (46000, 2.142342292904854, 2.1564347416162493)
offensive_classification (48600, 0.32441344705969094, 0.3685498026460409)
answer_embedding (15800, 0.010715409364138265, 0.0005726281676974434)
hate_speech (43000, 0.1651173330070451, 0.47593909987341615)
offensive_classification (48700, 0.3185143758058548, 0.36866661557927727)
topic_tagging (46100, 2.141076487541199, 2.1544042874574663)
hate_speech (43100, 0.16681434939149767, 0.47197314887400715)
offensive_classification (48800, 0.3274546402413398, 0.36918209824338555)
topic_tagging (46200, 2.138476367354393, 2.154141428589821)
hate_speech (43200, 0.1635667192535475, 0.47252173427399247)
offensive_classification (48900, 0.3202070390805602, 0.37214837048947813)
title_embedding (9700, 0.0016454482734296217, 0.0014771408608386257)
topic_tagging (46300, 2.13423324406147, 2.1564611426591873)
answ

offensive_classification (52300, 0.315767888026312, 0.3699875185023993)
hate_speech (46100, 0.16695300018414855, 0.4767651303643361)
topic_tagging (49500, 2.1489118002653123, 2.1503446185588837)
offensive_classification (52400, 0.32069862218014894, 0.36765827211551366)
hate_speech (46200, 0.16590525492466987, 0.47403907880652696)
topic_tagging (49600, 2.146528850436211, 2.152561685323715)
offensive_classification (52500, 0.3268465829249471, 0.3712509999554604)
answer_embedding (17000, 0.007031105925907085, 0.0003722083733902699)
hate_speech (46300, 0.16707797652482986, 0.47059131309669466)
topic_tagging (49700, 2.144010755300522, 2.152602873444557)
offensive_classification (52600, 0.3250491052810103, 0.36815096639283)
hate_speech (46400, 0.1646502484716475, 0.47239783095289023)
title_embedding (10400, 0.005055965520230483, 0.0019122042753815234)
topic_tagging (49800, 2.146421212911606, 2.152349766731262)
offensive_classification (52700, 0.32792184373177585, 0.36827507344074545)
hate_sp

answer_embedding (18100, 0.010291839206881218, 0.0005936126191403037)
offensive_classification (56100, 0.29526485107652845, 0.3684586617313325)
topic_tagging (53000, 2.1471710830926893, 2.146135562300682)
hate_speech (49400, 0.16389358056802303, 0.46423782122600826)
offensive_classification (56200, 0.2941024401392788, 0.3669388511106372)
topic_tagging (53100, 2.149228514075279, 2.1512028406858446)
hate_speech (49500, 0.1621933842925355, 0.46555691384058445)
offensive_classification (56300, 0.2950382633190602, 0.3687081590630114)
topic_tagging (53200, 2.158233086824417, 2.1474657578468324)
answer_embedding (18200, 0.009532037835761696, 0.0005936052881136944)
offensive_classification (56400, 0.3025694064050913, 0.37001346457377077)
title_embedding (11100, 0.003738634775489113, 0.0027045445004770068)
hate_speech (49600, 0.15890704230125993, 0.46797167242784055)
topic_tagging (53300, 2.1470229768753053, 2.150845497369766)
offensive_classification (56500, 0.30123234586045144, 0.368084534093

topic_tagging (56500, 2.1705687604546546, 2.1539529625177383)
offensive_classification (59800, 0.3094193788934499, 0.37084169738180933)
hate_speech (52600, 0.16154425592487678, 0.47162865805998444)
topic_tagging (56600, 2.1722323256731033, 2.15612413418293)
offensive_classification (59900, 0.3035855361390859, 0.36896497905254366)
title_embedding (11800, 0.003002492328185463, 0.0026026945914025983)
hate_speech (52700, 0.16223336880235, 0.47142116258013994)
topic_tagging (56700, 2.1723814097642897, 2.159898281097412)
answer_embedding (19400, 0.012123678341133122, 7.811534029792533e-05)
offensive_classification (60000, 0.30442136874608694, 0.3711671991571784)
hate_speech (52800, 0.1621647839541547, 0.47294439144432543)
topic_tagging (56800, 2.1786773979663847, 2.1570212498903274)
offensive_classification (60100, 0.3086252774372697, 0.3669289132207632)
hate_speech (52900, 0.15947733500925823, 0.4735249821525067)
topic_tagging (56900, 2.1742085144519807, 2.159075587749481)
offensive_classif

topic_tagging (60000, 2.1741935414075853, 2.158861242890358)
title_embedding (12500, 0.00023239225582125033, 0.003437284922754855)
offensive_classification (63500, 0.32808171772025524, 0.37057620874978603)
hate_speech (55900, 0.15785169556178152, 0.473356684521772)
topic_tagging (60100, 2.1730019420385362, 2.1591933653354647)
offensive_classification (63600, 0.31799725551530716, 0.37236706759408117)
hate_speech (56000, 0.16202678148448468, 0.47237931062374267)
answer_embedding (20600, 0.004519658668150012, 3.795719315233725e-05)
topic_tagging (60200, 2.168034842252731, 2.1589945248365403)
offensive_classification (63700, 0.3174571094810963, 0.37262490786053243)
hate_speech (56100, 0.16283789004478605, 0.4698766723610461)
topic_tagging (60300, 2.1732006132602693, 2.1581148513555526)
offensive_classification (63800, 0.32379842704162004, 0.3749124106261879)
hate_speech (56200, 0.16468361558485775, 0.470463034898974)
topic_tagging (60400, 2.171895000934601, 2.157648131966591)
offensive_cla

title_embedding (13200, 0.008447997957923673, 0.0019171551870311484)
topic_tagging (63600, 2.179004191160202, 2.1540091841220854)
offensive_classification (67200, 0.31971353058889507, 0.3697307359613478)
hate_speech (59100, 0.1676111860126257, 0.47497814521566034)
topic_tagging (63700, 2.168129433095455, 2.15567745244503)
offensive_classification (67300, 0.31679375847801566, 0.36940324517712)
hate_speech (59200, 0.16391772093623877, 0.47399591213651)
answer_embedding (21800, 0.005276172817642939, 0.001501452185656623)
topic_tagging (63800, 2.1611167271733285, 2.1541247183084486)
offensive_classification (67400, 0.32266937493532893, 0.37058648397400973)
hate_speech (59300, 0.16840313820540906, 0.48103108757920565)
topic_tagging (63900, 2.153072913110256, 2.153525249838829)
offensive_classification (67500, 0.31976197662204503, 0.37129272979497907)
hate_speech (59400, 0.16730451278947295, 0.47595559527911246)
topic_tagging (64000, 2.1523368675112726, 2.154415150880814)
offensive_classific

hate_speech (62300, 0.16518601846322417, 0.4765979183502495)
topic_tagging (67100, 2.18082806879282, 2.1518161424398423)
offensive_classification (70900, 0.3021873683426529, 0.371359115678817)
hate_speech (62400, 0.16652403732948004, 0.4788525774367154)
answer_embedding (23000, 0.010752466213911377, 0.00054035608751408)
topic_tagging (67200, 2.1780809484124184, 2.1496443111896513)
offensive_classification (71000, 0.3068838954754174, 0.36923064313456416)
hate_speech (62500, 0.16428787244670093, 0.4748129552826285)
topic_tagging (67300, 2.169307857334614, 2.151517313122749)
offensive_classification (71100, 0.3104940412137657, 0.3712825303338468)
title_embedding (14000, 0.0016193295270146258, 0.006811377856365029)
hate_speech (62600, 0.16374961794074624, 0.4773642932223156)
offensive_classification (71200, 0.30269805730879307, 0.3677583325896412)
topic_tagging (67400, 2.167245902955532, 2.1524809911251066)
hate_speech (62700, 0.1648640982778743, 0.47590779039729386)
answer_embedding (2310

offensive_classification (74500, 0.33990713131055234, 0.3696991540752351)
hate_speech (65700, 0.16416569924913346, 0.47060970446746797)
topic_tagging (70600, 2.152465582430363, 2.152992525100708)
offensive_classification (74600, 0.3324488002303988, 0.36833252013847234)
hate_speech (65800, 0.16502538623288274, 0.4695678849956021)
title_embedding (14700, 9.446734564821924e-09, 0.0079464930757496)
topic_tagging (70700, 2.1431826978325845, 2.1512938470840455)
offensive_classification (74700, 0.338363045707345, 0.3691325324960053)
hate_speech (65900, 0.16269054556451737, 0.46683443112298845)
topic_tagging (70800, 2.1552820956110956, 2.1529589483737945)
offensive_classification (74800, 0.33758227541297675, 0.36896590965613724)
answer_embedding (24300, 0.009652224337804367, 0.0027590229143952334)
topic_tagging (70900, 2.160238512814045, 2.1515869100093843)
hate_speech (66000, 0.16298383902944624, 0.46737863020785153)
offensive_classification (74900, 0.3293904546350241, 0.36863158755004405)
to

title_embedding (15400, 3.7927495387002354e-08, 0.001533868798090173)
topic_tagging (74000, 2.1381474766731263, 2.151696304321289)
offensive_classification (78300, 0.32495496775209903, 0.3677970922533423)
hate_speech (69000, 0.16033100332319736, 0.46370827638823536)
topic_tagging (74100, 2.1459497138261794, 2.151911523938179)
offensive_classification (78400, 0.32499830033257604, 0.3686282941829413)
hate_speech (69100, 0.1593097014501691, 0.46711552076879886)
topic_tagging (74200, 2.1471176300644874, 2.151439163684845)
offensive_classification (78500, 0.3239145027659833, 0.3683072180394083)
answer_embedding (25500, 0.008494575516739928, 0.0010555567963022488)
topic_tagging (74300, 2.153222717225552, 2.151057322859764)
hate_speech (69200, 0.1607191317565739, 0.46802794103045015)
offensive_classification (78600, 0.3278965755738318, 0.3708820069562644)
topic_tagging (74400, 2.1514158008098603, 2.1529022492170333)
hate_speech (69300, 0.16061663918755947, 0.46973954488057645)
offensive_class

topic_tagging (77600, 2.16181421738863, 2.1569503132104875)
answer_embedding (26600, 0.0038051372118665695, 0.00018590062629841197)
hate_speech (72200, 0.16070380352530628, 0.4773376253610477)
offensive_classification (82100, 0.31174379456043244, 0.36815912144258617)
topic_tagging (77700, 2.1667704704403876, 2.1561820344924927)
hate_speech (72300, 0.16311258864682168, 0.47424447162356226)
offensive_classification (82200, 0.3099412647373974, 0.37115677693858745)
topic_tagging (77800, 2.177463499605656, 2.154770106077194)
hate_speech (72400, 0.16735358239430934, 0.4785940365195274)
offensive_classification (82300, 0.30133816291764376, 0.36979036796838044)
answer_embedding (26700, 0.0038136487512360193, 0.0001868109855625657)
topic_tagging (77900, 2.180971585929394, 2.1584980949163435)
offensive_classification (82400, 0.30310825372859834, 0.37123772424459456)
hate_speech (72500, 0.16769402959104626, 0.47878573343344033)
title_embedding (16200, 0.00405414458960906, 0.004266918349164218)
to

answer_embedding (27800, 0.0027381997573672086, 0.00046910722317375917)
topic_tagging (81100, 2.149470581293106, 2.1544854081869125)
hate_speech (75400, 0.166652532720007, 0.4699860304389149)
offensive_classification (85900, 0.3010655635111034, 0.3675663165710866)
topic_tagging (81200, 2.149536095619202, 2.1559385693073274)
hate_speech (75500, 0.1659267895789817, 0.4698100597122684)
offensive_classification (86000, 0.2964510026117787, 0.3679778074547648)
title_embedding (16900, 0.0007265240509306317, 0.0007672479824773184)
topic_tagging (81300, 2.149548888146877, 2.1601421463489534)
offensive_classification (86100, 0.2982477235896513, 0.36987134263291954)
hate_speech (75600, 0.1633122549885884, 0.4698885700255632)
answer_embedding (27900, 0.004649779404526301, 0.00047837224150840417)
topic_tagging (81400, 2.162170283138752, 2.1607233897447586)
offensive_classification (86200, 0.29608627886418254, 0.36735668548196554)
hate_speech (75700, 0.16559454671572893, 0.47230511823669075)
topic_t

offensive_classification (89500, 0.3055055788550526, 0.3710470917150378)
title_embedding (17600, 6.018301696598449e-06, 0.0007075046928028401)
topic_tagging (84700, 2.1705330576300623, 2.1526645426750184)
hate_speech (78600, 0.1632082933196798, 0.46711666775494814)
offensive_classification (89600, 0.3094578371271491, 0.3701044265702367)
topic_tagging (84800, 2.1639254553318024, 2.152830285310745)
hate_speech (78700, 0.16614095616526903, 0.4689010541867465)
offensive_classification (89700, 0.30767835543677213, 0.37296468460187315)
topic_tagging (84900, 2.166165890097618, 2.1540704782009126)
answer_embedding (29100, 0.006340099561255238, 0.0003773739716154774)
hate_speech (78800, 0.16821642825286837, 0.47344074756465854)
offensive_classification (89800, 0.30177383816614745, 0.3694634713381529)
topic_tagging (85000, 2.1639714019298553, 2.152262805700302)
hate_speech (78900, 0.16517676739115267, 0.472876054758206)
offensive_classification (89900, 0.3000607367455959, 0.37205791151896117)
to

offensive_classification (93200, 0.3159498983863741, 0.369593355698511)
hate_speech (81800, 0.16702024616859854, 0.4695573270479217)
topic_tagging (88200, 2.1642771171331407, 2.1534435921907424)
offensive_classification (93300, 0.3144092445950955, 0.37123278504796325)
answer_embedding (30300, 0.003230243619059649, 0.00020861854784237234)
hate_speech (81900, 0.16268836980778725, 0.468990128044039)
topic_tagging (88300, 2.168815845370293, 2.1531502261161806)
offensive_classification (93400, 0.3193950259536505, 0.3695077145639807)
hate_speech (82000, 0.16486287449020892, 0.47310866992734374)
topic_tagging (88400, 2.1766576639413833, 2.150680951833725)
offensive_classification (93500, 0.3341510605625808, 0.37034035990200936)
title_embedding (18400, 9.57435272038687e-06, 0.00135257628700362)
hate_speech (82100, 0.16437271212879567, 0.4740582541003823)
offensive_classification (93600, 0.32821565988659857, 0.37006889685057104)
topic_tagging (88500, 2.1609989968538286, 2.15285773229599)
answer

hate_speech (85000, 0.1625579811576754, 0.4659330852907151)
topic_tagging (91600, 2.152620336890221, 2.1537709296941756)
offensive_classification (97100, 0.3015469294656068, 0.3663417101725936)
hate_speech (85100, 0.16398207506723703, 0.4689358954494819)
topic_tagging (91700, 2.1470954196453094, 2.151065010547638)
answer_embedding (31500, 0.008824018929938617, 0.0005266345874447551)
offensive_classification (97200, 0.3043978402223438, 0.36747524406015875)
hate_speech (85200, 0.15901736041996628, 0.47026977165509015)
topic_tagging (91800, 2.151243016600609, 2.1511834502220153)
offensive_classification (97300, 0.29440718778036534, 0.3646464121155441)
hate_speech (85300, 0.15875649003591388, 0.47114082564599813)
title_embedding (19100, 0.00012939945133809029, 0.0011306455542347104)
topic_tagging (91900, 2.1583203622102736, 2.154054013490677)
offensive_classification (97400, 0.29961669339612124, 0.36506545439362525)
hate_speech (85400, 0.15920710139069708, 0.47082720016967505)
topic_taggin

topic_tagging (95100, 2.133057586669922, 2.152496018409729)
answer_embedding (32700, 0.013073925705406992, 0.0019218719672354503)
offensive_classification (100700, 0.31769385738670824, 0.3686369273811579)
hate_speech (88500, 0.16365954994410276, 0.46090487104747446)
topic_tagging (95200, 2.138498993396759, 2.154254529595375)
title_embedding (19800, 0.0034859803935869756, 0.003505048905023196)
offensive_classification (100800, 0.3103269215337932, 0.3703505011275411)
hate_speech (88600, 0.16300065691769122, 0.46184046189766376)
topic_tagging (95300, 2.1406813864707948, 2.1520265176296234)
offensive_classification (100900, 0.3067995309121907, 0.3695558934733272)
hate_speech (88700, 0.16531534873321652, 0.4627986212465912)
topic_tagging (95400, 2.1500180181264876, 2.1520501962900163)
offensive_classification (101000, 0.3054716398175806, 0.37114501191675664)
answer_embedding (32800, 0.01650107244279891, 0.0006301065098097282)
topic_tagging (95500, 2.155143175125122, 2.1531530681848525)
hate

offensive_classification (104200, 0.3065561095662415, 0.36785326384939254)
topic_tagging (98700, 2.1766916662454605, 2.157376430988312)
hate_speech (91800, 0.16594640444684775, 0.47227421788312496)
offensive_classification (104300, 0.3166177842412144, 0.36554038139618933)
answer_embedding (33900, 0.009302143151091107, 0.0040792160065554126)
topic_tagging (98800, 2.1689984256625174, 2.155230080842972)
offensive_classification (104400, 0.312053109658882, 0.3648257753457874)
hate_speech (91900, 0.16419059397000818, 0.47298494464717805)
topic_tagging (98900, 2.1611483617424967, 2.1547208708524703)
offensive_classification (104500, 0.3140988249089569, 0.36405697597377)
hate_speech (92000, 0.16616877509839834, 0.4729013952426612)
topic_tagging (99000, 2.157883425652981, 2.1553489565849304)
offensive_classification (104600, 0.31472593373246494, 0.36528493036143483)
answer_embedding (34000, 0.008949282442255452, 0.0038100634296130385)
hate_speech (92100, 0.16611568746808916, 0.47302484642528)


offensive_classification (108000, 0.3179791983570904, 0.3687125941477716)
hate_speech (95000, 0.16555977575480937, 0.4648330163629726)
answer_embedding (35100, 0.011531524441424218, 0.002638208137810246)
topic_tagging (102200, 2.159035922884941, 2.1560823695659637)
offensive_classification (108100, 0.31178790201991796, 0.3697544225715101)
hate_speech (95100, 0.16781998950988053, 0.46444466066453605)
topic_tagging (102300, 2.156656948566437, 2.1591488229036333)
offensive_classification (108200, 0.3035646324660629, 0.3672822793647647)
hate_speech (95200, 0.16553009756468237, 0.4692957168510184)
topic_tagging (102400, 2.1723898901939394, 2.158571473479271)
offensive_classification (108300, 0.3041138372402638, 0.3694760039560497)
answer_embedding (35200, 0.01108551431534264, 0.0027794054374418314)
hate_speech (95300, 0.16502426272816956, 0.46799471917189656)
title_embedding (21300, 0.0010691239629116302, 0.0044290925270195885)
topic_tagging (102500, 2.1637990568876266, 2.156547503232956)
o

topic_tagging (105700, 2.167421694755554, 2.1577419492006302)
hate_speech (98200, 0.1658832957642153, 0.4686026967344806)
offensive_classification (111700, 0.3085660402290523, 0.3710271620657295)
topic_tagging (105800, 2.1718904801607133, 2.1599697750806808)
answer_embedding (36300, 0.010912166705882298, 0.0004983354684947577)
offensive_classification (111800, 0.3013681168369949, 0.3681270713526756)
hate_speech (98300, 0.16467770743835716, 0.47110682854335756)
topic_tagging (105900, 2.167497029542923, 2.1567908366918562)
offensive_classification (111900, 0.30727102283760904, 0.3694337422121316)
title_embedding (22000, 0.0007419229447773143, 0.0012980089315206657)
hate_speech (98400, 0.16616411276347937, 0.4673182600932196)
topic_tagging (106000, 2.162390955090523, 2.1581787785291673)
offensive_classification (112000, 0.3125223795771599, 0.3683245530258864)
hate_speech (98500, 0.16487010839767754, 0.46861734041105957)
topic_tagging (106100, 2.1719415193796157, 2.156249085664749)
answer_

hate_speech (101400, 0.16235697794798762, 0.4697371347658336)
offensive_classification (115300, 0.2969470523148775, 0.3726027200240642)
topic_tagging (109300, 2.1480651315450667, 2.15713912153244)
hate_speech (101500, 0.16120202312339096, 0.4708154686419293)
answer_embedding (37500, 0.009893916973705206, 0.0012301885647784854)
offensive_classification (115400, 0.29571464297920463, 0.3703858724590391)
title_embedding (22700, 0.0012946137480708186, 0.001529835923527643)
topic_tagging (109400, 2.162507194161415, 2.1599758039712906)
offensive_classification (115500, 0.29772832058370113, 0.3716258481796831)
hate_speech (101600, 0.15667378101218493, 0.4740088169919327)
topic_tagging (109500, 2.1563613836765287, 2.155231202840805)
offensive_classification (115600, 0.3062912222370505, 0.3725646833758801)
hate_speech (101700, 0.15896574888005852, 0.4722147808894515)
topic_tagging (109600, 2.1692685017585753, 2.1552307398319246)
offensive_classification (115700, 0.3093978594392538, 0.37080685350

topic_tagging (112600, 2.1796788079738616, 2.1499436882734297)
title_embedding (23400, 0.000717431105661392, 0.0007507146598339384)
offensive_classification (119100, 0.31566591950319706, 0.37192627223953606)
hate_speech (104700, 0.1600493085803464, 0.4701633138377219)
topic_tagging (112700, 2.1907098021507263, 2.151972864627838)
offensive_classification (119200, 0.3171842390708625, 0.37333826306462287)
answer_embedding (38700, 0.006437391107942843, 0.0018681204460600789)
hate_speech (104800, 0.16169797189626842, 0.46838960322923956)
topic_tagging (112800, 2.180978369474411, 2.15355205655098)
offensive_classification (119300, 0.31719407813251016, 0.369010865021497)
hate_speech (104900, 0.160646250911057, 0.4660276940995827)
topic_tagging (112900, 2.1911208013296126, 2.1524554710388184)
offensive_classification (119400, 0.3152922495007515, 0.3711463009752333)
hate_speech (105000, 0.16270768731087445, 0.4724587350850925)
topic_tagging (113000, 2.187646608233452, 2.1513033072948455)
answer

hate_speech (107800, 0.16157268868014216, 0.47344050723593684)
offensive_classification (122800, 0.3120876188986003, 0.3709504524730146)
topic_tagging (116100, 2.1711700581908224, 2.1550437313318254)
answer_embedding (39900, 0.007112582912888604, 0.0031500358034011727)
offensive_classification (122900, 0.31135641373321415, 0.36910051342472433)
hate_speech (107900, 0.1594748565107584, 0.47356129269860686)
topic_tagging (116200, 2.170789873898029, 2.1561301938295365)
offensive_classification (123000, 0.314819378381595, 0.36904871140792966)
hate_speech (108000, 0.1623202447257936, 0.47363548756204543)
topic_tagging (116300, 2.1643267909884454, 2.1562507086992264)
offensive_classification (123100, 0.30975871823728085, 0.3679446167163551)
hate_speech (108100, 0.1662677676063031, 0.4749646061770618)
answer_embedding (40000, 0.008028150876642635, 0.0019108645519423182)
title_embedding (24200, 0.0035960912853337224, 0.0031518606666941723)
topic_tagging (116400, 2.179458851158619, 2.15744514334

hate_speech (111000, 0.16405755520053208, 0.4677169767767191)
topic_tagging (119600, 2.149828377127647, 2.15547365295887)
offensive_classification (126500, 0.3059510836210102, 0.36624755208939314)
hate_speech (111100, 0.16500115875340998, 0.4677061889795586)
answer_embedding (41100, 0.0032495244684717477, 0.0006460016062375078)
offensive_classification (126600, 0.3054121447857469, 0.3660620129220188)
topic_tagging (119700, 2.1554739108085634, 2.153769671678543)
title_embedding (24900, 0.0023421078911140944, 7.946174214916724e-06)
hate_speech (111200, 0.1627017314238474, 0.4698792402073741)
offensive_classification (126700, 0.3087714228313416, 0.3672670775167644)
topic_tagging (119800, 2.1546728994846345, 2.1572111043930056)
hate_speech (111300, 0.16479176982026547, 0.46807018185500054)
offensive_classification (126800, 0.3087600193321705, 0.3658799065165222)
topic_tagging (119900, 2.16037226498127, 2.1558698679208756)
answer_embedding (41200, 0.002320046363932953, 7.782231554153496e-05

topic_tagging (123000, 2.175861089348793, 2.1472056189775466)
hate_speech (114300, 0.16776118901278825, 0.4769863167302683)
answer_embedding (42300, 0.0037329183032017536, 0.0005850672587791452)
offensive_classification (130100, 0.29900147741660477, 0.36432036972790954)
topic_tagging (123100, 2.181847985744476, 2.1468441622257233)
hate_speech (114400, 0.16939707193057985, 0.4738799669435248)
offensive_classification (130200, 0.2978041165173054, 0.36520783583074806)
topic_tagging (123200, 2.179335522055626, 2.147544523358345)
hate_speech (114500, 0.16631601471547036, 0.472539024759084)
offensive_classification (130300, 0.3018341377992183, 0.3674761299751699)
topic_tagging (123300, 2.1769153057932855, 2.1497830353975296)
answer_embedding (42400, 0.002189768067835632, 0.0005851057053211095)
hate_speech (114600, 0.165454229648225, 0.4685150988725945)
offensive_classification (130400, 0.3053492410238832, 0.3663884369581938)
topic_tagging (123400, 2.1762285606265066, 2.1499023246765137)
titl

offensive_classification (133700, 0.30390771408751605, 0.36737597676180306)
topic_tagging (126500, 2.1805198771357537, 2.1582017834186553)
answer_embedding (43500, 0.0035702771004584312, 0.0010263655609798828)
offensive_classification (133800, 0.30556996507942674, 0.36932032578997315)
hate_speech (117600, 0.16350755076110363, 0.4717027166951448)
topic_tagging (126600, 2.1844860925078393, 2.1574764013290406)
offensive_classification (133900, 0.3049649535305798, 0.36988729803822934)
hate_speech (117700, 0.1647602126048878, 0.47245188846997915)
topic_tagging (126700, 2.185856990635395, 2.1551257524490355)
title_embedding (26400, 0.0018574319494039488, 0.0008377240320528063)
offensive_classification (134000, 0.3075007183179259, 0.36624587067775427)
topic_tagging (126800, 2.1793390008807183, 2.154070922136307)
hate_speech (117800, 0.16512729033641518, 0.47352775336429476)
offensive_classification (134100, 0.3051971565410495, 0.3658560406435281)
answer_embedding (43600, 0.0034887281504831884

hate_speech (120700, 0.16549686604272573, 0.46884450226463376)
topic_tagging (130100, 2.1844992510080337, 2.158520218729973)
offensive_classification (137400, 0.30512923943810166, 0.3701442596241832)
hate_speech (120800, 0.16405491478927434, 0.46650457153469327)
answer_embedding (44700, 0.01733392840603672, 0.001752515097066952)
offensive_classification (137500, 0.31041444402746854, 0.372726386167109)
topic_tagging (130200, 2.178654133558273, 2.1594069120883943)
title_embedding (27100, 1.4397115457276399e-07, 0.0017621844811835645)
offensive_classification (137600, 0.3080762275606394, 0.3691844029463828)
hate_speech (120900, 0.1588982539102435, 0.4679370300192386)
topic_tagging (130300, 2.179368844032288, 2.157943951010704)
offensive_classification (137700, 0.3124446502439678, 0.3699976812824607)
hate_speech (121000, 0.1596522230952978, 0.47023505418747663)
topic_tagging (130400, 2.171885972738266, 2.1591413558721544)
offensive_classification (137800, 0.3129879830479622, 0.371723402690

topic_tagging (133500, 2.1601345662474634, 2.1521427377462388)
hate_speech (123900, 0.15957921712007372, 0.47496791347209366)
offensive_classification (141100, 0.30854383114911615, 0.36923658263869585)
topic_tagging (133600, 2.164704120695591, 2.1503904250860213)
hate_speech (124000, 0.1612498882273212, 0.47660492865834386)
title_embedding (27800, 0.0019602654262560323, 0.0024089792670832066)
offensive_classification (141200, 0.3093662911709398, 0.36791877758689223)
topic_tagging (133700, 2.1676463939547537, 2.155136914372444)
hate_speech (124100, 0.1616108885286376, 0.4731003243541345)
offensive_classification (141300, 0.30897301002405586, 0.36801907143183055)
answer_embedding (45900, 0.007409471248299212, 0.0017071075154771872)
topic_tagging (133800, 2.1725361576676367, 2.151055594921112)
offensive_classification (141400, 0.31268191696517167, 0.36875461391545833)
hate_speech (124200, 0.1605811520749703, 0.4698016973258927)
topic_tagging (133900, 2.1804134390950205, 2.153123234629631)

answer_embedding (47000, 0.009960940876398337, 0.0010916167885155063)
topic_tagging (137000, 2.1895033396482466, 2.155646921277046)
offensive_classification (144700, 0.298924344426021, 0.3654216481298208)
hate_speech (127200, 0.15969181139254943, 0.4752296644290909)
topic_tagging (137100, 2.1870601887702943, 2.156366097211838)
offensive_classification (144800, 0.29650442478619515, 0.3651847411803901)
hate_speech (127300, 0.1620537137449719, 0.4779622260862961)
topic_tagging (137200, 2.1747709804177284, 2.1546908538341523)
offensive_classification (144900, 0.2861803215201944, 0.3666204843316227)
answer_embedding (47100, 0.011517153178724794, 0.0007307949546814543)
hate_speech (127400, 0.16510002145031466, 0.4768994116121903)
topic_tagging (137300, 2.1687184955477714, 2.159852635502815)
offensive_classification (145000, 0.2823708468209952, 0.3682015080023557)
hate_speech (127500, 0.16437657379033044, 0.47970750867109746)
topic_tagging (137400, 2.166226715505123, 2.154324998140335)
title_

offensive_classification (148300, 0.307746081136167, 0.3695551154538989)
hate_speech (130400, 0.1640335777681321, 0.47166376758925616)
topic_tagging (140500, 2.1730539192557337, 2.1551665802001954)
offensive_classification (148400, 0.30671830344200135, 0.3692124551087618)
hate_speech (130500, 0.16520577742345632, 0.4719126265961677)
topic_tagging (140600, 2.169897063076496, 2.155704001545906)
offensive_classification (148500, 0.30972549809515476, 0.3675156895443797)
hate_speech (130600, 0.16081122107617557, 0.4781697715111077)
answer_embedding (48300, 0.0035740328687629414, 0.0014492441176460864)
topic_tagging (140700, 2.172094558238983, 2.1586910808086395)
offensive_classification (148600, 0.3161689349897206, 0.36933630084991453)
title_embedding (29300, 1.3034633294181752e-05, 0.0036051213399047356)
hate_speech (130700, 0.16413237441144884, 0.47392886873800305)
offensive_classification (148700, 0.3188974792342633, 0.36647469649091363)
topic_tagging (140800, 2.1636103297472, 2.16160728

topic_tagging (143900, 2.1473714183568955, 2.1603356548547743)
offensive_classification (152000, 0.299337743120268, 0.3743687662538141)
hate_speech (133700, 0.16727428938262165, 0.47120824046619236)
topic_tagging (144000, 2.146077290415764, 2.159845570206642)
offensive_classification (152100, 0.2980142383407801, 0.37141095446981487)
title_embedding (30000, 0.0002724999263457581, 0.0004894500431592026)
hate_speech (133800, 0.16897802085801958, 0.4660595565317199)
offensive_classification (152200, 0.30263720735907557, 0.37250751577876506)
topic_tagging (144100, 2.1492712932825087, 2.160122564077377)
answer_embedding (49500, 0.006779965392834121, 0.0008200862521117722)
offensive_classification (152300, 0.2998807065654546, 0.3710034108553082)
hate_speech (133900, 0.16241862498410045, 0.47054531081393364)
topic_tagging (144200, 2.1412657104730606, 2.1608631014823914)
offensive_classification (152400, 0.303369686761871, 0.37108226621709767)
hate_speech (134000, 0.1662245324552059, 0.47078647

answer_embedding (50600, 0.012166277738742758, 0.001255014898009291)
offensive_classification (155700, 0.32688579995185135, 0.3672858370076865)
topic_tagging (147500, 2.1363172587156294, 2.1520144897699356)
hate_speech (136900, 0.16311576790269464, 0.46759062258619816)
offensive_classification (155800, 0.32977540784701703, 0.36755653331056237)
title_embedding (30700, 0.004856324990713114, 0.0018916346522615535)
topic_tagging (147600, 2.1467282752990724, 2.1523188940286637)
offensive_classification (155900, 0.3256071902178228, 0.3691952315792441)
hate_speech (137000, 0.16314101539831607, 0.4711866548070684)
topic_tagging (147700, 2.160333849430084, 2.1534252095222475)
offensive_classification (156000, 0.33356204107403753, 0.3674794482663274)
answer_embedding (50700, 0.013810548526747091, 0.0012550072841307634)
hate_speech (137100, 0.16352279570326209, 0.46780076017044486)
offensive_classification (156100, 0.3325649850461632, 0.3697534108050168)
topic_tagging (147800, 2.1582273684740065,

topic_tagging (150900, 2.1578647805452347, 2.153969088435173)
answer_embedding (51800, 0.004422135271699532, 0.0019225873777592075)
hate_speech (140000, 0.16248872539401055, 0.47979405214078724)
title_embedding (31400, 0.004857365046187437, 0.0004240934416753448)
offensive_classification (159500, 0.3235685289129615, 0.36964838655665516)
topic_tagging (151000, 2.162887477517128, 2.15624194419384)
hate_speech (140100, 0.1628762205336243, 0.4844603036576882)
offensive_classification (159600, 0.3262252186015248, 0.3671813174895942)
topic_tagging (151100, 2.1696770629882813, 2.1538304557800294)
hate_speech (140200, 0.15937437654007225, 0.4835780991492793)
offensive_classification (159700, 0.324307888366282, 0.3679403524603695)
topic_tagging (151200, 2.1749610011577607, 2.1566050391197207)
answer_embedding (51900, 0.004693296140624081, 0.0016405012188898667)
offensive_classification (159800, 0.3224772997200489, 0.36681489245593546)
hate_speech (140300, 0.15946223946660756, 0.4843877720730379

offensive_classification (163100, 0.31440894105657935, 0.37340898256748917)
hate_speech (143200, 0.1568952731722966, 0.47629532671160996)
topic_tagging (154400, 2.148585588812828, 2.1541446529626844)
answer_embedding (53000, 0.004309351487499433, 0.003860829868496316)
offensive_classification (163200, 0.31719794749841096, 0.37225424668192864)
hate_speech (143300, 0.15933631683234126, 0.4765466320384294)
topic_tagging (154500, 2.152459858417511, 2.155956632733345)
offensive_classification (163300, 0.33040755581483244, 0.37132138065621256)
hate_speech (143400, 0.16041359453927725, 0.4776008507218212)
topic_tagging (154600, 2.135355161309242, 2.1564083898067476)
offensive_classification (163400, 0.32724159356206656, 0.37138791344314814)
hate_speech (143500, 0.16175828063394873, 0.48230519456695764)
topic_tagging (154700, 2.1440092660188674, 2.1550206015110014)
answer_embedding (53100, 0.0025497894770149685, 0.003855065984044479)
offensive_classification (163500, 0.33292954696156085, 0.372

hate_speech (146400, 0.16185976672917604, 0.4754219442764297)
topic_tagging (157800, 2.17684533315897, 2.156512676477432)
offensive_classification (166800, 0.30239656878076493, 0.37210843730345367)
hate_speech (146500, 0.16133654069155454, 0.4733511637663469)
topic_tagging (157900, 2.165087168991566, 2.1558564792871477)
answer_embedding (54200, 0.007189462488083097, 0.0009883171144949795)
offensive_classification (166900, 0.3030242841411382, 0.3729537338092923)
topic_tagging (158000, 2.1668336760401727, 2.157264075875282)
hate_speech (146600, 0.16381501183845104, 0.47398129091132435)
offensive_classification (167000, 0.3056181499566883, 0.3742185909897089)
topic_tagging (158100, 2.1676926756501196, 2.1602690020799638)
hate_speech (146700, 0.16685564405098557, 0.4702157110320404)
offensive_classification (167100, 0.3031965693961829, 0.37160802153870465)
title_embedding (32900, 0.00046420550259056317, 0.004951594863507052)
topic_tagging (158200, 2.1720865994095804, 2.1577292881011965)
of

hate_speech (149600, 0.1626337905600667, 0.46839791484735904)
topic_tagging (161400, 2.1813951247930525, 2.1557919768095015)
offensive_classification (170400, 0.31662779736705127, 0.36604933711141346)
hate_speech (149700, 0.16692049343977122, 0.4741067164782435)
topic_tagging (161500, 2.1764411599636078, 2.156007534623146)
offensive_classification (170500, 0.3159356601331383, 0.36706454765051605)
answer_embedding (55400, 0.00898058091901152, 4.558706508073973e-05)
hate_speech (149800, 0.16602621623780578, 0.4723641965184361)
topic_tagging (161600, 2.182831114888191, 2.1583407155275345)
offensive_classification (170600, 0.3145391686111689, 0.37003897969052196)
hate_speech (149900, 0.16246865700744093, 0.4736524004386738)
title_embedding (33600, 0.0009909152060006844, 0.002999446301553779)
topic_tagging (161700, 2.1817392176389694, 2.1554882724285127)
offensive_classification (170700, 0.3178547281250358, 0.3674859544560313)
hate_speech (150000, 0.16470936582051218, 0.4734631891148165)
to

hate_speech (152800, 0.16703065256914124, 0.4792713994178921)
topic_tagging (164800, 2.153321147620678, 2.1562912250757216)
offensive_classification (174100, 0.30746421485207975, 0.36931426741555334)
hate_speech (152900, 0.16304912539198996, 0.47580950569733976)
answer_embedding (56600, 0.0063038286494115385, 0.0015004679471184383)
topic_tagging (164900, 2.158877821147442, 2.1572113901376726)
offensive_classification (174200, 0.31451934919320046, 0.36949582627415656)
hate_speech (153000, 0.1650304355127737, 0.47662776485830544)
title_embedding (34300, 0.0018419079451840248, 0.0017718758818507264)
offensive_classification (174300, 0.3158293330874294, 0.36789960936456917)
topic_tagging (165000, 2.159830675125122, 2.1551049292087554)
hate_speech (153100, 0.16543552007619292, 0.4766812793193385)
offensive_classification (174400, 0.3224484364409, 0.36895899871736765)
topic_tagging (165100, 2.1665882720947267, 2.1595733391046523)
answer_embedding (56700, 0.0025075463058484167, 0.001510442871

offensive_classification (177700, 0.30701345548406245, 0.3689147949889302)
title_embedding (35000, 0.001185462749947642, 0.0016078659447762633)
hate_speech (156100, 0.17037610979285092, 0.4714809368168935)
topic_tagging (168300, 2.1507074356079103, 2.1559892424345017)
offensive_classification (177800, 0.30589266007766125, 0.37223971378430726)
answer_embedding (57800, 0.004738607839882159, 0.001194201037972289)
hate_speech (156200, 0.16546318283118308, 0.4725302444519475)
offensive_classification (177900, 0.30691227910295127, 0.3687632668428123)
topic_tagging (168400, 2.1555340098142626, 2.153519157409668)
hate_speech (156300, 0.16824468857049943, 0.47403570885304364)
offensive_classification (178000, 0.30711374564096333, 0.3696744715124369)
topic_tagging (168500, 2.1657468415498733, 2.153733121395111)
hate_speech (156400, 0.16527896071691067, 0.47533088554162534)
offensive_classification (178100, 0.3014625014923513, 0.37246634300425646)
topic_tagging (168600, 2.183630789101124, 2.15641

topic_tagging (171700, 2.1612196373939514, 2.1540766649246215)
offensive_classification (181400, 0.3142613539285958, 0.3681646235063672)
hate_speech (159300, 0.16282277333177625, 0.4705946661187336)
topic_tagging (171800, 2.154199183821678, 2.153538930416107)
answer_embedding (59000, 0.002828619790563049, 0.002056196665723226)
offensive_classification (181500, 0.32068402495235204, 0.3670727622359991)
topic_tagging (171900, 2.162029892206192, 2.1524923696517946)
hate_speech (159400, 0.16436244015488774, 0.47075620786100625)
offensive_classification (181600, 0.31923951355740426, 0.3683460042737424)
topic_tagging (172000, 2.1572935715913775, 2.1524470944404603)
hate_speech (159500, 0.1585234442334622, 0.47661382020264864)
offensive_classification (181700, 0.3165212566368282, 0.3704104133956134)
topic_tagging (172100, 2.1444763213992117, 2.1531217111349106)
answer_embedding (59100, 0.004949305096891645, 0.002346526076670626)
hate_speech (159600, 0.1581025316324085, 0.4771346564851701)
offe

hate_speech (162400, 0.1629697246812284, 0.4730208540679887)
topic_tagging (175200, 2.1320000705718996, 2.156621706724167)
offensive_classification (185200, 0.3015614798236638, 0.3709723499491811)
hate_speech (162500, 0.15946429457888006, 0.4744214966902509)
topic_tagging (175300, 2.133047920703888, 2.1574760555028916)
offensive_classification (185300, 0.29486254511587323, 0.37381886687502264)
answer_embedding (60200, 0.011966830622538642, 0.0009468887727819721)
hate_speech (162600, 0.15852995104994624, 0.4763418280519545)
offensive_classification (185400, 0.29246403849311176, 0.37081920336931945)
topic_tagging (175400, 2.130368184864521, 2.1566380307674407)
title_embedding (36500, 0.00015824432924663824, 0.002224680617718453)
offensive_classification (185500, 0.29330181384272874, 0.3715269952192903)
hate_speech (162700, 0.1612744568567723, 0.4774562042225152)
topic_tagging (175500, 2.1312737513184548, 2.1546124210357664)
offensive_classification (185600, 0.2979640943985432, 0.37376762

title_embedding (37200, 0.0022273365937311544, 0.00100940839184133)
hate_speech (165600, 0.16066487655229866, 0.46585751470457765)
offensive_classification (188900, 0.30059680647216735, 0.36992991687357424)
topic_tagging (178700, 2.1349085891246795, 2.151318978190422)
hate_speech (165700, 0.16243220598623156, 0.46934569809492677)
answer_embedding (61400, 0.007612624364000633, 0.0009521119127360387)
offensive_classification (189000, 0.3012914594057947, 0.36670770560204985)
topic_tagging (178800, 2.1455172979831696, 2.150930724740028)
hate_speech (165800, 0.16082653400488198, 0.47132999314088375)
offensive_classification (189100, 0.2998543342519552, 0.3690701183900237)
topic_tagging (178900, 2.150422653079033, 2.152610228061676)
hate_speech (165900, 0.16155509198084472, 0.4710822892356664)
offensive_classification (189200, 0.30410253286734223, 0.3719849355984479)
topic_tagging (179000, 2.1543671083450318, 2.151697422504425)
answer_embedding (61500, 0.007126131985641147, 0.000953312253424

hate_speech (168800, 0.1607335098721087, 0.4671813261443749)
offensive_classification (192500, 0.3029404211677611, 0.3712514498643577)
answer_embedding (62600, 0.008705116930352814, 0.0007737470787848029)
topic_tagging (182200, 2.1512506449222566, 2.150922341942787)
offensive_classification (192600, 0.3019882995337248, 0.3700712741948664)
hate_speech (168900, 0.16248692203499376, 0.466468655818142)
topic_tagging (182300, 2.1552733681201937, 2.14984763276577)
offensive_classification (192700, 0.29743041188642383, 0.37009514747932554)
title_embedding (38000, 0.0007305056044141116, 0.0008983560752714861)
topic_tagging (182400, 2.147449554383755, 2.1508981685638426)
hate_speech (169000, 0.1661057624090463, 0.4696446024468169)
offensive_classification (192800, 0.29932158037647605, 0.37011060332879425)
topic_tagging (182500, 2.1494685420393944, 2.1499236886501314)
answer_embedding (62700, 0.008705118263999207, 0.0007734323388351516)
hate_speech (169100, 0.16575856294110417, 0.468242206252180

In [7]:
from texture.processing import Document

docs = [Document.parse("<UNK>", "faggot"),
        Document.parse("<UNK>", "fuck"),
        Document.parse("<UNK>", "porno"),
        Document.parse("<UNK>", "porn"),
        Document.parse("<UNK>", "porn videos"),
        Document.parse("<UNK>", "porno videos"),
        Document.parse("<UNK>", "videos"),
        Document.parse("<UNK>", "watch movie"),
        Document.parse("<UNK>", "buy clothes online"),
        Document.parse("<UNK>", "buy clothes shopping"),
        Document.parse("<UNK>", "bob dylan"),
        Document.parse("<UNK>", "buy cool things"),
        Document.parse("<UNK>", "listen to a song"),
        Document.parse("<UNK>", "facebook"),
        Document.parse("<UNK>", "recipe pizza"),
        Document.parse("<UNK>", "programming python"),
        Document.parse("<UNK>", "bruce springsteen"),
        Document.parse("<UNK>", "john malkovich")]

import pprint
pprint.pprint(m.decode_docs(docs))

{'answer_embedding': Variable containing:
 5.6161e-01  5.3570e-01  9.3618e-01  ...   3.1751e-01 -1.5310e+00 -1.6545e-01
-1.7853e-01 -1.0787e-01  8.2820e-01  ...  -2.5292e-01 -6.8882e-01 -2.1772e-01
-1.4785e-01  5.3897e-02  5.3687e-01  ...  -4.7178e-01 -5.7985e-01 -2.6290e-01
                ...                   ⋱                   ...                
 1.9989e-01  1.7765e+00 -3.8585e-01  ...  -7.2101e-01 -1.6334e-01 -2.6821e-01
-4.4020e-01  1.2598e+00 -2.3462e-01  ...  -6.0701e-01  1.2705e-01 -1.7059e-01
 3.7433e-01  9.9518e-01 -3.8605e-01  ...  -6.5324e-01 -4.6318e-01 -2.7944e-01
[torch.FloatTensor of size 18x512]
,
 'hate_speech': [[('hate', 0.9608844518661499),
                  ('offensive', 0.03783681243658066),
                  ('non_offensive', 0.0012787628220394254)],
                 [('hate', 0.8911677598953247),
                  ('offensive', 0.10716559737920761),
                  ('non_offensive', 0.0016666718292981386)],
                 [('hate', 0.8763577938079834),
 

In [6]:
m.save_model("model_data/latest_512/")

Saving title_embedding
Saving answer_embedding
Saving offensive_classification
Saving topic_tagging
Saving hate_speech
