In [10]:
import json
import pandas as pd

In [11]:
# this helps with scrolling df
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)
pd.set_option('display.width', 1000)

In [20]:
def read_data(path, limiter):
    """
    Args:
        path: path to dataset in jsonl file format
        limiter: number of rows

    Returns:
        data: json dict, where every line is one sample as json
    """
    with open(path) as file:
        data = [json.loads(next(file)) for x in range(limiter)]
    return data


def transform_dll_imports(json_sample):
    """
    Args:
        json_sample: one sample of dataset

    Returns:
        functions_dict: dict with all dll functions name with value True
    """
    imports = sample["imports"]
    functions_dict = {}
    for key in imports.keys():
        functions = imports[key]
        functions_with_values = {key.lower() + "-" + f_name: True for f_name in functions}
        functions_dict.update(functions_with_values)
    return functions_dict


def transform_dict(json_dict):
    """
    Args:
        json_dict: json dict with nested key-value, where value is list

    Returns:
        functions_dict: dict with value as a key and default value True
    """
    result_dict = {}
    for key in json_dict.keys():
        keys = json_dict[key]
        values_with_default = {key.lower() + "-" + f_name: True for f_name in keys}
        result_dict.update(values_with_default)
    return result_dict


def transform_list(json_list):
    """
    Args:
        json_list: json list of values

    Returns:
        functions_dict: dict with all dll functions name with value True
    """
    result_dict = {}
    result_dict.update({i: True for i in json_list})
    return result_dict


def flatten_json(y, separator=''):
    """
    Args:
        y: json object
        separator: separator

    Returns:
        functions_dict: dict with flatten values
    """
    out = {}

    def flatten(x, name=separator):
        if type(x) is dict:
            for a in x:
                flatten(x[a], name + a + '_')
        elif type(x) is list:
            i = 0
            for a in x:
                flatten(a, name + str(i) + '_')
                i += 1
        else:
            out[name[:-1]] = x

    flatten(y)
    return out

In [14]:
# 1. read datas
data_path = 'sample_data_6k.jsonl'
data = read_data(data_path, limiter = 6000)
# 2. iterate over dataset
flatten_dataset = []
for sample in data:
    # version 1 dummy way
    # flat = flatten_json(sample)
    # flatten_dataset.append(flat)
    # collect transformed values for each sample

    # version 2
    transformed = {}
    transformed.update({"label": sample['label']})
    transformed.update({"sha256": sample['sha256']})
    transformed.update({"md5": sample['md5']})
    transformed.update({"appeared": sample['appeared']})
    transformed.update({"avclass": sample['avclass']})
    transformed.update(flatten_json(sample['histogram'], 'histogram.'))
    transformed.update(flatten_json(sample['byteentropy'], 'byteentropy.'))
    transformed.update(transform_dict(sample["imports"]))
    transformed.update(transform_list(sample["exports"]))
    transformed.update(flatten_json(sample['general']))
    transformed.update(flatten_json(sample['strings']))
    transformed.update(flatten_json(sample['header']))
    transformed.update(flatten_json(sample['datadirectories']))

    # here we fill with transform data
    flatten_dataset.append(transformed)

# change all transformed dataset to dataframe object
df = pd.DataFrame(flatten_dataset)
df


Unnamed: 0,label,sha256,md5,appeared,avclass,histogram.0,histogram.1,histogram.2,histogram.3,histogram.4,histogram.5,histogram.6,histogram.7,histogram.8,histogram.9,histogram.10,histogram.11,histogram.12,histogram.13,histogram.14,histogram.15,histogram.16,histogram.17,histogram.18,histogram.19,histogram.20,histogram.21,histogram.22,histogram.23,histogram.24,histogram.25,histogram.26,histogram.27,histogram.28,histogram.29,histogram.30,histogram.31,histogram.32,histogram.33,histogram.34,histogram.35,histogram.36,histogram.37,histogram.38,histogram.39,histogram.40,histogram.41,histogram.42,histogram.43,histogram.44,histogram.45,histogram.46,histogram.47,histogram.48,histogram.49,histogram.50,histogram.51,histogram.52,histogram.53,histogram.54,histogram.55,histogram.56,histogram.57,histogram.58,histogram.59,histogram.60,histogram.61,histogram.62,histogram.63,histogram.64,histogram.65,histogram.66,histogram.67,histogram.68,histogram.69,histogram.70,histogram.71,histogram.72,histogram.73,histogram.74,histogram.75,histogram.76,histogram.77,histogram.78,histogram.79,histogram.80,histogram.81,histogram.82,histogram.83,histogram.84,histogram.85,histogram.86,histogram.87,histogram.88,histogram.89,histogram.90,histogram.91,histogram.92,histogram.93,histogram.94,histogram.95,histogram.96,histogram.97,histogram.98,histogram.99,histogram.100,histogram.101,histogram.102,histogram.103,histogram.104,histogram.105,histogram.106,histogram.107,histogram.108,histogram.109,histogram.110,histogram.111,histogram.112,histogram.113,histogram.114,histogram.115,histogram.116,histogram.117,histogram.118,histogram.119,histogram.120,histogram.121,histogram.122,histogram.123,histogram.124,histogram.125,histogram.126,histogram.127,histogram.128,histogram.129,histogram.130,histogram.131,histogram.132,histogram.133,histogram.134,histogram.135,histogram.136,histogram.137,histogram.138,histogram.139,histogram.140,histogram.141,histogram.142,histogram.143,histogram.144,histogram.145,histogram.146,histogram.147,histogram.148,histogram.149,histogram.150,histogram.151,histogram.152,histogram.153,histogram.154,histogram.155,histogram.156,histogram.157,histogram.158,histogram.159,histogram.160,histogram.161,histogram.162,histogram.163,histogram.164,histogram.165,histogram.166,histogram.167,histogram.168,histogram.169,histogram.170,histogram.171,histogram.172,histogram.173,histogram.174,histogram.175,histogram.176,histogram.177,histogram.178,histogram.179,histogram.180,histogram.181,histogram.182,histogram.183,histogram.184,histogram.185,histogram.186,histogram.187,histogram.188,histogram.189,histogram.190,histogram.191,histogram.192,histogram.193,histogram.194,histogram.195,histogram.196,histogram.197,histogram.198,histogram.199,histogram.200,histogram.201,histogram.202,histogram.203,histogram.204,histogram.205,histogram.206,histogram.207,histogram.208,histogram.209,histogram.210,histogram.211,histogram.212,histogram.213,histogram.214,histogram.215,histogram.216,histogram.217,histogram.218,histogram.219,histogram.220,histogram.221,histogram.222,histogram.223,histogram.224,histogram.225,histogram.226,histogram.227,histogram.228,histogram.229,histogram.230,histogram.231,histogram.232,histogram.233,histogram.234,histogram.235,histogram.236,histogram.237,histogram.238,histogram.239,histogram.240,histogram.241,histogram.242,histogram.243,histogram.244,...,PtInRegion,PtVisible,QueryFontAssocStatus,RealizePalette,RectInRegion,RectVisible,Rectangle,RemoveFontMemResourceEx,RemoveFontResourceA,RemoveFontResourceExA,RemoveFontResourceExW,RemoveFontResourceTracking,RemoveFontResourceW,ResetDCA,ResetDCW,ResizePalette,RestoreDC,RoundRect,STROBJ_bEnum,STROBJ_bEnumPositionsOnly,STROBJ_bGetAdvanceWidths,STROBJ_dwGetCodePage,STROBJ_vEnumStart,SaveDC,ScaleRgn,ScaleValues,ScaleViewportExtEx,ScaleWindowExtEx,ScriptGetFontAlternateGlyphs,ScriptGetFontFeatureTags,ScriptGetFontLanguageTags,ScriptGetFontScriptTags,ScriptItemizeOpenType,ScriptPlaceOpenType,ScriptPositionSingleGlyph,ScriptShapeOpenType,ScriptSubstituteSingleGlyph,SelectBrushLocal,SelectClipPath,SelectClipRgn,SelectFontLocal,SelectObject,SelectPalette,SetAbortProc,SetArcDirection,SetBitmapAttributes,SetBitmapBits,SetBitmapDimensionEx,SetBkColor,SetBkMode,SetBoundsRect,SetBrushAttributes,SetBrushOrgEx,SetColorAdjustment,SetColorSpace,SetDCBrushColor,SetDCDpiScaleValue,SetDCPenColor,SetDIBColorTable,SetDIBits,SetDIBitsToDevice,SetDeviceGammaRamp,SetEnhMetaFileBits,SetFontEnumeration,SetGraphicsMode,SetICMMode,SetICMProfileA,SetICMProfileW,SetLayout,SetLayoutWidth,SetMagicColors,SetMapMode,SetMapperFlags,SetMetaFileBitsEx,SetMetaRgn,SetMiterLimit,SetOPMSigningKeyAndSequenceNumbers,SetPaletteEntries,SetPixel,SetPixelFormat,SetPixelV,SetPolyFillMode,SetROP2,SetRectRgn,SetRelAbs,SetStretchBltMode,SetSystemPaletteUse,SetTextAlign,SetTextCharacterExtra,SetTextColor,SetTextJustification,SetViewportExtEx,SetViewportOrgEx,SetVirtualResolution,SetWinMetaFileBits,SetWindowExtEx,SetWindowOrgEx,SetWorldTransform,StartDocA,StartDocW,StartFormPage,StartPage,StretchBlt,StretchDIBits,StrokeAndFillPath,StrokePath,SwapBuffers,TextOutA,TextOutW,TranslateCharsetInfo,UnloadNetworkFonts,UnrealizeObject,UpdateColors,UpdateICMRegKeyA,UpdateICMRegKeyW,WidenPath,XFORMOBJ_bApplyXform,XFORMOBJ_iGetXform,XLATEOBJ_cGetPalette,XLATEOBJ_hGetColorTransform,XLATEOBJ_iXlate,XLATEOBJ_piVector,bCreateDCW,bDeleteLDC,bInitSystemAndFontsDirectoriesW,bMakePathNameW,cGetTTFFromFOT,fpClosePrinter,gMaxGdiHandleCount,gW32PID,g_systemCallFilterId,gdiPlaySpoolStream,ghICM,hGetPEBHandle,pGdiDevCaps,pGdiSharedHandleTable,pGdiSharedMemory,pldcGet,semDxTrimNotification,vSetPldc,msvbvm60.dll-ordinal703,Create360SafeEngine,CreateCloudEngine,CreateCloudEngineLocker,CreateFileReportLog,CreatePlugin2,CreatePlugin3,CreatePlugin4,CreatePlugin5,CreateQuarantine,CreateTrustZone,ForceMerge360Log,GetModErrCode,IsSupportFeature,msi.dll-ordinal87,msi.dll-ordinal136,shlwapi.dll-PathGetDriveNumberA,wininet.dll-InternetGetCookieExA,qbsenderror20.dll-UDSetProdInfo,qbsenderror20.dll-UDAddFile,qbsenderror20.dll-AddCustomStrObject,qbsenderror20.dll-UDSetNonUIMode,qbsenderror20.dll-UDSetMemDump,qbsenderror20.dll-UDSetErrorCode,qbsenderror20.dll-UDSetErrorMsg,qbsenderror20.dll-UDIsValidData,qbsenderror20.dll-??0UploadData@@QAE@XZ,qbsenderror20.dll-?SetInfo@ReportInfo@@QAEABV1@ABV1@@Z,qbsenderror20.dll-UDSendDataReport,?GetData@CustomDWORDObject@@QBE?BKXZ,?GetData@CustomHexObject@@QBE?BKXZ,?GetData@CustomStrObject@@QBEPBDXZ,?GetDataDir@ProdInfo@@QBEPBDXZ,?GetDataInitFlags@UploadData@@UBEIXZ,?GetDescr@CustomObject@@QBEPBDXZ,?GetEmail@ReportInfo@@QBEPBDXZ,?GetEnvInfo@UploadData@@UBEPBVEnvInfo@@XZ,?GetErrorCode@ErrorData@@UAE?BKXZ,?GetErrorCode@ReportInfo@@QBE?BKXZ,?GetErrorCode@UploadData@@UAE?BKXZ,?GetErrorSeverity@ErrorData@@UBEKXZ,?GetErrorTime@UploadData@@UBE?BVCTime@ATL@@XZ,?GetErrorType@ErrorData@@UBE?AW4ERROR_TYPE@@XZ,?GetExceptionAddress@UEErrorData@@UBEQAXXZ,?GetExceptionDesc@UEErrorData@@UBEPBDXZ,?GetExceptionPointers@UploadData@@QBEPAU_EXCEPTION_POINTERS@@XZ,?GetFileDescriptionList@UploadData@@UAEXABVCStringArray@@@Z,?GetFileDescriptionList@UploadData@@UBEABVCStringArray@@XZ,?GetFileList@UploadData@@UBEABVCStringArray@@XZ,?GetHasSolution@ErrorData@@UBEHXZ,?GetLastSystemError@ErrorData@@UBEKXZ,?GetMdpFileName@UploadData@@UBEABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@XZ,?GetMessageText@ReportInfo@@QBEPBDXZ,?GetOsInfo@UploadData@@UBEPBVOsInfo@@XZ,?GetPayloadSize@UploadData@@UAE?BIXZ,?GetPayloadXmlFileName@UploadData@@UBEABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@XZ,?GetProcessorInfo@UploadData@@UBEPBVProcessorInfo@@XZ,?GetProdID@ProdInfo@@QBE?BIXZ,?GetProdName@ProdInfo@@QBEPBDXZ,?GetProdRelease@ProdInfo@@QBEPBDXZ,?GetProdVersion@ProdInfo@@QBEPBDXZ,?GetProgDir@ProdInfo@@QBEPBDXZ,?GetReportInfo@UploadData@@UBEPBVReportInfo@@XZ,?GetReportSeverity@ReportInfo@@QBE?BIXZ,?GetReportTimeStamp@ReportInfo@@QBEABVCTime@ATL@@XZ,?GetReportType@ReportInfo@@QBE?BW4REPORT_TYPE@@XZ,?GetReportType@UploadData@@QBE?BW4REPORT_TYPE@@XZ,?GetReportXmlFileName@UploadData@@UBEABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@XZ,?GetReportXmlString@UploadData@@UAEPBDXZ,?GetStrData@CustomObject@@UBEPBDXZ,?GetSubProdName@ProdInfo@@QBEPBDXZ,?SetDataDir@ProdInfo@@QAEPBDPBD@Z,?SetEmail@ReportInfo@@QAEPBDPBD@Z,?SetErrorCode@ReportInfo@@QAE?BKK@Z,?SetErrorSeverity@ErrorData@@QAEXK@Z,?SetErrorTime@UploadData@@UAEABVCTime@ATL@@ABV23@@Z,?SetErrorTime@UploadData@@UAEABVCTime@ATL@@PBV23@@Z,?SetErrorType@ErrorData@@QAEXW4ERROR_TYPE@@@Z,?SetExceptionAddress@UEErrorData@@UAEXPAX@Z,?SetExceptionPointers@UploadData@@UAEXPAU_EXCEPTION_POINTERS@@@Z,?SetFileList@UploadData@@UAEXABVCStringArray@@@Z,?SetHasSolution@ErrorData@@QAEXH@Z,?SetMdpFileName@UploadData@@UAEXV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@@Z,?SetMessageText@ReportInfo@@QAEPBDPBD@Z,?SetPayloadSize@UploadData@@UAEXI@Z,?SetPayloadXmlFileName@UploadData@@UAEXABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@@Z,?SetProdID@ProdInfo@@QAEXI@Z,?SetProdName@ProdInfo@@QAEPBDPBD@Z,?SetProdRelease@ProdInfo@@QAEPBDPBD@Z,?SetProdVersion@ProdInfo@@QAEPBDPBD@Z,?SetProgDir@ProdInfo@@QAEPBDPBD@Z,?SetReportInfo@UploadData@@UAEABVReportInfo@@ABV2@@Z,?SetReportSeverity@ReportInfo@@QAE?BII@Z,?SetReportTimeStamp@ReportInfo@@QAEABVCTime@ATL@@ABV23@@Z,?SetReportTimeStamp@ReportInfo@@QAEABVCTime@ATL@@PBV23@@Z,?SetReportType@ReportInfo@@QAE?BW4REPORT_TYPE@@W42@@Z,?SetReportXmlFileName@UploadData@@UAEXABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@@Z,?SetSubProdName@ProdInfo@@QAEPBDPBD@Z,?_exception_code@UEErrorData@@UBE?BKXZ,api-ms-win-crt-stdio-l1-1-0.dll-freopen,_cgo_panic,_cgo_topofstack,callbackTrampoline,commitHookTrampoline,compareTrampoline,crosscall2,doneTrampoline,rollbackHookTrampoline,stepTrampoline,updateHookTrampoline
0,0,0abb4fda7d5b13801d63bee53e5e256be43e141faa077a...,63956d6417f8f43357d9a8e79e52257e,2006-12,,45521,13095,12167,12496,12429,11709,11864,12057,12881,11798,11802,11783,12029,12081,11756,12532,11980,11628,11504,11715,11809,12414,11779,11708,11956,11622,11859,11775,11717,11507,11873,11781,12015,11690,11676,11782,11820,11859,12025,11786,11731,11445,11556,11676,12057,11636,11669,11903,12004,11741,11833,12329,11778,11859,11806,11586,11775,11885,11863,12047,11869,12077,11724,12037,13129,11931,12101,12202,11956,12625,11877,11804,11999,11869,11578,11591,11933,12020,11695,11915,12565,11755,11597,12224,11786,11709,12321,12325,11671,11624,11573,11879,11578,11802,12060,11792,11527,12248,11703,11793,12143,12701,12071,11871,12582,12346,12303,11892,12190,12011,11826,12261,12139,11913,11994,12155,13023,13136,11897,12164,12228,11972,11916,11951,12061,12243,12009,12266,12655,12023,11819,12283,11882,12303,11751,11888,11976,12472,11622,13260,11969,12127,11735,12024,11592,11699,11604,11657,11974,11714,11918,11815,11851,11806,11710,11590,11835,11971,11757,11874,11813,11834,11610,11723,11988,11714,11774,12021,11816,11834,11607,11829,11665,11641,11722,11869,11864,11784,11528,11733,11923,11749,11972,11721,11977,11712,11772,11721,11891,11796,11991,12200,12432,11643,11877,12040,11874,11804,11932,12179,11940,11764,11743,11653,11854,11800,12092,12021,11969,11931,11890,11982,11956,11710,11792,12095,11749,11815,11722,11825,11846,11804,11567,11926,11839,11814,11921,11981,11910,11640,11681,12030,12822,12105,12001,12008,12180,11862,11992,11888,12211,12155,11734,11819,12154,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,0,c9cafff8a596ba8a80bafb4ba8ae6f2ef3329d95b85f15...,6f7bde7a1126debf0cc359a54953efc1,2007-01,,93059,15789,2871,3005,4107,1771,2918,4312,4610,903,1184,956,3099,1128,1639,2669,3139,1070,1723,1328,3020,3593,1224,975,2642,895,823,1147,1546,1871,674,747,3381,658,711,907,3378,1540,656,668,1058,706,627,1011,1027,763,933,561,1284,667,760,2781,1066,1342,795,624,1204,1762,671,1812,911,937,614,589,1688,1134,722,1179,1582,5502,1471,890,1272,814,603,612,1182,2361,999,814,5117,1308,1012,3143,1275,1720,2645,2662,1126,818,730,1171,1246,1714,1269,1189,1889,3521,717,1655,2032,4198,1584,1043,4606,2505,3264,663,1899,1252,2273,2974,1766,609,2614,2331,7378,5705,1200,1304,1067,887,608,563,1314,1769,742,684,1414,1506,664,4512,1594,5409,727,602,1764,5609,679,10251,1011,5446,554,526,2908,499,505,500,726,570,541,474,758,516,538,447,1580,1782,515,487,871,879,473,579,806,843,488,521,785,460,554,625,698,528,548,635,936,843,531,566,795,1420,713,673,1046,580,534,694,751,960,713,549,3999,1308,1389,1304,1600,461,1081,1877,1205,1197,680,563,944,495,608,516,1029,745,742,745,925,508,1022,837,1277,551,558,813,1000,619,599,537,1534,805,616,697,1407,568,529,552,4924,1415,585,1705,2668,538,598,620,1521,651,518,969,1453,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,0,eac8ddb4970f8af985742973d6f0e06902d42a3684d791...,7520c8f9534ca818726a4feaebf49e2b,2007-02,,45369,2560,1233,1542,4234,515,613,1542,1841,212,631,172,903,189,170,1302,985,456,362,497,499,1285,122,81,286,146,274,457,309,129,84,117,709,98,212,91,553,117,117,108,212,104,61,727,195,101,179,89,924,363,410,2355,455,1015,291,354,535,546,413,790,438,596,510,466,2188,2121,411,295,1941,1520,289,255,303,287,86,120,340,417,222,186,2208,713,525,956,385,577,957,793,310,156,67,221,145,283,1144,324,125,319,90,234,280,806,2809,187,927,321,1132,147,380,561,400,831,770,57,418,401,1454,1491,185,2827,666,248,88,139,218,391,117,757,1757,310,107,787,572,1158,279,388,2198,873,67,2583,170,926,121,413,127,52,482,53,85,73,152,44,161,1979,533,54,80,63,39,35,983,236,49,175,106,154,174,28,153,64,337,66,104,63,47,53,111,34,89,53,95,55,43,206,364,70,31,87,476,46,80,397,1325,234,489,235,265,37,181,365,201,303,77,100,2047,39,72,107,219,79,65,69,156,30,276,180,254,45,33,127,161,210,106,54,304,46,36,146,205,82,71,99,1145,672,127,557,2133,188,47,155,954,296,197,577,471,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,0,7f513818bcc276c531af2e641c597744da807e21cc1160...,e435a536968941854bcec3b902c439f6,2007-02,,21315,9641,9332,9358,9598,9220,9146,9382,9365,9116,9178,9255,9503,9173,9095,9190,9381,9200,9176,9073,9098,9190,9140,9039,9188,9066,9079,9114,9209,9015,9132,9164,9778,9064,9189,9088,9400,9150,9007,9213,9248,9035,8897,8989,9260,9047,9055,9169,9403,9463,9239,9724,9091,9143,9119,9178,9014,9101,9114,9296,9124,9008,9090,9188,10427,9299,9203,9480,9399,9650,9222,9324,9153,8957,9121,9073,9179,9328,9011,9068,9483,9098,9329,9335,9042,9502,9425,9211,9089,9397,9299,9221,9236,9486,8962,9204,9029,9304,9360,9192,9541,9611,9366,9310,9441,9492,9362,9267,9253,9276,9374,9422,9200,9097,9220,9328,9829,9509,9480,9280,9203,9180,9175,9065,9157,9200,9214,9349,9343,9138,9115,9663,9139,9358,9074,9071,9065,9755,9174,11133,9090,9562,9006,9076,9144,8916,9039,9219,9086,9123,8824,9220,9054,9248,9130,8995,9036,9075,9017,9331,9236,9260,9062,9156,8970,9317,9113,9157,9188,9031,9074,9059,9170,9092,9216,9057,9361,9154,9176,9321,9163,9143,9107,9094,9206,9427,9219,9187,9206,9138,9175,9050,9809,9161,9002,9737,9368,9140,9114,9362,9124,9069,9102,9089,9421,8855,9288,9056,9251,9201,9270,9166,9062,9125,8968,9095,9333,8971,9158,9068,9058,9147,9178,9095,9422,9262,9156,9064,9066,9225,9100,9125,10073,9366,9267,9557,9119,9136,9250,9212,9563,9170,9289,9195,9170,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,0,ca65e1c387a4cc9e7d8a8ce12bf1bcf9f534c9032b9d95...,e93049e2df82ab26f35ad0049173cb14,2007-02,,23539,6015,5214,4727,4892,4649,4367,5299,5625,4361,4446,4892,4695,5005,4493,5703,4982,4504,4230,4094,4462,4626,4273,4313,4229,4308,4372,4349,4294,4433,4245,4291,4926,4311,4325,4346,4447,4338,4264,4295,4253,4388,4272,4246,4427,4472,4369,4298,4396,4271,4316,4547,4300,4429,4263,4395,4265,4343,4291,4440,4376,4442,4266,4334,4354,4509,4382,4542,4471,4839,4456,4304,4457,4598,4360,4325,4328,4330,4251,4405,4957,4369,4461,4739,4454,4584,4732,4465,4465,4393,4380,4458,4422,4359,4329,4337,4353,4749,4353,4484,4684,4989,4539,4322,4487,4563,4773,4236,4693,4395,4695,4613,4457,4212,4729,4530,5252,4934,4465,4397,4318,4294,4179,4390,4472,4336,4396,4405,4648,4207,4310,4834,4399,4806,4405,4286,4249,4558,4477,5222,4409,4781,4273,4246,4350,4250,4440,4407,4347,4386,4283,4283,4365,4193,4194,4230,4079,4137,4264,4251,4319,4433,4429,4263,4390,4390,4309,4279,4238,4309,4349,4330,4327,4287,4354,4269,4387,4225,4385,4220,4359,4238,4340,4338,4289,4306,4276,4320,4237,4329,4392,4346,4765,4403,4462,4401,4259,4321,4506,4360,4336,4335,4416,4353,4233,4171,4275,4189,4357,4287,4412,4251,4352,4178,4222,4300,4569,4115,4253,4194,4338,4326,4197,4212,4294,4378,4291,4293,4388,4374,4296,4297,4790,4327,4177,4476,4471,4220,4290,4303,4382,4183,4265,4465,4469,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5995,1,d9e6f5f080da1fc279144d67d1daf7c375c46d14eb2dd9...,bd42f6cc6cfe536bf73d53d7ef8ad303,2018-09,sivis,64674,2331,1273,1508,1368,582,727,1225,1036,601,752,551,917,615,738,1583,705,817,476,725,617,978,590,587,539,588,508,682,839,888,1333,2266,6728,382,575,1068,977,457,433,959,389,524,486,620,622,741,935,817,716,916,813,867,700,865,746,824,973,923,1345,460,1063,1605,1560,2914,1574,876,538,780,902,1125,752,1216,631,717,548,568,744,822,829,1602,1221,835,927,1109,844,691,900,1141,913,611,876,1158,989,822,1922,1636,587,1425,794,1375,1151,2252,726,876,1054,1485,804,895,1362,1040,1480,2556,1225,989,1508,1647,2373,3410,573,637,1218,1121,1765,2267,745,2120,2256,3937,686,780,560,1417,526,728,463,1097,835,784,646,1626,549,998,940,2334,539,698,663,846,507,560,501,639,470,456,507,660,600,664,1004,2106,580,698,462,659,583,590,769,1426,852,806,691,826,959,1228,948,2770,729,1062,499,550,497,768,657,1431,1104,630,1797,443,850,2559,1376,3201,1048,807,575,1084,1013,657,805,2024,779,685,410,681,1144,534,433,1487,590,450,647,1332,1061,974,1693,3045,944,559,522,1070,868,1481,1515,3103,984,789,854,1732,802,579,508,1365,898,1470,1606,4152,1048,819,1578,3156,1105,1585,904,1314,1446,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
5996,1,58841e48cfb4b80eda32ebe7da0a5c001f3da07f781dc8...,191c5fe8d4a1eaa8ff093ab8273de13e,2018-09,benjamin,10232,4849,4813,4701,4854,4933,4694,4713,4925,4816,4805,4912,4854,4816,4939,4836,4887,4741,4720,4849,4927,4785,4809,4871,4805,4834,5051,4741,4800,4688,4727,4823,4918,4771,4809,4776,4976,4725,4804,4743,4724,4839,4990,4905,4872,4789,4768,4847,4756,4801,4797,5007,4824,4832,4757,4712,4840,4795,4748,4884,4798,4676,4949,4762,4852,4859,4697,4823,4771,4838,4786,4793,4785,4627,4824,4865,4863,4636,4846,4698,4810,4712,4883,4706,4778,4707,4820,4796,4824,4748,4937,4871,4709,4820,4839,4765,4774,4775,4706,4875,4907,4850,4878,4859,4951,4844,4798,4759,4871,4695,4810,4735,4818,4830,4805,4771,5004,4896,4841,4993,4799,4852,4883,4795,4656,4810,4765,4654,4796,4827,4792,4857,4706,4807,4793,4973,4890,4927,4829,4887,4773,4854,4830,4781,4802,4808,4802,4875,4870,4695,4862,4794,4750,4948,4742,4801,4898,4694,4757,4914,4704,4784,4629,4748,4847,4836,4832,4846,4772,4800,4662,4738,4811,4729,4789,4794,4841,4909,4931,4721,4778,4728,4820,4813,4762,4841,4697,4835,4797,4701,4818,4744,4856,4848,4765,4853,4747,4937,4698,4712,4760,4796,4813,4866,4660,4840,4830,4830,4745,4782,4888,4891,4945,4812,4796,4746,4760,4854,4800,4823,4756,4822,4705,4845,4665,4890,4857,4663,4814,4752,4803,4874,4822,4756,4702,4870,4870,4724,4856,4878,4828,4852,4893,4839,4847,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
5997,0,9a4c4f36530c1cd52765085e274bba5be47814153476f8...,f23415c8ac5c8fc9859c5c97b1347c8f,2018-09,,40352,8912,7835,7813,8687,7444,7700,7501,9307,7408,7435,7478,8541,7642,7421,8047,8036,7304,7191,7421,7626,7478,7195,7410,7564,7424,7288,7416,7648,7445,7472,7450,7635,7158,7085,7292,8347,7095,7253,7423,7357,7261,7201,7537,7502,7264,7355,7237,7343,7304,7322,8098,7477,7550,7308,7516,7509,7709,7553,8139,7421,7639,7338,7580,7586,9460,7787,7507,7707,8988,8013,7600,7454,7308,7252,7438,7431,9045,7721,7648,8194,7578,7183,7933,7446,7747,8207,7843,7368,7907,7449,7769,7691,7928,8201,7964,7167,7346,7274,7461,7691,7946,7650,7469,7577,7569,7927,7342,7639,7546,7842,7726,7465,7448,7749,7755,9011,9286,7622,7776,7464,7530,7534,7642,7739,7930,7879,7662,7608,7246,7341,9109,7407,8023,7291,7429,7468,9660,7345,12899,7317,9473,7585,7523,7337,7433,7235,7554,7240,7388,7239,7385,7206,7456,7348,7488,7329,7516,7398,7673,7177,7317,7372,7470,7437,7530,7198,7495,7397,7395,7343,7360,7438,7335,7433,7433,7373,7477,7262,7479,7356,7596,7617,7790,8043,7481,7532,7629,7716,7501,7543,7610,8098,7880,7739,8103,7621,7383,7989,8063,7544,7796,7502,7597,8087,7637,7674,7704,7444,7538,7480,7400,7429,7427,7366,7541,7534,7454,7400,7767,7443,7747,7432,7755,7735,7355,7348,7500,7720,7643,7726,7582,10361,8417,7450,8112,7994,7648,7649,7854,8166,7746,7687,7709,7793,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
5998,1,7c19bcb1167c75daaffaf3363b12ea3156db7db4fe74ff...,9591ee24bd997e627e7ce167a81c40e2,2018-09,btcon,35245,26083,19383,18614,19014,19500,17352,19830,21803,26672,16930,17008,17210,16900,15872,15743,18341,18102,21524,18295,20475,16373,20870,18683,22632,20742,19342,16527,19819,17243,17250,17859,23248,24357,17157,14551,19055,21548,17607,19092,22355,25339,18073,16507,17717,20891,16704,16744,18885,23170,16829,15589,15983,15876,14630,14404,17686,16209,16309,15820,16838,14085,16166,16058,21884,18013,17241,13711,16286,16523,16448,15194,18829,17923,17906,16725,15194,14815,16105,15761,17099,18055,16184,14281,15567,15675,14536,16619,16508,17801,18576,15873,15697,14559,15632,18187,19691,16526,15640,12606,14827,15166,15041,13431,16423,16270,14385,15483,16494,13975,15057,15521,16272,17259,16319,13648,18041,15248,14224,17546,19265,16680,16967,15890,18385,16190,16652,24061,26605,19096,19469,16614,20605,17925,17638,20761,23545,22075,22593,19589,17353,18215,17008,15549,19109,19044,22447,17130,19740,21377,19608,20074,20604,21373,19960,16218,18408,20068,16367,17763,18672,18347,19436,14194,15531,17570,14387,15006,17592,17787,16908,16265,16395,17214,16134,14940,17056,16433,16072,14020,14983,16085,14696,16593,19924,17649,17309,16689,17295,16660,15604,17878,19605,18587,19345,16304,17179,17292,17063,16800,18027,21319,18544,19323,18289,18052,17416,15567,17347,17336,16521,17003,17306,16010,16555,17267,19074,18952,16156,14957,17499,16872,16272,17574,18088,17892,17764,15978,16488,16626,16152,15910,19551,19491,17430,18012,16717,16651,17827,17074,16652,16427,17277,16282,15143,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,True,True,True,True,True,True,True,True,True,True


In [15]:
df.head()

Unnamed: 0,label,sha256,md5,appeared,avclass,histogram.0,histogram.1,histogram.2,histogram.3,histogram.4,histogram.5,histogram.6,histogram.7,histogram.8,histogram.9,histogram.10,histogram.11,histogram.12,histogram.13,histogram.14,histogram.15,histogram.16,histogram.17,histogram.18,histogram.19,histogram.20,histogram.21,histogram.22,histogram.23,histogram.24,histogram.25,histogram.26,histogram.27,histogram.28,histogram.29,histogram.30,histogram.31,histogram.32,histogram.33,histogram.34,histogram.35,histogram.36,histogram.37,histogram.38,histogram.39,histogram.40,histogram.41,histogram.42,histogram.43,histogram.44,histogram.45,histogram.46,histogram.47,histogram.48,histogram.49,histogram.50,histogram.51,histogram.52,histogram.53,histogram.54,histogram.55,histogram.56,histogram.57,histogram.58,histogram.59,histogram.60,histogram.61,histogram.62,histogram.63,histogram.64,histogram.65,histogram.66,histogram.67,histogram.68,histogram.69,histogram.70,histogram.71,histogram.72,histogram.73,histogram.74,histogram.75,histogram.76,histogram.77,histogram.78,histogram.79,histogram.80,histogram.81,histogram.82,histogram.83,histogram.84,histogram.85,histogram.86,histogram.87,histogram.88,histogram.89,histogram.90,histogram.91,histogram.92,histogram.93,histogram.94,histogram.95,histogram.96,histogram.97,histogram.98,histogram.99,histogram.100,histogram.101,histogram.102,histogram.103,histogram.104,histogram.105,histogram.106,histogram.107,histogram.108,histogram.109,histogram.110,histogram.111,histogram.112,histogram.113,histogram.114,histogram.115,histogram.116,histogram.117,histogram.118,histogram.119,histogram.120,histogram.121,histogram.122,histogram.123,histogram.124,histogram.125,histogram.126,histogram.127,histogram.128,histogram.129,histogram.130,histogram.131,histogram.132,histogram.133,histogram.134,histogram.135,histogram.136,histogram.137,histogram.138,histogram.139,histogram.140,histogram.141,histogram.142,histogram.143,histogram.144,histogram.145,histogram.146,histogram.147,histogram.148,histogram.149,histogram.150,histogram.151,histogram.152,histogram.153,histogram.154,histogram.155,histogram.156,histogram.157,histogram.158,histogram.159,histogram.160,histogram.161,histogram.162,histogram.163,histogram.164,histogram.165,histogram.166,histogram.167,histogram.168,histogram.169,histogram.170,histogram.171,histogram.172,histogram.173,histogram.174,histogram.175,histogram.176,histogram.177,histogram.178,histogram.179,histogram.180,histogram.181,histogram.182,histogram.183,histogram.184,histogram.185,histogram.186,histogram.187,histogram.188,histogram.189,histogram.190,histogram.191,histogram.192,histogram.193,histogram.194,histogram.195,histogram.196,histogram.197,histogram.198,histogram.199,histogram.200,histogram.201,histogram.202,histogram.203,histogram.204,histogram.205,histogram.206,histogram.207,histogram.208,histogram.209,histogram.210,histogram.211,histogram.212,histogram.213,histogram.214,histogram.215,histogram.216,histogram.217,histogram.218,histogram.219,histogram.220,histogram.221,histogram.222,histogram.223,histogram.224,histogram.225,histogram.226,histogram.227,histogram.228,histogram.229,histogram.230,histogram.231,histogram.232,histogram.233,histogram.234,histogram.235,histogram.236,histogram.237,histogram.238,histogram.239,histogram.240,histogram.241,histogram.242,histogram.243,histogram.244,...,PtInRegion,PtVisible,QueryFontAssocStatus,RealizePalette,RectInRegion,RectVisible,Rectangle,RemoveFontMemResourceEx,RemoveFontResourceA,RemoveFontResourceExA,RemoveFontResourceExW,RemoveFontResourceTracking,RemoveFontResourceW,ResetDCA,ResetDCW,ResizePalette,RestoreDC,RoundRect,STROBJ_bEnum,STROBJ_bEnumPositionsOnly,STROBJ_bGetAdvanceWidths,STROBJ_dwGetCodePage,STROBJ_vEnumStart,SaveDC,ScaleRgn,ScaleValues,ScaleViewportExtEx,ScaleWindowExtEx,ScriptGetFontAlternateGlyphs,ScriptGetFontFeatureTags,ScriptGetFontLanguageTags,ScriptGetFontScriptTags,ScriptItemizeOpenType,ScriptPlaceOpenType,ScriptPositionSingleGlyph,ScriptShapeOpenType,ScriptSubstituteSingleGlyph,SelectBrushLocal,SelectClipPath,SelectClipRgn,SelectFontLocal,SelectObject,SelectPalette,SetAbortProc,SetArcDirection,SetBitmapAttributes,SetBitmapBits,SetBitmapDimensionEx,SetBkColor,SetBkMode,SetBoundsRect,SetBrushAttributes,SetBrushOrgEx,SetColorAdjustment,SetColorSpace,SetDCBrushColor,SetDCDpiScaleValue,SetDCPenColor,SetDIBColorTable,SetDIBits,SetDIBitsToDevice,SetDeviceGammaRamp,SetEnhMetaFileBits,SetFontEnumeration,SetGraphicsMode,SetICMMode,SetICMProfileA,SetICMProfileW,SetLayout,SetLayoutWidth,SetMagicColors,SetMapMode,SetMapperFlags,SetMetaFileBitsEx,SetMetaRgn,SetMiterLimit,SetOPMSigningKeyAndSequenceNumbers,SetPaletteEntries,SetPixel,SetPixelFormat,SetPixelV,SetPolyFillMode,SetROP2,SetRectRgn,SetRelAbs,SetStretchBltMode,SetSystemPaletteUse,SetTextAlign,SetTextCharacterExtra,SetTextColor,SetTextJustification,SetViewportExtEx,SetViewportOrgEx,SetVirtualResolution,SetWinMetaFileBits,SetWindowExtEx,SetWindowOrgEx,SetWorldTransform,StartDocA,StartDocW,StartFormPage,StartPage,StretchBlt,StretchDIBits,StrokeAndFillPath,StrokePath,SwapBuffers,TextOutA,TextOutW,TranslateCharsetInfo,UnloadNetworkFonts,UnrealizeObject,UpdateColors,UpdateICMRegKeyA,UpdateICMRegKeyW,WidenPath,XFORMOBJ_bApplyXform,XFORMOBJ_iGetXform,XLATEOBJ_cGetPalette,XLATEOBJ_hGetColorTransform,XLATEOBJ_iXlate,XLATEOBJ_piVector,bCreateDCW,bDeleteLDC,bInitSystemAndFontsDirectoriesW,bMakePathNameW,cGetTTFFromFOT,fpClosePrinter,gMaxGdiHandleCount,gW32PID,g_systemCallFilterId,gdiPlaySpoolStream,ghICM,hGetPEBHandle,pGdiDevCaps,pGdiSharedHandleTable,pGdiSharedMemory,pldcGet,semDxTrimNotification,vSetPldc,msvbvm60.dll-ordinal703,Create360SafeEngine,CreateCloudEngine,CreateCloudEngineLocker,CreateFileReportLog,CreatePlugin2,CreatePlugin3,CreatePlugin4,CreatePlugin5,CreateQuarantine,CreateTrustZone,ForceMerge360Log,GetModErrCode,IsSupportFeature,msi.dll-ordinal87,msi.dll-ordinal136,shlwapi.dll-PathGetDriveNumberA,wininet.dll-InternetGetCookieExA,qbsenderror20.dll-UDSetProdInfo,qbsenderror20.dll-UDAddFile,qbsenderror20.dll-AddCustomStrObject,qbsenderror20.dll-UDSetNonUIMode,qbsenderror20.dll-UDSetMemDump,qbsenderror20.dll-UDSetErrorCode,qbsenderror20.dll-UDSetErrorMsg,qbsenderror20.dll-UDIsValidData,qbsenderror20.dll-??0UploadData@@QAE@XZ,qbsenderror20.dll-?SetInfo@ReportInfo@@QAEABV1@ABV1@@Z,qbsenderror20.dll-UDSendDataReport,?GetData@CustomDWORDObject@@QBE?BKXZ,?GetData@CustomHexObject@@QBE?BKXZ,?GetData@CustomStrObject@@QBEPBDXZ,?GetDataDir@ProdInfo@@QBEPBDXZ,?GetDataInitFlags@UploadData@@UBEIXZ,?GetDescr@CustomObject@@QBEPBDXZ,?GetEmail@ReportInfo@@QBEPBDXZ,?GetEnvInfo@UploadData@@UBEPBVEnvInfo@@XZ,?GetErrorCode@ErrorData@@UAE?BKXZ,?GetErrorCode@ReportInfo@@QBE?BKXZ,?GetErrorCode@UploadData@@UAE?BKXZ,?GetErrorSeverity@ErrorData@@UBEKXZ,?GetErrorTime@UploadData@@UBE?BVCTime@ATL@@XZ,?GetErrorType@ErrorData@@UBE?AW4ERROR_TYPE@@XZ,?GetExceptionAddress@UEErrorData@@UBEQAXXZ,?GetExceptionDesc@UEErrorData@@UBEPBDXZ,?GetExceptionPointers@UploadData@@QBEPAU_EXCEPTION_POINTERS@@XZ,?GetFileDescriptionList@UploadData@@UAEXABVCStringArray@@@Z,?GetFileDescriptionList@UploadData@@UBEABVCStringArray@@XZ,?GetFileList@UploadData@@UBEABVCStringArray@@XZ,?GetHasSolution@ErrorData@@UBEHXZ,?GetLastSystemError@ErrorData@@UBEKXZ,?GetMdpFileName@UploadData@@UBEABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@XZ,?GetMessageText@ReportInfo@@QBEPBDXZ,?GetOsInfo@UploadData@@UBEPBVOsInfo@@XZ,?GetPayloadSize@UploadData@@UAE?BIXZ,?GetPayloadXmlFileName@UploadData@@UBEABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@XZ,?GetProcessorInfo@UploadData@@UBEPBVProcessorInfo@@XZ,?GetProdID@ProdInfo@@QBE?BIXZ,?GetProdName@ProdInfo@@QBEPBDXZ,?GetProdRelease@ProdInfo@@QBEPBDXZ,?GetProdVersion@ProdInfo@@QBEPBDXZ,?GetProgDir@ProdInfo@@QBEPBDXZ,?GetReportInfo@UploadData@@UBEPBVReportInfo@@XZ,?GetReportSeverity@ReportInfo@@QBE?BIXZ,?GetReportTimeStamp@ReportInfo@@QBEABVCTime@ATL@@XZ,?GetReportType@ReportInfo@@QBE?BW4REPORT_TYPE@@XZ,?GetReportType@UploadData@@QBE?BW4REPORT_TYPE@@XZ,?GetReportXmlFileName@UploadData@@UBEABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@XZ,?GetReportXmlString@UploadData@@UAEPBDXZ,?GetStrData@CustomObject@@UBEPBDXZ,?GetSubProdName@ProdInfo@@QBEPBDXZ,?SetDataDir@ProdInfo@@QAEPBDPBD@Z,?SetEmail@ReportInfo@@QAEPBDPBD@Z,?SetErrorCode@ReportInfo@@QAE?BKK@Z,?SetErrorSeverity@ErrorData@@QAEXK@Z,?SetErrorTime@UploadData@@UAEABVCTime@ATL@@ABV23@@Z,?SetErrorTime@UploadData@@UAEABVCTime@ATL@@PBV23@@Z,?SetErrorType@ErrorData@@QAEXW4ERROR_TYPE@@@Z,?SetExceptionAddress@UEErrorData@@UAEXPAX@Z,?SetExceptionPointers@UploadData@@UAEXPAU_EXCEPTION_POINTERS@@@Z,?SetFileList@UploadData@@UAEXABVCStringArray@@@Z,?SetHasSolution@ErrorData@@QAEXH@Z,?SetMdpFileName@UploadData@@UAEXV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@@Z,?SetMessageText@ReportInfo@@QAEPBDPBD@Z,?SetPayloadSize@UploadData@@UAEXI@Z,?SetPayloadXmlFileName@UploadData@@UAEXABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@@Z,?SetProdID@ProdInfo@@QAEXI@Z,?SetProdName@ProdInfo@@QAEPBDPBD@Z,?SetProdRelease@ProdInfo@@QAEPBDPBD@Z,?SetProdVersion@ProdInfo@@QAEPBDPBD@Z,?SetProgDir@ProdInfo@@QAEPBDPBD@Z,?SetReportInfo@UploadData@@UAEABVReportInfo@@ABV2@@Z,?SetReportSeverity@ReportInfo@@QAE?BII@Z,?SetReportTimeStamp@ReportInfo@@QAEABVCTime@ATL@@ABV23@@Z,?SetReportTimeStamp@ReportInfo@@QAEABVCTime@ATL@@PBV23@@Z,?SetReportType@ReportInfo@@QAE?BW4REPORT_TYPE@@W42@@Z,?SetReportXmlFileName@UploadData@@UAEXABV?$CStringT@DV?$StrTraitMFC@DV?$ChTraitsCRT@D@ATL@@@@@ATL@@@Z,?SetSubProdName@ProdInfo@@QAEPBDPBD@Z,?_exception_code@UEErrorData@@UBE?BKXZ,api-ms-win-crt-stdio-l1-1-0.dll-freopen,_cgo_panic,_cgo_topofstack,callbackTrampoline,commitHookTrampoline,compareTrampoline,crosscall2,doneTrampoline,rollbackHookTrampoline,stepTrampoline,updateHookTrampoline
0,0,0abb4fda7d5b13801d63bee53e5e256be43e141faa077a...,63956d6417f8f43357d9a8e79e52257e,2006-12,,45521,13095,12167,12496,12429,11709,11864,12057,12881,11798,11802,11783,12029,12081,11756,12532,11980,11628,11504,11715,11809,12414,11779,11708,11956,11622,11859,11775,11717,11507,11873,11781,12015,11690,11676,11782,11820,11859,12025,11786,11731,11445,11556,11676,12057,11636,11669,11903,12004,11741,11833,12329,11778,11859,11806,11586,11775,11885,11863,12047,11869,12077,11724,12037,13129,11931,12101,12202,11956,12625,11877,11804,11999,11869,11578,11591,11933,12020,11695,11915,12565,11755,11597,12224,11786,11709,12321,12325,11671,11624,11573,11879,11578,11802,12060,11792,11527,12248,11703,11793,12143,12701,12071,11871,12582,12346,12303,11892,12190,12011,11826,12261,12139,11913,11994,12155,13023,13136,11897,12164,12228,11972,11916,11951,12061,12243,12009,12266,12655,12023,11819,12283,11882,12303,11751,11888,11976,12472,11622,13260,11969,12127,11735,12024,11592,11699,11604,11657,11974,11714,11918,11815,11851,11806,11710,11590,11835,11971,11757,11874,11813,11834,11610,11723,11988,11714,11774,12021,11816,11834,11607,11829,11665,11641,11722,11869,11864,11784,11528,11733,11923,11749,11972,11721,11977,11712,11772,11721,11891,11796,11991,12200,12432,11643,11877,12040,11874,11804,11932,12179,11940,11764,11743,11653,11854,11800,12092,12021,11969,11931,11890,11982,11956,11710,11792,12095,11749,11815,11722,11825,11846,11804,11567,11926,11839,11814,11921,11981,11910,11640,11681,12030,12822,12105,12001,12008,12180,11862,11992,11888,12211,12155,11734,11819,12154,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,0,c9cafff8a596ba8a80bafb4ba8ae6f2ef3329d95b85f15...,6f7bde7a1126debf0cc359a54953efc1,2007-01,,93059,15789,2871,3005,4107,1771,2918,4312,4610,903,1184,956,3099,1128,1639,2669,3139,1070,1723,1328,3020,3593,1224,975,2642,895,823,1147,1546,1871,674,747,3381,658,711,907,3378,1540,656,668,1058,706,627,1011,1027,763,933,561,1284,667,760,2781,1066,1342,795,624,1204,1762,671,1812,911,937,614,589,1688,1134,722,1179,1582,5502,1471,890,1272,814,603,612,1182,2361,999,814,5117,1308,1012,3143,1275,1720,2645,2662,1126,818,730,1171,1246,1714,1269,1189,1889,3521,717,1655,2032,4198,1584,1043,4606,2505,3264,663,1899,1252,2273,2974,1766,609,2614,2331,7378,5705,1200,1304,1067,887,608,563,1314,1769,742,684,1414,1506,664,4512,1594,5409,727,602,1764,5609,679,10251,1011,5446,554,526,2908,499,505,500,726,570,541,474,758,516,538,447,1580,1782,515,487,871,879,473,579,806,843,488,521,785,460,554,625,698,528,548,635,936,843,531,566,795,1420,713,673,1046,580,534,694,751,960,713,549,3999,1308,1389,1304,1600,461,1081,1877,1205,1197,680,563,944,495,608,516,1029,745,742,745,925,508,1022,837,1277,551,558,813,1000,619,599,537,1534,805,616,697,1407,568,529,552,4924,1415,585,1705,2668,538,598,620,1521,651,518,969,1453,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,0,eac8ddb4970f8af985742973d6f0e06902d42a3684d791...,7520c8f9534ca818726a4feaebf49e2b,2007-02,,45369,2560,1233,1542,4234,515,613,1542,1841,212,631,172,903,189,170,1302,985,456,362,497,499,1285,122,81,286,146,274,457,309,129,84,117,709,98,212,91,553,117,117,108,212,104,61,727,195,101,179,89,924,363,410,2355,455,1015,291,354,535,546,413,790,438,596,510,466,2188,2121,411,295,1941,1520,289,255,303,287,86,120,340,417,222,186,2208,713,525,956,385,577,957,793,310,156,67,221,145,283,1144,324,125,319,90,234,280,806,2809,187,927,321,1132,147,380,561,400,831,770,57,418,401,1454,1491,185,2827,666,248,88,139,218,391,117,757,1757,310,107,787,572,1158,279,388,2198,873,67,2583,170,926,121,413,127,52,482,53,85,73,152,44,161,1979,533,54,80,63,39,35,983,236,49,175,106,154,174,28,153,64,337,66,104,63,47,53,111,34,89,53,95,55,43,206,364,70,31,87,476,46,80,397,1325,234,489,235,265,37,181,365,201,303,77,100,2047,39,72,107,219,79,65,69,156,30,276,180,254,45,33,127,161,210,106,54,304,46,36,146,205,82,71,99,1145,672,127,557,2133,188,47,155,954,296,197,577,471,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,0,7f513818bcc276c531af2e641c597744da807e21cc1160...,e435a536968941854bcec3b902c439f6,2007-02,,21315,9641,9332,9358,9598,9220,9146,9382,9365,9116,9178,9255,9503,9173,9095,9190,9381,9200,9176,9073,9098,9190,9140,9039,9188,9066,9079,9114,9209,9015,9132,9164,9778,9064,9189,9088,9400,9150,9007,9213,9248,9035,8897,8989,9260,9047,9055,9169,9403,9463,9239,9724,9091,9143,9119,9178,9014,9101,9114,9296,9124,9008,9090,9188,10427,9299,9203,9480,9399,9650,9222,9324,9153,8957,9121,9073,9179,9328,9011,9068,9483,9098,9329,9335,9042,9502,9425,9211,9089,9397,9299,9221,9236,9486,8962,9204,9029,9304,9360,9192,9541,9611,9366,9310,9441,9492,9362,9267,9253,9276,9374,9422,9200,9097,9220,9328,9829,9509,9480,9280,9203,9180,9175,9065,9157,9200,9214,9349,9343,9138,9115,9663,9139,9358,9074,9071,9065,9755,9174,11133,9090,9562,9006,9076,9144,8916,9039,9219,9086,9123,8824,9220,9054,9248,9130,8995,9036,9075,9017,9331,9236,9260,9062,9156,8970,9317,9113,9157,9188,9031,9074,9059,9170,9092,9216,9057,9361,9154,9176,9321,9163,9143,9107,9094,9206,9427,9219,9187,9206,9138,9175,9050,9809,9161,9002,9737,9368,9140,9114,9362,9124,9069,9102,9089,9421,8855,9288,9056,9251,9201,9270,9166,9062,9125,8968,9095,9333,8971,9158,9068,9058,9147,9178,9095,9422,9262,9156,9064,9066,9225,9100,9125,10073,9366,9267,9557,9119,9136,9250,9212,9563,9170,9289,9195,9170,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,0,ca65e1c387a4cc9e7d8a8ce12bf1bcf9f534c9032b9d95...,e93049e2df82ab26f35ad0049173cb14,2007-02,,23539,6015,5214,4727,4892,4649,4367,5299,5625,4361,4446,4892,4695,5005,4493,5703,4982,4504,4230,4094,4462,4626,4273,4313,4229,4308,4372,4349,4294,4433,4245,4291,4926,4311,4325,4346,4447,4338,4264,4295,4253,4388,4272,4246,4427,4472,4369,4298,4396,4271,4316,4547,4300,4429,4263,4395,4265,4343,4291,4440,4376,4442,4266,4334,4354,4509,4382,4542,4471,4839,4456,4304,4457,4598,4360,4325,4328,4330,4251,4405,4957,4369,4461,4739,4454,4584,4732,4465,4465,4393,4380,4458,4422,4359,4329,4337,4353,4749,4353,4484,4684,4989,4539,4322,4487,4563,4773,4236,4693,4395,4695,4613,4457,4212,4729,4530,5252,4934,4465,4397,4318,4294,4179,4390,4472,4336,4396,4405,4648,4207,4310,4834,4399,4806,4405,4286,4249,4558,4477,5222,4409,4781,4273,4246,4350,4250,4440,4407,4347,4386,4283,4283,4365,4193,4194,4230,4079,4137,4264,4251,4319,4433,4429,4263,4390,4390,4309,4279,4238,4309,4349,4330,4327,4287,4354,4269,4387,4225,4385,4220,4359,4238,4340,4338,4289,4306,4276,4320,4237,4329,4392,4346,4765,4403,4462,4401,4259,4321,4506,4360,4336,4335,4416,4353,4233,4171,4275,4189,4357,4287,4412,4251,4352,4178,4222,4300,4569,4115,4253,4194,4338,4326,4197,4212,4294,4378,4291,4293,4388,4374,4296,4297,4790,4327,4177,4476,4471,4220,4290,4303,4382,4183,4265,4465,4469,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [1]:
df.shape

NameError: name 'df' is not defined

In [19]:
df.columns

Index(['label', 'sha256', 'md5', 'appeared', 'avclass', 'histogram.0', 'histogram.1', 'histogram.2', 'histogram.3', 'histogram.4',
       ...
       '_cgo_panic', '_cgo_topofstack', 'callbackTrampoline', 'commitHookTrampoline', 'compareTrampoline', 'crosscall2', 'doneTrampoline', 'rollbackHookTrampoline', 'stepTrampoline', 'updateHookTrampoline'], dtype='object', length=239191)

In [16]:
header = df.loc[:,df.columns.str.startswith("header")]

In [17]:
header.head()

Unnamed: 0,header_word
0,
1,
2,
3,
4,
