In [2]:
import json
import pandas as pd


def read_data(path, limiter):
    """
    Args:
        path: path to dataset in jsonl file format
        limiter: number of rows

    Returns:
        data: json dict, where every line is one sample as json
    """
    with open(path) as file:
        data = [json.loads(next(file)) for x in range(limiter)]
    return data


def transform_dll_imports(json_sample):
    """
    Args:
        json_sample: one sample of dataset

    Returns:
        functions_dict: dict with all dll functions name with value True
    """
    imports = sample["imports"]
    functions_dict = {}
    for key in imports.keys():
        functions = imports[key]
        functions_with_values = {key.lower() + "-" + f_name: True for f_name in functions}
        functions_dict.update(functions_with_values)
    return functions_dict


def transform_dict(json_dict):
    """
    Args:
        json_dict: json dict with nested key-value, where value is list

    Returns:
        functions_dict: dict with value as a key and default value True
    """
    result_dict = {}
    for key in json_dict.keys():
        keys = json_dict[key]
        values_with_default = {key.lower() + "-" + f_name: True for f_name in keys}
        result_dict.update(values_with_default)
    return result_dict


def transform_list(json_list):
    """
    Args:
        json_list: json list of values

    Returns:
        functions_dict: dict with all dll functions name with value True
    """
    result_dict = {}
    result_dict.update({i: True for i in json_list})
    return result_dict


def flatten_json(y, separator=''):
    """
    Args:
        y: json object
        separator: separator

    Returns:
        functions_dict: dict with flatten values
    """
    out = {}

    def flatten(x, name=separator):
        if type(x) is dict:
            for a in x:
                flatten(x[a], name + a + '_')
        elif type(x) is list:
            i = 0
            for a in x:
                flatten(a, name + str(i) + '_')
                i += 1
        else:
            out[name[:-1]] = x

    flatten(y)
    return out


# 1. read datas
data_path = '/sample_data_6k.jsonl'
data = read_data(data_path, limiter=2)
# 2. iterate over dataset
flatten_dataset = []
for sample in data:
    # version 1 dummy way
    # flat = flatten_json(sample)
    # flatten_dataset.append(flat)
    # collect transformed values for each sample

    # version 2
    transformed = {}
    transformed.update({"label": sample['label']})
    transformed.update({"sha256": sample['sha256']})
    transformed.update({"md5": sample['md5']})
    transformed.update({"appeared": sample['appeared']})
    transformed.update({"avclass": sample['avclass']})
    transformed.update(flatten_json(sample['histogram'], 'histogram.'))
    transformed.update(flatten_json(sample['byteentropy'], 'byteentropy.'))
    transformed.update(transform_dict(sample["imports"]))
    transformed.update(transform_list(sample["exports"]))
    transformed.update(flatten_json(sample['general']))
    transformed.update(flatten_json(sample['strings']))
    transformed.update(flatten_json(sample['header']))
    transformed.update(flatten_json(sample['datadirectories']))

    # here we fill with transform data
    flatten_dataset.append(transformed)

# change all transformed dataset to dataframe object
df = pd.DataFrame(flatten_dataset)
df


FileNotFoundError: [Errno 2] No such file or directory: '/sample_data_6k.jsonl'

In [3]:
import json
import pandas as pd

In [16]:
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)
pd.set_option('display.width', 1000)
pd.set_option('display.float_format', '{:.2f}'.format)

In [17]:
def read_data(path, limiter):
    """
    Args:
        path: path to dataset in jsonl file format
        limiter: number of rows

    Returns:
        data: json dict, where every line is one sample as json
    """
    with open(path) as file:
        data = [json.loads(next(file)) for x in range(limiter)]
    return data


def transform_dll_imports(json_sample):
    """
    Args:
        json_sample: one sample of dataset

    Returns:
        functions_dict: dict with all dll functions name with value True
    """
    imports = sample["imports"]
    functions_dict = {}
    for key in imports.keys():
        functions = imports[key]
        functions_with_values = {key.lower() + "-" + f_name: True for f_name in functions}
        functions_dict.update(functions_with_values)
    return functions_dict


def transform_dict(json_dict):
    """
    Args:
        json_dict: json dict with nested key-value, where value is list

    Returns:
        functions_dict: dict with value as a key and default value True
    """
    result_dict = {}
    for key in json_dict.keys():
        keys = json_dict[key]
        values_with_default = {key.lower() + "-" + f_name: True for f_name in keys}
        result_dict.update(values_with_default)
    return result_dict


def transform_list(json_list):
    """
    Args:
        json_list: json list of values

    Returns:
        functions_dict: dict with all dll functions name with value True
    """
    result_dict = {}
    result_dict.update({i: True for i in json_list})
    return result_dict


def flatten_json(y, separator=''):
    """
    Args:
        y: json object
        separator: separator

    Returns:
        functions_dict: dict with flatten values
    """
    out = {}

    def flatten(x, name=separator):
        if type(x) is dict:
            for a in x:
                flatten(x[a], name + a + '_')
        elif type(x) is list:
            i = 0
            for a in x:
                flatten(a, name + str(i) + '_')
                i += 1
        else:
            out[name[:-1]] = x

    flatten(y)
    return out



In [5]:
# 1. read datas
data_path = 'sample_data_6k.jsonl'
data = read_data(data_path, limiter=6000)
# 2. iterate over dataset
flatten_dataset = []

In [6]:
data[0]['section']['sections']

[{'name': '.text',
  'size': 26624,
  'entropy': 6.532239617101003,
  'vsize': 26134,
  'props': ['CNT_CODE', 'MEM_EXECUTE', 'MEM_READ']},
 {'name': '.rdata',
  'size': 6656,
  'entropy': 5.433081641309689,
  'vsize': 6216,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ']},
 {'name': '.data',
  'size': 512,
  'entropy': 1.7424160994148217,
  'vsize': 172468,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ', 'MEM_WRITE']},
 {'name': '.rsro',
  'size': 0,
  'entropy': -0.0,
  'vsize': 135168,
  'props': ['CNT_UNINITIALIZED_DATA', 'MEM_READ', 'MEM_WRITE']},
 {'name': '.rsrc',
  'size': 27648,
  'entropy': 5.020929764194735,
  'vsize': 28672,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ']}]

In [13]:
flatten_dataset = []
for sample in data:
    
    transformed = {}
    transformed.update({"label": sample['label']})
    transformed.update(flatten_json(sample['section']['sections']))
    
    flatten_dataset.append(transformed)

# change all transformed dataset to dataframe object
df = pd.DataFrame(flatten_dataset)
df

Unnamed: 0,label,0_name,0_size,0_entropy,0_vsize,0_props_0,0_props_1,0_props_2,1_name,1_size,...,29_props_2,29_props_3,30_name,30_size,30_entropy,30_vsize,30_props_0,30_props_1,30_props_2,30_props_3
0,0,.text,26624.0,6.532240,26134.0,CNT_CODE,MEM_EXECUTE,MEM_READ,.rdata,6656.0,...,,,,,,,,,,
1,0,.text,455680.0,6.822879,455304.0,CNT_CODE,MEM_EXECUTE,MEM_READ,.data,8192.0,...,,,,,,,,,,
2,0,.text,81920.0,6.459014,80594.0,CNT_CODE,MEM_EXECUTE,MEM_READ,.data,4096.0,...,,,,,,,,,,
3,0,CODE,36864.0,6.599333,36628.0,CNT_CODE,MEM_EXECUTE,MEM_READ,DATA,1024.0,...,,,,,,,,,,
4,0,.text,34304.0,6.591424,33908.0,CNT_CODE,MEM_EXECUTE,MEM_READ,.data,1024.0,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5995,1,.code,1841.0,5.338839,1841.0,CNT_CODE,MEM_EXECUTE,MEM_READ,.text,6552.0,...,,,,,,,,,,
5996,1,CODE,90624.0,7.996807,204800.0,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,DATA,1536.0,...,,,,,,,,,,
5997,0,.text,104448.0,6.610239,104384.0,CNT_CODE,MEM_EXECUTE,MEM_READ,.rdata,17920.0,...,,,,,,,,,,
5998,1,,2886656.0,7.985471,6692864.0,CNT_INITIALIZED_DATA,MEM_EXECUTE,MEM_READ,.rsrc,81920.0,...,,,,,,,,,,


In [19]:
df

Unnamed: 0,label,0_name,0_size,0_entropy,0_vsize,0_props_0,0_props_1,0_props_2,1_name,1_size,1_entropy,1_vsize,1_props_0,1_props_1,2_name,2_size,2_entropy,2_vsize,2_props_0,2_props_1,2_props_2,3_name,3_size,3_entropy,3_vsize,3_props_0,3_props_1,3_props_2,4_name,4_size,4_entropy,4_vsize,4_props_0,4_props_1,1_props_2,5_name,5_size,5_entropy,5_vsize,5_props_0,5_props_1,5_props_2,6_name,6_size,6_entropy,6_vsize,6_props_0,6_props_1,6_props_2,7_name,7_size,7_entropy,7_vsize,7_props_0,7_props_1,7_props_2,0_props_3,1_props_3,4_props_2,8_name,8_size,8_entropy,8_vsize,8_props_0,8_props_1,8_props_2,3_props_3,2_props_3,4_props_3,4_props_4,3_props_4,9_name,9_size,9_entropy,9_vsize,9_props_0,9_props_1,9_props_2,0_props_4,1_props_4,5_props_3,6_props_3,7_props_3,0_props_5,0_props_6,0_props_7,0_props_8,0_props_9,0_props_10,0_props_11,0_props_12,0_props_13,0_props_14,1_props_5,1_props_6,1_props_7,1_props_8,1_props_9,1_props_10,1_props_11,1_props_12,1_props_13,2_props_4,2_props_5,2_props_6,2_props_7,2_props_8,3_props_5,3_props_6,3_props_7,3_props_8,3_props_9,4_props_5,4_props_6,4_props_7,4_props_8,4_props_9,4_props_10,4_props_11,4_props_12,4_props_13,2_props_9,2_props_10,2_props_11,2_props_12,2_props_13,5_props_4,10_name,10_size,10_entropy,10_vsize,10_props_0,10_props_1,10_props_2,7_props_4,6_props_4,3_props_10,3_props_11,3_props_12,5_props_5,5_props_6,5_props_7,5_props_8,5_props_9,5_props_10,5_props_11,5_props_12,6_props_5,6_props_6,6_props_7,6_props_8,6_props_9,6_props_10,6_props_11,6_props_12,6_props_13,7_props_5,7_props_6,7_props_7,7_props_8,7_props_9,7_props_10,7_props_11,7_props_12,7_props_13,8_props_3,8_props_4,8_props_5,8_props_6,8_props_7,8_props_8,8_props_9,8_props_10,8_props_11,8_props_12,8_props_13,9_props_3,9_props_4,9_props_5,9_props_6,9_props_7,9_props_8,9_props_9,9_props_10,9_props_11,9_props_12,9_props_13,2_props_14,5_props_13,5_props_14,5_props_15,10_props_3,10_props_4,10_props_5,10_props_6,10_props_7,10_props_8,10_props_9,10_props_10,10_props_11,10_props_12,10_props_13,3_props_13,11_name,11_size,11_entropy,11_vsize,11_props_0,11_props_1,11_props_2,11_props_3,11_props_4,11_props_5,11_props_6,11_props_7,11_props_8,11_props_9,12_name,12_size,12_entropy,12_vsize,12_props_0,12_props_1,12_props_2,12_props_3,12_props_4,12_props_5,12_props_6,12_props_7,12_props_8,12_props_9,13_name,13_size,13_entropy,13_vsize,13_props_0,13_props_1,13_props_2,13_props_3,13_props_4,13_props_5,13_props_6,13_props_7,13_props_8,13_props_9,14_name,14_size,14_entropy,14_vsize,14_props_0,14_props_1,14_props_2,14_props_3,14_props_4,14_props_5,14_props_6,14_props_7,14_props_8,14_props_9,15_name,15_size,15_entropy,15_vsize,15_props_0,15_props_1,15_props_2,15_props_3,15_props_4,15_props_5,15_props_6,15_props_7,15_props_8,15_props_9,16_name,16_size,16_entropy,16_vsize,16_props_0,16_props_1,16_props_2,16_props_3,16_props_4,16_props_5,16_props_6,16_props_7,16_props_8,16_props_9,13_props_10,13_props_11,13_props_12,13_props_13,14_props_10,14_props_11,14_props_12,4_props_14,4_props_15,11_props_10,11_props_11,11_props_12,11_props_13,12_props_10,12_props_11,12_props_12,12_props_13,17_name,17_size,17_entropy,17_vsize,17_props_0,17_props_1,17_props_2,17_props_3,17_props_4,17_props_5,17_props_6,17_props_7,17_props_8,17_props_9,1_props_14,1_props_15,3_props_14,3_props_15,18_name,18_size,18_entropy,18_vsize,18_props_0,18_props_1,18_props_2,18_props_3,19_name,19_size,19_entropy,19_vsize,19_props_0,19_props_1,19_props_2,19_props_3,20_name,20_size,20_entropy,20_vsize,20_props_0,20_props_1,20_props_2,20_props_3,21_name,21_size,21_entropy,21_vsize,21_props_0,21_props_1,21_props_2,21_props_3,22_name,22_size,22_entropy,22_vsize,22_props_0,22_props_1,22_props_2,22_props_3,23_name,23_size,23_entropy,23_vsize,23_props_0,23_props_1,23_props_2,23_props_3,24_name,24_size,24_entropy,24_vsize,24_props_0,24_props_1,24_props_2,24_props_3,25_name,25_size,25_entropy,25_vsize,25_props_0,25_props_1,25_props_2,25_props_3,0_props_15,0_props_16,18_props_4,18_props_5,18_props_6,18_props_7,18_props_8,18_props_9,19_props_4,19_props_5,19_props_6,19_props_7,19_props_8,19_props_9,20_props_4,20_props_5,20_props_6,20_props_7,20_props_8,20_props_9,16_props_10,16_props_11,16_props_12,16_props_13,8_props_14,26_name,26_size,26_entropy,26_vsize,26_props_0,26_props_1,26_props_2,26_props_3,27_name,27_size,27_entropy,27_vsize,27_props_0,27_props_1,27_props_2,27_props_3,28_name,28_size,28_entropy,28_vsize,28_props_0,28_props_1,28_props_2,28_props_3,29_name,29_size,29_entropy,29_vsize,29_props_0,29_props_1,29_props_2,29_props_3,30_name,30_size,30_entropy,30_vsize,30_props_0,30_props_1,30_props_2,30_props_3
0,0,.text,26624.00,6.53,26134.00,CNT_CODE,MEM_EXECUTE,MEM_READ,.rdata,6656.00,5.43,6216.00,CNT_INITIALIZED_DATA,MEM_READ,.data,512.00,1.74,172468.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.rsro,0.00,-0.00,135168.00,CNT_UNINITIALIZED_DATA,MEM_READ,MEM_WRITE,.rsrc,27648.00,5.02,28672.00,CNT_INITIALIZED_DATA,MEM_READ,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,0,.text,455680.00,6.82,455304.00,CNT_CODE,MEM_EXECUTE,MEM_READ,.data,8192.00,6.20,19856.00,CNT_INITIALIZED_DATA,MEM_READ,.rsrc,39424.00,3.69,38992.00,CNT_INITIALIZED_DATA,MEM_READ,,,,,,,,,,,,,,,MEM_WRITE,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,0,.text,81920.00,6.46,80594.00,CNT_CODE,MEM_EXECUTE,MEM_READ,.data,4096.00,1.59,1332.00,CNT_INITIALIZED_DATA,MEM_READ,.rsrc,81920.00,5.12,81920.00,CNT_INITIALIZED_DATA,MEM_READ,,.reloc,8192.00,6.81,6580.00,CNT_INITIALIZED_DATA,MEM_DISCARDABLE,MEM_READ,,,,,,,MEM_WRITE,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,0,CODE,36864.00,6.60,36628.00,CNT_CODE,MEM_EXECUTE,MEM_READ,DATA,1024.00,4.13,584.00,CNT_INITIALIZED_DATA,MEM_READ,BSS,0.00,-0.00,3636.00,MEM_READ,MEM_WRITE,,.idata,2560.00,4.65,2370.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.tls,0.00,-0.00,8.00,MEM_READ,MEM_WRITE,MEM_WRITE,.rdata,512.00,2.05,24.00,CNT_INITIALIZED_DATA,MEM_SHARED,MEM_READ,.reloc,0.00,-0.00,2176.00,CNT_INITIALIZED_DATA,MEM_SHARED,MEM_READ,.rsrc,10240.00,4.34,10240.00,CNT_INITIALIZED_DATA,MEM_SHARED,MEM_READ,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,0,.text,34304.00,6.59,33908.00,CNT_CODE,MEM_EXECUTE,MEM_READ,.data,1024.00,4.10,7180.00,CNT_INITIALIZED_DATA,MEM_READ,.rsrc,1116672.00,7.99,1118208.00,CNT_INITIALIZED_DATA,MEM_READ,,,,,,,,,,,,,,,MEM_WRITE,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5995,1,.code,1841.00,5.34,1841.00,CNT_CODE,MEM_EXECUTE,MEM_READ,.text,6552.00,6.19,6552.00,CNT_CODE,MEM_EXECUTE,.rdata,28.00,1.77,28.00,CNT_INITIALIZED_DATA,MEM_READ,,.data,1960.00,4.98,1960.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.rsrc,700.00,5.07,700.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_READ,.NewSec,4096.00,0.53,4096.00,CNT_CODE,MEM_EXECUTE,CNT_INITIALIZED_DATA,,,,,,,,,,,,,,,MEM_WRITE,,,,,,,,,,,,,,,,,,,,,,,,CNT_UNINITIALIZED_DATA,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,MEM_READ,,,,,,,,,,,,,MEM_WRITE,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
5996,1,CODE,90624.00,8.00,204800.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,DATA,1536.00,6.60,4096.00,CNT_INITIALIZED_DATA,MEM_READ,BSS,0.00,-0.00,4096.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.idata,3584.00,7.39,12288.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.tls,0.00,-0.00,4096.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.rdata,512.00,0.20,4096.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.reloc,0.00,-0.00,16384.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.rsrc,30720.00,7.88,94208.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,,,MEM_WRITE,.aspack,6144.00,6.29,8192.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,,,,,,.data,0.00,-0.00,4096.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
5997,0,.text,104448.00,6.61,104384.00,CNT_CODE,MEM_EXECUTE,MEM_READ,.rdata,17920.00,4.45,17552.00,CNT_INITIALIZED_DATA,MEM_READ,.data,12800.00,1.38,23144.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,.sxdata,512.00,0.81,4.00,CNT_INITIALIZED_DATA,LNK_INFO,MEM_READ,.rsrc,3072.00,3.71,2672.00,CNT_INITIALIZED_DATA,MEM_READ,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,MEM_WRITE,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
5998,1,,2886656.00,7.99,6692864.00,CNT_INITIALIZED_DATA,MEM_EXECUTE,MEM_READ,.rsrc,81920.00,8.00,81920.00,CNT_INITIALIZED_DATA,MEM_READ,.idata,512.00,1.28,4096.00,CNT_INITIALIZED_DATA,MEM_READ,MEM_WRITE,,512.00,0.26,2424832.00,CNT_INITIALIZED_DATA,MEM_EXECUTE,MEM_READ,qbhbfumh,1555456.00,7.96,1556480.00,CNT_INITIALIZED_DATA,MEM_EXECUTE,MEM_WRITE,fihqeqes,512.00,3.90,4096.00,CNT_INITIALIZED_DATA,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,,MEM_WRITE,,MEM_READ,,,,,,,,MEM_WRITE,,MEM_WRITE,,,,,,,,,,,,MEM_WRITE,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [11]:
frame.head()

Unnamed: 0,0_name,0_size,0_entropy,0_vsize,0_props_0,0_props_1,0_props_2,0_props_3,0_props_4,0_props_5,...,0_props_7,0_props_8,0_props_9,0_props_10,0_props_11,0_props_12,0_props_13,0_props_14,0_props_15,0_props_16
0,.text,26624.0,6.53224,26134.0,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,...,,,,,,,,,,
1,.text,455680.0,6.822879,455304.0,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,...,,,,,,,,,,
2,.text,81920.0,6.459014,80594.0,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,...,,,,,,,,,,
3,CODE,36864.0,6.599333,36628.0,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,...,,,,,,,,,,
4,.text,34304.0,6.591424,33908.0,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,...,,,,,,,,,,


In [12]:
df.shape

(6000, 450)

In [10]:
frame = df.loc[:,df.columns.str.startswith('0')]

In [45]:
frame[frame['0_name']=='.text']

Unnamed: 0,0_name,0_size,0_entropy,0_vsize,0_props_0,0_props_1,0_props_2,0_props_3,0_props_4,0_props_5,0_props_6,0_props_7,0_props_8,0_props_9,0_props_10,0_props_11,0_props_12,0_props_13,0_props_14,0_props_15,0_props_16
0,.text,26624.00,6.53,26134.00,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,
1,.text,455680.00,6.82,455304.00,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,
2,.text,81920.00,6.46,80594.00,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,
4,.text,34304.00,6.59,33908.00,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,
5,.text,8704.00,6.27,8259.00,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
5990,.text,1706496.00,7.19,1706326.00,CNT_CODE,MEM_LOCKED,MEM_READ,MEM_WRITE,,,,,,,,,,,,,
5993,.text,2559488.00,6.52,2559196.00,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,
5994,.text,0.00,-0.00,96153.00,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,
5997,.text,104448.00,6.61,104384.00,CNT_CODE,MEM_EXECUTE,MEM_READ,,,,,,,,,,,,,,


In [None]:
for s

In [29]:
df.columns

Index(['0_name', '0_size', '0_entropy', '0_vsize', '0_props_0', '0_props_1',
       '0_props_2', '1_name', '1_size', '1_entropy', '1_vsize', '1_props_0',
       '1_props_1', '2_name', '2_size', '2_entropy', '2_vsize', '2_props_0',
       '2_props_1', '2_props_2', '3_name', '3_size', '3_entropy', '3_vsize',
       '3_props_0', '3_props_1', '3_props_2', '4_name', '4_size', '4_entropy',
       '4_vsize', '4_props_0', '4_props_1', '1_props_2'],
      dtype='object')

In [33]:
# this helps with scrolling df
pd.set_option('display.max_rows', 500)
pd.set_option('display.max_columns', 500)
pd.set_option('display.width', 1000)
pd.set_option('display.float_format', '{:.2f}'.format)

In [26]:
import json
import pandas as pd
import csv

def read_data(path, limiter):
    """
    Args:
        path: path to dataset in jsonl file format
        limiter: number of rows

    Returns:
        data: json dict, where every line is one sample as json
    """
    with open(path) as file:
        data = [json.loads(next(file)) for x in range(limiter)]
    return data


def transform_dll_imports(json_sample):
    """
    Args:
        json_sample: one sample of dataset

    Returns:
        functions_dict: dict with all dll functions name with value True
    """
    imports = sample["imports"]
    functions_dict = {}
    for key in imports.keys():
        functions = imports[key]
        functions_with_values = {key.lower() + "-" + f_name: True for f_name in functions}
        functions_dict.update(functions_with_values)
    return functions_dict


def transform_dict(json_dict):
    """
    Args:
        json_dict: json dict with nested key-value, where value is list

    Returns:
        functions_dict: dict with value as a key and default value True
    """
    result_dict = {}
    for key in json_dict.keys():
        keys = json_dict[key]
        values_with_default = {key.lower() + "-" + f_name: True for f_name in keys}
        result_dict.update(values_with_default)
    return result_dict


def transform_list(json_list):
    """
    Args:
        json_list: json list of values

    Returns:
        functions_dict: dict with all dll functions name with value True
    """
    result_dict = {}
    result_dict.update({i: True for i in json_list})
    return result_dict


def flatten_json(y, separator=''):
    """
    Args:
        y: json object
        separator: separator

    Returns:
        functions_dict: dict with flatten values
    """
    out = {}

    def flatten(x, name=separator):
        if type(x) is dict:
            for a in x:
                flatten(x[a], name + a + '_')
        elif type(x) is list:
            i = 0
            for a in x:
                flatten(a, name + str(i) + '_')
                i += 1
        else:
            out[name[:-1]] = x

    flatten(y)
    return out

# Extract "sha256", "md5", "appeared", "label" and "avclass" columns to a flat form

def get_simple_column(sample, columns = ["sha256", "md5", "appeared", "label", "avclass"]):
    '''
    input:
        data: variable with dataset
        columns: list of names extracted columns
    output:
        final_list: list of dicts, one list's element is a one sample of dataset
    '''
    simple_dict = {}
    simple_dict.update({column:sample[column] for column in columns})
    return simple_dict

# Extraction columns with list: "histogram", "byteentropy", "exports"

def get_simple_list_from_column(sample, columns = ["histogram", "byteentropy", "exports"]):

    '''
    input:
        data: variable with dataset
        columns: name of extracted columns (str)
    output:
        final_list: list of dicts, one list's element is a one sample of dataset
    '''
  
    dict_exports = {}
    dict_others = {}
    dict_final = {}

    for column in columns:
        if column == "exports":
            dict_exports.update({column+"_"+str(v).lower():True for v in sample[column]})
        else:
            dict_others.update({column+"_"+str(i):n for i, n in enumerate(sample[column])})             
                
    dict_final.update(dict_others)
    dict_final.update(dict_exports)
               
    return dict_final


# Extraction IMPORTS, GENERAL and STRINGS columns

def get_features_from_dict_column(sample, columns = "imports"):
    '''
    input:
            data
            columns
    output:
            functions_with_valuex
    '''
    dict_final = {}
    temp1 = {}
    temp2 = {}
    temp3 = {}

    feature = sample[columns]
    for key in feature.keys():
        content = feature[key]
        if (isinstance(content, list) and len(content)!=0):
            if not isinstance(content[0], str):
                temp1.update({columns +"_"+key.lower() + "-" + str(i):cont for i, cont in enumerate(content)})
            else:
                temp2.update({columns +"_"+ key.lower() + "-" + str(cont).lower():True for cont in content})
        else:
            temp3.update({columns+"_"+key:content})

    dict_final.update(temp1)   
    dict_final.update(temp2) 
    dict_final.update(temp3) 
    return dict_final

# Extraction HEADER column

def get_features_from_header(sample):
    '''
    input:
        data: data
    output:
        list_final: list of dicts
    '''    
    headers = sample["header"]
    dict_lists = {}
    dict_others = {}
    dict_final = {}

    for h in headers.keys():   
        temp = headers[h]      
        for k in temp.keys():  

            if isinstance(temp[k], list):
                dict_lists.update({"header_"+h.lower()+"_"+k.lower()+"_"+str(t).lower():True for t in temp[k]}) 
            else:
                dict_others.update({"header_"+h.lower()+"_"+k.lower():temp[k]})

    dict_final.update(dict_lists)    
    dict_final.update(dict_others)
    return dict_final


# Extraction Section column

def get_features_from_section(sample):

    '''
    input:
        data: data
    output:
        list_final: list of dicts
    '''  
    section_entry = sample['section']['entry']    # .text
    section_sections = sample['section']['sections']
    dict_lists_sections = {}
    dict_others_sections = {}
    dict_final = {}

    for part in section_sections:
        name = part['name']
        for position in ['size', 'entropy', 'vsize', 'props']:
            if position == 'props':
                dict_lists_sections.update({"section_"+section_entry.lower()+"_sections"+name.lower()+"_"+position+"_"+str(element).lower():True for element in part[position]})
            else:
                dict_others_sections.update({"section_"+section_entry.lower()+"_sections"+name.lower()+"_"+position:part[position]})
    dict_final.update(dict_lists_sections)
    dict_final.update(dict_others_sections)
    return dict_final


# Extraction DATADIRECTORIES column

def get_features_from_datadirectories(sample):
    '''
    input:
        data: data
    output:
        sum_others_datadir: list of dicts
    '''  

    dict_others_datadir = {}
    datadir = sample["datadirectories"]

    for element in datadir:
        element_name = element['name']
        for position in ['size', 'virtual_address']:
            dict_others_datadir.update({"datadirectories_"+element_name+"_"+position:element[position]})
    return dict_others_datadir



def write_csv(csv_file_path, sample_list):
    """
    Args:
        csv_file_path: destination path of csv file
        sample_list: list of dicts 
    """
    all_keys = set().union(*(d.keys() for d in flatten_dataset))    

    try:
        with open(csv_file_path, 'w') as csvfile:
            writer = csv.DictWriter(csvfile, fieldnames=all_keys)
            writer.writeheader()
            for data in flatten_dataset:
                writer.writerow(data)
    except IOError:
        print("I/O error")


In [27]:

# 1. read datas
data_path = 'sample_data_6k.jsonl'
data = read_data(data_path, limiter=500)

In [47]:
data[0]['header']

{'coff': {'timestamp': 1124149349,
  'machine': 'I386',
  'characteristics': ['CHARA_32BIT_MACHINE',
   'RELOCS_STRIPPED',
   'EXECUTABLE_IMAGE',
   'LINE_NUMS_STRIPPED',
   'LOCAL_SYMS_STRIPPED']},
 'optional': {'subsystem': 'WINDOWS_GUI',
  'dll_characteristics': [],
  'magic': 'PE32',
  'major_image_version': 0,
  'minor_image_version': 0,
  'major_linker_version': 7,
  'minor_linker_version': 10,
  'major_operating_system_version': 4,
  'minor_operating_system_version': 0,
  'major_subsystem_version': 4,
  'minor_subsystem_version': 0,
  'sizeof_code': 26624,
  'sizeof_headers': 1024,
  'sizeof_heap_commit': 4096}}

In [50]:

# 2. iterate over dataset
flatten_dataset = []
for sample in data:
    # version 1 dummy way
    # flat = flatten_json(sample)
    # flatten_dataset.append(flat)
    # collect transformed values for each sample

    # version 2
    transformed = {}

#     transformed.update(get_simple_column(sample))
#     transformed.update(get_simple_list_from_column(sample))
#     transformed.update(get_features_from_dict_column(sample, columns = "strings"))
#     transformed.update(get_features_from_dict_column(sample, columns = "general"))
#     transformed.update(get_features_from_dict_column(sample, columns = "imports"))
    transformed.update(get_features_from_header(sample))
#    transformed.update(get_features_from_section(sample))
#    transformed.update(get_features_from_datadirectories(sample))


    # here we fill with transform data
    flatten_dataset.append(transformed)


all_keys = set().union(*(d.keys() for d in flatten_dataset))    



In [51]:
df= pd.DataFrame(flatten_dataset)

In [52]:
df.head()

Unnamed: 0,header_coff_characteristics_chara_32bit_machine,header_coff_characteristics_relocs_stripped,header_coff_characteristics_executable_image,header_coff_characteristics_line_nums_stripped,header_coff_characteristics_local_syms_stripped,header_coff_timestamp,header_coff_machine,header_optional_subsystem,header_optional_magic,header_optional_major_image_version,header_optional_minor_image_version,header_optional_major_linker_version,header_optional_minor_linker_version,header_optional_major_operating_system_version,header_optional_minor_operating_system_version,header_optional_major_subsystem_version,header_optional_minor_subsystem_version,header_optional_sizeof_code,header_optional_sizeof_headers,header_optional_sizeof_heap_commit,header_coff_characteristics_aggressive_ws_trim,header_optional_dll_characteristics_terminal_server_aware,header_coff_characteristics_debug_stripped,header_coff_characteristics_bytes_reversed_lo,header_coff_characteristics_bytes_reversed_hi,header_coff_characteristics_removable_run_from_swap,header_optional_dll_characteristics_no_seh,header_coff_characteristics_dll,header_coff_characteristics_large_address_aware,header_optional_dll_characteristics_dynamic_base,header_coff_characteristics_net_run_from_swap,header_optional_dll_characteristics_nx_compat,header_optional_dll_characteristics_wdm_driver
0,True,True,True,True,True,1124149349,I386,WINDOWS_GUI,PE32,0,0,7,10,4,0,4,0,26624,1024,4096,,,,,,,,,,,,,
1,True,True,True,True,True,1091600092,I386,WINDOWS_GUI,PE32,21315,20512,7,10,5,1,4,0,455680,1024,4096,True,True,,,,,,,,,,,
2,True,,True,True,,892092777,I386,WINDOWS_GUI,PE32,5,0,6,0,5,0,4,0,80896,1024,4096,,,True,,,,,,,,,,
3,True,True,True,True,True,708992537,I386,WINDOWS_GUI,PE32,0,0,2,25,1,0,4,0,36864,1024,4096,,,,True,True,,,,,,,,
4,True,True,True,True,True,938258311,I386,WINDOWS_GUI,PE32,5,0,5,12,5,0,4,0,34304,1536,4096,,True,True,,,,,,,,,,


In [46]:
data[150]['section']['entry']

'.text'

In [43]:
data[1]['section']['sections']

[{'name': '.text',
  'size': 455680,
  'entropy': 6.822879297636897,
  'vsize': 455304,
  'props': ['CNT_CODE', 'MEM_EXECUTE', 'MEM_READ']},
 {'name': '.data',
  'size': 8192,
  'entropy': 6.2046997042859555,
  'vsize': 19856,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ', 'MEM_WRITE']},
 {'name': '.rsrc',
  'size': 39424,
  'entropy': 3.6912241130964434,
  'vsize': 38992,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ']}]

In [42]:
data[13]['label']

0

In [38]:
data[1]['section']['sections']

[{'name': '.text',
  'size': 455680,
  'entropy': 6.822879297636897,
  'vsize': 455304,
  'props': ['CNT_CODE', 'MEM_EXECUTE', 'MEM_READ']},
 {'name': '.data',
  'size': 8192,
  'entropy': 6.2046997042859555,
  'vsize': 19856,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ', 'MEM_WRITE']},
 {'name': '.rsrc',
  'size': 39424,
  'entropy': 3.6912241130964434,
  'vsize': 38992,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ']}]

In [39]:
data[113]['section']['sections']

[{'name': '.text',
  'size': 61440,
  'entropy': 5.457595399705385,
  'vsize': 60837,
  'props': ['CNT_CODE', 'MEM_EXECUTE', 'MEM_READ']},
 {'name': '.data',
  'size': 4096,
  'entropy': -0.0,
  'vsize': 2060,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ', 'MEM_WRITE']},
 {'name': '.rsrc',
  'size': 4096,
  'entropy': 3.480594315356002,
  'vsize': 2732,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_READ']},
 {'name': '.reloc',
  'size': 16384,
  'entropy': 2.7788766335175183,
  'vsize': 13352,
  'props': ['CNT_INITIALIZED_DATA', 'MEM_DISCARDABLE', 'MEM_READ']}]

In [37]:
df.head()

Unnamed: 0,section_.text_sections.text_props_cnt_code,section_.text_sections.text_props_mem_execute,section_.text_sections.text_props_mem_read,section_.text_sections.rdata_props_cnt_initialized_data,section_.text_sections.rdata_props_mem_read,section_.text_sections.data_props_cnt_initialized_data,section_.text_sections.data_props_mem_read,section_.text_sections.data_props_mem_write,section_.text_sections.rsro_props_cnt_uninitialized_data,section_.text_sections.rsro_props_mem_read,section_.text_sections.rsro_props_mem_write,section_.text_sections.rsrc_props_cnt_initialized_data,section_.text_sections.rsrc_props_mem_read,section_.text_sections.text_size,section_.text_sections.text_entropy,section_.text_sections.text_vsize,section_.text_sections.rdata_size,section_.text_sections.rdata_entropy,section_.text_sections.rdata_vsize,section_.text_sections.data_size,section_.text_sections.data_entropy,section_.text_sections.data_vsize,section_.text_sections.rsro_size,section_.text_sections.rsro_entropy,section_.text_sections.rsro_vsize,section_.text_sections.rsrc_size,section_.text_sections.rsrc_entropy,section_.text_sections.rsrc_vsize,section_.text_sections.reloc_props_cnt_initialized_data,section_.text_sections.reloc_props_mem_discardable,section_.text_sections.reloc_props_mem_read,section_.text_sections.reloc_size,section_.text_sections.reloc_entropy,section_.text_sections.reloc_vsize,section_code_sectionscode_props_cnt_code,section_code_sectionscode_props_mem_execute,section_code_sectionscode_props_mem_read,section_code_sectionsdata_props_cnt_initialized_data,section_code_sectionsdata_props_mem_read,section_code_sectionsdata_props_mem_write,section_code_sectionsbss_props_mem_read,section_code_sectionsbss_props_mem_write,section_code_sections.idata_props_cnt_initialized_data,section_code_sections.idata_props_mem_read,section_code_sections.idata_props_mem_write,section_code_sections.tls_props_mem_read,section_code_sections.tls_props_mem_write,section_code_sections.rdata_props_cnt_initialized_data,section_code_sections.rdata_props_mem_shared,section_code_sections.rdata_props_mem_read,section_code_sections.reloc_props_cnt_initialized_data,section_code_sections.reloc_props_mem_shared,section_code_sections.reloc_props_mem_read,section_code_sections.rsrc_props_cnt_initialized_data,section_code_sections.rsrc_props_mem_shared,section_code_sections.rsrc_props_mem_read,section_code_sectionscode_size,section_code_sectionscode_entropy,section_code_sectionscode_vsize,section_code_sectionsdata_size,section_code_sectionsdata_entropy,section_code_sectionsdata_vsize,section_code_sectionsbss_size,section_code_sectionsbss_entropy,section_code_sectionsbss_vsize,section_code_sections.idata_size,section_code_sections.idata_entropy,section_code_sections.idata_vsize,section_code_sections.tls_size,section_code_sections.tls_entropy,section_code_sections.tls_vsize,section_code_sections.rdata_size,section_code_sections.rdata_entropy,section_code_sections.rdata_vsize,section_code_sections.reloc_size,section_code_sections.reloc_entropy,section_code_sections.reloc_vsize,section_code_sections.rsrc_size,section_code_sections.rsrc_entropy,section_code_sections.rsrc_vsize,section_upx0_sectionsupx0_props_cnt_uninitialized_data,section_upx0_sectionsupx0_props_mem_execute,section_upx0_sectionsupx0_props_mem_read,section_upx0_sectionsupx0_props_mem_write,section_upx0_sectionsupx1_props_cnt_initialized_data,section_upx0_sectionsupx1_props_mem_execute,section_upx0_sectionsupx1_props_mem_read,section_upx0_sectionsupx1_props_mem_write,section_upx0_sections.rsrc_props_cnt_initialized_data,section_upx0_sections.rsrc_props_mem_read,section_upx0_sections.rsrc_props_mem_write,section_upx0_sectionsupx0_size,section_upx0_sectionsupx0_entropy,section_upx0_sectionsupx0_vsize,section_upx0_sectionsupx1_size,section_upx0_sectionsupx1_entropy,section_upx0_sectionsupx1_vsize,section_upx0_sections.rsrc_size,section_upx0_sections.rsrc_entropy,section_upx0_sections.rsrc_vsize,section_.text_sections.inject_props_cnt_code,section_.text_sections.inject_props_mem_execute,section_.text_sections.inject_props_mem_read,section_.text_sections.inject_props_mem_write,section_.text_sections.inject_size,section_.text_sections.inject_entropy,section_.text_sections.inject_vsize,section__sections.text_props_cnt_initialized_data,section__sections.text_props_mem_read,section__sections.text_props_mem_write,section__sectionscodeseg_props_cnt_initialized_data,section__sectionscodeseg_props_mem_read,section__sectionscodeseg_props_mem_write,section__sections.rdata_props_cnt_initialized_data,section__sections.rdata_props_mem_read,section__sections.rdata_props_mem_write,section__sections.data_props_cnt_initialized_data,section__sections.data_props_mem_read,section__sections.data_props_mem_write,section__sectionsdataseg_props_cnt_initialized_data,section__sectionsdataseg_props_mem_read,section__sectionsdataseg_props_mem_write,section__sections.cms_t_props_cnt_initialized_data,section__sections.cms_t_props_mem_read,section__sections.cms_t_props_mem_write,section__sections.cms_d_props_cnt_initialized_data,section__sections.cms_d_props_mem_read,section__sections.cms_d_props_mem_write,section__sections.idata_props_cnt_initialized_data,section__sections.idata_props_mem_read,section__sections.idata_props_mem_write,section__sections.rsrc_props_cnt_initialized_data,section__sections.rsrc_props_mem_read,section__sections.rsrc_props_mem_write,section__sections.text_size,section__sections.text_entropy,section__sections.text_vsize,section__sectionscodeseg_size,section__sectionscodeseg_entropy,section__sectionscodeseg_vsize,section__sections.rdata_size,section__sections.rdata_entropy,section__sections.rdata_vsize,section__sections.data_size,section__sections.data_entropy,section__sections.data_vsize,section__sectionsdataseg_size,section__sectionsdataseg_entropy,section__sectionsdataseg_vsize,section__sections.cms_t_size,section__sections.cms_t_entropy,section__sections.cms_t_vsize,section__sections.cms_d_size,section__sections.cms_d_entropy,section__sections.cms_d_vsize,section__sections.idata_size,section__sections.idata_entropy,section__sections.idata_vsize,section__sections.rsrc_size,section__sections.rsrc_entropy,section__sections.rsrc_vsize,section_.text_sections.ndata_props_cnt_uninitialized_data,section_.text_sections.ndata_props_mem_read,section_.text_sections.ndata_props_mem_write,section_.text_sections.ndata_size,section_.text_sections.ndata_entropy,section_.text_sections.ndata_vsize,section_.text_sections.sxdata_props_cnt_initialized_data,section_.text_sections.sxdata_props_lnk_info,section_.text_sections.sxdata_props_mem_read,section_.text_sections.sxdata_props_mem_write,section_.text_sections.sxdata_size,section_.text_sections.sxdata_entropy,section_.text_sections.sxdata_vsize,section_.data_sections.text_props_cnt_code,section_.data_sections.text_props_mem_execute,section_.data_sections.text_props_mem_read,section_.data_sections.rdata_props_cnt_initialized_data,section_.data_sections.rdata_props_mem_read,section_.data_sections.data_props_cnt_initialized_data,section_.data_sections.data_props_mem_read,section_.data_sections.data_props_mem_write,section_.data_sections.rsrc_props_cnt_initialized_data,section_.data_sections.rsrc_props_mem_read,section_.data_sections.text_size,section_.data_sections.text_entropy,section_.data_sections.text_vsize,section_.data_sections.rdata_size,section_.data_sections.rdata_entropy,section_.data_sections.rdata_vsize,section_.data_sections.data_size,section_.data_sections.data_entropy,section_.data_sections.data_vsize,section_.data_sections.rsrc_size,section_.data_sections.rsrc_entropy,section_.data_sections.rsrc_vsize,section_.text_sections_winzip__props_cnt_initialized_data,section_.text_sections_winzip__props_mem_discardable,section_.text_sections_winzip__props_mem_read,section_.text_sections_winzip__size,section_.text_sections_winzip__entropy,section_.text_sections_winzip__vsize,section_.text_sections.text_props_mem_not_paged,section_.text_sections.rdata_props_mem_not_paged,section_.text_sections.data_props_mem_not_paged,section_.text_sections.pdata_props_cnt_initialized_data,section_.text_sections.pdata_props_mem_not_paged,section_.text_sections.pdata_props_mem_read,section_.text_sectionsinit_props_cnt_code,section_.text_sectionsinit_props_mem_discardable,section_.text_sectionsinit_props_mem_write,section_.text_sectionsinit_props_mem_execute,section_.text_sectionsinit_props_mem_read,section_.text_sections.rsrc_props_mem_discardable,section_.text_sections.pdata_size,section_.text_sections.pdata_entropy,section_.text_sections.pdata_vsize,section_.text_sectionsinit_size,section_.text_sectionsinit_entropy,section_.text_sectionsinit_vsize,section__sections.reloc_props_cnt_initialized_data,section__sections.reloc_props_mem_read,section__sections.reloc_props_mem_write,section__sections.aspack_props_cnt_initialized_data,section__sections.aspack_props_mem_read,section__sections.aspack_props_mem_write,section__sections.reloc_size,section__sections.reloc_entropy,section__sections.reloc_vsize,section__sections.aspack_size,section__sections.aspack_entropy,section__sections.aspack_vsize,section_.text_sections.text_props_mem_write,section_.text_sections.rsrc_props_mem_not_cached,section_.text_sections.rsrc_props_mem_write,section_.text_sections.rsrc_props_mem_not_paged,section__sectionscode_props_cnt_initialized_data,section__sectionscode_props_mem_read,section__sectionscode_props_mem_write,section__sectionsdata_props_cnt_initialized_data,section__sectionsdata_props_mem_read,section__sectionsdata_props_mem_write,section__sectionsbss_props_cnt_initialized_data,section__sectionsbss_props_mem_read,section__sectionsbss_props_mem_write,section__sections.tls_props_cnt_initialized_data,section__sections.tls_props_mem_read,section__sections.tls_props_mem_write,section__sectionscode_size,section__sectionscode_entropy,...,section_.text_sections.sdata_entropy,section_.text_sections.sdata_vsize,section_.text_sections.bss_props_cnt_uninitialized_data,section_.text_sections.bss_props_mem_read,section_.text_sections.bss_props_mem_write,section_.text_sections.edata_props_cnt_initialized_data,section_.text_sections.edata_props_mem_read,section_.text_sections.bss_size,section_.text_sections.bss_entropy,section_.text_sections.bss_vsize,section_.text_sections.edata_size,section_.text_sections.edata_entropy,section_.text_sections.edata_vsize,section_.text_sections.tls_props_cnt_initialized_data,section_.text_sections.tls_props_mem_read,section_.text_sections.tls_props_mem_write,section_.text_sections.tls_size,section_.text_sections.tls_entropy,section_.text_sections.tls_vsize,section_.text_sections.rdata_props_cnt_code,section_.text_sections.idata_props_cnt_code,section_.text_sectionsrtfout_p_props_cnt_code,section_.text_sectionsrtfout_p_props_mem_execute,section_.text_sectionsrtfout_p_props_mem_read,section_.text_sectionsrtfout_p_size,section_.text_sectionsrtfout_p_entropy,section_.text_sectionsrtfout_p_vsize,section_.text_sections.data1_props_cnt_initialized_data,section_.text_sections.data1_props_mem_read,section_.text_sections.data1_props_mem_write,section_.text_sections.data1_size,section_.text_sections.data1_entropy,section_.text_sections.data1_vsize,section_.text_sections.text_props_align_1bytes,section_.text_sections.text_props_align_4bytes,section_.text_sections.text_props_align_8bytes,section_.text_sections.text_props_align_16bytes,section_.text_sections.text_props_align_32bytes,section_.text_sections.text_props_align_64bytes,section_.text_sections.text_props_align_256bytes,section_.text_sections.text_props_align_1024bytes,section_.text_sections.text_props_align_2048bytes,section_.text_sections.text_props_align_4096bytes,section_.text_sections.text_props_align_8192bytes,section_.text_sections.data_props_align_2bytes,section_.text_sections.data_props_align_16bytes,section_.text_sections.data_props_align_4bytes,section_.text_sections.data_props_align_8bytes,section_.text_sections.data_props_align_32bytes,section_.text_sections.data_props_align_64bytes,section_.text_sections.data_props_align_512bytes,section_.text_sections.data_props_align_1024bytes,section_.text_sections.data_props_align_2048bytes,section_.text_sections.data_props_align_4096bytes,section_.text_sections.data_props_align_8192bytes,section_.text_sections.rdata_props_align_8bytes,section_.text_sections.rdata_props_align_64bytes,section_.text_sections.rdata_props_align_16bytes,section_.text_sections.rdata_props_align_32bytes,section_.text_sections.rdata_props_align_2048bytes,section_.text_sections.rdata_props_align_4096bytes,section_.text_sections.rdata_props_align_8192bytes,section_.text_sections.bss_props_align_8bytes,section_.text_sections.bss_props_align_64bytes,section_.text_sections.bss_props_align_16bytes,section_.text_sections.bss_props_align_32bytes,section_.text_sections.bss_props_align_2048bytes,section_.text_sections.bss_props_align_4096bytes,section_.text_sections.bss_props_align_8192bytes,section_.text_sections.idata_props_align_1bytes,section_.text_sections.idata_props_align_16bytes,section_.text_sections.idata_props_align_2bytes,section_.text_sections.idata_props_align_4bytes,section_.text_sections.idata_props_align_32bytes,section_.text_sections.idata_props_align_64bytes,section_.text_sections.idata_props_align_256bytes,section_.text_sections.idata_props_align_512bytes,section_.text_sections.idata_props_align_1024bytes,section_.text_sections.idata_props_align_4096bytes,section_.text_sections.idata_props_align_8192bytes,section_code_sections.edata_props_cnt_initialized_data,section_code_sections.edata_props_mem_shared,section_code_sections.edata_props_mem_read,section_code_sections.edata_size,section_code_sections.edata_entropy,section_code_sections.edata_vsize,section_.text_sections.bss_props_mem_shared,section_.text_sections.edata_props_mem_shared,section_.text_sections.sharedd_props_cnt_initialized_data,section_.text_sections.sharedd_props_mem_shared,section_.text_sections.sharedd_props_mem_read,section_.text_sections.sharedd_props_mem_write,section_.text_sections.sharedd_size,section_.text_sections.sharedd_entropy,section_.text_sections.sharedd_vsize,section_.text_sections.text_props_align_2bytes,section_.text_sections.text_props_align_512bytes,section_.text_sections.rdata_props_align_1bytes,section_.text_sections.rdata_props_align_2bytes,section_.text_sections.rdata_props_align_4bytes,section_.text_sections.rdata_props_align_256bytes,section_.text_sections.rdata_props_align_512bytes,section_.text_sections.rdata_props_align_1024bytes,section_.text_sections.data_props_align_1bytes,section_.text_sections.data_props_align_256bytes,section_.text_sectionsnexdic_props_cnt_initialized_data,section_.text_sectionsnexdic_props_mem_shared,section_.text_sectionsnexdic_props_mem_read,section_.text_sectionsnexdic_props_mem_write,section_.text_sectionsnexdic_size,section_.text_sectionsnexdic_entropy,section_.text_sectionsnexdic_vsize,section_.text_sections.stab_props_lnk_remove,section_.text_sections.stab_props_mem_discardable,section_.text_sections.stab_props_mem_read,section_.text_sections.stabstr_props_lnk_remove,section_.text_sections.stabstr_props_mem_discardable,section_.text_sections.stabstr_props_mem_read,section_.text_sections.stab_size,section_.text_sections.stab_entropy,section_.text_sections.stab_vsize,section_.text_sections.stabstr_size,section_.text_sections.stabstr_entropy,section_.text_sections.stabstr_vsize,section_.text_sections.itext_props_cnt_code,section_.text_sections.itext_props_mem_execute,section_.text_sections.itext_props_mem_read,section_.text_sections.itext_size,section_.text_sections.itext_entropy,section_.text_sections.itext_vsize,section_.text_sections _props_cnt_initialized_data,section_.text_sections _props_mem_discardable,section_.text_sections _props_mem_read,section_.text_sections _size,section_.text_sections _entropy,section_.text_sections _vsize,section_.text_sections.shared_props_cnt_initialized_data,section_.text_sections.shared_props_mem_shared,section_.text_sections.shared_props_mem_read,section_.text_sections.shared_props_mem_write,section_.text_sections.shared_size,section_.text_sections.shared_entropy,section_.text_sections.shared_vsize,section_code_sections.rsrc_props_mem_write,section__sections.edata_props_cnt_initialized_data,section__sections.edata_props_mem_read,section__sections.edata_props_mem_write,section__sections.edata_size,section__sections.edata_entropy,section__sections.edata_vsize,section_.text_sectionspagelk_props_cnt_code,section_.text_sectionspagelk_props_mem_execute,section_.text_sectionspagelk_props_mem_read,section_.text_sectionspageipmc_props_cnt_code,section_.text_sectionspageipmc_props_mem_execute,section_.text_sectionspageipmc_props_mem_read,section_.text_sectionspagelk_size,section_.text_sectionspagelk_entropy,section_.text_sectionspagelk_vsize,section_.text_sectionspageipmc_size,section_.text_sectionspageipmc_entropy,section_.text_sectionspageipmc_vsize,section_.text_sections.reloc_props_mem_shared,section_.text_sections.reloc_props_mem_not_paged,section_.text_sections_ldata_props_cnt_initialized_data,section_.text_sections_ldata_props_mem_not_paged,section_.text_sections_ldata_props_mem_read,section_.text_sections_ldata_props_mem_write,section_.text_sections_ldata_size,section_.text_sections_ldata_entropy,section_.text_sections_ldata_vsize,section_.text_sections.hkt_props_cnt_initialized_data,section_.text_sections.hkt_props_mem_shared,section_.text_sections.hkt_props_mem_read,section_.text_sections.hkt_props_mem_write,section_.text_sections.hkt_size,section_.text_sections.hkt_entropy,section_.text_sections.hkt_vsize,section_.text_sections_props_cnt_initialized_data,section_.text_sections_props_mem_read,section_.text_sections_props_mem_write,section_.text_sections_size,section_.text_sections_entropy,section_.text_sections_vsize,section__sections.data_props_mem_execute,section_.text_sections.edata_props_mem_write,section_.text_sections.reloc_props_mem_write,section_.text_sections.init_t_props_cnt_code,section_.text_sections.init_t_props_mem_execute,section_.text_sections.init_t_props_mem_read,section_.text_sections.init_d_props_cnt_initialized_data,section_.text_sections.init_d_props_mem_read,section_.text_sections.init_d_props_mem_write,section_.text_sections.init_t_size,section_.text_sections.init_t_entropy,section_.text_sections.init_t_vsize,section_.text_sections.init_d_size,section_.text_sections.init_d_entropy,section_.text_sections.init_d_vsize,section_.text_sectionsshared_props_cnt_initialized_data,section_.text_sectionsshared_props_mem_shared,section_.text_sectionsshared_props_mem_read,section_.text_sectionsshared_props_mem_write,section_.text_sectionsshared_size,section_.text_sectionsshared_entropy,section_.text_sectionsshared_vsize,section_.text_sectionslexmark_props_cnt_initialized_data,section_.text_sectionslexmark_props_mem_shared,section_.text_sectionslexmark_props_mem_read,section_.text_sectionslexmark_props_mem_write,section_.text_sectionslexmark_size,section_.text_sectionslexmark_entropy,section_.text_sectionslexmark_vsize,section_.text_sectionsconst_props_cnt_initialized_data,section_.text_sectionsconst_props_mem_read,section_.text_sectionsconst_props_mem_write,section_.text_sectionsconst_size,section_.text_sectionsconst_entropy,section_.text_sectionsconst_vsize,section_.text_sectionspagesrp0_props_cnt_code,section_.text_sectionspagesrp0_props_mem_execute,section_.text_sectionspagesrp0_props_mem_read,section_.text_sectionspageser_props_cnt_code,section_.text_sectionspageser_props_mem_execute,section_.text_sectionspageser_props_mem_read,section_.text_sectionspagesrp0_size,section_.text_sectionspagesrp0_entropy,section_.text_sectionspagesrp0_vsize,section_.text_sectionspageser_size,section_.text_sectionspageser_entropy,section_.text_sectionspageser_vsize,section_.data_sections.data_props_mem_execute,section_.data_sections.rsrc_props_mem_discardable,section_.data_sections.reloc_props_cnt_initialized_data,section_.data_sections.reloc_props_mem_discardable,section_.data_sections.reloc_props_mem_read,section_.data_sections.reloc_size,section_.data_sections.reloc_entropy,section_.data_sections.reloc_vsize,section_.text_sections.orpc_props_cnt_code,section_.text_sections.orpc_props_mem_execute,section_.text_sections.orpc_props_mem_read,section_.text_sections.orpc_size,section_.text_sections.orpc_entropy,section_.text_sections.orpc_vsize,section__sections.its_props_cnt_initialized_data,section__sections.its_props_mem_read,section__sections.its_size,section__sections.its_entropy,section__sections.its_vsize
0,True,True,True,True,True,True,True,True,True,True,True,True,True,26624.0,6.53,26134.0,6656.0,5.43,6216.0,512.0,1.74,172468.0,0.0,-0.0,135168.0,27648.0,5.02,28672.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,True,True,True,,,True,True,True,,,,True,True,455680.0,6.82,455304.0,,,,8192.0,6.2,19856.0,,,,39424.0,3.69,38992.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,True,True,True,,,True,True,True,,,,True,True,81920.0,6.46,80594.0,,,,4096.0,1.59,1332.0,,,,81920.0,5.12,81920.0,True,True,True,8192.0,6.81,6580.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,True,True,True,True,True,True,True,True,True,True,True,True,True,True,True,True,True,True,True,True,True,True,36864.0,6.6,36628.0,1024.0,4.13,584.0,0.0,-0.0,3636.0,2560.0,4.65,2370.0,0.0,-0.0,8.0,512.0,2.05,24.0,0.0,-0.0,2176.0,10240.0,4.34,10240.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,True,True,True,,,True,True,True,,,,True,True,34304.0,6.59,33908.0,,,,1024.0,4.1,7180.0,,,,1116672.0,7.99,1118208.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,...,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [53]:
len(all_keys)

33

In [None]:
#save to csv file
csv_file = "flatten_sample_data_6k.csv"
write_csv(csv_file, flatten_dataset)    

# read in chunks
for chunk in pd.read_csv(csv_file, chunksize=10):
    pass

# change all transformed dataset to dataframe object
df = pd.DataFrame(flatten_dataset)
df    