# ***Embedding for JSON File Format***

**Importing Libraries**

In [None]:
import os
import pandas as pd
import json
from gensim.models import Word2Vec

**Flattening the JSON Structure into Dictionary**

In [None]:
def flatten_json(json_data, parent_key='', sep='_'):
    flattened = {}
    if isinstance(json_data, list):
        for i, item in enumerate(json_data):
            flattened.update(flatten_json(item, parent_key=f"{parent_key}{sep}{i}", sep=sep))
    elif isinstance(json_data, dict):
        for k, v in json_data.items():
            new_key = f"{parent_key}{sep}{k}" if parent_key else k
            if isinstance(v, (dict, list)):
                flattened.update(flatten_json(v, new_key, sep=sep))
            else:
                flattened[new_key] = v
    return flattened

**Load and tokenize the JSON Data**

In [None]:
with open('/content/entries .json', 'r') as file:
    json_data = json.load(file)
flattened_data = flatten_json(json_data)
tokenized_values = [str(value).split() for value in flattened_data.values()]

**Word2Vec Model**

In [None]:
word2vec_model = Word2Vec(sentences=tokenized_values, vector_size=100, window=5, min_count=1, workers=4)

**Embed the JSON data**

In [None]:
embedded_data = {}
for key, value in flattened_data.items():
    embeddings = [word2vec_model.wv[token].tolist() for token in str(value).split() if token in word2vec_model.wv]
    embedded_data[key] = embeddings
for key, value in embedded_data.items():#DISPLAY IN VECTOR FORMAT
    print(f"{key}: {value}")

_0_id: [[0.008819193579256535, 0.009432656690478325, -0.0028205036651343107, -0.0015043020248413086, -0.008250120095908642, -0.003927330952137709, 0.0051549687050282955, -0.008171328343451023, -0.008025224320590496, 0.00976634956896305, -0.006456476636230946, -0.00808517262339592, -0.0002922606363426894, 0.008770891465246677, 0.00787956453859806, 0.00456105126067996, 0.0058943224139511585, -0.00531628867611289, -0.006255603861063719, 0.002990707056596875, -0.0032164526637643576, -0.008933127857744694, -0.0037389767821878195, -0.0028751767240464687, 0.00800730474293232, -0.009373288601636887, -0.009802430868148804, -0.008336734026670456, 0.008286266587674618, 0.008808650076389313, 0.00966937281191349, 0.004385281819850206, -0.0041794623248279095, 0.005467738024890423, -0.008252531290054321, -0.0010532188462093472, -0.0013999271905049682, -0.0003101909242104739, 0.007564955856651068, 0.008037124760448933, 0.006408277899026871, -0.0008861327078193426, -0.007897970266640186, 0.005802259314

IOPub data rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_data_rate_limit`.

Current values:
NotebookApp.iopub_data_rate_limit=1000000.0 (bytes/sec)
NotebookApp.rate_limit_window=3.0 (secs)




_30_children1_0_children1_children1_1_properties_value: [[-0.0025087667163461447, -0.00590265728533268, 0.007483337074518204, -0.007259732577949762, -0.008966119028627872, -0.0017895937198773026, -0.008367436937987804, 0.00039020777330733836, 0.0019457340240478516, -0.002469483530148864, -0.006448009982705116, -0.0003211796283721924, -0.0010985040571540594, 0.003493361407890916, 0.008127013221383095, 0.005855571012943983, 0.008440988138318062, -0.00896817073225975, 0.009442486800253391, -0.002365756081417203, 0.00869705155491829, 0.0023846172261983156, 0.0035852408036589622, -0.009581687860190868, -0.009486453607678413, 0.008983921259641647, -0.002896767808124423, 0.00281641841866076, 0.006419443059712648, -0.00029992699273861945, 0.00972189661115408, -0.001033714972436428, -0.009672874584794044, -0.007054847665131092, -0.0010431563714519143, -0.008674900978803635, 0.007421448361128569, 0.0036193334963172674, -0.008746946230530739, 0.008479722775518894, 0.008929639123380184, 0.0058473

IOPub data rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_data_rate_limit`.

Current values:
NotebookApp.iopub_data_rate_limit=1000000.0 (bytes/sec)
NotebookApp.rate_limit_window=3.0 (secs)



_54_children1_0_children1_type: [[-0.007139015011489391, 0.0012410306371748447, -0.007176716346293688, -0.002244618022814393, 0.003719303524121642, 0.0058331238105893135, 0.0011981832794845104, 0.002102731494233012, -0.00411039125174284, 0.007225333247333765, -0.006307041738182306, 0.004647215828299522, -0.008219973184168339, 0.002036467893049121, -0.004977052100002766, -0.004247688222676516, -0.00310898432508111, 0.005655208602547646, 0.005798400845378637, -0.00497464882209897, 0.0007733309175819159, -0.00849577784538269, 0.007809805683791637, 0.009257291443645954, -0.002742327516898513, 0.0008002233225852251, 0.0007466519018635154, 0.0054778847843408585, -0.008606079034507275, 0.0005844557308591902, 0.006869422271847725, 0.00223159440793097, 0.001124676433391869, -0.009322155267000198, 0.008482366800308228, -0.0062641273252666, -0.0029923736583441496, 0.003493787022307515, -0.0007726275944150984, 0.001411291304975748, 0.001781991682946682, -0.006828899495303631, -0.009724811650812626

IOPub data rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_data_rate_limit`.

Current values:
NotebookApp.iopub_data_rate_limit=1000000.0 (bytes/sec)
NotebookApp.rate_limit_window=3.0 (secs)



_81_children1_0_children1_children1_1_children1_children1_2_id: [[0.0032612967770546675, 0.0038488400168716908, -0.004360328894108534, 0.004116593394428492, -0.0015540659660473466, 0.0066056144423782825, 0.0022023285273462534, -0.004771326668560505, -0.002990058623254299, 0.003898794762790203, -0.007507839240133762, -0.00028927208040840924, -0.006948058493435383, -0.001972370082512498, -0.004602249711751938, -0.007516201585531235, -0.0005739426705986261, -0.00700906990095973, 0.0042680371552705765, -0.005853351205587387, 0.004736538976430893, -0.004396481439471245, -0.0023111761547625065, 0.005985764320939779, -0.005289333872497082, -0.00460043316707015, -0.000694003130774945, -0.007385375443845987, 0.0036670733243227005, 0.0030507624614983797, -0.009289225563406944, 0.005797078832983971, -0.006312825717031956, -0.0028881193138659, 0.0016203188570216298, -0.0033329438883811235, 0.004958817735314369, -0.0017442500684410334, -0.0067719281651079655, 0.0014547728933393955, 0.00828100554645

IOPub data rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_data_rate_limit`.

Current values:
NotebookApp.iopub_data_rate_limit=1000000.0 (bytes/sec)
NotebookApp.rate_limit_window=3.0 (secs)




_157_children1_1_children1_children1_0_children1_children1_0_id: [[0.003074519569054246, -0.0049097537994384766, 5.381822484196164e-05, 0.002191477920860052, -0.003554413327947259, -0.007692720741033554, -0.0028630150482058525, 0.007893434725701809, -0.009304029867053032, -0.003767931368201971, -0.0014633977552875876, 0.0001384150964440778, 6.314158235909417e-05, -0.0008022511028684676, 0.007008830085396767, 0.006027070339769125, 0.0011788379633799195, -0.003802783554419875, -0.0025205970741808414, -0.002358261262997985, 0.0038734746631234884, -0.009240193292498589, 0.004516522865742445, -1.9787550627370365e-05, 0.0011769389966502786, 0.009114238433539867, -0.00011669635568978265, -0.0010315275285393, 0.0030958415009081364, -0.004578212276101112, -0.0004660928389057517, 0.0025108205154538155, 0.005895794834941626, 0.005711306352168322, 0.006953151430934668, -0.002624663058668375, 0.0029416538309305906, 0.0034148383419960737, -0.009218377992510796, 0.008996396325528622, 0.0042757000774

IOPub data rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_data_rate_limit`.

Current values:
NotebookApp.iopub_data_rate_limit=1000000.0 (bytes/sec)
NotebookApp.rate_limit_window=3.0 (secs)

