In [11]:
import pandas as pd
import numpy as np
from pathlib import Path
import spacy

In [None]:
!python -m spacy download en_core_web_sm

# Fetching Data 

In [195]:
entities = pd.read_csv('data/entities.tsv',sep = '\t')
entities.head()

Unnamed: 0,filename,mark,label,offset1,offset2,span,code
0,es-S0212-71992007000100007-1,T1,ENFERMEDAD,40,61,arterial hypertension,38341003
1,es-S0212-71992007000100007-1,T2,ENFERMEDAD,66,79,polyarthrosis,36186002
2,es-S0212-71992007000100007-1,T3,ENFERMEDAD,1682,1698,pleural effusion,60046008
3,es-S0212-71992007000100007-1,T4,ENFERMEDAD,1859,1875,pleural effusion,60046008
4,es-S0212-71992007000100007-1,T5,ENFERMEDAD,1626,1648,lower lobe atelectasis,46621007


In [205]:
text_path = 'data/text/'
text_files = list(Path(text_path).glob('*.txt'))

In [206]:
file_text = {}

for file in text_files:
    file = str(file)
    with open(file, "r", encoding="UTF-8") as f:
        file_name = file[len(text_path):-4]
        file_text.update({file_name: f.read()})

text_files = [str(text_file)[len(text_path):-4] for text_file in text_files]

# Sentence Splitting & Tokenization

In [208]:
nlp = spacy.load("en_core_web_sm")

In [209]:
def tokenize(file_name):
    text = file_text[file_name]
    doc = nlp(text)
    sentence_ids = []
    tokens = []
    for i, sent in enumerate(doc.sents):
        sentence_ids.append(i)
        tokens.append([(tk.text, tk.idx) for tk in sent])
    return sentence_ids, tokens

# Converting Spans to IOB Format

In [266]:
def get_bio_tags(tokens, entities):
    tags = []
    curr_entity = None
    for token in tokens:
        if len(entities):
            nxt_entity = entities[0]
            start, end, lbl = nxt_entity[0], nxt_entity[1], nxt_entity[2]
            if token[1] >= start and (token[1] + len(token)) <= end:
                if curr_entity:
                    tags.append('I-' + lbl)
                else:
                    tags.append('B-' + lbl)
                    curr_entity = nxt_entity
                if (token[1] + len(token)) >= end:
                    curr_entity = None
                    entities.pop(0)
            else:
                if token[1] >= end:
                    print(entities.pop(0))
                tags.append('O')
                curr_entity = None
        else:
            tags.append('O')
    return tags

In [267]:
file_info = ['text', 'entities', 'tags', 'sentence_ids', 'tokens']

In [268]:
res = {}
for info in file_info:
    res[info] = []
    for file_num in range(len(text_files)):
        if info == 'text':
            res[info].append("")
        else:
            res[info].append([])
        
file_idx = {}
for idx, file in enumerate(text_files):
    file_idx[file] = idx
        
for entity in entities.itertuples():
    file = entity[1]
    idx = file_idx[file]
    if res['text'][idx] == "":
        res['text'][idx] = file_text[file]
        res['sentence_ids'][idx], res['tokens'][idx] = tokenize(file)
    # entity -> offset1, offset2, label, span
    res['entities'][idx].append([entity[4], entity[5], entity[3], entity[6]])
    
for idx, file in enumerate(text_files):
    text = file_text[file_name]
    doc = nlp(text)
    ents = res['entities'][idx].copy()
    for i in res['sentence_ids'][idx]:
        res['tags'][idx].append(get_bio_tags(res['tokens'][idx][i], ents))

[238, 264, 'ENFERMEDAD', 'severe respiratory failure']
[280, 297, 'ENFERMEDAD', "Potter's Syndrome"]
[302, 324, 'ENFERMEDAD', 'severe oligohydramnios']
[556, 568, 'ENFERMEDAD', 'micrognathia']
[1057, 1062, 'ENFERMEDAD', 'cysts']
[1907, 1912, 'ENFERMEDAD', 'cysts']
[2004, 2009, 'ENFERMEDAD', 'cysts']
[2158, 2163, 'ENFERMEDAD', 'cysts']
[2262, 2267, 'ENFERMEDAD', 'cysts']
[2332, 2337, 'ENFERMEDAD', 'cysts']
[2252, 2267, 'ENFERMEDAD', 'medullary cysts']
[1004, 1021, 'ENFERMEDAD', 'cystic formations']
[23, 45, 'ENFERMEDAD', 'allergic to penicillin']
[87, 99, 'ENFERMEDAD', 'endocarditis']
[475, 510, 'ENFERMEDAD', 'pulmonary and inguinal adenopathies']
[976, 995, 'ENFERMEDAD', 'acute renal failure']
[532, 537, 'ENFERMEDAD', 'cysts']
[754, 767, 'ENFERMEDAD', 'cystic lesion']
[964, 992, 'ENFERMEDAD', 'bilateral renal lymphangioma']
[481, 488, 'ENFERMEDAD', 'lesions']
[847, 881, 'ENFERMEDAD', 'left renal cell there was a lesion']
[738, 747, 'ENFERMEDAD', 'haematoma']
[1291, 1310, 'ENFERMEDAD', 

[189, 205, 'ENFERMEDAD', 'ischaemic stroke']
[101, 113, 'ENFERMEDAD', 'hypertensive']
[1001, 1020, 'ENFERMEDAD', 'acute renal failure']
[1506, 1528, 'ENFERMEDAD', 'emphysematous cystitis']
[1761, 1780, 'ENFERMEDAD', 'choledocholithiasis']
[2015, 2035, 'ENFERMEDAD', 'obstructive jaundice']
[2343, 2363, 'ENFERMEDAD', 'obstructive jaundice']
[2040, 2062, 'ENFERMEDAD', 'emphysematous cystitis']
[2315, 2337, 'ENFERMEDAD', 'emphysematous cystitis']
[2453, 2469, 'ENFERMEDAD', 'bile duct stones']
[2908, 2915, 'ENFERMEDAD', 'lesions']
[70, 91, 'ENFERMEDAD', 'arterial hypertension']
[96, 116, 'ENFERMEDAD', 'hypercholesterolemia']
[182, 201, 'ENFERMEDAD', 'nephrogenic anaemia']
[254, 283, 'ENFERMEDAD', 'secondary hyperparathyroidism']
[653, 670, 'ENFERMEDAD', 'diabetes mellitus']
[1369, 1390, 'ENFERMEDAD', 'peri-graft collection']
[1827, 1837, 'ENFERMEDAD', 'lymphocele']
[1916, 1926, 'ENFERMEDAD', 'lymphocele']
[1882, 1891, 'ENFERMEDAD', 'infection']
[2163, 2173, 'ENFERMEDAD', 'lymphocele']
[58, 

[201, 223, 'ENFERMEDAD', 'pulmonary tuberculosis']
[228, 265, 'ENFERMEDAD', 'chronic obstructive pulmonary disease']
[731, 744, 'ENFERMEDAD', 'cystic lesion']
[1816, 1845, 'ENFERMEDAD', 'dysplastic right lower kidney']
[1851, 1881, 'ENFERMEDAD', 'partial agenesis of the ureter']
[2044, 2057, 'ENFERMEDAD', 'cystic lesion']
[2208, 2219, 'ENFERMEDAD', 'cystic mass']
[2465, 2476, 'ENFERMEDAD', 'cystic mass']
[2558, 2569, 'ENFERMEDAD', 'cystic mass']
[2784, 2820, 'ENFERMEDAD', 'mucinous cystadenoma of the appendix']
[2639, 2655, 'ENFERMEDAD', 'dilated appendix']
[3175, 3192, 'ENFERMEDAD', 'abdominal lesions']
[322, 335, 'ENFERMEDAD', 'penile trauma']
[668, 698, 'ENFERMEDAD', 'priapism of prolonged duration']
[727, 745, 'ENFERMEDAD', 'high-flow priapism']
[668, 676, 'ENFERMEDAD', 'priapism']
[737, 745, 'ENFERMEDAD', 'priapism']
[846, 890, 'ENFERMEDAD', 'irreversible damage to the corpora cavernosa']
[1855, 1882, 'ENFERMEDAD', 'myeloproliferative syndrome']
[1952, 1977, 'ENFERMEDAD', 'chronic

[428, 454, 'ENFERMEDAD', 'transient ischaemic attack']
[521, 539, 'ENFERMEDAD', 'cardiac arrhythmia']
[543, 565, 'ENFERMEDAD', 'valvular heart disease']
[585, 608, 'ENFERMEDAD', 'thromboembolic episodes']
[630, 647, 'ENFERMEDAD', 'urinary lithiasis']
[697, 710, 'ENFERMEDAD', 'cocaine abuse']
[726, 742, 'ENFERMEDAD', 'hepatitis B or C']
[347, 359, 'ENFERMEDAD', 'Hypertension']
[1551, 1577, 'ENFERMEDAD', 'acute myocardial ischaemia']
[1868, 1885, 'ENFERMEDAD', 'aortic dilatation']
[1889, 1910, 'ENFERMEDAD', 'renal artery aneurysm']
[1568, 1577, 'ENFERMEDAD', 'ischaemia']
[1789, 1798, 'ENFERMEDAD', 'ischaemia']
[2460, 2480, 'ENFERMEDAD', 'valvular vegetations']
[2502, 2523, 'ENFERMEDAD', 'myocardial dyskinesia']
[2709, 2778, 'ENFERMEDAD', 'macro/microaneurysms or alterations of the main renal artery or aorta']
[2816, 2850, 'ENFERMEDAD', 'prothrombotic and vascular disease']
[3263, 3275, 'ENFERMEDAD', 'hypertension']
[3143, 3151, 'ENFERMEDAD', 'embolism']
[3173, 3189, 'ENFERMEDAD', 'system

[116, 125, 'ENFERMEDAD', 'neoplasia']
[406, 416, 'ENFERMEDAD', 'meningitis']
[438, 468, 'ENFERMEDAD', 'permanent neurological deficit']
[905, 922, 'ENFERMEDAD', 'testicular tumour']
[997, 1007, 'ENFERMEDAD', 'metastases']
[1166, 1182, 'ENFERMEDAD', 'classic seminoma']
[1196, 1232, 'ENFERMEDAD', 'infiltrate the albuginea or the cord']
[1252, 1282, 'ENFERMEDAD', 'vascular or lymphatic invasion']
[1473, 1482, 'ENFERMEDAD', 'neoplasia']
[1686, 1695, 'ENFERMEDAD', 'Neoplasia']
[2326, 2342, 'ENFERMEDAD', 'classic seminoma']
[2293, 2342, 'ENFERMEDAD', 'abdominal adenopathic relapse of classic seminoma']
[283, 301, 'ENFERMEDAD', 'hepatosplenomegaly']
[972, 982, 'ENFERMEDAD', 'metastasis']
[1006, 1035, 'ENFERMEDAD', 'multiple pulmonary metastases']
[1049, 1065, 'ENFERMEDAD', 'pleural effusion']
[1025, 1035, 'ENFERMEDAD', 'metastases']
[1200, 1222, 'ENFERMEDAD', 'metastatic involvement']
[1366, 1388, 'ENFERMEDAD', 'metastatic involvement']
[1273, 1289, 'ENFERMEDAD', 'pleural effusion']
[1426, 14

[65, 75, 'ENFERMEDAD', 'varicocele']
[598, 608, 'ENFERMEDAD', 'varicocele']
[979, 994, 'ENFERMEDAD', 'bone metastases']
[1588, 1613, 'ENFERMEDAD', 'renal fibromyxoid sarcoma']
[1452, 1463, 'ENFERMEDAD', 'tumour mass']
[2636, 2698, 'ENFERMEDAD', 'abdominal and retroperitoneal recurrence of high-grade sarcoma']
[2716, 2728, 'ENFERMEDAD', 'fibrosarcoma']
[36, 57, 'ENFERMEDAD', 'arterial hypertension']
[62, 90, 'ENFERMEDAD', 'benign prostatic hyperplasia']
[407, 432, 'ENFERMEDAD', 'retrovesical hydatid cyst']
[155, 176, 'ENFERMEDAD', 'arterial hypertension']
[244, 258, 'ENFERMEDAD', 'duodenal ulcus']
[299, 335, 'ENFERMEDAD', 'infrarenal abdominal aortic aneurysm']
[549, 566, 'ENFERMEDAD', 'horseshoe kidneys']
[327, 335, 'ENFERMEDAD', 'aneurysm']
[739, 747, 'ENFERMEDAD', 'aneurysm']
[1172, 1180, 'ENFERMEDAD', 'aneurysm']
[1376, 1385, 'ENFERMEDAD', 'aneurysms']
[1575, 1583, 'ENFERMEDAD', 'aneurysm']
[1557, 1583, 'ENFERMEDAD', 'infrarenal aortic aneurysm']
[2186, 2207, 'ENFERMEDAD', 'aneurysm

[112, 184, 'ENFERMEDAD', 'Acute coronary syndrome with ST-segment elevation in the anterior aspect']
[283, 354, 'ENFERMEDAD', 'lesion in the middle portion of the anterior descending coronary artery']
[635, 647, 'ENFERMEDAD', 'haematemesis']
[818, 838, 'ENFERMEDAD', 'Mallory Weiss lesion']
[47, 69, 'ENFERMEDAD', 'pulmonary tuberculosis']
[71, 88, 'ENFERMEDAD', 'bladder carcinoma']
[167, 184, 'ENFERMEDAD', 'diabetes mellitus']
[186, 207, 'ENFERMEDAD', 'arterial hypertension']
[212, 226, 'ENFERMEDAD', 'hyperuricaemia']
[398, 407, 'ENFERMEDAD', 'skin rash']
[559, 562, 'ENFERMEDAD', 'NET']
[688, 707, 'ENFERMEDAD', 'respiratory failure']
[746, 757, 'ENFERMEDAD', 'hypotension']
[852, 864, 'ENFERMEDAD', 'skin lesions']
[44, 67, 'ENFERMEDAD', 'acute coronary syndrome']
[263, 278, 'ENFERMEDAD', 'cerebral oedema']
[763, 771, 'ENFERMEDAD', 'asystole']
[901, 909, 'ENFERMEDAD', 'Asystole']
[1133, 1150, 'ENFERMEDAD', 'bronchoaspiration']
[69, 74, 'ENFERMEDAD', 'burns']
[163, 168, 'ENFERMEDAD', 'burn

[23, 85, 'ENFERMEDAD', 'stage 4 CKD secondary to hepatorenal polycystic kidney disease']
[48, 85, 'ENFERMEDAD', 'hepatorenal polycystic kidney disease']
[118, 139, 'ENFERMEDAD', 'arterial hypertension']
[141, 165, 'ENFERMEDAD', 'type 2 diabetes mellitus']
[167, 181, 'ENFERMEDAD', 'hyperuricaemia']
[183, 196, 'ENFERMEDAD', 'dyslipidaemia']
[201, 238, 'ENFERMEDAD', 'chronic obstructive pulmonary disease']
[263, 275, 'ENFERMEDAD', 'advanced CKD']
[1388, 1412, 'ENFERMEDAD', 'indirect inguinal hernia']
[1397, 1412, 'ENFERMEDAD', 'inguinal hernia']
[1559, 1574, 'ENFERMEDAD', 'inguinal hernia']
[825, 839, 'ENFERMEDAD', 'genital oedema']
[1589, 1610, 'ENFERMEDAD', 'peritoneovaginal duct']
[60, 79, 'ENFERMEDAD', 'hypertensive crises']
[1220, 1261, 'ENFERMEDAD', 'paraganglioma of the organ of Zuckerkandl']
[1220, 1233, 'ENFERMEDAD', 'paraganglioma']
[1455, 1472, 'ENFERMEDAD', 'intracaval tumour']
[1733, 1746, 'ENFERMEDAD', 'paraganglioma']
[46, 65, 'ENFERMEDAD', 'alcoholic hepatitis']
[126, 144,

[42, 45, 'ENFERMEDAD', 'PNH']
[215, 222, 'ENFERMEDAD', 'anaemia']
[197, 222, 'ENFERMEDAD', 'severe haemolytic anaemia']
[622, 648, 'ENFERMEDAD', 'repeated haemolytic crises']
[929, 932, 'ENFERMEDAD', 'PNH']
[859, 886, 'ENFERMEDAD', 'subcortical lacunar lesions']
[879, 886, 'ENFERMEDAD', 'lesions']
[1050, 1057, 'ENFERMEDAD', 'anaemia']
[54, 68, 'ENFERMEDAD', 'kyphoscoliosis']
[112, 126, 'ENFERMEDAD', 'diverticulosis']
[155, 205, 'ENFERMEDAD', 'peritonitis secondary to perforated diverticulitis']
[180, 205, 'ENFERMEDAD', 'perforated diverticulitis']
[279, 303, 'ENFERMEDAD', 'entero-cutaneous fistula']
[1331, 1350, 'ENFERMEDAD', 'acute renal failure']
[1379, 1392, 'ENFERMEDAD', 'hyponatraemia']
[1397, 1410, 'ENFERMEDAD', 'hyperkalaemia']
[1352, 1370, 'ENFERMEDAD', 'metabolic acidosis']
[1435, 1462, 'ENFERMEDAD', 'acute adrenal insufficiency']
[1441, 1462, 'ENFERMEDAD', 'adrenal insufficiency']
[1318, 1329, 'ENFERMEDAD', 'dehydration']
[1834, 1856, 'ENFERMEDAD', 'intestinal obstruction']
[

[87, 105, 'ENFERMEDAD', 'Metabolic Diseases']
[163, 180, 'ENFERMEDAD', 'metabolic disease']
[261, 273, 'ENFERMEDAD', 'microcephaly']
[278, 303, 'ENFERMEDAD', 'severe mental retardation']
[363, 383, 'ENFERMEDAD', 'cardiac malformation']
[702, 734, 'ENFERMEDAD', 'mild-moderate mental retardation']
[1114, 1117, 'ENFERMEDAD', 'PKU']
[1166, 1196, 'ENFERMEDAD', 'disorders of pterin metabolism']
[1429, 1444, 'ENFERMEDAD', 'phenylketonuria']
[1596, 1599, 'ENFERMEDAD', 'PKU']
[2464, 2467, 'ENFERMEDAD', 'PKU']
[404, 411, 'ENFERMEDAD', 'anaemia']
[87, 100, 'ENFERMEDAD', 'gastric ulcer']
[210, 225, 'ENFERMEDAD', 'alkaline reflux']
[312, 334, 'ENFERMEDAD', 'intestinal obstruction']
[346, 358, 'ENFERMEDAD', 'malnutrition']
[364, 387, 'ENFERMEDAD', 'severe hypoalbuminaemia']
[486, 505, 'ENFERMEDAD', 'immobility syndrome']
[651, 658, 'ENFERMEDAD', 'anaemia']
[760, 795, 'ENFERMEDAD', 'severe protein-calorie malnutrition']
[990, 998, 'ENFERMEDAD', 'anasarca']
[783, 795, 'ENFERMEDAD', 'malnutrition']
[10

[183, 211, 'ENFERMEDAD', 'upper respiratory infections']
[261, 285, 'ENFERMEDAD', 'infectious mononucleosis']
[504, 521, 'ENFERMEDAD', 'nasal obstruction']
[1835, 1844, 'ENFERMEDAD', 'sinusitis']
[2087, 2096, 'ENFERMEDAD', 'sinusitis']
[1849, 1859, 'ENFERMEDAD', 'meningitis']
[2152, 2178, 'ENFERMEDAD', 'cavernous sinus thrombosis']
[2181, 2193, 'ENFERMEDAD', 'encephalitis']
[2302, 2319, 'ENFERMEDAD', 'acute sinusopathy']
[2355, 2364, 'ENFERMEDAD', 'sinusitis']
[87, 112, 'ENFERMEDAD', 'gastro-oesophageal reflux']
[117, 135, 'ENFERMEDAD', 'incompetent cardia']
[345, 360, 'ENFERMEDAD', 'nephrolithiasis']
[516, 527, 'ENFERMEDAD', 'renal colic']
[883, 897, 'ENFERMEDAD', 'hydronephrosis']
[1761, 1775, 'ENFERMEDAD', 'hydronephrosis']
[2924, 2941, 'ENFERMEDAD', 'testicular tumour']
[210, 216, 'ENFERMEDAD', 'smoker']
[249, 259, 'ENFERMEDAD', 'ex-drinker']
[1848, 1855, 'ENFERMEDAD', 'lesions']
[1781, 1787, 'ENFERMEDAD', 'lesion']
[2738, 2744, 'ENFERMEDAD', 'lesion']
[1098, 1117, 'ENFERMEDAD', 'c

[36, 39, 'ENFERMEDAD', 'SLE']
[949, 952, 'ENFERMEDAD', 'SLE']
[44, 69, 'ENFERMEDAD', 'antiphospholipid syndrome']
[462, 477, 'ENFERMEDAD', 'lymphadenopathy']
[425, 443, 'ENFERMEDAD', 'hepatosplenomegaly']
[626, 644, 'ENFERMEDAD', 'hepatosplenomegaly']
[668, 675, 'ENFERMEDAD', 'lesions']
[465, 481, 'ENFERMEDAD', 'bronchial asthma']
[437, 443, 'ENFERMEDAD', 'smoker']
[1385, 1412, 'ENFERMEDAD', 'severe pericardial effusion']
[1392, 1412, 'ENFERMEDAD', 'pericardial effusion']
[1254, 1266, 'ENFERMEDAD', 'cardiomegaly']
[2003, 2023, 'ENFERMEDAD', 'pericardial effusion']
[2917, 2943, 'ENFERMEDAD', 'bilateral pleural effusion']
[3838, 3855, 'ENFERMEDAD', 'acute lung damage']
[3891, 3924, 'ENFERMEDAD', 'diffuse interstitial lung disease']
[4026, 4048, 'ENFERMEDAD', 'eosinophilic pneumonia']
[4498, 4524, 'ENFERMEDAD', 'bilateral pleural effusion']
[4489, 4524, 'ENFERMEDAD', 'moderate bilateral pleural effusion']
[4720, 4734, 'ENFERMEDAD', 'adenocarcinoma']
[4824, 4838, 'ENFERMEDAD', 'adenocarcin

[308, 317, 'ENFERMEDAD', 'exotropia']
[699, 702, 'ENFERMEDAD', 'AOC']
[334, 354, 'ENFERMEDAD', 'horizontal nystagmus']
[982, 985, 'ENFERMEDAD', 'AOC']
[355, 373, 'ENFERMEDAD', 'epileptic seizures']
[1059, 1083, 'ENFERMEDAD', 'Topamax toxic phenomenon']
[51, 75, 'ENFERMEDAD', 'bilateral loss of vision']
[213, 221, 'ENFERMEDAD', 'epilepsy']
[354, 379, 'ENFERMEDAD', 'bilateral central scotoma']
[402, 423, 'ENFERMEDAD', 'bilateral maculopathy']
[61, 75, 'ENFERMEDAD', 'loss of vision']
[158, 171, 'ENFERMEDAD', 'brachydactyly']
[407, 425, 'ENFERMEDAD', 'monocular diplopia']
[417, 425, 'ENFERMEDAD', 'diplopia']
[634, 661, 'ENFERMEDAD', 'bilateral iridophacodonesis']
[685, 702, 'ENFERMEDAD', 'microspherophakia']
[1057, 1072, 'ENFERMEDAD', 'angular closure']
[1205, 1213, 'ENFERMEDAD', 'diplopia']
[1429, 1448, 'ENFERMEDAD', 'glaucomatous damage']
[1636, 1648, 'ENFERMEDAD', 'spherophakia']
[1667, 1680, 'ENFERMEDAD', 'brachydactyly']
[204, 229, 'ENFERMEDAD', 'angina on slight exertion']
[536, 564,

[203, 228, 'ENFERMEDAD', 'autoimmune Evans syndrome']
[536, 566, 'ENFERMEDAD', 'posterior subcapsular cataract']
[628, 723, 'ENFERMEDAD', 'neurosensory and retinal pigment epithelium detachment (RPE) in the posterior pole of both eyes']
[558, 566, 'ENFERMEDAD', 'cataract']
[951, 962, 'ENFERMEDAD', 'detachments']
[780, 787, 'ENFERMEDAD', 'lesions']
[879, 886, 'ENFERMEDAD', 'lesions']
[1461, 1508, 'ENFERMEDAD', 'diffuse large B-cell lymphoma with CD20+ marker']
[1482, 1490, 'ENFERMEDAD', 'lymphoma']
[1578, 1586, 'ENFERMEDAD', 'lymphoma']
[1978, 1986, 'ENFERMEDAD', 'lymphoma']
[2231, 2239, 'ENFERMEDAD', 'cataract']
[2159, 2170, 'ENFERMEDAD', 'detachments']
[1161, 1181, 'ENFERMEDAD', 'persistent diarrhoea']
[42, 52, 'ENFERMEDAD', 'chickenpox']
[579, 587, 'ENFERMEDAD', 'vitritis']
[609, 618, 'ENFERMEDAD', 'retinitis']
[850, 859, 'ENFERMEDAD', 'retinitis']
[897, 915, 'ENFERMEDAD', 'retinal vasculitis']
[1195, 1211, 'ENFERMEDAD', 'retinal necrosis']
[1433, 1441, 'ENFERMEDAD', 'vitritis']
[203

[671, 694, 'ENFERMEDAD', 'bilateral hypernephroma']
[808, 840, 'ENFERMEDAD', 'pancreatic neuroendocrine tumour']
[136, 147, 'ENFERMEDAD', 'VHL disease']
[542, 548, 'ENFERMEDAD', 'lesion']
[1012, 1034, 'ENFERMEDAD', 'subretinal haemorrhage']
[1065, 1085, 'ENFERMEDAD', 'vitreous haemorrhage']
[1358, 1372, 'ENFERMEDAD', 'macular oedema']
[1223, 1229, 'ENFERMEDAD', 'lesion']
[1435, 1441, 'ENFERMEDAD', 'lesion']
[1588, 1594, 'ENFERMEDAD', 'lesion']
[203, 211, 'ENFERMEDAD', 'glaucoma']
[363, 375, 'ENFERMEDAD', 'microcorneas']
[630, 647, 'ENFERMEDAD', 'mild micrognathia']
[652, 708, 'ENFERMEDAD', 'syndactyly of the fourth and fifth fingers of both hands']
[422, 442, 'ENFERMEDAD', 'horizontal nystagmus']
[120, 129, 'ENFERMEDAD', 'nystagmus']
[433, 442, 'ENFERMEDAD', 'nystagmus']
[566, 586, 'ENFERMEDAD', 'narrow nasal pyramid']
[592, 607, 'ENFERMEDAD', 'narrow nostrils']
[612, 628, 'ENFERMEDAD', 'thin nasal wings']
[57, 71, 'ENFERMEDAD', 'blurred vision']
[826, 832, 'ENFERMEDAD', 'sprain']
[87,

[562, 568, 'ENFERMEDAD', 'trauma']
[60, 77, 'ENFERMEDAD', 'cloacal exstrophy']
[258, 275, 'ENFERMEDAD', 'pubic eventration']
[286, 299, 'ENFERMEDAD', 'scar sequelae']
[264, 275, 'ENFERMEDAD', 'eventration']
[307, 336, 'ENFERMEDAD', 'incontinent urinary reservoir']
[1581, 1592, 'ENFERMEDAD', 'eventration']
[1912, 1927, 'ENFERMEDAD', 'pubic diastasis']
[48, 65, 'ENFERMEDAD', 'cloacal exstrophy']
[1044, 1060, 'ENFERMEDAD', 'abdominal defect']
[1587, 1594, 'ENFERMEDAD', 'keloids']
[1538, 1585, 'ENFERMEDAD', 'Persistent residual oedema of the cervical flap']
[717, 743, 'ENFERMEDAD', 'generalised polyneuropathy']
[1035, 1055, 'ENFERMEDAD', 'pulmonary herniation']
[1352, 1361, 'ENFERMEDAD', 'pneumonia']
[325, 339, 'ENFERMEDAD', 'surgical wound']
[47, 83, 'ENFERMEDAD', 'left facial abscess of dental origin']
[509, 556, 'ENFERMEDAD', 'severe dysplasia of the temporomandibular joint']
[672, 699, 'ENFERMEDAD', 'maxillomandibular ankylosis']
[1093, 1114, 'ENFERMEDAD', 'chronic osteomyelitis']
[46,

[1374, 1389, 'ENFERMEDAD', 'bone metastasis']
[1374, 1420, 'ENFERMEDAD', 'bone metastasis of medullary thyroid carcinoma']
[322, 331, 'ENFERMEDAD', 'neoplasia']
[223, 253, 'ENFERMEDAD', 'generalised lytic bone lesions']
[1873, 1890, 'ENFERMEDAD', 'thyroid pathology']
[2241, 2256, 'ENFERMEDAD', 'bone metastases']
[245, 256, 'ENFERMEDAD', 'tumour mass']
[143, 149, 'ENFERMEDAD', 'tumour']
[245, 251, 'ENFERMEDAD', 'tumour']
[307, 313, 'ENFERMEDAD', 'tumour']
[392, 403, 'ENFERMEDAD', 'tumour mass']
[392, 398, 'ENFERMEDAD', 'tumour']
[497, 546, 'ENFERMEDAD', 'involvement of the sinus and pyelocaliceal system']
[937, 973, 'ENFERMEDAD', 'desmoplastic small round cell tumour']
[967, 973, 'ENFERMEDAD', 'tumour']
[1864, 1870, 'ENFERMEDAD', 'tumour']
[2186, 2202, 'ENFERMEDAD', 'liver metastasis']
[2091, 2097, 'ENFERMEDAD', 'tumour']
[2175, 2181, 'ENFERMEDAD', 'tumour']
[80, 94, 'ENFERMEDAD', 'lung carcinoma']
[96, 105, 'ENFERMEDAD', 'Sinusitis']
[612, 625, 'ENFERMEDAD', 'polypoid mass']
[122, 152,

[961, 980, 'ENFERMEDAD', 'ciliated liver cyst']
[77, 93, 'ENFERMEDAD', 'breast carcinoma']
[516, 564, 'ENFERMEDAD', 'cystic formations throughout the pancreatic cell']
[741, 763, 'ENFERMEDAD', 'pancreatic cystadenoma']
[1055, 1088, 'ENFERMEDAD', 'giant cystadenoma of the pancreas']
[863, 868, 'ENFERMEDAD', 'cysts']
[152, 182, 'ENFERMEDAD', 'adenocarcinoma of the prostate']
[1039, 1055, 'ENFERMEDAD', 'hypoalbuminaemia']
[1760, 1775, 'ENFERMEDAD', 'actinic colitis']
[1107, 1120, 'ENFERMEDAD', 'malabsorption']
[1972, 1987, 'ENFERMEDAD', 'lymphadenopathy']
[2498, 2515, 'ENFERMEDAD', 'actinic enteritis']
[3373, 3390, 'ENFERMEDAD', 'actinic enteritis']
[109, 116, 'ENFERMEDAD', 'obesity']
[156, 174, 'ENFERMEDAD', 'spinal cord injury']
[319, 340, 'ENFERMEDAD', 'arterial hypertension']
[188, 204, 'ENFERMEDAD', 'accident at work']
[1524, 1542, 'ENFERMEDAD', 'vitamin deficiency']
[18, 24, 'ENFERMEDAD', 'smoker']
[117, 134, 'ENFERMEDAD', 'biliary lithiasis']
[161, 183, 'ENFERMEDAD', 'Gastric adeno

[67, 74, 'ENFERMEDAD', 'smoking']
[212, 234, 'ENFERMEDAD', 'uterine polymyomatosis']
[407, 420, 'ENFERMEDAD', 'hiatal hernia']
[990, 1004, 'ENFERMEDAD', 'primary tumour']
[1783, 1798, 'ENFERMEDAD', 'lymphadenopathy']
[1870, 1885, 'ENFERMEDAD', 'lymphadenopathy']
[2010, 2022, 'ENFERMEDAD', 'splenic cyst']
[2191, 2209, 'ENFERMEDAD', 'oat-cell carcinoma']
[2232, 2248, 'ENFERMEDAD', 'pleural invasion']
[1971, 1997, 'ENFERMEDAD', 'bilobular liver metastases']
[2547, 2566, 'ENFERMEDAD', 'celiac adenopathies']
[2630, 2648, 'ENFERMEDAD', 'oat-cell carcinoma']
[1390, 1409, 'ENFERMEDAD', 'tonic-clonic crisis']
[558, 592, 'ENFERMEDAD', 'foreign bodies in the mesogastrium']
[28, 31, 'ENFERMEDAD', 'CKD']
[36, 50, 'ENFERMEDAD', 'hypothyroidism']
[129, 142, 'ENFERMEDAD', 'acute abdomen']
[148, 160, 'ENFERMEDAD', 'septic shock']
[298, 315, 'ENFERMEDAD', 'ischaemic colitis']
[155, 160, 'ENFERMEDAD', 'shock']
[422, 427, 'ENFERMEDAD', 'shock']
[321, 329, 'ENFERMEDAD', 'hepatoma']
[653, 668, 'ENFERMEDAD',

[28, 41, 'ENFERMEDAD', 'active smoker']
[555, 576, 'ENFERMEDAD', 'oesophageal carcinoma']
[652, 658, 'ENFERMEDAD', 'lesion']
[135, 161, 'ENFERMEDAD', 'intrahepatic cystic tumour']
[679, 685, 'ENFERMEDAD', 'lesion']
[820, 826, 'ENFERMEDAD', 'lesion']
[912, 918, 'ENFERMEDAD', 'lesion']
[1090, 1105, 'ENFERMEDAD', 'mucinous tumour']
[1176, 1194, 'ENFERMEDAD', 'cystadenocarcinoma']
[1398, 1426, 'ENFERMEDAD', 'intracystic polypoid lesions']
[1484, 1502, 'ENFERMEDAD', 'cystadenocarcinoma']
[1470, 1502, 'ENFERMEDAD', 'mucosecretory cystadenocarcinoma']
[33, 47, 'ENFERMEDAD', 'drug allergies']
[76, 97, 'ENFERMEDAD', 'arterial hypertension']
[99, 123, 'ENFERMEDAD', 'type 2 diabetes mellitus']
[125, 152, 'ENFERMEDAD', 'chronic atrial fibrillation']
[157, 176, 'ENFERMEDAD', "Alzheimer's disease"]
[211, 225, 'ENFERMEDAD', 'coffee grounds']
[484, 497, 'ENFERMEDAD', 'hiatal hernia']
[812, 825, 'ENFERMEDAD', 'actinomycosis']
[661, 667, 'ENFERMEDAD', 'lesion']
[575, 593, 'ENFERMEDAD', 'hypoplastic uter

[265, 282, 'ENFERMEDAD', 'neurofibromatosis']
[167, 173, 'ENFERMEDAD', 'lesion']
[314, 330, 'ENFERMEDAD', 'facial asymmetry']
[991, 1014, 'ENFERMEDAD', 'neurofibromatous lesion']
[527, 539, 'ENFERMEDAD', 'absent teeth']
[502, 514, 'ENFERMEDAD', 'malocclusion']
[516, 525, 'ENFERMEDAD', 'diastemas']
[642, 648, 'ENFERMEDAD', 'lesion']
[1008, 1014, 'ENFERMEDAD', 'lesion']
[1133, 1154, 'ENFERMEDAD', 'mandibular hypoplasia']
[1082, 1101, 'ENFERMEDAD', 'retained element 23']
[1197, 1220, 'ENFERMEDAD', 'neurofibromatous lesion']
[1427, 1444, 'ENFERMEDAD', 'neurofibromatosis']
[1214, 1220, 'ENFERMEDAD', 'lesion']
[1255, 1261, 'ENFERMEDAD', 'lesion']
[1610, 1616, 'ENFERMEDAD', 'lesion']
[352, 362, 'ENFERMEDAD', 'strabismus']
[331, 337, 'ENFERMEDAD', 'lesion']
[509, 528, 'ENFERMEDAD', 'fibrous haemangioma']
[30, 43, 'ENFERMEDAD', 'facial trauma']
[112, 136, 'ENFERMEDAD', 'displaced angle fracture']
[99, 105, 'ENFERMEDAD', 'lesion']
[128, 136, 'ENFERMEDAD', 'fracture']
[158, 164, 'ENFERMEDAD', 'le

[136, 142, 'ENFERMEDAD', 'trauma']
[1634, 1648, 'ENFERMEDAD', 'nodular lesion']
[265, 280, 'ENFERMEDAD', 'renal lithiasis']
[285, 306, 'ENFERMEDAD', 'arterial hypertension']
[772, 781, 'ENFERMEDAD', 'carcinoma']
[76, 82, 'ENFERMEDAD', 'tumour']
[1155, 1161, 'ENFERMEDAD', 'tumour']
[1454, 1478, 'ENFERMEDAD', 'neoplastic proliferation']
[2300, 2309, 'ENFERMEDAD', 'carcinoma']
[2095, 2101, 'ENFERMEDAD', 'tumour']
[2643, 2660, 'ENFERMEDAD', 'tumour recurrence']
[2664, 2674, 'ENFERMEDAD', 'metastasis']
[2643, 2649, 'ENFERMEDAD', 'tumour']
[280, 296, 'ENFERMEDAD', 'malar hypoplasia']
[491, 511, 'ENFERMEDAD', 'maxillary hypoplasia']
[338, 369, 'ENFERMEDAD', 'dysmorphia of the nasal pyramid']
[1781, 1847, 'ENFERMEDAD', 'pseudoaneurysm and its dependence on the internal maxillary artery']
[234, 241, 'ENFERMEDAD', 'anxiety']
[172, 181, 'ENFERMEDAD', 'deformity']
[653, 668, 'ENFERMEDAD', 'parietal lesion']
[585, 605, 'ENFERMEDAD', 'intracranial lesions']
[685, 702, 'ENFERMEDAD', 'fibrous dysplasi

[79, 104, 'ENFERMEDAD', 'gastrointestinal bleeding']
[124, 144, 'ENFERMEDAD', 'mitral valve disease']
[252, 271, 'ENFERMEDAD', 'intestinal bleeding']
[521, 540, 'ENFERMEDAD', 'intestinal bleeding']
[299, 329, 'ENFERMEDAD', 'severe iron deficiency anaemia']
[631, 646, 'ENFERMEDAD', 'angiodysplasias']
[957, 972, 'ENFERMEDAD', 'angiodysplasias']
[1040, 1055, 'ENFERMEDAD', 'angiodysplasias']
[1034, 1055, 'ENFERMEDAD', 'ileal angiodysplasias']
[1264, 1271, 'ENFERMEDAD', 'lesions']
[1848, 1877, 'ENFERMEDAD', 'severe pulmonary hypertension']
[2080, 2105, 'ENFERMEDAD', 'pulmonary thromboembolism']
[47, 53, 'ENFERMEDAD', 'smoker']
[106, 140, 'ENFERMEDAD', 'chronic hepatitis C genotype 1a/1c']
[175, 183, 'ENFERMEDAD', 'fibrosis']
[114, 125, 'ENFERMEDAD', 'hepatitis C']
[303, 314, 'ENFERMEDAD', 'hepatitis C']
[831, 838, 'ENFERMEDAD', 'anxiety']
[1651, 1669, 'ENFERMEDAD', 'Acute pancreatitis']
[124, 137, 'ENFERMEDAD', 'hypoglycaemia']
[206, 235, 'ENFERMEDAD', 'urinary infectious conditions']
[445,

[156, 161, 'ENFERMEDAD', 'obese']
[116, 130, 'ENFERMEDAD', 'polyneuropathy']
[1105, 1127, 'ENFERMEDAD', 'respiratory depression']
[96, 112, 'ENFERMEDAD', 'chorioamnionitis']
[416, 434, 'ENFERMEDAD', 'hepatosplenomegaly']
[665, 683, 'ENFERMEDAD', 'hepatosplenomegaly']
[2415, 2437, 'ENFERMEDAD', 'right pleural effusion']
[817, 839, 'ENFERMEDAD', 'vascular malformations']
[687, 694, 'ENFERMEDAD', 'lesions']
[1196, 1211, 'ENFERMEDAD', 'foetal distress']
[2258, 2282, 'ENFERMEDAD', 'thromboembolic phenomena']
[1079, 1082, 'ENFERMEDAD', 'ALL']
[63, 80, 'ENFERMEDAD', 'thyroglossal cyst']
[116, 123, 'ENFERMEDAD', 'obesity']
[326, 374, 'ENFERMEDAD', 'laterocervical and submandibular lymphadenopathy']
[376, 388, 'ENFERMEDAD', 'splenomegaly']
[408, 420, 'ENFERMEDAD', 'hepatomegaly']
[761, 794, 'ENFERMEDAD', 'haematological neoplastic process']
[1441, 1444, 'ENFERMEDAD', 'ALL']
[2491, 2494, 'ENFERMEDAD', 'all']
[2849, 2852, 'ENFERMEDAD', 'all']
[66, 75, 'ENFERMEDAD', 'ex-smoker']
[103, 127, 'ENFERM

[286, 311, 'ENFERMEDAD', 'severe metabolic acidosis']
[313, 325, 'ENFERMEDAD', 'hypokalaemia']
[330, 349, 'ENFERMEDAD', 'acute renal failure']
[149, 155, 'ENFERMEDAD', 'wounds']
[473, 479, 'ENFERMEDAD', 'wounds']
[777, 783, 'ENFERMEDAD', 'wounds']
[1134, 1168, 'ENFERMEDAD', 'intraparotid arteriovenous fistula']
[1696, 1711, 'ENFERMEDAD', 'vascular lesion']
[2357, 2399, 'ENFERMEDAD', 'occlusion of the internal maxillary artery']
[191, 249, 'ENFERMEDAD', 'penetrating wound at the level of the submandibular region']
[1901, 1916, 'ENFERMEDAD', 'intraoral wound']
[1987, 2006, 'ENFERMEDAD', 'submandibular wound']
[2114, 2128, 'ENFERMEDAD', 'pneumocephalus']
[2310, 2331, 'ENFERMEDAD', 'neurological disorder']
[2427, 2473, 'ENFERMEDAD', 'conductive hearing loss of 60% in the left ear']
[103, 125, 'ENFERMEDAD', 'hyperemesis gravidarum']
[212, 228, 'ENFERMEDAD', 'ocular proptosis']
[393, 399, 'ENFERMEDAD', 'trauma']
[439, 451, 'ENFERMEDAD', 'exophthalmos']
[457, 470, 'ENFERMEDAD', 'hypophthalmos

[753, 765, 'ENFERMEDAD', 'skin lesions']
[1796, 1813, 'ENFERMEDAD', 'hepatitis B and C']
[1759, 1763, 'ENFERMEDAD', 'lues']
[3837, 3858, 'ENFERMEDAD', 'vasculitis infarction']
[241, 264, 'ENFERMEDAD', 'squamous cell carcinoma']
[445, 468, 'ENFERMEDAD', 'squamous cell carcinoma']
[1026, 1038, 'ENFERMEDAD', 'haematemesis']
[54, 86, 'ENFERMEDAD', 'generalised tonic-clonic seizure']
[917, 945, 'ENFERMEDAD', 'cocaine metabolites in urine']
[1121, 1144, 'ENFERMEDAD', 'regular cannabis smoker']
[1176, 1187, 'ENFERMEDAD', 'cocaine use']
[96, 114, 'ENFERMEDAD', 'infectious process']
[205, 217, 'ENFERMEDAD', 'metrorrhagia']
[1113, 1136, 'ENFERMEDAD', 'hypercalcaemic syndrome']
[1608, 1625, 'ENFERMEDAD', 'uterine neoplasia']
[1731, 1749, 'ENFERMEDAD', 'Douglas pouch mass']
[1755, 1781, 'ENFERMEDAD', 'peritoneal tumour implants']
[1786, 1806, 'ENFERMEDAD', 'pulmonary metastases']
[1891, 1927, 'ENFERMEDAD', 'recurrence of her neoplastic disease']
[44, 75, 'ENFERMEDAD', 'repeated respiratory infecti

[37, 58, 'ENFERMEDAD', 'ulcerative pancolitis']
[439, 460, 'ENFERMEDAD', 'ulcerative pancolitis']
[68, 84, 'ENFERMEDAD', 'corticodependent']
[150, 180, 'ENFERMEDAD', 'cytomegalovirus superinfection']
[272, 296, 'ENFERMEDAD', 'diarrhoea with red blood']
[331, 362, 'ENFERMEDAD', 'chronic iron deficiency anaemia']
[53, 81, 'ENFERMEDAD', 'Laurence-Moon-Biell syndrome']
[94, 106, 'ENFERMEDAD', 'hypogonadism']
[112, 119, 'ENFERMEDAD', 'obesity']
[121, 139, 'ENFERMEDAD', 'mental retardation']
[141, 152, 'ENFERMEDAD', 'polydactyly']
[154, 174, 'ENFERMEDAD', 'retinitis pigmentosa']
[179, 192, 'ENFERMEDAD', 'renal failure']
[312, 329, 'ENFERMEDAD', 'venous thrombosis']
[531, 542, 'ENFERMEDAD', 'peritonitis']
[712, 723, 'ENFERMEDAD', 'peritonitis']
[547, 573, 'ENFERMEDAD', 'severe hyperparathyroidism']
[816, 847, 'ENFERMEDAD', 'staphylococcal tunnel infection']
[1033, 1079, 'ENFERMEDAD', 'peritoneal eventration at the catheter orifice']
[1109, 1170, 'ENFERMEDAD', 'sclerosis and calcification of t

[340, 354, 'ENFERMEDAD', 'polyhydramnios']
[1306, 1324, 'ENFERMEDAD', 'metabolic acidosis']
[1767, 1783, 'ENFERMEDAD', 'nephrocalcinosis']
[2250, 2266, 'ENFERMEDAD', 'nephrocalcinosis']
[337, 356, 'ENFERMEDAD', 'mesenteric adenitis']
[686, 736, 'ENFERMEDAD', 'mild-moderate dilatation of the right renal pelvis']
[808, 839, 'ENFERMEDAD', 'pyeloureteral junction stenosis']
[854, 876, 'ENFERMEDAD', 'intestinal obstruction']
[1216, 1222, 'ENFERMEDAD', 'cystic']
[1498, 1525, 'ENFERMEDAD', 'intra-abdominal cystic mass']
[1514, 1520, 'ENFERMEDAD', 'cystic']
[1828, 1834, 'ENFERMEDAD', 'cystic']
[1900, 1906, 'ENFERMEDAD', 'cystic']
[2431, 2460, 'ENFERMEDAD', 'mesenteric cystic lymphagioma']
[2468, 2492, 'ENFERMEDAD', 'multiseptate cystic mass']
[2442, 2448, 'ENFERMEDAD', 'cystic']
[2481, 2487, 'ENFERMEDAD', 'cystic']
[86, 102, 'ENFERMEDAD', 'vaginal bleeding']
[391, 403, 'ENFERMEDAD', 'sexual abuse']
[553, 565, 'ENFERMEDAD', 'sexual abuse']
[805, 817, 'ENFERMEDAD', 'sexual abuse']
[516, 536, 'EN

[721, 750, 'ENFERMEDAD', 'amyotrophic lateral sclerosis']
[752, 755, 'ENFERMEDAD', 'ALS']
[974, 985, 'ENFERMEDAD', 'paraparesis']
[1281, 1314, 'ENFERMEDAD', 'Muscle atrophy in both quadriceps']
[1880, 1883, 'ENFERMEDAD', 'ALS']
[2009, 2012, 'ENFERMEDAD', 'ALS']
[2564, 2572, 'ENFERMEDAD', 'myopathy']
[2592, 2600, 'ENFERMEDAD', 'myopathy']
[2659, 2667, 'ENFERMEDAD', 'myopathy']
[2592, 2642, 'ENFERMEDAD', 'myopathy with bulbar and pelvic girdle involvement']
[2644, 2667, 'ENFERMEDAD', 'inclusion body myopathy']
[2383, 2392, 'ENFERMEDAD', 'dysphagia']
[2314, 2325, 'ENFERMEDAD', 'paraparesis']
[2305, 2325, 'ENFERMEDAD', 'proximal paraparesis']
[2352, 2381, 'ENFERMEDAD', 'muscle atrophy of both thighs']
[2772, 2803, 'ENFERMEDAD', 'primary skeletal muscle disease']
[3129, 3136, 'ENFERMEDAD', 'aphonia']
[3207, 3210, 'ENFERMEDAD', 'ALS']
[3162, 3182, 'ENFERMEDAD', 'motor neuron disease']
[3408, 3438, 'ENFERMEDAD', 'septic shock of urinary origin']
[3579, 3596, 'ENFERMEDAD', 'adaptive disorder']

[52, 66, 'ENFERMEDAD', 'drug allergies']
[116, 143, 'ENFERMEDAD', 'vertebral and rib fractures']
[161, 180, 'ENFERMEDAD', "Dupuytren's disease"]
[256, 276, 'ENFERMEDAD', 'hypercholesterolemia']
[281, 295, 'ENFERMEDAD', 'hyperuricaemia']
[297, 314, 'ENFERMEDAD', 'active alcoholism']
[316, 322, 'ENFERMEDAD', 'smoker']
[655, 671, 'ENFERMEDAD', 'prostate adenoma']
[1059, 1115, 'ENFERMEDAD', 'vascular calcifications in both hypochondrium and pelvis']
[1469, 1498, 'ENFERMEDAD', 'ureteral pseudodiverticulosis']
[1588, 1602, 'ENFERMEDAD', 'stress bladder']
[1677, 1692, 'ENFERMEDAD', 'bladder tumours']
[1775, 1822, 'ENFERMEDAD', 'superficial urothelial carcinoma of the bladder']
[452, 463, 'ENFERMEDAD', 'brucellosis']
[656, 673, 'ENFERMEDAD', 'orchiepididymitis']
[890, 896, 'ENFERMEDAD', 'goitre']
[1257, 1271, 'ENFERMEDAD', 'varicose veins']
[2478, 2492, 'ENFERMEDAD', 'microabscesses']
[2516, 2533, 'ENFERMEDAD', 'orchiepididymitis']
[2516, 2555, 'ENFERMEDAD', 'orchiepididymitis secondary to Bru

[85, 97, 'ENFERMEDAD', 'metrorrhagia']
[118, 142, 'ENFERMEDAD', 'gynaecological pathology']
[297, 307, 'ENFERMEDAD', 'leiomyomas']
[388, 421, 'ENFERMEDAD', 'repeated urinary tract infections']
[596, 616, 'ENFERMEDAD', 'urothelial dysplasia']
[748, 757, 'ENFERMEDAD', 'neoplasia']
[1482, 1494, 'ENFERMEDAD', 'desmoid cyst']
[2334, 2343, 'ENFERMEDAD', 'neoplasia']
[1832, 1848, 'ENFERMEDAD', 'cystic formation']
[1995, 2050, 'ENFERMEDAD', 'grade III papillary neoplasm of transitional epithelium']
[2195, 2246, 'ENFERMEDAD', 'tumour infiltrates the muscular wall of the bladder']
[221, 234, 'ENFERMEDAD', 'heart failure']
[251, 270, 'ENFERMEDAD', 'atrial fibrillation']
[291, 310, 'ENFERMEDAD', 'urological diseases']
[667, 689, 'ENFERMEDAD', 'microscopic haematuria']
[1038, 1050, 'ENFERMEDAD', 'pyonephrosis']
[1625, 1661, 'ENFERMEDAD', 'dilatation of the pyelocaliceal tree']
[1666, 1704, 'ENFERMEDAD', 'marked atrophy of the renal parenchyma']
[1849, 1916, 'ENFERMEDAD', 'abcedification of the rena

[52, 79, 'ENFERMEDAD', 'chronic atrial fibrillation']
[93, 121, 'ENFERMEDAD', 'massive intestinal ischaemia']
[417, 436, 'ENFERMEDAD', "Parkinson's disease"]
[575, 603, 'ENFERMEDAD', 'community-acquired pneumonia']
[669, 699, 'ENFERMEDAD', 'catheter-associated infections']
[701, 710, 'ENFERMEDAD', 'infection']
[344, 356, 'ENFERMEDAD', 'hepatomegaly']
[90, 96, 'ENFERMEDAD', 'lesion']
[412, 418, 'ENFERMEDAD', 'lesion']
[670, 687, 'ENFERMEDAD', 'aortic elongation']
[914, 958, 'ENFERMEDAD', 'thickening of the oesophago-gastric junction']
[1010, 1023, 'ENFERMEDAD', 'liver lesions']
[1094, 1117, 'ENFERMEDAD', 'neoplasia of the cardia']
[796, 810, 'ENFERMEDAD', 'adenocarcinoma']
[1135, 1149, 'ENFERMEDAD', 'adenocarcinoma']
[1193, 1207, 'ENFERMEDAD', 'adenocarcinoma']
[1174, 1207, 'ENFERMEDAD', 'metastatic gastric adenocarcinoma']
[1436, 1442, 'ENFERMEDAD', 'tumour']
[1519, 1556, 'ENFERMEDAD', 'tumours of the gastrointestinal tract']
[1601, 1624, 'ENFERMEDAD', 'haematological toxicity']
[1630,

In [269]:
file_no = 1
sentence_no = 1

In [270]:
res['tokens'][file_no][sentence_no]

[('The', 139),
 ('first', 143),
 ('of', 149),
 ('the', 152),
 ('corpses', 156),
 (',', 163),
 ('corresponding', 165),
 ('to', 179),
 ('the', 182),
 ('female', 186),
 (',', 192),
 ('was', 194),
 ('referred', 198),
 ('with', 207),
 ('the', 212),
 ('clinical', 216),
 ('judgement', 225),
 ('of', 235),
 ('severe', 238),
 ('respiratory', 245),
 ('failure', 257),
 ('with', 265),
 ('suspected', 270),
 ('Potter', 280),
 ("'s", 286),
 ('Syndrome', 289),
 ('and', 298),
 ('severe', 302),
 ('oligohydramnios', 309),
 (';', 324),
 ('she', 326),
 ('was', 330),
 ('born', 334),
 ('by', 339),
 ('emergency', 342),
 ('caesarean', 352),
 ('section', 362),
 ('due', 370),
 ('to', 374),
 ('breech', 377),
 ('presentation', 384),
 ('and', 397),
 ('the', 401),
 ('Apgar', 405),
 ('test', 411),
 ('was', 416),
 ('1/3/7', 420),
 (';', 425),
 ('minutes', 427),
 ('later', 435),
 ('she', 441),
 ('died', 445),
 ('.', 449)]

In [271]:
res['tags'][file_no][sentence_no]

['O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'B-ENFERMEDAD',
 'I-ENFERMEDAD',
 'I-ENFERMEDAD',
 'O',
 'O',
 'B-ENFERMEDAD',
 'I-ENFERMEDAD',
 'I-ENFERMEDAD',
 'O',
 'B-ENFERMEDAD',
 'I-ENFERMEDAD',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O',
 'O']

In [272]:
res['sentence_ids'][file_no]

[0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15]

In [273]:
res['entities'][file_no]

[[238, 264, 'ENFERMEDAD', 'severe respiratory failure'],
 [280, 297, 'ENFERMEDAD', "Potter's Syndrome"],
 [302, 324, 'ENFERMEDAD', 'severe oligohydramnios'],
 [556, 568, 'ENFERMEDAD', 'micrognathia'],
 [1057, 1062, 'ENFERMEDAD', 'cysts'],
 [1907, 1912, 'ENFERMEDAD', 'cysts'],
 [2004, 2009, 'ENFERMEDAD', 'cysts'],
 [2158, 2163, 'ENFERMEDAD', 'cysts'],
 [2262, 2267, 'ENFERMEDAD', 'cysts'],
 [2332, 2337, 'ENFERMEDAD', 'cysts'],
 [2252, 2267, 'ENFERMEDAD', 'medullary cysts'],
 [1004, 1021, 'ENFERMEDAD', 'cystic formations']]

In [274]:
res['text'][file_no]

"Two newborns, male and female from the same mother, died at 10 and 45 minutes of life respectively, and underwent post-mortem examination. The first of the corpses, corresponding to the female, was referred with the clinical judgement of severe respiratory failure with suspected Potter's Syndrome and severe oligohydramnios; she was born by emergency caesarean section due to breech presentation and the Apgar test was 1/3/7; minutes later she died. External examination revealed a subcyanotic colour, triangular facies with mongoloid parpebral fissures, micrognathia, broad nasal root and prominent occiput. The abdomen, globular, hard and slightly dented, allowed the palpation of two large masses occupying both renal fossae and hemiabdomenes. When the cavities were opened, the presence of two large renal masses measuring 10 x 8 x 5.5 cm and 12 x 8 x 6 cm with weights of 190 and 235 g respectively, stood out. Although the renal silhouette could be discerned, the surface, dented, showed nume