## Import and Data Load

In [None]:
import pandas as pd
import numpy as np
import json
import requests

## PubTator

In [None]:
def pubtator_generate_struct(pubt_data):
    pubt_res = []
    for dic in pubt_data:
        annot_type = dic['infons']['type']
        if annot_type == "Chemical":
            annot_text = dic['text']
            annot_loc = {'start': dic['locations'][0]['offset'],
                        'end': dic['locations'][0]['offset'] + dic['locations'][0]['length']}
            res = {'text': annot_text, 'location': annot_loc}
            pubt_res.append(res)
    return pubt_res

In [None]:
import time

def pubtator_process(id):

    url = f"https://www.ncbi.nlm.nih.gov/research/pubtator3-api/publications/export/biocjson?pmids={id}&full=true"
    res = requests.get(url)
    print(id)
    res_js = json.loads(res.content)['PubTator3']

    # Only working with abstracts
    pubt_annot = res_js[0]['passages'][1]['annotations']
    display(pubt_annot)
    pubt_res = pubtator_generate_struct(pubt_annot)

    time.sleep(0.6)

    return pubt_res

In [None]:
pubtator_process(11036042)

11036042


[{'id': '12',
  'infons': {'identifier': 'MESH:D012293',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D012293'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D012293',
   'biotype': 'chemical',
   'name': 'Rifampin',
   'accession': '@CHEMICAL_Rifampin'},
  'text': 'rifampin',
  'locations': [{'offset': 117, 'length': 8}]},
 {'id': '13',
  'infons': {'identifier': '1280',
   'type': 'Species',
   'valid': True,
   'normalized': [1280],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1280,
   'biotype': 'species',
   'name': '1280',
   'accession': None},
  'text': 'Staphylococcus aureus',
  'locations': [{'offset': 147, 'length': 21}]},
 {'id': '14',
  'infons': {'identifier': 'MESH:C100307',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C100307'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C100307',
   'biotype': 'chemical',
   'name': 'streptolydigin',
   'accession': '@CHEMICAL_streptolydigin'},
  'text': 'streptolydigin',
  'locations': [{

[{'text': 'rifampin', 'location': {'start': 117, 'end': 125}},
 {'text': 'streptolydigin', 'location': {'start': 408, 'end': 422}},
 {'text': 'sorangicin A.', 'location': {'start': 427, 'end': 440}},
 {'text': 'thiolutin', 'location': {'start': 454, 'end': 463}},
 {'text': 'holomycin', 'location': {'start': 465, 'end': 474}},
 {'text': 'corallopyronin A', 'location': {'start': 476, 'end': 492}},
 {'text': 'ripostatin A', 'location': {'start': 498, 'end': 510}}]

## Procesar Dataset Positivo

In [None]:
pos_df = pd.read_excel("/content/DatasetPositivo.xlsx")
pos_df.dropna(subset=['Abstract'], inplace=True)
pos_df

Unnamed: 0,PMC_ID,PMID,Title,Abstract,T5,Alpaca,LaMini,Score,Answer,Unnamed: 9
0,101622.0,11036042.0,RNA polymerase inhibitors with activity agains...,A collection of rifampin-resistant mutants of ...,<pad> yes</s>,Yes,Yes.,3,YES,
1,10187937.0,37192172.0,Streptothricin F is a bactericidal antibiotic ...,The streptothricin natural product mixture (al...,<pad> yes</s>,yes,The context does not provide information on wh...,2.5,YES,
2,1162199.0,6258580.0,Interaction of pseudomonic acid A with Escheri...,Sodium pseudomonate was shown to be a powerful...,<pad> yes</s>,Yes.,The context describes the active inhibition an...,3,YES,
3,1251517.0,16189117.0,"Efficacy of telavancin (TD-6424), a rapidly ba...","The efficacy of telavancin, a bactericidal lip...",<pad> yes</s>,Yes,Yes.,3,YES,
4,1482072.0,13681272.0,Pharmacology of methicillin.,The pharmacology of a new antibiotic methicill...,<pad> yes</s>,antimicrobial,Yes.,2.5,YES,
...,...,...,...,...,...,...,...,...,...,...
106,89784.0,10722483.0,Pefloxacin-induced achilles tendon toxicity in...,Despite a relatively low incidence of serious ...,<pad> no</s>,Yes,No.,1,NO,
107,8984893.0,35411221.0,Antibiotic heliomycin and its water-soluble 4-...,Bladder cancer is one of the most frequent can...,<pad> yes</s>,Yes; no,Yes.,2.5,YES,
108,90866.0,11709337.0,Target preference of 15 quinolones against Sta...,The antibacterial activities and target inhibi...,<pad> yes</s>,Yes,No.,2,YES,
109,9225766.0,35723082.0,Re-establishing the utility of tetracycline-cl...,The progressive increase in antibiotic resista...,<pad> yes</s>,Yes,Yes.,3,YES,


In [None]:
pos_df['PMID'] = pos_df['PMID'].astype(int)
pos_df

Unnamed: 0,PMC_ID,PMID,Title,Abstract,T5,Alpaca,LaMini,Score,Answer,Unnamed: 9
0,101622.0,11036042,RNA polymerase inhibitors with activity agains...,A collection of rifampin-resistant mutants of ...,<pad> yes</s>,Yes,Yes.,3,YES,
1,10187937.0,37192172,Streptothricin F is a bactericidal antibiotic ...,The streptothricin natural product mixture (al...,<pad> yes</s>,yes,The context does not provide information on wh...,2.5,YES,
2,1162199.0,6258580,Interaction of pseudomonic acid A with Escheri...,Sodium pseudomonate was shown to be a powerful...,<pad> yes</s>,Yes.,The context describes the active inhibition an...,3,YES,
3,1251517.0,16189117,"Efficacy of telavancin (TD-6424), a rapidly ba...","The efficacy of telavancin, a bactericidal lip...",<pad> yes</s>,Yes,Yes.,3,YES,
4,1482072.0,13681272,Pharmacology of methicillin.,The pharmacology of a new antibiotic methicill...,<pad> yes</s>,antimicrobial,Yes.,2.5,YES,
...,...,...,...,...,...,...,...,...,...,...
106,89784.0,10722483,Pefloxacin-induced achilles tendon toxicity in...,Despite a relatively low incidence of serious ...,<pad> no</s>,Yes,No.,1,NO,
107,8984893.0,35411221,Antibiotic heliomycin and its water-soluble 4-...,Bladder cancer is one of the most frequent can...,<pad> yes</s>,Yes; no,Yes.,2.5,YES,
108,90866.0,11709337,Target preference of 15 quinolones against Sta...,The antibacterial activities and target inhibi...,<pad> yes</s>,Yes,No.,2,YES,
109,9225766.0,35723082,Re-establishing the utility of tetracycline-cl...,The progressive increase in antibiotic resista...,<pad> yes</s>,Yes,Yes.,3,YES,


In [None]:
pos_df['PubTator'] = pos_df['PMID'].apply(pubtator_process)

11036042


[{'id': '12',
  'infons': {'identifier': 'MESH:D012293',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D012293'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D012293',
   'biotype': 'chemical',
   'name': 'Rifampin',
   'accession': '@CHEMICAL_Rifampin'},
  'text': 'rifampin',
  'locations': [{'offset': 117, 'length': 8}]},
 {'id': '13',
  'infons': {'identifier': '1280',
   'type': 'Species',
   'valid': True,
   'normalized': [1280],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1280,
   'biotype': 'species',
   'name': '1280',
   'accession': None},
  'text': 'Staphylococcus aureus',
  'locations': [{'offset': 147, 'length': 21}]},
 {'id': '14',
  'infons': {'identifier': 'MESH:C100307',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C100307'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C100307',
   'biotype': 'chemical',
   'name': 'streptolydigin',
   'accession': '@CHEMICAL_streptolydigin'},
  'text': 'streptolydigin',
  'locations': [{

37192172


[{'id': '12630',
  'infons': {'identifier': '470',
   'type': 'Species',
   'valid': True,
   'normalized': [470],
   'database': 'ncbi_taxonomy',
   'normalized_id': 470,
   'biotype': 'species',
   'name': '470',
   'accession': None},
  'text': 'Acinetobacter baumannii',
  'locations': [{'offset': 615, 'length': 23}]},
 {'id': '12632',
  'infons': {'identifier': 'tmVar:p|SUB|S||F;VariantGroup:9',
   'type': 'Variant',
   'valid': False,
   'subtype': 'ProteinMutation',
   'database': 'litvar',
   'rsids': [],
   'normalized': [],
   'normalized_id': None,
   'biotype': 'variant'},
  'text': 'S-F',
  'locations': [{'offset': 1008, 'length': 3}]},
 {'id': '12633',
  'infons': {'identifier': 'tmVar:p|Allele|S|16;VariantGroup:2',
   'type': 'Variant',
   'valid': False,
   'subtype': 'ProteinMutation',
   'database': 'litvar',
   'rsids': [],
   'normalized': [],
   'normalized_id': None,
   'biotype': 'variant'},
  'text': '16S',
  'locations': [{'offset': 1396, 'length': 3}]},
 {'id':

6258580


[{'id': '26',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'Sodium pseudomonate',
  'locations': [{'offset': 85, 'length': 19}]},
 {'id': '27',
  'infons': {'identifier': '37762',
   'type': 'Species',
   'valid': True,
   'normalized': [37762],
   'database': 'ncbi_taxonomy',
   'normalized_id': 37762,
   'biotype': 'species',
   'name': '37762',
   'accession': None},
  'text': 'Escherichia coli B',
  'locations': [{'offset': 157, 'length': 18}]},
 {'id': '28',
  'infons': {'identifier': 'MESH:D007532',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D007532'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007532',
   'biotype': 'chemical',
   'name': 'Isoleucine',
   'accession': '@CHEMICAL_Isoleucine'},
  'text': 'isoleucine',
  'locations': [{'offset': 310, 'length': 10}]},
 {'id': '29',
  'infons': {'identifier': 'MESH:D007532',
   'type': 'Chemical',
   'valid': True,
   '

16189117


[{'id': '29',
  'infons': {'identifier': 'MESH:C487637',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C487637'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C487637',
   'biotype': 'chemical',
   'name': 'telavancin',
   'accession': '@CHEMICAL_telavancin'},
  'text': 'telavancin',
  'locations': [{'offset': 213, 'length': 10}]},
 {'id': '30',
  'infons': {'identifier': 'MESH:D000077427',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D000077427'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D000077427',
   'biotype': 'chemical',
   'name': 'Lipoglycopeptides',
   'accession': '@CHEMICAL_Lipoglycopeptides'},
  'text': 'lipoglycopeptide',
  'locations': [{'offset': 240, 'length': 16}]},
 {'id': '31',
  'infons': {'identifier': 'MESH:D014640',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014640'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014640',
   'biotype': 'chemical',
   'name': 'Vancomycin',
   'accession': '@CHEMICAL_Va

13681272


[{'id': '8',
  'infons': {'identifier': 'MESH:D008712',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008712'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008712',
   'biotype': 'chemical',
   'name': 'Methicillin',
   'accession': '@CHEMICAL_Methicillin'},
  'text': 'methicillin',
  'locations': [{'offset': 66, 'length': 11}]},
 {'id': '9',
  'infons': {'identifier': 'MESH:D008712',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008712'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008712',
   'biotype': 'chemical',
   'name': 'Methicillin',
   'accession': '@CHEMICAL_Methicillin'},
  'text': '6(2:6-dimethoxybenzamido)-penicillanic acid',
  'locations': [{'offset': 79, 'length': 43}]},
 {'id': '10',
  'infons': {'identifier': 'MESH:D010400',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D010400'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D010400',
   'biotype': 'chemical',
   'name': 'Penicillin G',
   'accession': '@CHEM

5847736


[{'id': '7',
  'infons': {'identifier': 'MESH:D002512',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002512'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002512',
   'biotype': 'chemical',
   'name': 'Cephalothin',
   'accession': '@CHEMICAL_Cephalothin'},
  'text': 'cephalothin',
  'locations': [{'offset': 209, 'length': 11}]},
 {'id': '8',
  'infons': {'identifier': 'MESH:D002512',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002512'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002512',
   'biotype': 'chemical',
   'name': 'Cephalothin',
   'accession': '@CHEMICAL_Cephalothin'},
  'text': 'cephalothin',
  'locations': [{'offset': 562, 'length': 11}]},
 {'id': '9',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'Pseudomonas spp',
  'locations': [{'offset': 711, 'length': 15}]},
 {'id': '10',
  'infons': {'identifier': 'MESH:D002512',
   'type': 'Chemical',
   'valid': True,


4901344


[{'id': '14',
  'infons': {'identifier': '9606',
   'type': 'Species',
   'valid': True,
   'normalized': [9606],
   'database': 'ncbi_taxonomy',
   'normalized_id': 9606,
   'biotype': 'species',
   'name': '9606',
   'accession': None},
  'text': 'patients',
  'locations': [{'offset': 143, 'length': 8}]},
 {'id': '15',
  'infons': {'identifier': 'MESH:D029481',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D029481'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D029481',
   'biotype': 'disease',
   'name': 'Bronchitis Chronic',
   'accession': '@DISEASE_Bronchitis_Chronic'},
  'text': 'chronic bronchitis',
  'locations': [{'offset': 174, 'length': 18}]},
 {'id': '16',
  'infons': {'identifier': 'MESH:D014295',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014295'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014295',
   'biotype': 'chemical',
   'name': 'Trimethoprim',
   'accession': '@CHEMICAL_Trimethoprim'},
  'text': 'trimethoprim',
  'locati

8726004


[{'id': '39',
  'infons': {'identifier': 'MESH:C082896',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C082896'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C082896',
   'biotype': 'chemical',
   'name': 'epiroprim',
   'accession': '@CHEMICAL_epiroprim'},
  'text': 'Epiroprim',
  'locations': [{'offset': 119, 'length': 9}]},
 {'id': '40',
  'infons': {'identifier': 'MESH:C082896',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C082896'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C082896',
   'biotype': 'chemical',
   'name': 'epiroprim',
   'accession': '@CHEMICAL_epiroprim'},
  'text': 'EPM',
  'locations': [{'offset': 130, 'length': 3}]},
 {'id': '41',
  'infons': {'identifier': 'MESH:C082896',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C082896'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C082896',
   'biotype': 'chemical',
   'name': 'epiroprim',
   'accession': '@CHEMICAL_epiroprim'},
  'text': 'Ro 11-8958',
  'locati

2552910


[{'id': '20',
  'infons': {'identifier': 'MESH:D017576',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D017576'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D017576',
   'biotype': 'chemical',
   'name': 'Daptomycin',
   'accession': '@CHEMICAL_Daptomycin'},
  'text': 'daptomycin',
  'locations': [{'offset': 146, 'length': 10}]},
 {'id': '21',
  'infons': {'identifier': 'MESH:D014640',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014640'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014640',
   'biotype': 'chemical',
   'name': 'Vancomycin',
   'accession': '@CHEMICAL_Vancomycin'},
  'text': 'vancomycin',
  'locations': [{'offset': 258, 'length': 10}]},
 {'id': '22',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'gram-positive bacteria',
  'locations': [{'offset': 279, 'length': 22}]},
 {'id': '23',
  'infons': {'identifier': '1578',
   'type': 'Species',
   'valid': True,
   'n

17220414


[{'id': '20',
  'infons': {'identifier': '196914',
   'type': 'Species',
   'valid': True,
   'normalized': [196914],
   'database': 'ncbi_taxonomy',
   'normalized_id': 196914,
   'biotype': 'species',
   'name': '196914',
   'accession': None},
  'text': 'Actinoplanes friuliensis',
  'locations': [{'offset': 128, 'length': 24}]},
 {'id': '21',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'lipopeptide antibiotic',
  'locations': [{'offset': 166, 'length': 22}]},
 {'id': '22',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'friulimicin',
  'locations': [{'offset': 189, 'length': 11}]},
 {'id': '23',
  'infons': {'identifier': 'MESH:D005227',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D005227'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D005227',
   'biotype': 'chemical',
   'name': '

6941742


[{'id': '36',
  'infons': {'identifier': 'MESH:D015281',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D015281'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D015281',
   'biotype': 'chemical',
   'name': 'Cefmenoxime',
   'accession': '@CHEMICAL_Cefmenoxime'},
  'text': 'cefmenoxime',
  'locations': [{'offset': 125, 'length': 11}]},
 {'id': '37',
  'infons': {'identifier': 'MESH:D015281',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D015281'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D015281',
   'biotype': 'chemical',
   'name': 'Cefmenoxime',
   'accession': '@CHEMICAL_Cefmenoxime'},
  'text': 'SCE-1365',
  'locations': [{'offset': 138, 'length': 8}]},
 {'id': '38',
  'infons': {'identifier': 'MESH:D002511',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002511'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002511',
   'biotype': 'chemical',
   'name': 'Cephalosporins',
   'accession': '@CHEMICAL_Cephalosporins'},
  'text

5481218


[{'id': '37',
  'infons': {'identifier': 'MESH:D005436',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D005436'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D005436',
   'biotype': 'chemical',
   'name': 'Floxacillin',
   'accession': '@CHEMICAL_Floxacillin'},
  'text': 'Flucloxacillin',
  'locations': [{'offset': 102, 'length': 14}]},
 {'id': '38',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'isoxazole penicillin',
  'locations': [{'offset': 124, 'length': 20}]},
 {'id': '39',
  'infons': {'identifier': '1280',
   'type': 'Species',
   'valid': True,
   'normalized': [1280],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1280,
   'biotype': 'species',
   'name': '1280',
   'accession': None},
  'text': 'Staphylococcus aureus',
  'locations': [{'offset': 199, 'length': 21}]},
 {'id': '40',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   '

6289734


[{'id': '28',
  'infons': {'identifier': 'MESH:D002443',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002443'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002443',
   'biotype': 'chemical',
   'name': 'Ceftriaxone',
   'accession': '@CHEMICAL_Ceftriaxone'},
  'text': 'ceftriaxone',
  'locations': [{'offset': 80, 'length': 11}]},
 {'id': '29',
  'infons': {'identifier': 'MESH:D002443',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002443'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002443',
   'biotype': 'chemical',
   'name': 'Ceftriaxone',
   'accession': '@CHEMICAL_Ceftriaxone'},
  'text': 'Ceftriaxone',
  'locations': [{'offset': 163, 'length': 11}]},
 {'id': '30',
  'infons': {'identifier': '543',
   'type': 'Species',
   'valid': True,
   'normalized': [543],
   'database': 'ncbi_taxonomy',
   'normalized_id': 543,
   'biotype': 'species',
   'name': '543',
   'accession': None},
  'text': 'Enterobacteriaceae',
  'locations': [{'offset

6821456


[{'id': '14',
  'infons': {'identifier': '287',
   'type': 'Species',
   'valid': True,
   'normalized': [287],
   'database': 'ncbi_taxonomy',
   'normalized_id': 287,
   'biotype': 'species',
   'name': '287',
   'accession': None},
  'text': 'Pseudomonas aeruginosa',
  'locations': [{'offset': 68, 'length': 22}]},
 {'id': '15',
  'infons': {'identifier': 'MESH:D002228',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002228'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002228',
   'biotype': 'chemical',
   'name': 'Carbenicillin',
   'accession': '@CHEMICAL_Carbenicillin'},
  'text': 'carbenicillin',
  'locations': [{'offset': 133, 'length': 13}]},
 {'id': '16',
  'infons': {'identifier': 'MESH:D008997',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008997'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008997',
   'biotype': 'chemical',
   'name': 'Monobactams',
   'accession': '@CHEMICAL_Monobactams'},
  'text': 'beta-lactam antibiotic',
  '

6295263


[{'id': '37',
  'infons': {'identifier': 'MESH:D009675',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D009675'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D009675',
   'biotype': 'chemical',
   'name': 'Novobiocin',
   'accession': '@CHEMICAL_Novobiocin'},
  'text': 'Novobiocin',
  'locations': [{'offset': 123, 'length': 10}]},
 {'id': '38',
  'infons': {'identifier': 'MESH:C004628',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C004628'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C004628',
   'biotype': 'chemical',
   'name': 'coumermycin',
   'accession': '@CHEMICAL_coumermycin'},
  'text': 'coumermycin A1',
  'locations': [{'offset': 135, 'length': 14}]},
 {'id': '39',
  'infons': {'identifier': 'MESH:C006260',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C006260'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C006260',
   'biotype': 'chemical',
   'name': 'clorobiocin',
   'accession': '@CHEMICAL_clorobiocin'},
  'text':

14217764


[{'id': '17',
  'infons': {'identifier': 'MESH:D008034',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008034'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008034',
   'biotype': 'chemical',
   'name': 'Lincomycin',
   'accession': '@CHEMICAL_Lincomycin'},
  'text': 'lincomycin',
  'locations': [{'offset': 170, 'length': 10}]},
 {'id': '18',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'Streptomyces lincolnensis var.',
  'locations': [{'offset': 195, 'length': 30}]},
 {'id': '19',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'lincolnensis',
  'locations': [{'offset': 226, 'length': 12}]},
 {'id': '20',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'staphylococci',
  'locations': [{'offset': 348, 'length': 13}]},
 {'id': '21',
  'infons': {'i

16528813


[{'id': '36183',
  'infons': {'identifier': 'MESH:D010406',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D010406'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D010406',
   'biotype': 'chemical',
   'name': 'Penicillins',
   'accession': '@CHEMICAL_Penicillins'},
  'text': 'penicillin',
  'locations': [{'offset': 177, 'length': 10}]}]

15406368


[{'id': '971',
  'infons': {'identifier': 'MESH:D014449',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014449'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014449',
   'biotype': 'chemical',
   'name': 'Tyrothricin',
   'accession': '@CHEMICAL_Tyrothricin'},
  'text': 'tyrothricin',
  'locations': [{'offset': 538, 'length': 11}]},
 {'id': '972',
  'infons': {'identifier': 'MESH:D014449',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014449'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014449',
   'biotype': 'chemical',
   'name': 'Tyrothricin',
   'accession': '@CHEMICAL_Tyrothricin'},
  'text': 'tyrothricin',
  'locations': [{'offset': 425, 'length': 11}]},
 {'id': '973',
  'infons': {'identifier': 'MESH:D014449',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014449'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014449',
   'biotype': 'chemical',
   'name': 'Tyrothricin',
   'accession': '@CHEMICAL_Tyrothricin'},
  'tex

17764469


[{'id': '10',
  'infons': {'identifier': 'MESH:D003141',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D003141'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D003141',
   'biotype': 'disease',
   'name': 'Communicable Diseases',
   'accession': '@DISEASE_Communicable_Diseases'},
  'text': 'infectious disease',
  'locations': [{'offset': 133, 'length': 18}]},
 {'id': '11',
  'infons': {'identifier': 'MESH:D013881',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D013881'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D013881',
   'biotype': 'chemical',
   'name': 'Thioridazine',
   'accession': '@CHEMICAL_Thioridazine'},
  'text': 'Thioridazine',
  'locations': [{'offset': 228, 'length': 12}]},
 {'id': '12',
  'infons': {'identifier': 'MESH:C031637',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C031637'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C031637',
   'biotype': 'chemical',
   'name': 'phenothiazine',
   'accession': '@CHEM

17938194


[{'id': '51',
  'infons': {'identifier': 'MESH:C530475',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C530475'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C530475',
   'biotype': 'chemical',
   'name': '7-(7-amino-7-methyl-5-azaspiro(2.4)heptan-5-yl)-6-fluoro-1-(2-fluoro-1-cyclopropyl)-1 4-dihydro-8-methoxy-4-oxo-3-quinolinecarboxylic acid',
   'accession': '@CHEMICAL_7_(7_amino_7_methyl_5_azaspiro(2.4)heptan_5_yl)_6_fluoro_1_(2_fluoro_1_cyclopropyl)_1_4_dihydro_8_methoxy_4_oxo_3_quinolinecarboxylic_acid'},
  'text': 'DC-159a',
  'locations': [{'offset': 81, 'length': 7}]},
 {'id': '52',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': '8-methoxy fluoroquinolone',
  'locations': [{'offset': 98, 'length': 25}]},
 {'id': '53',
  'infons': {'type': 'Disease',
   'valid': False,
   'normalized_id': None,
   'biotype': 'disease'},
  'text': 'staphylococci',
  'locations': [{'offset'

18180358


[{'id': '9',
  'infons': {'identifier': 'MESH:C587495',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C587495'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C587495',
   'biotype': 'chemical',
   'name': 'AR-709',
   'accession': '@CHEMICAL_AR_709'},
  'text': 'AR-709',
  'locations': [{'offset': 103, 'length': 6}]},
 {'id': '10',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'diaminopyrimidine antibiotic',
  'locations': [{'offset': 119, 'length': 28}]},
 {'id': '11',
  'infons': {'identifier': 'MESH:D012141',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D012141'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D012141',
   'biotype': 'disease',
   'name': 'Respiratory Tract Infections',
   'accession': '@DISEASE_Respiratory_Tract_Infections'},
  'text': 'upper and lower respiratory tract infections',
  'locations': [{'offset': 209, 'length': 44}]},
 {'id': '12

18472972


[{'id': '23335',
  'infons': {'identifier': '64146',
   'type': 'Gene',
   'ncbi_homologene': '69354',
   'valid': True,
   'normalized': [64146],
   'database': 'ncbi_gene',
   'normalized_id': 64146,
   'biotype': 'gene',
   'name': 'PDF',
   'accession': '@GENE_PDF'},
  'text': 'peptide deformylase',
  'locations': [{'offset': 374, 'length': 19}]},
 {'id': '23336',
  'infons': {'identifier': '64146',
   'type': 'Gene',
   'ncbi_homologene': '69354',
   'valid': True,
   'normalized': [64146],
   'database': 'ncbi_gene',
   'normalized_id': 64146,
   'biotype': 'gene',
   'name': 'PDF',
   'accession': '@GENE_PDF'},
  'text': 'peptide deformylase',
  'locations': [{'offset': 496, 'length': 19}]},
 {'id': '23337',
  'infons': {'identifier': '64146',
   'type': 'Gene',
   'ncbi_homologene': '69354',
   'valid': True,
   'normalized': [64146],
   'database': 'ncbi_gene',
   'normalized_id': 64146,
   'biotype': 'gene',
   'name': 'PDF',
   'accession': '@GENE_PDF'},
  'text': 'peptide d

2014970


[{'id': '37',
  'infons': {'identifier': 'MESH:C068217',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C068217'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C068217',
   'biotype': 'chemical',
   'name': 'PD 131628',
   'accession': '@CHEMICAL_PD_131628'},
  'text': 'PD 131628',
  'locations': [{'offset': 94, 'length': 9}]},
 {'id': '38',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'aminopyrrolidine',
  'locations': [{'offset': 113, 'length': 16}]},
 {'id': '39',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'fluorocyclopropyl naphthyridine quinolone',
  'locations': [{'offset': 142, 'length': 41}]},
 {'id': '40',
  'infons': {'identifier': '1314',
   'type': 'Species',
   'valid': True,
   'normalized': [1314],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1314,
   'biotype': 's

1332594


[{'id': '55',
  'infons': {'identifier': 'MESH:C078052',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C078052'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C078052',
   'biotype': 'chemical',
   'name': 'pazufloxacin',
   'accession': '@CHEMICAL_pazufloxacin'},
  'text': 'T-3761',
  'locations': [{'offset': 77, 'length': 6}]},
 {'id': '56',
  'infons': {'identifier': 'MESH:D024841',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D024841'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D024841',
   'biotype': 'chemical',
   'name': 'Fluoroquinolones',
   'accession': '@CHEMICAL_Fluoroquinolones'},
  'text': 'fluoroquinolone',
  'locations': [{'offset': 91, 'length': 15}]},
 {'id': '57',
  'infons': {'identifier': 'MESH:D010078',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D010078'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D010078',
   'biotype': 'chemical',
   'name': 'Oxazines',
   'accession': '@CHEMICAL_Oxazines'},
  'text

1482147


[{'id': '34',
  'infons': {'identifier': 'MESH:D000077731',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D000077731'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D000077731',
   'biotype': 'chemical',
   'name': 'Meropenem',
   'accession': '@CHEMICAL_Meropenem'},
  'text': 'meropenem',
  'locations': [{'offset': 160, 'length': 9}]},
 {'id': '35',
  'infons': {'identifier': 'MESH:D000077731',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D000077731'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D000077731',
   'biotype': 'chemical',
   'name': 'Meropenem',
   'accession': '@CHEMICAL_Meropenem'},
  'text': 'ICI 194,660',
  'locations': [{'offset': 171, 'length': 11}]},
 {'id': '36',
  'infons': {'identifier': 'MESH:C069520',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C069520'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C069520',
   'biotype': 'chemical',
   'name': 'ICI 213689',
   'accession': '@CHEMICAL_ICI_213689'},
  't

4914633


[]

4308412


[{'id': '9',
  'infons': {'identifier': 'MESH:C100307',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C100307'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C100307',
   'biotype': 'chemical',
   'name': 'streptolydigin',
   'accession': '@CHEMICAL_streptolydigin'},
  'text': 'Streptolydigin',
  'locations': [{'offset': 34, 'length': 14}]},
 {'id': '10',
  'infons': {'identifier': 'MESH:C023808',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C023808'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C023808',
   'biotype': 'chemical',
   'name': 'rifamycin SV',
   'accession': '@CHEMICAL_rifamycin_SV'},
  'text': 'rifamycin',
  'locations': [{'offset': 53, 'length': 9}]},
 {'id': '11',
  'infons': {'identifier': 'MESH:C100307',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C100307'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C100307',
   'biotype': 'chemical',
   'name': 'streptolydigin',
   'accession': '@CHEMICAL_streptolydigin'}

19015359


[{'id': '10',
  'infons': {'identifier': 'MESH:D064704',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D064704'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D064704',
   'biotype': 'chemical',
   'name': 'Levofloxacin',
   'accession': '@CHEMICAL_Levofloxacin'},
  'text': 'levofloxacin',
  'locations': [{'offset': 171, 'length': 12}]},
 {'id': '11',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'CHP-105',
  'locations': [{'offset': 214, 'length': 7}]},
 {'id': '12',
  'infons': {'identifier': 'MESH:D064704',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D064704'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D064704',
   'biotype': 'chemical',
   'name': 'Levofloxacin',
   'accession': '@CHEMICAL_Levofloxacin'},
  'text': 'levofloxacin',
  'locations': [{'offset': 367, 'length': 12}]},
 {'id': '13',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'v

19114678


[{'id': '24',
  'infons': {'identifier': 'MESH:C074191',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C074191'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C074191',
   'biotype': 'chemical',
   'name': 'prulifloxacin',
   'accession': '@CHEMICAL_prulifloxacin'},
  'text': 'Prulifloxacin',
  'locations': [{'offset': 163, 'length': 13}]},
 {'id': '25',
  'infons': {'identifier': 'MESH:C074190',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C074190'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C074190',
   'biotype': 'chemical',
   'name': 'ulifloxacin',
   'accession': '@CHEMICAL_ulifloxacin'},
  'text': 'ulifloxacin',
  'locations': [{'offset': 193, 'length': 11}]},
 {'id': '26',
  'infons': {'identifier': 'MESH:D024841',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D024841'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D024841',
   'biotype': 'chemical',
   'name': 'Fluoroquinolones',
   'accession': '@CHEMICAL_Fluoroquinolo

19451282


[{'id': '16',
  'infons': {'identifier': 'MESH:C520838',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C520838'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C520838',
   'biotype': 'chemical',
   'name': 'EDP 420',
   'accession': '@CHEMICAL_EDP_420'},
  'text': 'EDP-420',
  'locations': [{'offset': 113, 'length': 7}]},
 {'id': '17',
  'infons': {'identifier': 'MESH:C520838',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C520838'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C520838',
   'biotype': 'chemical',
   'name': 'EDP 420',
   'accession': '@CHEMICAL_EDP_420'},
  'text': 'EP-013420',
  'locations': [{'offset': 136, 'length': 9}]},
 {'id': '18',
  'infons': {'identifier': 'MESH:C520838',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C520838'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C520838',
   'biotype': 'chemical',
   'name': 'EDP 420',
   'accession': '@CHEMICAL_EDP_420'},
  'text': 'S-013420',
  'locations': [{'o

19105177


[{'id': '25',
  'infons': {'identifier': 'MESH:D014756',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014756'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014756',
   'biotype': 'chemical',
   'name': 'Viomycin',
   'accession': '@CHEMICAL_Viomycin'},
  'text': 'Viomycin',
  'locations': [{'offset': 101, 'length': 8}]},
 {'id': '26',
  'infons': {'identifier': 'MESH:D002207',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002207'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002207',
   'biotype': 'chemical',
   'name': 'Capreomycin',
   'accession': '@CHEMICAL_Capreomycin'},
  'text': 'capreomycin',
  'locations': [{'offset': 114, 'length': 11}]},
 {'id': '27',
  'infons': {'identifier': 'MESH:C015563',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C015563'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C015563',
   'biotype': 'chemical',
   'name': 'tuberactinomycin',
   'accession': '@CHEMICAL_tuberactinomycin'},
  'text':

19738021


[{'id': '11',
  'infons': {'identifier': 'MESH:D014217',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014217'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014217',
   'biotype': 'chemical',
   'name': 'Troleandomycin',
   'accession': '@CHEMICAL_Troleandomycin'},
  'text': 'triacetyloleandomycin',
  'locations': [{'offset': 169, 'length': 21}]},
 {'id': '12',
  'infons': {'identifier': 'MESH:C059646',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C059646'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C059646',
   'biotype': 'chemical',
   'name': 'mycalamide A',
   'accession': '@CHEMICAL_mycalamide_A'},
  'text': 'mycalamide A',
  'locations': [{'offset': 195, 'length': 12}]},
 {'id': '13',
  'infons': {'identifier': '2238',
   'type': 'Species',
   'valid': True,
   'normalized': [2238],
   'database': 'ncbi_taxonomy',
   'normalized_id': 2238,
   'biotype': 'species',
   'name': '2238',
   'accession': None},
  'text': 'Haloarcula marismortu

6931548


[{'id': '28',
  'infons': {'identifier': 'MESH:C015537',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C015537'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C015537',
   'biotype': 'chemical',
   'name': 'thienamycin',
   'accession': '@CHEMICAL_thienamycin'},
  'text': 'thienamycin',
  'locations': [{'offset': 180, 'length': 11}]},
 {'id': '29',
  'infons': {'identifier': 'MESH:D015378',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D015378'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D015378',
   'biotype': 'chemical',
   'name': 'Imipenem',
   'accession': '@CHEMICAL_Imipenem'},
  'text': 'N-formimidoyl thienamycin',
  'locations': [{'offset': 193, 'length': 25}]},
 {'id': '30',
  'infons': {'identifier': 'MESH:D015378',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D015378'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D015378',
   'biotype': 'chemical',
   'name': 'Imipenem',
   'accession': '@CHEMICAL_Imipenem'},
  'text

21194422


[]

21464247


[{'id': '45',
  'infons': {'identifier': 'MESH:C556453',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C556453'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C556453',
   'biotype': 'chemical',
   'name': 'MX-2401',
   'accession': '@CHEMICAL_MX_2401'},
  'text': 'MX-2401',
  'locations': [{'offset': 77, 'length': 7}]},
 {'id': '46',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'calcium-dependent lipopeptide antibiotic',
  'locations': [{'offset': 104, 'length': 40}]},
 {'id': '47',
  'infons': {'identifier': 'MESH:C004423',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C004423'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C004423',
   'biotype': 'chemical',
   'name': 'amphomycin',
   'accession': '@CHEMICAL_amphomycin'},
  'text': 'amphomycin',
  'locations': [{'offset': 158, 'length': 10}]},
 {'id': '48',
  'infons': {'identifier': 'MESH:D016908',
   'ty

22460279


[{'id': '4976',
  'infons': {'identifier': 'MESH:D001424',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D001424'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D001424',
   'biotype': 'disease',
   'name': 'Bacterial Infections',
   'accession': '@DISEASE_Bacterial_Infections'},
  'text': 'bacterial infections',
  'locations': [{'offset': 333, 'length': 20}]},
 {'id': '4977',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007239',
   'biotype': 'disease',
   'name': 'Infections',
   'accession': '@DISEASE_Infections'},
  'text': 'infections',
  'locations': [{'offset': 195, 'length': 10}]}]

21768509


[{'id': '12',
  'infons': {'identifier': 'MESH:D002207',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002207'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002207',
   'biotype': 'chemical',
   'name': 'Capreomycin',
   'accession': '@CHEMICAL_Capreomycin'},
  'text': 'Capreomycin',
  'locations': [{'offset': 92, 'length': 11}]},
 {'id': '13',
  'infons': {'identifier': 'MESH:D014756',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014756'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014756',
   'biotype': 'chemical',
   'name': 'Viomycin',
   'accession': '@CHEMICAL_Viomycin'},
  'text': 'viomycin',
  'locations': [{'offset': 142, 'length': 8}]},
 {'id': '14',
  'infons': {'identifier': '1773',
   'type': 'Species',
   'valid': True,
   'normalized': [1773],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1773,
   'biotype': 'species',
   'name': '1773',
   'accession': None},
  'text': 'Mycobacterium tuberculosis',
  'locations': [{'offs

14742198


[{'id': '44',
  'infons': {'identifier': 'MESH:C461664',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C461664'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C461664',
   'biotype': 'chemical',
   'name': 'NB 2001',
   'accession': '@CHEMICAL_NB_2001'},
  'text': 'NB2001',
  'locations': [{'offset': 253, 'length': 6}]},
 {'id': '45',
  'infons': {'identifier': 'MESH:C482454',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C482454'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C482454',
   'biotype': 'chemical',
   'name': 'NB 2030',
   'accession': '@CHEMICAL_NB_2030'},
  'text': 'NB2030',
  'locations': [{'offset': 264, 'length': 6}]},
 {'id': '46',
  'infons': {'identifier': 'MESH:D002511',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002511'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002511',
   'biotype': 'chemical',
   'name': 'Cephalosporins',
   'accession': '@CHEMICAL_Cephalosporins'},
  'text': 'cephalosporin',
  'l

22346533


[{'id': '26',
  'infons': {'identifier': 'MESH:D002981',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002981'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002981',
   'biotype': 'chemical',
   'name': 'Clindamycin',
   'accession': '@CHEMICAL_Clindamycin'},
  'text': 'clindamycin',
  'locations': [{'offset': 172, 'length': 11}]},
 {'id': '27',
  'infons': {'identifier': 'MESH:D002981',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002981'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002981',
   'biotype': 'chemical',
   'name': 'Clindamycin',
   'accession': '@CHEMICAL_Clindamycin'},
  'text': 'clindamycin',
  'locations': [{'offset': 364, 'length': 11}]},
 {'id': '28',
  'infons': {'identifier': 'MESH:D002981',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002981'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002981',
   'biotype': 'chemical',
   'name': 'Clindamycin',
   'accession': '@CHEMICAL_Clindamycin'},
  'text':

22232283


[{'id': '35',
  'infons': {'identifier': '43767',
   'type': 'Species',
   'valid': True,
   'normalized': [43767],
   'database': 'ncbi_taxonomy',
   'normalized_id': 43767,
   'biotype': 'species',
   'name': '43767',
   'accession': None},
  'text': 'Rhodococcus equi',
  'locations': [{'offset': 109, 'length': 16}]},
 {'id': '36',
  'infons': {'type': 'Disease',
   'valid': False,
   'normalized_id': None,
   'biotype': 'disease'},
  'text': 'rhodococcosis',
  'locations': [{'offset': 147, 'length': 13}]},
 {'id': '37',
  'infons': {'identifier': 'MESH:D007153',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007153'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007153',
   'biotype': 'disease',
   'name': 'Immunologic Deficiency Syndromes',
   'accession': '@DISEASE_Immunologic_Deficiency_Syndromes'},
  'text': 'immunodeficient',
  'locations': [{'offset': 204, 'length': 15}]},
 {'id': '38',
  'infons': {'identifier': '9606',
   'type': 'Species',
   'valid': True

22710113


[{'id': '29',
  'infons': {'identifier': 'MESH:D008712',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008712'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008712',
   'biotype': 'chemical',
   'name': 'Methicillin',
   'accession': '@CHEMICAL_Methicillin'},
  'text': 'methicillin',
  'locations': [{'offset': 116, 'length': 11}]},
 {'id': '30',
  'infons': {'identifier': '1280',
   'type': 'Species',
   'valid': True,
   'normalized': [1280],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1280,
   'biotype': 'species',
   'name': '1280',
   'accession': None},
  'text': 'Staphylococcus aureus',
  'locations': [{'offset': 138, 'length': 21}]},
 {'id': '31',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'MRSA',
  'locations': [{'offset': 161, 'length': 4}]},
 {'id': '32',
  'infons': {'identifier': 'MESH:D047090',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D047090'],
   'databas

3060240


[{'id': '39',
  'infons': {'identifier': 'MESH:D047090',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D047090'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D047090',
   'biotype': 'chemical',
   'name': 'beta-Lactams',
   'accession': '@CHEMICAL_beta_Lactams'},
  'text': 'beta-lactam',
  'locations': [{'offset': 139, 'length': 11}]},
 {'id': '40',
  'infons': {'identifier': 'MESH:D047090',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D047090'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D047090',
   'biotype': 'chemical',
   'name': 'beta-Lactams',
   'accession': '@CHEMICAL_beta_Lactams'},
  'text': 'beta-lactam',
  'locations': [{'offset': 173, 'length': 11}]},
 {'id': '41',
  'infons': {'identifier': 'MESH:D010406',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D010406'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D010406',
   'biotype': 'chemical',
   'name': 'Penicillins',
   'accession': '@CHEMICAL_Penicillins'},
  'te

23476724


[{'id': '20',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'Muraminomicin',
  'locations': [{'offset': 106, 'length': 13}]},
 {'id': '21',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'lipopeptidyl nucleoside antibiotic',
  'locations': [{'offset': 125, 'length': 34}]},
 {'id': '22',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'Streptosporangium amethystogenes SANK 60709',
  'locations': [{'offset': 172, 'length': 43}]},
 {'id': '23',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'A-90289',
  'locations': [{'offset': 278, 'length': 7}]},
 {'id': '24',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None

23295920


[{'id': '20',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007239',
   'biotype': 'disease',
   'name': 'Infections',
   'accession': '@DISEASE_Infections'},
  'text': 'infections',
  'locations': [{'offset': 157, 'length': 10}]},
 {'id': '21',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007239',
   'biotype': 'disease',
   'name': 'Infections',
   'accession': '@DISEASE_Infections'},
  'text': 'infections',
  'locations': [{'offset': 254, 'length': 10}]},
 {'id': '22',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'oxaborole',
  'locations': [{'offset': 761, 'length': 9}]},
 {'id': '23',
  'infons': {'identifier': 'MESH:D001895',
   'type': 'Chemical',
   'valid'

23741637


[{'id': '9023',
  'infons': {'identifier': '1423',
   'type': 'Species',
   'valid': True,
   'normalized': [1423],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1423,
   'biotype': 'species',
   'name': '1423',
   'accession': None},
  'text': 'Bacillus subtilis',
  'locations': [{'offset': 1013, 'length': 17}]},
 {'id': '9024',
  'infons': {'identifier': '1931',
   'type': 'Species',
   'valid': True,
   'normalized': [1931],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1931,
   'biotype': 'species',
   'name': '1931',
   'accession': None},
  'text': 'Streptomyces sp',
  'locations': [{'offset': 178, 'length': 15}]},
 {'id': '9025',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'alpha2-Rhodomycin II',
  'locations': [{'offset': 1064, 'length': 20}]},
 {'id': '9026',
  'infons': {'identifier': '1924',
   'type': 'Species',
   'valid': True,
   'normalized': [1924],
   'database': '

5132096


[{'id': '23',
  'infons': {'identifier': 'MESH:D002514',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002514'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002514',
   'biotype': 'chemical',
   'name': 'Cephapirin',
   'accession': '@CHEMICAL_Cephapirin'},
  'text': 'Cephapirin',
  'locations': [{'offset': 45, 'length': 10}]},
 {'id': '24',
  'infons': {'identifier': 'MESH:D002511',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002511'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002511',
   'biotype': 'chemical',
   'name': 'Cephalosporins',
   'accession': '@CHEMICAL_Cephalosporins'},
  'text': 'cephalosporin',
  'locations': [{'offset': 77, 'length': 13}]},
 {'id': '25',
  'infons': {'identifier': 'MESH:D002512',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002512'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002512',
   'biotype': 'chemical',
   'name': 'Cephalothin',
   'accession': '@CHEMICAL_Cephalothin'},
  'tex

24100496


[{'id': '24',
  'infons': {'identifier': '1311',
   'type': 'Species',
   'valid': True,
   'normalized': [1311],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1311,
   'biotype': 'species',
   'name': '1311',
   'accession': None},
  'text': 'Streptococcus agalactiae',
  'locations': [{'offset': 178, 'length': 24}]},
 {'id': '25',
  'infons': {'identifier': 'MESH:D016470',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D016470'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D016470',
   'biotype': 'disease',
   'name': 'Bacteremia',
   'accession': '@DISEASE_Bacteremia'},
  'text': 'bacteremia',
  'locations': [{'offset': 227, 'length': 10}]},
 {'id': '26',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007239',
   'biotype': 'disease',
   'name': 'Infections',
   'accession': '@DISEASE_Infections'},
  'text': 'invasive infections',
  'locations': [

24097668


[{'id': '43',
  'infons': {'identifier': 'MESH:D056486',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D056486'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D056486',
   'biotype': 'disease',
   'name': 'Chemical and Drug Induced Liver Injury',
   'accession': '@DISEASE_Chemical_and_Drug_Induced_Liver_Injury'},
  'text': 'Idiosyncratic drug-induced liver injury',
  'locations': [{'offset': 115, 'length': 39}]},
 {'id': '44',
  'infons': {'identifier': 'MESH:D056486',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D056486'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D056486',
   'biotype': 'disease',
   'name': 'Chemical and Drug Induced Liver Injury',
   'accession': '@DISEASE_Chemical_and_Drug_Induced_Liver_Injury'},
  'text': 'IDILI',
  'locations': [{'offset': 156, 'length': 5}]},
 {'id': '45',
  'infons': {'identifier': '9606',
   'type': 'Species',
   'valid': True,
   'normalized': [9606],
   'database': 'ncbi_taxonomy',
   'normalized_id': 9

24121552


[{'id': '7045',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'MAC13772',
  'locations': [{'offset': 895, 'length': 8}]},
 {'id': '7046',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'MAC13772',
  'locations': [{'offset': 744, 'length': 8}]},
 {'id': '7047',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'MAC168425',
  'locations': [{'offset': 769, 'length': 9}]},
 {'id': '7048',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'MAC173979',
  'locations': [{'offset': 730, 'length': 9}]},
 {'id': '7049',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  '

24637688


[{'id': '16',
  'infons': {'identifier': '1314',
   'type': 'Species',
   'valid': True,
   'normalized': [1314],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1314,
   'biotype': 'species',
   'name': '1314',
   'accession': None},
  'text': 'Streptococcus pyogenes',
  'locations': [{'offset': 467, 'length': 22}]},
 {'id': '17',
  'infons': {'identifier': '1314',
   'type': 'Species',
   'valid': True,
   'normalized': [1314],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1314,
   'biotype': 'species',
   'name': '1314',
   'accession': None},
  'text': 'S. pyogenes',
  'locations': [{'offset': 666, 'length': 11}]},
 {'id': '18',
  'infons': {'identifier': '1314',
   'type': 'Species',
   'valid': True,
   'normalized': [1314],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1314,
   'biotype': 'species',
   'name': '1314',
   'accession': None},
  'text': 'S. pyogenes',
  'locations': [{'offset': 895, 'length': 11}]},
 {'id': '19',
  'infons': {'identifier': '1314',
 

23931281


[{'id': '19',
  'infons': {'identifier': 'MESH:C010327',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C010327'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C010327',
   'biotype': 'chemical',
   'name': 'salinomycin',
   'accession': '@CHEMICAL_salinomycin'},
  'text': 'Salinomycin',
  'locations': [{'offset': 77, 'length': 11}]},
 {'id': '20',
  'infons': {'identifier': 'MESH:D009369',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D009369'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D009369',
   'biotype': 'disease',
   'name': 'Neoplasms',
   'accession': '@DISEASE_Neoplasms'},
  'text': 'cancer',
  'locations': [{'offset': 176, 'length': 6}]},
 {'id': '21',
  'infons': {'identifier': 'MESH:D009369',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D009369'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D009369',
   'biotype': 'disease',
   'name': 'Neoplasms',
   'accession': '@DISEASE_Neoplasms'},
  'text': 'cancer',
  'locatio

25170230


[{'id': '38',
  'infons': {'identifier': 'MESH:D005664',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D005664'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D005664',
   'biotype': 'chemical',
   'name': 'Furazolidone',
   'accession': '@CHEMICAL_Furazolidone'},
  'text': 'furazolidone',
  'locations': [{'offset': 128, 'length': 12}]},
 {'id': '39',
  'infons': {'identifier': '210',
   'type': 'Species',
   'valid': True,
   'normalized': [210],
   'database': 'ncbi_taxonomy',
   'normalized_id': 210,
   'biotype': 'species',
   'name': '210',
   'accession': None},
  'text': 'Helicobacter pylori',
  'locations': [{'offset': 191, 'length': 19}]},
 {'id': '40',
  'infons': {'identifier': '210',
   'type': 'Species',
   'valid': True,
   'normalized': [210],
   'database': 'ncbi_taxonomy',
   'normalized_id': 210,
   'biotype': 'species',
   'name': '210',
   'accession': None},
  'text': 'H. pylori',
  'locations': [{'offset': 212, 'length': 9}]},
 {'id': '41',
  'in

25199778


[{'id': '36',
  'infons': {'identifier': '9606',
   'type': 'Species',
   'valid': True,
   'normalized': [9606],
   'database': 'ncbi_taxonomy',
   'normalized_id': 9606,
   'biotype': 'species',
   'name': '9606',
   'accession': None},
  'text': 'human',
  'locations': [{'offset': 165, 'length': 5}]},
 {'id': '37',
  'infons': {'identifier': '1672',
   'type': 'Gene',
   'ncbi_homologene': '88476',
   'valid': True,
   'normalized': [1672],
   'database': 'ncbi_gene',
   'normalized_id': 1672,
   'biotype': 'gene',
   'name': 'DEFB1',
   'accession': '@GENE_DEFB1'},
  'text': 'hBD-1',
  'locations': [{'offset': 187, 'length': 5}]},
 {'id': '38',
  'infons': {'identifier': '1673',
   'type': 'Gene',
   'ncbi_homologene': '122147',
   'valid': True,
   'normalized': [1673],
   'database': 'ncbi_gene',
   'normalized_id': 1673,
   'biotype': 'gene',
   'name': 'DEFB4A',
   'accession': '@GENE_DEFB4A'},
  'text': 'hBD-2',
  'locations': [{'offset': 197, 'length': 5}]},
 {'id': '39',
  '

25199777


[{'id': '10',
  'infons': {'identifier': '470',
   'type': 'Species',
   'valid': True,
   'normalized': [470],
   'database': 'ncbi_taxonomy',
   'normalized_id': 470,
   'biotype': 'species',
   'name': '470',
   'accession': None},
  'text': 'Acinetobacter baumannii',
  'locations': [{'offset': 180, 'length': 23}]},
 {'id': '11',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'MDRAB',
  'locations': [{'offset': 205, 'length': 5}]},
 {'id': '12',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007239',
   'biotype': 'disease',
   'name': 'Infections',
   'accession': '@DISEASE_Infections'},
  'text': 'infection',
  'locations': [{'offset': 284, 'length': 9}]},
 {'id': '13',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'MDRAB',
  'locations

1103722


[{'id': '17',
  'infons': {'identifier': 'MESH:D000617',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D000617'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D000617',
   'biotype': 'chemical',
   'name': 'Aminoglycosides',
   'accession': '@CHEMICAL_Aminoglycosides'},
  'text': 'aminoglycoside',
  'locations': [{'offset': 213, 'length': 14}]},
 {'id': '18',
  'infons': {'identifier': 'MESH:D005839',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D005839'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D005839',
   'biotype': 'chemical',
   'name': 'Gentamicins',
   'accession': '@CHEMICAL_Gentamicins'},
  'text': 'gentamicin',
  'locations': [{'offset': 241, 'length': 10}]},
 {'id': '19',
  'infons': {'identifier': 'MESH:D012853',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D012853'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D012853',
   'biotype': 'chemical',
   'name': 'Sisomicin',
   'accession': '@CHEMICAL_Sisomicin'},
  '

1259401


[{'id': '24',
  'infons': {'identifier': 'MESH:D002436',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002436'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002436',
   'biotype': 'chemical',
   'name': 'Cefatrizine',
   'accession': '@CHEMICAL_Cefatrizine'},
  'text': 'BL-S640',
  'locations': [{'offset': 177, 'length': 7}]},
 {'id': '25',
  'infons': {'identifier': 'MESH:D002436',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002436'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002436',
   'biotype': 'chemical',
   'name': 'Cefatrizine',
   'accession': '@CHEMICAL_Cefatrizine'},
  'text': 'cefatrizine',
  'locations': [{'offset': 186, 'length': 11}]},
 {'id': '26',
  'infons': {'identifier': '1280',
   'type': 'Species',
   'valid': True,
   'normalized': [1280],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1280,
   'biotype': 'species',
   'name': '1280',
   'accession': None},
  'text': 'Staphylococcus aureus',
  'locations': [{'off

25561334


[{'id': '12',
  'infons': {'identifier': 'MESH:D013407',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D013407'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D013407',
   'biotype': 'chemical',
   'name': 'Sulbactam',
   'accession': '@CHEMICAL_Sulbactam'},
  'text': 'Sulbactam',
  'locations': [{'offset': 113, 'length': 9}]},
 {'id': '13',
  'infons': {'identifier': '470',
   'type': 'Species',
   'valid': True,
   'normalized': [470],
   'database': 'ncbi_taxonomy',
   'normalized_id': 470,
   'biotype': 'species',
   'name': '470',
   'accession': None},
  'text': 'Acinetobacter baumannii',
  'locations': [{'offset': 241, 'length': 23}]},
 {'id': '14',
  'infons': {'identifier': 'MESH:D013407',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D013407'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D013407',
   'biotype': 'chemical',
   'name': 'Sulbactam',
   'accession': '@CHEMICAL_Sulbactam'},
  'text': 'sulbactam',
  'locations': [{'offset': 286,

25644122


[]

4680803


[{'id': '15',
  'infons': {'identifier': 'MESH:D001710',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D001710'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D001710',
   'biotype': 'chemical',
   'name': 'Biotin',
   'accession': '@CHEMICAL_Biotin'},
  'text': 'biotin',
  'locations': [{'offset': 111, 'length': 6}]},
 {'id': '16',
  'infons': {'identifier': '47763',
   'type': 'Species',
   'valid': True,
   'normalized': [47763],
   'database': 'ncbi_taxonomy',
   'normalized_id': 47763,
   'biotype': 'species',
   'name': '47763',
   'accession': None},
  'text': 'Streptomyces lydicus',
  'locations': [{'offset': 158, 'length': 20}]},
 {'id': '17',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'beta-methyldethiobiotin',
  'locations': [{'offset': 180, 'length': 23}]},
 {'id': '18',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': 

4597739


[{'id': '16',
  'infons': {'identifier': 'MESH:D013455',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D013455'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D013455',
   'biotype': 'chemical',
   'name': 'Sulfur',
   'accession': '@CHEMICAL_Sulfur'},
  'text': 'sulfur',
  'locations': [{'offset': 103, 'length': 6}]},
 {'id': '17',
  'infons': {'identifier': 'MESH:C006361',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C006361'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C006361',
   'biotype': 'chemical',
   'name': 'acetopyrrothine',
   'accession': '@CHEMICAL_acetopyrrothine'},
  'text': 'thiolutin',
  'locations': [{'offset': 132, 'length': 9}]},
 {'id': '18',
  'infons': {'identifier': '4932',
   'type': 'Species',
   'valid': True,
   'normalized': [4932],
   'database': 'ncbi_taxonomy',
   'normalized_id': 4932,
   'biotype': 'species',
   'name': '4932',
   'accession': None},
  'text': 'Saccharomyces cerevisiae',
  'locations': [{'offset

26168713


[{'id': '20755',
  'infons': {'identifier': 'MESH:C000599190',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C000599190'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C000599190',
   'biotype': 'chemical',
   'name': 'zoliflodacin',
   'accession': '@CHEMICAL_zoliflodacin'},
  'text': 'ETX0914',
  'locations': [{'offset': 922, 'length': 7}]},
 {'id': '20756',
  'infons': {'identifier': 'MESH:D006069',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D006069'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D006069',
   'biotype': 'disease',
   'name': 'Gonorrhea',
   'accession': '@DISEASE_Gonorrhea'},
  'text': 'gonorrhea',
  'locations': [{'offset': 1430, 'length': 9}]},
 {'id': '20757',
  'infons': {'identifier': 'MESH:C000599190',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C000599190'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C000599190',
   'biotype': 'chemical',
   'name': 'zoliflodacin',
   'accession': '@CHEMICAL_zoliflod

26033735


[{'id': '29',
  'infons': {'identifier': 'MESH:C037689',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C037689'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C037689',
   'biotype': 'chemical',
   'name': 'benzamide',
   'accession': '@CHEMICAL_benzamide'},
  'text': 'benzamide',
  'locations': [{'offset': 201, 'length': 9}]},
 {'id': '30',
  'infons': {'identifier': 'MESH:C531944',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C531944'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C531944',
   'biotype': 'chemical',
   'name': 'PC190723',
   'accession': '@CHEMICAL_PC190723'},
  'text': 'PC190723',
  'locations': [{'offset': 226, 'length': 8}]},
 {'id': '31',
  'infons': {'identifier': 'MESH:C531944',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C531944'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C531944',
   'biotype': 'chemical',
   'name': 'PC190723',
   'accession': '@CHEMICAL_PC190723'},
  'text': 'PC190723',
  'locatio

26190576


[{'id': '14',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'CBR',
  'locations': [{'offset': 86, 'length': 3}]},
 {'id': '15',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'hydroxamidines',
  'locations': [{'offset': 90, 'length': 14}]},
 {'id': '16',
  'infons': {'identifier': 'MESH:D011720',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D011720'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D011720',
   'biotype': 'chemical',
   'name': 'Pyrazoles',
   'accession': '@CHEMICAL_Pyrazoles'},
  'text': 'pyrazoles',
  'locations': [{'offset': 252, 'length': 9}]},
 {'id': '17',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'hydroxamidines',
  'locations': [{'offset': 348, 'length': 14}]},
 {'id': '18'

26144346


[{'id': '7',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': '1,2,4-oxadiazole antibiotics',
  'locations': [{'offset': 141, 'length': 28}]},
 {'id': '8',
  'infons': {'identifier': '1280',
   'type': 'Species',
   'valid': True,
   'normalized': [1280],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1280,
   'biotype': 'species',
   'name': '1280',
   'accession': None},
  'text': 'Staphylococcus aureus',
  'locations': [{'offset': 312, 'length': 21}]},
 {'id': '9',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'S. aureus',
  'locations': [{'offset': 576, 'length': 9}]},
 {'id': '10',
  'infons': {'identifier': 'MESH:D008712',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008712'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008712',
   'biotype': 'chemical',
   'name': 'Methicillin',
   'accession': '@CHE

25995221


[{'id': '28',
  'infons': {'identifier': 'MESH:D000198',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D000198'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D000198',
   'biotype': 'chemical',
   'name': 'Spectinomycin',
   'accession': '@CHEMICAL_Spectinomycin'},
  'text': 'spectinomycin',
  'locations': [{'offset': 142, 'length': 13}]},
 {'id': '29',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': "N-benzyl-substituted 3'-(R)-3'-aminomethyl-3'-hydroxy spectinomycins",
  'locations': [{'offset': 367, 'length': 68}]},
 {'id': '30',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'aminomethyl spectinomycin',
  'locations': [{'offset': 498, 'length': 25}]},
 {'id': '31',
  'infons': {'identifier': 'MESH:D000198',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D000198'],
   'databa

26625295


[{'id': '12',
  'infons': {'identifier': 'MESH:D005227',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D005227'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D005227',
   'biotype': 'chemical',
   'name': 'Fatty Acids',
   'accession': '@CHEMICAL_Fatty_Acids'},
  'text': 'fatty-acid',
  'locations': [{'offset': 159, 'length': 10}]},
 {'id': '13',
  'infons': {'identifier': 'MESH:D014376',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D014376'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014376',
   'biotype': 'disease',
   'name': 'Tuberculosis',
   'accession': '@DISEASE_Tuberculosis'},
  'text': 'tuberculosis',
  'locations': [{'offset': 263, 'length': 12}]},
 {'id': '14',
  'infons': {'identifier': 'MESH:D007538',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D007538'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007538',
   'biotype': 'chemical',
   'name': 'Isoniazid',
   'accession': '@CHEMICAL_Isoniazid'},
  'text': 'iso

26391612


[]

5697054


[{'id': '10',
  'infons': {'identifier': 'MESH:D014295',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014295'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014295',
   'biotype': 'chemical',
   'name': 'Trimethoprim',
   'accession': '@CHEMICAL_Trimethoprim'},
  'text': 'Trimethoprim',
  'locations': [{'offset': 47, 'length': 12}]},
 {'id': '11',
  'infons': {'identifier': 'MESH:C030985',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C030985'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C030985',
   'biotype': 'chemical',
   'name': 'purine',
   'accession': '@CHEMICAL_purine'},
  'text': 'purine',
  'locations': [{'offset': 120, 'length': 6}]},
 {'id': '12',
  'infons': {'identifier': 'MESH:D013449',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D013449'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D013449',
   'biotype': 'chemical',
   'name': 'Sulfonamides',
   'accession': '@CHEMICAL_Sulfonamides'},
  'text': 'sulphonami

27029317


[{'id': '6502',
  'infons': {'identifier': 'MESH:D023303',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D023303'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D023303',
   'biotype': 'chemical',
   'name': 'Oxazolidinones',
   'accession': '@CHEMICAL_Oxazolidinones'},
  'text': 'oxazolidinones',
  'locations': [{'offset': 1226, 'length': 14}]},
 {'id': '6503',
  'infons': {'identifier': 'MESH:D055666',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D055666'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D055666',
   'biotype': 'chemical',
   'name': 'Lipopeptides',
   'accession': '@CHEMICAL_Lipopeptides'},
  'text': 'lipopeptides',
  'locations': [{'offset': 1328, 'length': 12}]},
 {'id': '6504',
  'infons': {'identifier': 'MESH:D018942',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D018942'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D018942',
   'biotype': 'chemical',
   'name': 'Macrolides',
   'accession': '@CHEMICAL_Macro

26921428


[{'id': '36',
  'infons': {'identifier': 'MESH:D001424',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D001424'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D001424',
   'biotype': 'disease',
   'name': 'Bacterial Infections',
   'accession': '@DISEASE_Bacterial_Infections'},
  'text': 'bacterial',
  'locations': [{'offset': 188, 'length': 9}]},
 {'id': '37',
  'infons': {'identifier': 'MESH:D008712',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008712'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008712',
   'biotype': 'chemical',
   'name': 'Methicillin',
   'accession': '@CHEMICAL_Methicillin'},
  'text': 'methicillin',
  'locations': [{'offset': 260, 'length': 11}]},
 {'id': '38',
  'infons': {'identifier': '1280',
   'type': 'Species',
   'valid': True,
   'normalized': [1280],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1280,
   'biotype': 'species',
   'name': '1280',
   'accession': None},
  'text': 'Staphylococcus aureus',
  'l

26907184


[{'id': '35',
  'infons': {'identifier': 'MESH:D000077727',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D000077727'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D000077727',
   'biotype': 'chemical',
   'name': 'Ertapenem',
   'accession': '@CHEMICAL_Ertapenem'},
  'text': 'ertapenem',
  'locations': [{'offset': 180, 'length': 9}]},
 {'id': '36',
  'infons': {'identifier': 'MESH:D018805',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D018805'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D018805',
   'biotype': 'disease',
   'name': 'Sepsis',
   'accession': '@DISEASE_Sepsis'},
  'text': 'bloodstream infections',
  'locations': [{'offset': 211, 'length': 22}]},
 {'id': '37',
  'infons': {'identifier': 'MESH:D018805',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D018805'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D018805',
   'biotype': 'disease',
   'name': 'Sepsis',
   'accession': '@DISEASE_Sepsis'},
  'text': 'BSI',
  'lo

27215369


[{'id': '16767',
  'infons': {'identifier': 'MESH:D064420',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D064420'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D064420',
   'biotype': 'disease',
   'name': 'Drug-Related Side Effects and Adverse Reactions',
   'accession': '@DISEASE_Drug_Related_Side_Effects_and_Adverse_Reactions'},
  'text': 'toxicity',
  'locations': [{'offset': 913, 'length': 8}]},
 {'id': '16768',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'avarofloxacin',
  'locations': [{'offset': 1000, 'length': 13}]},
 {'id': '16769',
  'infons': {'identifier': 'MESH:C560572',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C560572'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C560572',
   'biotype': 'chemical',
   'name': 'finafloxacin',
   'accession': '@CHEMICAL_finafloxacin'},
  'text': 'finafloxacin',
  'locations': [{'offset': 1029, 'length': 1

27340469


[{'id': '3',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'Muraymycins',
  'locations': [{'offset': 145, 'length': 11}]},
 {'id': '4',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'muraymycins',
  'locations': [{'offset': 513, 'length': 11}]},
 {'id': '5',
  'infons': {'identifier': 'MESH:D014529',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014529'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014529',
   'biotype': 'chemical',
   'name': 'Uridine',
   'accession': '@CHEMICAL_Uridine'},
  'text': 'uridine',
  'locations': [{'offset': 220, 'length': 7}]},
 {'id': '6',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'muraymycin',
  'locations': [{'offset': 621, 'length': 10}]},
 {'id': '7',
  'in

27208767


[{'id': '6',
  'infons': {'identifier': 'MESH:D047090',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D047090'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D047090',
   'biotype': 'chemical',
   'name': 'beta-Lactams',
   'accession': '@CHEMICAL_beta_Lactams'},
  'text': 'beta-lactam',
  'locations': [{'offset': 206, 'length': 11}]},
 {'id': '7',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'BL-BLI',
  'locations': [{'offset': 244, 'length': 6}]},
 {'id': '8',
  'infons': {'identifier': 'MESH:C000594038',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C000594038'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C000594038',
   'biotype': 'chemical',
   'name': 'ceftolozane tazobactam drug combination',
   'accession': '@CHEMICAL_ceftolozane_tazobactam_drug_combination'},
  'text': 'ceftolozane-tazobactam',
  'locations': [{'offset': 266, 'length': 22}]},
 {'id'

26289137


[]

28487682


[{'id': '28746',
  'infons': {'identifier': '7091',
   'type': 'Species',
   'valid': True,
   'normalized': [7091],
   'database': 'ncbi_taxonomy',
   'normalized_id': 7091,
   'biotype': 'species',
   'name': '7091',
   'accession': None},
  'text': 'silkworms',
  'locations': [{'offset': 493, 'length': 9}]},
 {'id': '28747',
  'infons': {'identifier': 'MESH:D008712',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008712'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008712',
   'biotype': 'chemical',
   'name': 'Methicillin',
   'accession': '@CHEMICAL_Methicillin'},
  'text': 'methicillin',
  'locations': [{'offset': 363, 'length': 11}]},
 {'id': '28748',
  'infons': {'identifier': '1280',
   'type': 'Species',
   'valid': True,
   'normalized': [1280],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1280,
   'biotype': 'species',
   'name': '1280',
   'accession': None},
  'text': 'Staphylococcus aureus',
  'locations': [{'offset': 385, 'length': 21}]},
 {'

4383870


[{'id': '14',
  'infons': {'identifier': 'MESH:D004318',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D004318'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D004318',
   'biotype': 'chemical',
   'name': 'Doxycycline',
   'accession': '@CHEMICAL_Doxycycline'},
  'text': 'Doxycycline',
  'locations': [{'offset': 74, 'length': 11}]},
 {'id': '15',
  'infons': {'identifier': 'MESH:D004318',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D004318'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D004318',
   'biotype': 'chemical',
   'name': 'Doxycycline',
   'accession': '@CHEMICAL_Doxycycline'},
  'text': 'alpha-6-deoxy-oxytetracycline',
  'locations': [{'offset': 87, 'length': 29}]},
 {'id': '16',
  'infons': {'identifier': '629395',
   'type': 'Species',
   'valid': True,
   'normalized': [629395],
   'database': 'ncbi_taxonomy',
   'normalized_id': 629395,
   'biotype': 'species',
   'name': '629395',
   'accession': None},
  'text': 'bacteria',
  'lo

29401640


[{'id': '9708',
  'infons': {'identifier': '7153',
   'type': 'Gene',
   'ncbi_homologene': '830',
   'valid': True,
   'normalized': [7153],
   'database': 'ncbi_gene',
   'normalized_id': 7153,
   'biotype': 'gene',
   'name': 'TOP2A',
   'accession': '@GENE_TOP2A'},
  'text': 'DNA gyrase',
  'locations': [{'offset': 1837, 'length': 10}]},
 {'id': '9709',
  'infons': {'identifier': '7153',
   'type': 'Gene',
   'ncbi_homologene': '830',
   'valid': True,
   'normalized': [7153],
   'database': 'ncbi_gene',
   'normalized_id': 7153,
   'biotype': 'gene',
   'name': 'TOP2A',
   'accession': '@GENE_TOP2A'},
  'text': 'DNA gyrase',
  'locations': [{'offset': 398, 'length': 10}]},
 {'id': '9710',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'NBTIs',
  'locations': [{'offset': 1587, 'length': 5}]},
 {'id': '9711',
  'infons': {'identifier': '629395',
   'type': 'Species',
   'valid': True,
   'norma

29339384


[{'id': '16',
  'infons': {'identifier': 'MESH:D008070',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008070'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008070',
   'biotype': 'chemical',
   'name': 'Lipopolysaccharides',
   'accession': '@CHEMICAL_Lipopolysaccharides'},
  'text': 'lipopolysaccharides',
  'locations': [{'offset': 229, 'length': 19}]},
 {'id': '17',
  'infons': {'identifier': 'MESH:D010743',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D010743'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D010743',
   'biotype': 'chemical',
   'name': 'Phospholipids',
   'accession': '@CHEMICAL_Phospholipids'},
  'text': 'phospholipids',
  'locations': [{'offset': 250, 'length': 13}]},
 {'id': '18',
  'infons': {'identifier': '13877144',
   'type': 'Gene',
   'valid': True,
   'normalized': [13877144],
   'database': 'ncbi_gene',
   'normalized_id': 13877144,
   'biotype': 'gene',
   'name': 'HUS41_pIII0012',
   'accession': '@GENE_HUS41_PII

29600576


[{'id': '38',
  'infons': {'identifier': 'MESH:D002437',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002437'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002437',
   'biotype': 'chemical',
   'name': 'Cefazolin',
   'accession': '@CHEMICAL_Cefazolin'},
  'text': 'cefazolin',
  'locations': [{'offset': 238, 'length': 9}]},
 {'id': '39',
  'infons': {'identifier': 'MESH:D010406',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D010406'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D010406',
   'biotype': 'chemical',
   'name': 'Penicillins',
   'accession': '@CHEMICAL_Penicillins'},
  'text': 'penicillin',
  'locations': [{'offset': 271, 'length': 10}]},
 {'id': '40',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'ASP',
  'locations': [{'offset': 283, 'length': 3}]},
 {'id': '41',
  'infons': {'type': 'Disease',
   'valid': False,
   'normalized_id': None,
 

30869693


[{'id': '19',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'Thiotetronate',
  'locations': [{'offset': 96, 'length': 13}]},
 {'id': '20',
  'infons': {'identifier': 'MESH:C035068',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C035068'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C035068',
   'biotype': 'chemical',
   'name': 'thiolactomycin',
   'accession': '@CHEMICAL_thiolactomycin'},
  'text': 'thiolactomycin',
  'locations': [{'offset': 149, 'length': 14}]},
 {'id': '21',
  'infons': {'identifier': 'MESH:C037482',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C037482'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C037482',
   'biotype': 'chemical',
   'name': 'thiotetromycin',
   'accession': '@CHEMICAL_thiotetromycin'},
  'text': 'thiotetromycin',
  'locations': [{'offset': 165, 'length': 14}]},
 {'id': '22',
  'infons': {'identifier': '-',
   'type':

30858223


[{'id': '31',
  'infons': {'type': 'Disease',
   'valid': False,
   'normalized_id': None,
   'biotype': 'disease'},
  'text': 'ESBLs',
  'locations': [{'offset': 377, 'length': 5}]},
 {'id': '32',
  'infons': {'identifier': 'MESH:C000656730',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C000656730'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C000656730',
   'biotype': 'chemical',
   'name': 'enmetazobactam',
   'accession': '@CHEMICAL_enmetazobactam'},
  'text': 'AAI101',
  'locations': [{'offset': 542, 'length': 6}]},
 {'id': '33',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'penicillanic acid sulfone beta-lactamase inhibitor',
  'locations': [{'offset': 560, 'length': 50}]},
 {'id': '34',
  'infons': {'identifier': 'MESH:D000078142',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D000078142'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D000078142',
  

29396290


[{'id': '20',
  'infons': {'identifier': 'MESH:C013629',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C013629'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C013629',
   'biotype': 'chemical',
   'name': 'octapeptin antibiotics',
   'accession': '@CHEMICAL_octapeptin_antibiotics'},
  'text': 'octapeptins',
  'locations': [{'offset': 327, 'length': 11}]},
 {'id': '21',
  'infons': {'identifier': 'MESH:D055666',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D055666'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D055666',
   'biotype': 'chemical',
   'name': 'Lipopeptides',
   'accession': '@CHEMICAL_Lipopeptides'},
  'text': 'lipopeptides',
  'locations': [{'offset': 351, 'length': 12}]},
 {'id': '22',
  'infons': {'identifier': 'MESH:C013629',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C013629'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C013629',
   'biotype': 'chemical',
   'name': 'octapeptin antibiotics',
   'accession':

31064143


[{'id': '27392',
  'infons': {'identifier': 'MESH:D061065',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D061065'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D061065',
   'biotype': 'chemical',
   'name': 'Polyketides',
   'accession': '@CHEMICAL_Polyketides'},
  'text': 'polyketides',
  'locations': [{'offset': 601, 'length': 11}]},
 {'id': '27393',
  'infons': {'identifier': 'MESH:D061065',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D061065'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D061065',
   'biotype': 'chemical',
   'name': 'Polyketides',
   'accession': '@CHEMICAL_Polyketides'},
  'text': 'polyketides',
  'locations': [{'offset': 561, 'length': 11}]},
 {'id': '27394',
  'infons': {'identifier': 'MESH:D002784',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D002784'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D002784',
   'biotype': 'chemical',
   'name': 'Cholesterol',
   'accession': '@CHEMICAL_Cholesterol'},


31303992


[{'id': '11',
  'infons': {'identifier': 'MESH:D009428',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D009428'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D009428',
   'biotype': 'chemical',
   'name': 'Netilmicin',
   'accession': '@CHEMICAL_Netilmicin'},
  'text': 'netilmicin',
  'locations': [{'offset': 128, 'length': 10}]},
 {'id': '12',
  'infons': {'identifier': 'MESH:D009428',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D009428'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D009428',
   'biotype': 'chemical',
   'name': 'Netilmicin',
   'accession': '@CHEMICAL_Netilmicin'},
  'text': 'netilmicin',
  'locations': [{'offset': 217, 'length': 10}]},
 {'id': '13',
  'infons': {'identifier': 'MESH:C010686',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C010686'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C010686',
   'biotype': 'chemical',
   'name': 'benzeneboronic acid',
   'accession': '@CHEMICAL_benzeneboronic_acid'},

32435426


[{'id': '1540',
  'infons': {'identifier': 'MESH:D011691',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D011691'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D011691',
   'biotype': 'chemical',
   'name': 'Puromycin',
   'accession': '@CHEMICAL_Puromycin'},
  'text': 'puromycin',
  'locations': [{'offset': 1206, 'length': 9}]},
 {'id': '1541',
  'infons': {'identifier': 'MESH:D011691',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D011691'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D011691',
   'biotype': 'chemical',
   'name': 'Puromycin',
   'accession': '@CHEMICAL_Puromycin'},
  'text': 'Puromycin',
  'locations': [{'offset': 698, 'length': 9}]},
 {'id': '1542',
  'infons': {'identifier': 'MESH:D011691',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D011691'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D011691',
   'biotype': 'chemical',
   'name': 'Puromycin',
   'accession': '@CHEMICAL_Puromycin'},
  'text': 'Puromycin

32636816


[{'id': '27598',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'IMB-H4',
  'locations': [{'offset': 1065, 'length': 6}]},
 {'id': '27599',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007239',
   'biotype': 'disease',
   'name': 'Infections',
   'accession': '@DISEASE_Infections'},
  'text': 'infection disease',
  'locations': [{'offset': 238, 'length': 17}]},
 {'id': '27600',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'IMB-H4',
  'locations': [{'offset': 1174, 'length': 6}]},
 {'id': '27601',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'IMB-H4',
  'locations': [{'offset': 889, 'length': 6}]},
 {'

32917596


[{'id': '24255',
  'infons': {'identifier': 'MESH:D013203',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D013203'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D013203',
   'biotype': 'disease',
   'name': 'Staphylococcal Infections',
   'accession': '@DISEASE_Staphylococcal_Infections'},
  'text': 'MRSA infections',
  'locations': [{'offset': 223, 'length': 15}]}]

32712655


[]

32978140


[{'id': '46',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'Nonribosomal peptides',
  'locations': [{'offset': 125, 'length': 21}]},
 {'id': '47',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'NRPs',
  'locations': [{'offset': 148, 'length': 4}]},
 {'id': '48',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'Brevibacillus spp',
  'locations': [{'offset': 322, 'length': 17}]},
 {'id': '49',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'NRPs',
  'locations': [{'offset': 362, 'length': 4}]},
 {'id': '50',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'bogorol',
  

33412557


[{'id': '5499',
  'infons': {'identifier': 'MESH:D009547',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D009547'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D009547',
   'biotype': 'chemical',
   'name': 'Nifurtimox',
   'accession': '@CHEMICAL_Nifurtimox'},
  'text': 'Nifurtimox',
  'locations': [{'offset': 209, 'length': 10}]},
 {'id': '5500',
  'infons': {'identifier': '9606',
   'type': 'Species',
   'valid': True,
   'normalized': [9606],
   'database': 'ncbi_taxonomy',
   'normalized_id': 9606,
   'biotype': 'species',
   'name': '9606',
   'accession': None},
  'text': 'patients',
  'locations': [{'offset': 1242, 'length': 8}]},
 {'id': '5501',
  'infons': {'identifier': 'MESH:D014355',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D014355'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014355',
   'biotype': 'disease',
   'name': 'Chagas Disease',
   'accession': '@DISEASE_Chagas_Disease'},
  'text': 'Chagas disease',
  'locations': [{'of

33627412


[{'id': '4393',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007239',
   'biotype': 'disease',
   'name': 'Infections',
   'accession': '@DISEASE_Infections'},
  'text': 'infections',
  'locations': [{'offset': 1730, 'length': 10}]},
 {'id': '4394',
  'infons': {'identifier': '91347',
   'type': 'Species',
   'valid': True,
   'normalized': [91347],
   'database': 'ncbi_taxonomy',
   'normalized_id': 91347,
   'biotype': 'species',
   'name': '91347',
   'accession': None},
  'text': 'Enterobacterales',
  'locations': [{'offset': 451, 'length': 16}]},
 {'id': '4395',
  'infons': {'type': 'Disease',
   'valid': False,
   'normalized_id': None,
   'biotype': 'disease'},
  'text': 'nephrotoxicity',
  'locations': [{'offset': 1383, 'length': 14}]},
 {'id': '4396',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239']

32658473


[{'id': '22665',
  'infons': {'identifier': '7872529',
   'type': 'Gene',
   'valid': True,
   'normalized': [7872529],
   'database': 'ncbi_gene',
   'normalized_id': 7872529,
   'biotype': 'gene',
   'name': 'ampC',
   'accession': '@GENE_AMPC'},
  'text': 'beta-lactamase',
  'locations': [{'offset': 798, 'length': 14}]},
 {'id': '22666',
  'infons': {'identifier': '7872529',
   'type': 'Gene',
   'valid': True,
   'normalized': [7872529],
   'database': 'ncbi_gene',
   'normalized_id': 7872529,
   'biotype': 'gene',
   'name': 'ampC',
   'accession': '@GENE_AMPC'},
  'text': 'beta-Lactamase',
  'locations': [{'offset': 389, 'length': 14}]},
 {'id': '22667',
  'infons': {'identifier': 'MESH:D016905',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D016905'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D016905',
   'biotype': 'disease',
   'name': 'Gram-Negative Bacterial Infections',
   'accession': '@DISEASE_Gram_Negative_Bacterial_Infections'},
  'text': 'Gram-negat

33917912


[{'id': '14285',
  'infons': {'identifier': 'MESH:D014634',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014634'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014634',
   'biotype': 'chemical',
   'name': 'Valinomycin',
   'accession': '@CHEMICAL_Valinomycin'},
  'text': 'valinomycin',
  'locations': [{'offset': 665, 'length': 11}]},
 {'id': '14286',
  'infons': {'identifier': 'MESH:D014634',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014634'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014634',
   'biotype': 'chemical',
   'name': 'Valinomycin',
   'accession': '@CHEMICAL_Valinomycin'},
  'text': 'valinomycin',
  'locations': [{'offset': 991, 'length': 11}]},
 {'id': '14287',
  'infons': {'identifier': 'MESH:D014634',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014634'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014634',
   'biotype': 'chemical',
   'name': 'Valinomycin',
   'accession': '@CHEMICAL_Valinomycin'},


33996753


[{'id': '34785',
  'infons': {'identifier': 'MESH:C539430',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C539430'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C539430',
   'biotype': 'chemical',
   'name': 'cefilavancin',
   'accession': '@CHEMICAL_cefilavancin'},
  'text': 'TD-1792',
  'locations': [{'offset': 625, 'length': 7}]},
 {'id': '34786',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'DSTA4637S',
  'locations': [{'offset': 1233, 'length': 9}]},
 {'id': '34787',
  'infons': {'identifier': 'MESH:D016470',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D016470'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D016470',
   'biotype': 'disease',
   'name': 'Bacteremia',
   'accession': '@DISEASE_Bacteremia'},
  'text': 'bacteremia',
  'locations': [{'offset': 1299, 'length': 10}]},
 {'id': '34788',
  'infons': {'identifier': 'MESH:C000619733',
   'type': 'C

34191513


[{'id': '4047',
  'infons': {'identifier': '7872529',
   'type': 'Gene',
   'valid': True,
   'normalized': [7872529],
   'database': 'ncbi_gene',
   'normalized_id': 7872529,
   'biotype': 'gene',
   'name': 'ampC',
   'accession': '@GENE_AMPC'},
  'text': 'beta-lactamase',
  'locations': [{'offset': 250, 'length': 14}]},
 {'id': '4048',
  'infons': {'identifier': '7872529',
   'type': 'Gene',
   'valid': True,
   'normalized': [7872529],
   'database': 'ncbi_gene',
   'normalized_id': 7872529,
   'biotype': 'gene',
   'name': 'ampC',
   'accession': '@GENE_AMPC'},
  'text': 'beta-lactamase',
  'locations': [{'offset': 302, 'length': 14}]},
 {'id': '4049',
  'infons': {'identifier': '7872529',
   'type': 'Gene',
   'valid': True,
   'normalized': [7872529],
   'database': 'ncbi_gene',
   'normalized_id': 7872529,
   'biotype': 'gene',
   'name': 'ampC',
   'accession': '@GENE_AMPC'},
  'text': 'beta-lactamase',
  'locations': [{'offset': 1040, 'length': 14}]},
 {'id': '4050',
  'infon

33875545


[]

32084340


[{'id': '8',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'Hub',
  'locations': [{'offset': 393, 'length': 3}]},
 {'id': '9',
  'infons': {'identifier': 'MESH:C000717882',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C000717882'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C000717882',
   'biotype': 'chemical',
   'name': 'SU 3327',
   'accession': '@CHEMICAL_SU_3327'},
  'text': 'halicin',
  'locations': [{'offset': 397, 'length': 7}]},
 {'id': '10',
  'infons': {'identifier': '1773',
   'type': 'Species',
   'valid': True,
   'normalized': [1773],
   'database': 'ncbi_taxonomy',
   'normalized_id': 1773,
   'biotype': 'species',
   'name': '1773',
   'accession': None},
  'text': 'Mycobacterium tuberculosis',
  'locations': [{'offset': 561, 'length': 26}]},
 {'id': '11',
  'infons': {'identifier': 'MESH:D015780',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['

34452252


[{'id': '29003',
  'infons': {'identifier': 'MESH:D015363',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D015363'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D015363',
   'biotype': 'chemical',
   'name': 'Quinolones',
   'accession': '@CHEMICAL_Quinolones'},
  'text': 'quinolones',
  'locations': [{'offset': 419, 'length': 10}]},
 {'id': '29004',
  'infons': {'identifier': 'MESH:C480202',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C480202'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C480202',
   'biotype': 'chemical',
   'name': 'zabofloxacin',
   'accession': '@CHEMICAL_zabofloxacin'},
  'text': 'zabofloxacin',
  'locations': [{'offset': 1005, 'length': 12}]},
 {'id': '29005',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'delafoxacin',
  'locations': [{'offset': 911, 'length': 11}]},
 {'id': '29006',
  'infons': {'identifier': 'MESH:D015363',
   't

34436264


[{'id': '33930',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'desertomycin H.',
  'locations': [{'offset': 1414, 'length': 15}]},
 {'id': '33931',
  'infons': {'identifier': 'MESH:D007239',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D007239'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D007239',
   'biotype': 'disease',
   'name': 'Infections',
   'accession': '@DISEASE_Infections'},
  'text': 'infections',
  'locations': [{'offset': 145, 'length': 10}]},
 {'id': '33932',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'macrolactone',
  'locations': [{'offset': 1380, 'length': 12}]},
 {'id': '33933',
  'infons': {'identifier': 'MESH:D014640',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D014640'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D014640',
   'biotype': '

34895348


[]

33657598


[{'id': '21',
  'infons': {'identifier': 'MESH:C508887',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C508887'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C508887',
   'biotype': 'chemical',
   'name': 'retapamulin',
   'accession': '@CHEMICAL_retapamulin'},
  'text': 'Retapamulin',
  'locations': [{'offset': 115, 'length': 11}]},
 {'id': '22',
  'infons': {'identifier': 'MESH:D016712',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D016712'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D016712',
   'biotype': 'chemical',
   'name': 'Mupirocin',
   'accession': '@CHEMICAL_Mupirocin'},
  'text': 'mupirocin',
  'locations': [{'offset': 172, 'length': 9}]},
 {'id': '23',
  'infons': {'identifier': 'MESH:D008712',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008712'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D008712',
   'biotype': 'chemical',
   'name': 'Methicillin',
   'accession': '@CHEMICAL_Methicillin'},
  'text': 'methi

35009233


[{'id': '20070',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'SurgihoneyRO',
  'locations': [{'offset': 1697, 'length': 12}]},
 {'id': '20071',
  'infons': {'identifier': 'MESH:C016240',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C016240'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C016240',
   'biotype': 'chemical',
   'name': 'polycaprolactone',
   'accession': '@CHEMICAL_polycaprolactone'},
  'text': 'polycaprolactone',
  'locations': [{'offset': 911, 'length': 16}]},
 {'id': '20072',
  'infons': {'identifier': 'MESH:D011108',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D011108'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D011108',
   'biotype': 'chemical',
   'name': 'Polymers',
   'accession': '@CHEMICAL_Polymers'},
  'text': 'polymer',
  'locations': [{'offset': 1302, 'length': 7}]},
 {'id': '20073',
  'infons': {'identifier': 'MESH:D007239',

35100868


[]

34969066


[]

10049250


[{'id': '44',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'CL 188,624',
  'locations': [{'offset': 95, 'length': 10}]},
 {'id': '45',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'CL 190,294',
  'locations': [{'offset': 107, 'length': 10}]},
 {'id': '46',
  'infons': {'identifier': 'MESH:C119421',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['C119421'],
   'database': 'ncbi_mesh',
   'normalized_id': 'C119421',
   'biotype': 'chemical',
   'name': 'CL 191121',
   'accession': '@CHEMICAL_CL_191121'},
  'text': 'CL 191,121',
  'locations': [{'offset': 123, 'length': 10}]},
 {'id': '47',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'aminomethyl tetrahydrofuranyl (THF)-1 beta-methylcarbapenems',
  'locat

10722483


[{'id': '25',
  'infons': {'identifier': 'MESH:D024841',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D024841'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D024841',
   'biotype': 'chemical',
   'name': 'Fluoroquinolones',
   'accession': '@CHEMICAL_Fluoroquinolones'},
  'text': 'fluoroquinolones',
  'locations': [{'offset': 196, 'length': 16}]},
 {'id': '26',
  'infons': {'identifier': 'MESH:D024841',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D024841'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D024841',
   'biotype': 'chemical',
   'name': 'Fluoroquinolones',
   'accession': '@CHEMICAL_Fluoroquinolones'},
  'text': 'fluoroquinolone',
  'locations': [{'offset': 221, 'length': 15}]},
 {'id': '27',
  'infons': {'identifier': 'MESH:D015366',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D015366'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D015366',
   'biotype': 'chemical',
   'name': 'Pefloxacin',
   'accession': '@CHEMI

35411221


[{'id': '41',
  'infons': {'identifier': 'MESH:D001749',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D001749'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D001749',
   'biotype': 'disease',
   'name': 'Urinary Bladder Neoplasms',
   'accession': '@DISEASE_Urinary_Bladder_Neoplasms'},
  'text': 'Bladder cancer',
  'locations': [{'offset': 152, 'length': 14}]},
 {'id': '42',
  'infons': {'identifier': 'MESH:D009369',
   'type': 'Disease',
   'valid': True,
   'normalized': ['D009369'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D009369',
   'biotype': 'disease',
   'name': 'Neoplasms',
   'accession': '@DISEASE_Neoplasms'},
  'text': 'cancers',
  'locations': [{'offset': 195, 'length': 7}]},
 {'id': '43',
  'infons': {'identifier': '23411',
   'type': 'Gene',
   'ncbi_homologene': '56556',
   'valid': True,
   'normalized': [23411],
   'database': 'ncbi_gene',
   'normalized_id': 23411,
   'biotype': 'gene',
   'name': 'SIRT1',
   'accession': '@GENE_SIRT1'},
 

11709337


[{'id': '32',
  'infons': {'identifier': 'MESH:D015363',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D015363'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D015363',
   'biotype': 'chemical',
   'name': 'Quinolones',
   'accession': '@CHEMICAL_Quinolones'},
  'text': 'quinolones',
  'locations': [{'offset': 180, 'length': 10}]},
 {'id': '33',
  'infons': {'type': 'Species',
   'valid': False,
   'normalized_id': None,
   'biotype': 'species'},
  'text': 'Staphylococcus aureus MS5935',
  'locations': [{'offset': 283, 'length': 28}]},
 {'id': '34',
  'infons': {'identifier': 'MESH:D009643',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D009643'],
   'database': 'ncbi_mesh',
   'normalized_id': 'D009643',
   'biotype': 'chemical',
   'name': 'Norfloxacin',
   'accession': '@CHEMICAL_Norfloxacin'},
  'text': 'norfloxacin',
  'locations': [{'offset': 330, 'length': 11}]},
 {'id': '35',
  'infons': {'identifier': 'MESH:C062127',
   'type': 'Chemical',
   'v

35723082


[]

36290043


[{'id': '37931',
  'infons': {'identifier': '562',
   'type': 'Species',
   'valid': True,
   'normalized': [562],
   'database': 'ncbi_taxonomy',
   'normalized_id': 562,
   'biotype': 'species',
   'name': '562',
   'accession': None},
  'text': 'Escherichia coli',
  'locations': [{'offset': 1638, 'length': 16}]},
 {'id': '37932',
  'infons': {'identifier': '4932',
   'type': 'Species',
   'valid': True,
   'normalized': [4932],
   'database': 'ncbi_taxonomy',
   'normalized_id': 4932,
   'biotype': 'species',
   'name': '4932',
   'accession': None},
  'text': 'yeast',
  'locations': [{'offset': 865, 'length': 5}]},
 {'id': '37933',
  'infons': {'identifier': '-',
   'type': 'Chemical',
   'valid': False,
   'normalized_id': None,
   'biotype': 'chemical'},
  'text': 'IMB-0042',
  'locations': [{'offset': 1118, 'length': 8}]},
 {'id': '37934',
  'infons': {'identifier': 'MESH:D008070',
   'type': 'Chemical',
   'valid': True,
   'normalized': ['D008070'],
   'database': 'ncbi_mesh',

In [None]:
pos_df[ pos_df['PubTator'].str.len() < 1 ]

Unnamed: 0,PMC_ID,PMID,Title,Abstract,T5,Alpaca,LaMini,Score,Answer,Unnamed: 9,PubTator
25,2466982.0,4914633,Cephalexin--a new oral antibiotic.,"The pharmacology, antimicrobial activity and c...",<pad> yes</s>,Yes,Yes.,3.0,YES,,[]
33,3024282.0,21194422,An open randomized clinical trial in comparing...,Several studies have demonstrated the efficacy...,<pad> yes</s>,No; yes,Yes. For AS + SMP FDC; the same drugs are used...,2.5,YES,,[]
35,3167646.0,22460279,Host defence peptides: antimicrobial and immun...,The rapidly increasing incidence of multidrug-...,<pad> yes</s>,Yes,Yes.,3.0,YES,,[]
57,4359184.0,25644122,Pharmacokinetics of cefozopran by single and m...,Cefozopran is a parenteral cephalosporin with ...,<pad> yes</s>,Yes,Yes.,3.0,YES,,[]
66,4675762.0,26391612,In Vitro Activity of Oral Cephalosporins (Cefp...,The global emergence of pathogens of urinary-t...,<pad> yes</s>,Yes,Yes.,3.0,YES,,[]
74,5042094.0,26289137,Evidence for the use of demeclocycline in the ...,Hyponatraemia (HN) is the most common electrol...,<pad> no</s>,Yes; yes,No.,1.0,NO,,[]
87,7467700.0,32917596,Globally deimmunized lysostaphin evades human ...,There is a critical need for novel therapies t...,<pad> yes</s>,yes,No.,2.0,YES,,[]
88,7566547.0,32712655,"High in vitro activity of DIS-73285, a novel a...",The rising incidence of antimicrobial resistan...,<pad> yes</s>,yes,Yes.,3.0,YES,,[]
96,8316002.0,33875545,Inhibition of Escherichia coli Lipoprotein Dia...,Lipoprotein diacylglyceryl transferase (Lgt) c...,<pad> yes</s>,Yes,Yes.,3.0,YES,,[]
100,8665510.0,34895348,A fresh look at the role of spiramycin in prev...,We aimed to investigate the effect of antepart...,<pad> yes</s>,Yes.,Yes.,3.0,YES,,[]


In [None]:
def pubtator_process(id):

    url = f"https://www.ncbi.nlm.nih.gov/research/pubtator3-api/publications/export/biocjson?pmids={id}&full=true"
    res = requests.get(url)
    print(id)
    res_js = json.loads(res.content)['PubTator3']

    # Only working with abstracts
    abstract_js = [js for js in res_js[0]['passages'] if js['infons']['type'] == 'abstract']

    pubt_annot = [js['annotations'] for js in abstract_js]
    pubt_annot = sum(pubt_annot, [])
    #display(pubt_annot)
    pubt_res = pubtator_generate_struct(pubt_annot)

    time.sleep(0.6)

    return sorted(pubt_res, key=lambda d: d['location']['start'])

In [None]:
pos_df

Unnamed: 0,PMC_ID,PMID,Title,Abstract,T5,Alpaca,LaMini,Score,Answer,Unnamed: 9,PubTator
0,101622.0,11036042,RNA polymerase inhibitors with activity agains...,A collection of rifampin-resistant mutants of ...,<pad> yes</s>,Yes,Yes.,3,YES,,"[{'text': 'rifampin', 'location': {'start': 11..."
1,10187937.0,37192172,Streptothricin F is a bactericidal antibiotic ...,The streptothricin natural product mixture (al...,<pad> yes</s>,yes,The context does not provide information on wh...,2.5,YES,,"[{'text': 'steptolidine', 'location': {'start'..."
2,1162199.0,6258580,Interaction of pseudomonic acid A with Escheri...,Sodium pseudomonate was shown to be a powerful...,<pad> yes</s>,Yes.,The context describes the active inhibition an...,3,YES,,"[{'text': 'Sodium pseudomonate', 'location': {..."
3,1251517.0,16189117,"Efficacy of telavancin (TD-6424), a rapidly ba...","The efficacy of telavancin, a bactericidal lip...",<pad> yes</s>,Yes,Yes.,3,YES,,"[{'text': 'telavancin', 'location': {'start': ..."
4,1482072.0,13681272,Pharmacology of methicillin.,The pharmacology of a new antibiotic methicill...,<pad> yes</s>,antimicrobial,Yes.,2.5,YES,,"[{'text': 'methicillin', 'location': {'start':..."
...,...,...,...,...,...,...,...,...,...,...,...
106,89784.0,10722483,Pefloxacin-induced achilles tendon toxicity in...,Despite a relatively low incidence of serious ...,<pad> no</s>,Yes,No.,1,NO,,"[{'text': 'fluoroquinolones', 'location': {'st..."
107,8984893.0,35411221,Antibiotic heliomycin and its water-soluble 4-...,Bladder cancer is one of the most frequent can...,<pad> yes</s>,Yes; no,Yes.,2.5,YES,,"[{'text': 'water', 'location': {'start': 483, ..."
108,90866.0,11709337,Target preference of 15 quinolones against Sta...,The antibacterial activities and target inhibi...,<pad> yes</s>,Yes,No.,2,YES,,"[{'text': 'quinolones', 'location': {'start': ..."
109,9225766.0,35723082,Re-establishing the utility of tetracycline-cl...,The progressive increase in antibiotic resista...,<pad> yes</s>,Yes,Yes.,3,YES,,[]


In [None]:
def collapse_pubtator(row):
    texts = []
    for d in row:
        texts.append(d['text'])
    return list(set(texts))

pos_df['PubTator_simplified'] = pos_df['PubTator'].apply(collapse_pubtator)
pos_df

Unnamed: 0,PMC_ID,PMID,Title,Abstract,T5,Alpaca,LaMini,Score,Answer,Unnamed: 9,PubTator,PubTator_simplified
0,101622.0,11036042,RNA polymerase inhibitors with activity agains...,A collection of rifampin-resistant mutants of ...,<pad> yes</s>,Yes,Yes.,3,YES,,"[{'text': 'rifampin', 'location': {'start': 11...","[corallopyronin A, streptolydigin, sorangicin ..."
1,10187937.0,37192172,Streptothricin F is a bactericidal antibiotic ...,The streptothricin natural product mixture (al...,<pad> yes</s>,yes,The context does not provide information on wh...,2.5,YES,,"[{'text': 'steptolidine', 'location': {'start'...","[guanine, streptothricin, streptothricin D, st..."
2,1162199.0,6258580,Interaction of pseudomonic acid A with Escheri...,Sodium pseudomonate was shown to be a powerful...,<pad> yes</s>,Yes.,The context describes the active inhibition an...,3,YES,,"[{'text': 'Sodium pseudomonate', 'location': {...","[isoleucine, [14C]isoleucine, Sodium [9'-3H]ps..."
3,1251517.0,16189117,"Efficacy of telavancin (TD-6424), a rapidly ba...","The efficacy of telavancin, a bactericidal lip...",<pad> yes</s>,Yes,Yes.,3,YES,,"[{'text': 'telavancin', 'location': {'start': ...","[vancomycin, lipoglycopeptide, methicillin, te..."
4,1482072.0,13681272,Pharmacology of methicillin.,The pharmacology of a new antibiotic methicill...,<pad> yes</s>,antimicrobial,Yes.,2.5,YES,,"[{'text': 'methicillin', 'location': {'start':...","[penicillin G., penicillin G, methicillin, 6(2..."
...,...,...,...,...,...,...,...,...,...,...,...,...
106,89784.0,10722483,Pefloxacin-induced achilles tendon toxicity in...,Despite a relatively low incidence of serious ...,<pad> no</s>,Yes,No.,1,NO,,"[{'text': 'fluoroquinolones', 'location': {'st...","[radiosulfate, fluoroquinolones, Pefloxacin, N..."
107,8984893.0,35411221,Antibiotic heliomycin and its water-soluble 4-...,Bladder cancer is one of the most frequent can...,<pad> yes</s>,Yes; no,Yes.,2.5,YES,,"[{'text': 'water', 'location': {'start': 483, ...","[4-(tert-butylamino)methyl, water, heliomycin,..."
108,90866.0,11709337,Target preference of 15 quinolones against Sta...,The antibacterial activities and target inhibi...,<pad> yes</s>,Yes,No.,2,YES,,"[{'text': 'quinolones', 'location': {'start': ...","[ofloxacin, Type III quinolones, II quinolones..."
109,9225766.0,35723082,Re-establishing the utility of tetracycline-cl...,The progressive increase in antibiotic resista...,<pad> yes</s>,Yes,Yes.,3,YES,,[],[]


In [None]:
pos_df.to_excel('DatasetPositivo.xlsx', columns=["PMC_ID","PMID","Title","Abstract","PubTator","PubTator_simplified"], index=False)