In [1]:
from adeft import available_shortforms
from adeft.disambiguate import load_disambiguator
from adeft_indra.s3 import model_to_s3

In [2]:
disambiguators = {shortform: load_disambiguator(shortform) for shortform in available_shortforms}

In [3]:
grounding_dicts = {shortform: disambiguator.grounding_dict for shortform, disambiguator in disambiguators.items()}

In [4]:
grounding_dicts

{'PC': {'PC': {'phosphatidylcholine': 'CHEBI:CHEBI:64482',
   'cancer': 'ungrounded',
   'cells': 'ungrounded',
   'protein c': 'HGNC:9451',
   'preconditioning': 'ungrounded',
   'pyruvate carboxylase': 'HGNC:8636',
   'phosphocholine': 'ungrounded',
   'phosphorylcholine': 'ungrounded',
   'protein carbonyl': 'MESH:D050050',
   'es li': 'ungrounded',
   'principal component': 'ungrounded',
   'peritoneal carcinomatosis': 'ungrounded',
   'platelet concentrations': 'ungrounded',
   'complex': 'ungrounded',
   'phosphatidyl choline': 'CHEBI:CHEBI:64482',
   'cortex': 'ungrounded',
   'control': 'ungrounded',
   'care': 'ungrounded',
   'carcinoma': 'ungrounded',
   'pericytes': 'ungrounded',
   'phycocyanin': 'ungrounded',
   'portland cement': 'ungrounded',
   'polycarbonate': 'ungrounded',
   'plastocyanin': 'ungrounded',
   'pachyonychia congenita': 'ungrounded',
   'phosphocitrate': 'ungrounded',
   'protein content': 'ungrounded',
   'phytochelatin': 'ungrounded',
   'photonic cry

In [5]:
BP_disamb = disambiguators['BP']
PS_disamb = disambiguators['PS']
PA_disamb = disambiguators['PA']
MB_disamb = disambiguators['MB']

In [6]:
BP_disamb.grounding_dict

{'BP': {'blood pressure': 'MESH:D001794',
  'benzo a pyrene': 'CHEBI:29865',
  'bullous pemphigoid': 'ungrounded',
  'bisphosphonate': 'MESH:D004164',
  'binding potential': 'ungrounded',
  'bipolar disorder': 'ungrounded',
  'n butylidenephthalide': 'ungrounded',
  'black phosphorus': 'ungrounded',
  'brevipedicellus': 'ungrounded',
  'protein': 'ungrounded',
  'bacterial production': 'ungrounded',
  'benzophenone': 'ungrounded',
  'rcas': 'ungrounded',
  'bipolar': 'ungrounded',
  'biological process': 'ungrounded',
  'point': 'ungrounded',
  'butylparaben': 'ungrounded',
  'benzoyl peroxide': 'ungrounded',
  'brachial plexus': 'ungrounded'}}

In [7]:
BP_disamb.modify_groundings(new_groundings={'CHEBI:29865': 'CHEBI:CHEBI:29865'})

In [8]:
BP_disamb.grounding_dict

{'BP': {'blood pressure': 'MESH:D001794',
  'benzo a pyrene': 'CHEBI:CHEBI:29865',
  'bullous pemphigoid': 'ungrounded',
  'bisphosphonate': 'MESH:D004164',
  'binding potential': 'ungrounded',
  'bipolar disorder': 'ungrounded',
  'n butylidenephthalide': 'ungrounded',
  'black phosphorus': 'ungrounded',
  'brevipedicellus': 'ungrounded',
  'protein': 'ungrounded',
  'bacterial production': 'ungrounded',
  'benzophenone': 'ungrounded',
  'rcas': 'ungrounded',
  'bipolar': 'ungrounded',
  'biological process': 'ungrounded',
  'point': 'ungrounded',
  'butylparaben': 'ungrounded',
  'benzoyl peroxide': 'ungrounded',
  'brachial plexus': 'ungrounded'}}

In [9]:
BP_disamb.names

{'CHEBI:CHEBI:29865': 'benzo[a]pyrene',
 'MESH:D001794': 'Blood Pressure',
 'MESH:D004164': 'Diphosphonates'}

In [13]:
BP_disamb.disambiguate('benzo benzo pyrene chemical wow')

('CHEBI:CHEBI:29865',
 'benzo[a]pyrene',
 {'CHEBI:CHEBI:29865': 0.9875054329190245,
  'MESH:D001794': 0.008616123995984281,
  'MESH:D004164': 0.0025408888748896835,
  'ungrounded': 0.001337554210101759})

In [10]:
model_to_s3(BP_disamb)

In [11]:
!python -m adeft.download --update

100% [......................................................] 1181008 / 1181008

In [12]:
BP_disamb = load_disambiguator('BP')

In [30]:
grounding_map = MB_disamb.grounding_dict['MB']

In [31]:
[id_ for phrase, id_ in grounding_map.items() if id_.startswith('CHEBI')]

['CHEBI:6872']

In [32]:
new_groundings = {'CHEBI:6872': 'CHEBI:CHEBI:6872'}

In [33]:
MB_disamb.modify_groundings(new_groundings=new_groundings)

In [34]:
MB_disamb.grounding_dict

{'MB': {'methylene blue': 'CHEBI:CHEBI:6872',
  'medulloblastoma': 'ungrounded',
  'mushroom body': 'ungrounded',
  'microbubbles': 'ungrounded',
  'molecular beacon': 'ungrounded',
  'sio 2': 'ungrounded',
  'myocardial bridge': 'ungrounded',
  'maneb': 'ungrounded',
  'multibacillary': 'ungrounded',
  'mitochondrial biogenesis': 'ungrounded',
  'myoblasts': 'ungrounded',
  'multiband': 'ungrounded',
  'b': 'ungrounded',
  'hfc diet or the hfc diet supplemented with monobutyrin at 1 g kg diet 0 · 1 mb mb at 5 g kg diet': 'ungrounded',
  'major bleeding': 'ungrounded',
  'mibolerone': 'ungrounded',
  'maternal behavior': 'ungrounded',
  'midbrain': 'ungrounded',
  'band': 'ungrounded',
  'myoglobin': 'HGNC:6915',
  'midbody': 'ungrounded'}}

In [35]:
model_to_s3(MB_disamb)

In [36]:
!python -m adeft.download --update

100% [......................................................] 1181008 / 1181008