In [1]:
from indra.sources import trips
from indra.sources import reach
import pandas as pd
from indra.assemblers import PybelAssembler
from pybel.canonicalize import edge_to_bel

INFO: indra/elsevier - No Elsevier institution key found in environment variable ELSEVIER_INST_KEY.
ERROR: indra/reach - Could not import jnius, offline reading cannot be used.


# Data Acquisition

In [2]:
training_url = 'https://wiki.openbel.org/download/attachments/11108491/Training.sentence?version=2&modificationDate=1426865542000&api=v2'

training_df = pd.read_csv(training_url, sep='\t')
training_df.head()

Unnamed: 0,Sentence-ID,PMID,Sentence
0,SEN:10000006,7557387,Induction of C/EBP beta DNA-binding activity i...
1,SEN:10000010,7988462,Pulse-chase biosynthetic labeling studies show...
2,SEN:10000018,8856503,We have identified glucocorticoids as physiolo...
3,SEN:10000020,9112333,interleukin 1 receptor antagonist (IL-1ra) is ...
4,SEN:10000022,9291476,"Treatment with RU486, a progesterone receptor ..."


In [3]:
test_url = 'https://wiki.openbel.org/download/attachments/11108491/Test.sentence?version=1&modificationDate=1434282678000&api=v2'

test_df = pd.read_csv(test_url, sep='\t', names=('Sentence-ID', 'PMID', 'Sentence'))
test_df.head()

Unnamed: 0,Sentence-ID,PMID,Sentence
0,SEN:10003274,18032669,Alcohol and heat stimulate the translocation o...
1,SEN:10003350,11267935,"TGF-beta increased the expression of PAI-1, ju..."
2,SEN:10003358,10688433,Dexamethasone decreased ICAM-3 and increased L...
3,SEN:10003390,8428935,We conclude that ethanol exposure enhances exp...
4,SEN:10003462,12421982,"Following i.v. infusion of LPS into mice, up-r..."


In [4]:
evaluation_url = 'https://wiki.openbel.org/download/attachments/19169286/BELTask1_2017.testset.sentence?version=1&modificationDate=1500897598000&api=v2'

evaluation_df = pd.read_csv(evaluation_url, sep='\t')
evaluation_df.head()

Unnamed: 0,Sentence ID,PMID,Sentence
0,SEN:201710001,25377781,Activation of c-Src by JNK2 was accompanied by...
1,SEN:201710002,23656735,"Additionally, siRNA-induced knockdown of p38 k..."
2,SEN:201710003,23656735,"Additionally, the siRNA-induced knockdown of p..."
3,SEN:201710004,23656735,"Additionally, the siRNA knockdown of ATF-2 als..."
4,SEN:201710005,24732359,After 72 h of S100A4-knockdown in HLC-1 and LK...


# Example Conversion to BEL with INDRA

In [5]:
sentence_id, pmid, sentence = training_df.loc[1]
sentence

'Pulse-chase biosynthetic labeling studies showed that AtT-20 cells expressed much less RESP18 than the endogenous prohormone, POMC, but that glucocorticoid treatment lowered POMC and raised RESP18 biosynthetic rates so that they were nearly equimolar.'

## Using TRIPS

The following example makes an extraction with the [TRIPS processor](http://indra.readthedocs.io/en/latest/modules/sources/trips/index.html#indra.sources.trips.trips_api.process_text).

In [6]:
%%time
trips_result = trips.process_text(sentence)

CPU times: user 22.8 ms, sys: 7.38 ms, total: 30.2 ms
Wall time: 1min 53s


In [7]:
len(trips_result.statements)

0

In [8]:
trips_assembly = PybelAssembler(trips_result.statements, name='TRIPS Test', version='0.0.1')

In [9]:
for u, v, k, d in trips_assembly.model.edges():
    print(edge_to_bel(trips_assembly.model, u, v, d))

## Using REACH

The following example makes an extraction with the [REACH processor](http://indra.readthedocs.io/en/latest/modules/sources/reach/index.html#indra.sources.reach.reach_api.process_text)

In [10]:
%%time
reach_result = reach.process_text(sentence)

CPU times: user 6.07 ms, sys: 2.27 ms, total: 8.34 ms
Wall time: 1.48 s


In [11]:
len(reach_result.statements)

0

In [12]:
reach_assembly = PybelAssembler(reach_result.statements, name='REACH Test', version='0.0.1')

In [13]:
for u, v, k, d in reach_assembly.model.edges():
    print(edge_to_bel(reach_assembly.model, u, v, d))