In [None]:
!pip install orkg==0.18.0

In [None]:
import os
import pandas as pd
from orkg import ORKG, OID

Create a connection to ORKG (incubating)

In [None]:
orkg = ORKG(host="https://incubating.orkg.org")

Read the data of the comparison https://incubating.orkg.org/comparison/R44930

In [None]:
df1 = orkg.contributions.compare_dataframe(comparison_id='R44930')

In [None]:
df1.head(11)

Now complete the following tasks

In [None]:
# Compute the mean of 'Has value'

# Plot the 'Has value'

Next, read the data of the comparison https://incubating.orkg.org/comparison/R41466 as data frame `df2` and compute the mean value. Then read the microbe-scope CSV data and create a scatter plot of basic reproduction number and case fatality rate for all infections diseases included in the microbe-scope and the mean values for COVID-19 computed here.

Let's create some new scientific knowledge using template (https://incubating.orkg.org/template/R40006, whic supports describing basic reproduction number estimates. We first load the template specification in the environment.

In [None]:
orkg.templates.materialize_template("R40006")
tp = orkg.templates

In [None]:
if not os.path.exists("data"):
   os.makedirs("data")

We have now a Python-native API that we can use to obtain documentation and create new data programmatically. 

In [None]:
print(tp.basic_reproduction_number_estimate.__doc__)

In [None]:
tp.basic_reproduction_number_estimate(
    label="COVID-19 basic reproduction number estimation",
    time_period=tp.time_interval(
        has_beginning="2020-01-03",
        has_end="2020-03-01"
    ),
    location=tp.location(
        label="Kuopio",
        same_as="http://www.wikidata.org/entity/Q162279",
    ),
    basic_reproduction_number=tp.basic_reproduction_number_estimate_value_specification(
        has_value="3.1",
        confidence_interval_95=tp.confidence_interval_95(
            lower_confidence_limit="2.5",
            upper_confidence_limit="3.7"
        )
    )
).serialize_to_file("data/article.contribution.json", format="json-ld")

Finally, we harvest the new data in ORKG

In [None]:
r = orkg.harvesters.directory_harvest(
     directory="data",
     research_field="Epidemiology",
     title="Estimating COVID-19 basic reproduction number",
     authors=["Jane Doe","John Doe"],
     publication_year="2023",
     published_in="Epidemiology",
     doi="https://doi.org/10.1000/xyz.12345"
)

In [None]:
print("Check the harvested data in ORKG at: https://incubating.orkg.org/paper/{}".format(r.content["id"]))