In [1]:
import pickle
import pandas as pd
import yaml as yaml
#from rdkit import Chem
from tqdm.notebook import tqdm
from openff.evaluator import unit
from openff.evaluator.datasets import PropertyPhase, PhysicalProperty
from openff.evaluator.datasets.thermoml import ThermoMLDataSet
from openff.evaluator.datasets.thermoml import thermoml_property, register_thermoml_property

# Read a thermoML File and display as a pandas DataFrame
The thermoML file includes the simulated bulk diffusion and density

In [2]:
@thermoml_property("Self diffusion coefficient, m2/s", supported_phases=PropertyPhase.Liquid)
class Diffusion(PhysicalProperty):
    """A class representation of a self diffusion property"""

    @classmethod
    def default_unit(cls):
        return unit.meter**2 / unit.second

In [3]:
dataset = ThermoMLDataSet.from_file("test_file.xml")
dataset.to_pandas()

Unnamed: 0,Id,Temperature (K),Pressure (kPa),Phase,N Components,Component 1,Role 1,Mole Fraction 1,Exact Amount 1,Diffusion Value (m ** 2 / s),Diffusion Uncertainty (m ** 2 / s),Source
0,3f0e52cc84d34344988173bd6cbf566b,293.15,101.0,Liquid,1,O,Solvent,1.0,,1.7e-09,0.175,10.1021/je700717w
1,0d21aa4ddbbd4135bf8cb52514ea1e44,298.15,101.0,Liquid,1,O,Solvent,1.0,,2.05e-09,0.21,10.1021/je700717w
2,217e73c58b74458ab51063481d12abcc,303.15,101.0,Liquid,1,O,Solvent,1.0,,2.3e-09,0.235,10.1021/je700717w
3,02579f2430fe4097a67840c0629bb5d5,313.15,101.0,Liquid,1,O,Solvent,1.0,,2.99e-09,0.305,10.1021/je700717w
4,f4781a2ee4e342dcaf3852b0ec381a24,323.15,101.0,Liquid,1,O,Solvent,1.0,,4.02e-09,0.405,10.1021/je700717w
5,9913b3d9583f4af1aa1503ab7f827bba,333.15,101.0,Liquid,1,O,Solvent,1.0,,4.9e-09,0.495,10.1021/je700717w
6,b7f3709b03b1426c9af0f194d220f370,343.15,101.0,Liquid,1,O,Solvent,1.0,,5.79e-09,0.585,10.1021/je700717w
7,274149744a034eca9de2a8ff0f802108,353.15,101.0,Liquid,1,O,Solvent,1.0,,7.09e-09,0.715,10.1021/je700717w
8,229487a95d89428295fd99321e743571,363.15,101.0,Liquid,1,O,Solvent,1.0,,8.23e-09,0.825,10.1021/je700717w
9,86a85e7fae1e4926b78b7cb453a275c9,368.15,101.0,Liquid,1,O,Solvent,1.0,,8.87e-09,0.89,10.1021/je700717w


# Read the yaml File with the experimental data
The cells read the yaml file with the experimental data and display the data in a pandas DataFrame

In [4]:
with open("exp_data_density.yml", 'r') as file:
    data_exp_dens = yaml.safe_load(file)

with open("exp_data_diffusion.yml", 'r') as file:
    data_exp_diff = yaml.safe_load(file)

In [5]:
print("Experimental mean density")
display(pd.DataFrame(data_exp_dens))

Experimental mean density


Unnamed: 0,Comment,Diffusion (10^-9 m^2s^-1),Molecule,Number of Data,References,Standard deviation (10^-9 m^2s^-1),Temperature (K)
0,Experimental Data,1.9325,methanol,4.0,"[Partington, J. R.; Hudson, R. F.; Bagnall, Na...",0.075622,288
1,Interpolated,2.176,methanol,5.0,"[Siddharth Agrawal, Mahmoud Elmehlawy, and Mic...",0.075987,295
2,Experimental Data,2.290154,methanol,13.0,"Dortmund Data Bank. www.ddbst.com, 2018",0.09548,298
3,Experimental Data,0.8095,ethanol,4.0,"[Partington, J. R.; Hudson, R. F.; Bagnall, K....",0.037957,288
4,Experimental Data,0.997,ethanol,1.0,"[P.S. Tofts, D. Lloyd, C.A. Clark, G.J. Barker...",0.0,293
5,Interpolated,0.967371,ethanol,7.0,"[Siddharth Agrawal, Mahmoud Elmehlawy, and Mic...",0.039235,295
6,Experimental Data,1.052143,ethanol,7.0,"[Robert L. Hurle, Allan J. Easteal and Law...",0.05277,298
7,Experimental Data,0.504,1-propanol,1.0,"[Partington, J. R.; Hudson, R. F.; Bagnall, Na...",0.0,288
8,Experimental Data,0.536,1-propanol,1.0,"[P.S. Tofts, D. Lloyd, C.A. Clark, G.J. Barker...",0.0,293
9,Interpolated,0.5737,1-propanol,2.0,"[Siddharth Agrawal, Mahmoud Elmehlawy, and Mic...",0.0013,295


In [6]:
print("Experimental diffusion")
display(pd.DataFrame(data_exp_diff))

Experimental diffusion


Unnamed: 0,Molecule,Temperature (K),Diffusion (10^-9 m^2s^-1),Standard deviation (10^-9 m^2s^-1),Number of Data,Comment,References
0,methanol,288,1.9325,0.075622,4.0,Experimental Data,"[Partington, J. R.; Hudson, R. F.; Bagnall, Na..."
1,methanol,295,2.176,0.075987,5.0,Interpolated,"[Siddharth Agrawal, Mahmoud Elmehlawy, and Mic..."
2,methanol,298,2.290154,0.09548,13.0,Experimental Data,"Dortmund Data Bank. www.ddbst.com, 2018"
3,ethanol,288,0.8095,0.037957,4.0,Experimental Data,"[Partington, J. R.; Hudson, R. F.; Bagnall, K...."
4,ethanol,293,0.997,0.0,1.0,Experimental Data,"[P.S. Tofts, D. Lloyd, C.A. Clark, G.J. Barker..."
5,ethanol,295,0.967371,0.039235,7.0,Interpolated,"[Siddharth Agrawal, Mahmoud Elmehlawy, and Mic..."
6,ethanol,298,1.052143,0.05277,7.0,Experimental Data,"[Robert L. Hurle, Allan J. Easteal and Law..."
7,1-propanol,288,0.504,0.0,1.0,Experimental Data,"[Partington, J. R.; Hudson, R. F.; Bagnall, Na..."
8,1-propanol,293,0.536,0.0,1.0,Experimental Data,"[P.S. Tofts, D. Lloyd, C.A. Clark, G.J. Barker..."
9,1-propanol,295,0.5737,0.0013,2.0,Interpolated,"[Siddharth Agrawal, Mahmoud Elmehlawy, and Mic..."
