This notebook demonstrates use of the code 'from_Citrine.py' in retrieving data from various datasets collected by Citrine Informatics at http://citrination.com/, and output it in the form of a Pandas dataframe. In this example, we run several queries on the Citrine API to retrieve data contained within its databases,

In [1]:
from matminer.data_retrieval.from_Citrine import CitrineDataRetrieval

In [2]:
api_key = None     # Set your Citrine API key here. If set as an environment variable 'CITRINE_KEY', set it to 'None'

Create an adapter to the Citrine database

In [3]:
c = CitrineDataRetrieval(api_key)

Retrive data from the Citrine database that is contributed by "AFLOWLIB" for all samples with a chemical formula of "Si"

In [4]:
c.get_dataframe(contributor='aflow', formula='Si')

  0%|          | 0/46 [00:00<?, ?it/s]

ValueError: Index contains duplicate entries, cannot reshape

Rows with the same 'sample' # indicate the same sample but with different measurements/properties. Each of these properties is listed as a column of the dataframe. 

In [5]:
c.get_dataframe(contributor='Citrine', term='NIST', formula='al2o3')



Unnamed: 0_level_0,data_set_id,license,material.chemicalFormula,material.condition,reference,Log of formation reaction rate constant,Relative standard enthalpy,Specific heat capacity,Standard Gibbs free energy of formation,Standard enthalpy of formation,Standard entropy,adsorped NH3,measurement.condition,measurement.dataType,measurement.reference,property.units
sample,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1
1,20,,Al2O3,"[{u'scalar': [{u'value': u'Alpha'}], u'name': ...",,11.686,350.019,144.474,-671.139,-2244.729,327.841,,"[{u'units': u'K', u'scalar': [{u'value': u'0'}...",Experimental,"[{u'url': u'http://kinetics.nist.gov/janaf', u...","{u'Specific heat capacity': u'J/K$\cdot$mol', ..."
2,20,,Al2O3,[{u'scalar': [{u'value': u'Crystalline and liq...,,3.365,687.839,192.464,-257.664,-2009.609,443.912,,"[{u'units': u'K', u'scalar': [{u'value': u'0'}...",Experimental,"[{u'url': u'http://kinetics.nist.gov/janaf', u...",
3,20,,Al2O3,"[{u'scalar': [{u'value': u'Gamma'}], u'name': ...",,11.822,366.469,151.264,-678.952,-2209.45,342.205,,"[{u'units': u'K', u'scalar': [{u'value': u'298...",Experimental,"[{u'url': u'http://kinetics.nist.gov/janaf', u...",
4,20,,Al2O3,"[{u'scalar': [{u'value': u'Delta'}], u'name': ...",,11.759,360.519,148.808,-675.384,-2225.023,335.824,,"[{u'units': u'K', u'scalar': [{u'value': u'298...",Experimental,"[{u'url': u'http://kinetics.nist.gov/janaf', u...",
5,20,,Al2O3,"[{u'scalar': [{u'value': u'Kappa'}], u'name': ...",,11.773,357.719,147.652,-676.141,-2223.639,336.538,,"[{u'units': u'K', u'scalar': [{u'value': u'298...",Experimental,"[{u'url': u'http://kinetics.nist.gov/janaf', u...",
6,20,,Al2O3,"[{u'scalar': [{u'value': u'Liquid'}], u'name':...",,3.365,632.714,192.464,-257.664,-2009.61,443.912,,"[{u'units': u'K', u'scalar': [{u'value': u'298...",Experimental,"[{u'url': u'http://kinetics.nist.gov/janaf', u...",
7,1823,[NIST_SRD-205],Alumina 1593,,"[{u'URL': u'http://adsorbents.nist.gov', u'edi...",,,,,,,2.16707,"[{u'units': u'K', u'scalar': [{u'value': u'298...",,,
8,1823,[NIST_SRD-205],Alumina 1597,,"[{u'URL': u'http://adsorbents.nist.gov', u'edi...",,,,,,,2.7068,"[{u'units': u'K', u'scalar': [{u'value': u'298...",,,
9,1823,[NIST_SRD-205],Alumina VPO2,,"[{u'URL': u'http://adsorbents.nist.gov', u'edi...",,,,,,,2.60815,"[{u'units': u'K', u'scalar': [{u'value': u'298...",,,
10,1823,[NIST_SRD-205],Alumina 1593,,"[{u'URL': u'http://adsorbents.nist.gov', u'edi...",,,,,,,2.1714,"[{u'units': u'K', u'scalar': [{u'value': u'298...",,,


In [6]:
c.get_dataframe(contributor='Gaultois', formula='pbte')



Unnamed: 0_level_0,data_set_id,material.chemicalFormula,material.condition,Electrical conductivity,Electrical resistivity,Power factor,Seebeck coefficient,Thermal conductivity,Thermoelectric figure of merit (zT),measurement.condition,measurement.dataType,measurement.reference,property.units
sample,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1
1,1822,Na0.02Pb0.98Te,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",2713.0,0.000368595,0.0010557,62.38,3.99643,0.079250912,"[{u'units': u'K', u'scalar': [{u'value': u'300...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...","{u'Seebeck coefficient': u'$\mu$V/K', u'Electr..."
2,1822,Na0.02Pb0.98Te,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",583.98,0.0017124,0.0026459,212.86,1.39286,1.329723145,"[{u'units': u'K', u'scalar': [{u'value': u'700...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
3,1822,Pb0.98TeNa0.02,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",444.0,0.002252252,0.0024729,236.0,1.44,1.20211,"[{u'units': u'K', u'scalar': [{u'value': u'700...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
4,1822,Pb0.98TeNa0.02,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",2399.0,0.00041684,0.00098263,64.0,4.29,0.0687154,"[{u'units': u'K', u'scalar': [{u'value': u'300...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
5,1822,Tl0.02Pb0.98Te,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",417.72,0.00239394,0.00077455,136.17,2.16832,0.107163649,"[{u'units': u'K', u'scalar': [{u'value': u'300...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
6,1822,Tl0.02Pb0.98Te,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",186.44,0.00536364,0.0020016,327.66,1.0099,1.387416646,"[{u'units': u'K', u'scalar': [{u'value': u'700...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
7,1822,Tl0.01Pb0.99Te,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",364.64,0.00274242,0.00071879,140.4,1.9421,0.111032448,"[{u'units': u'K', u'scalar': [{u'value': u'300...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
8,1822,Tl0.02Pb0.98Te,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",343.75,0.00290909,0.00131,195.21,1.65594,0.316428584,"[{u'units': u'K', u'scalar': [{u'value': u'400...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
9,1822,Na0.02Pb0.98Te,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",1756.2,0.000569421,0.0019362,105.0,2.675,0.289521835,"[{u'units': u'K', u'scalar': [{u'value': u'400...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
10,1822,Pb0.98TeNa0.02,"[{u'scalar': [{u'value': u'Polycrystalline'}],...",1736.0,0.000576037,0.0019139,105.0,3.18,0.240747,"[{u'units': u'K', u'scalar': [{u'value': u'400...",Experimental,"[{u'citation': u'10.1021/cm400893e', u'referen...",
