In [1]:
import sys
import re
import pandas as pd
sys.path.append("../automaterialsdata/")

from chemdataextractor_parsers import NumericalProperty, OPVPropertyParser
from chemdataextractor_parsers import OPVMaterials, OPVMaterialsParser
from chemdataextractor_parsers import sentence_preprocessing

from chemdataextractor import Document
from chemdataextractor.model import Compound,ListType, ModelType
from chemdataextractor.doc import Paragraph, Sentence

Compound.opv_materials = ListType(ModelType(OPVMaterials))
Compound.opv_property = ListType(ModelType(NumericalProperty))
Sentence.parsers.append(OPVMaterialsParser())
Paragraph.parsers.append(OPVMaterialsParser())
Sentence.parsers.append(OPVPropertyParser())
Paragraph.parsers.append(OPVPropertyParser())

In [2]:
Test_examples = [
    "FIG. 3. Color online The I-V curves of the optimized pBTTT:PC71BM cell in the dark and under calibrated 1 sun illumination PCE=2.34%, Jsc=9.37 mA/cm2, Voc=0.525 V, FF=0.48.",
    " This cell had a Jsc of 9.37 mA/cm2, a Voc of 0.525 V, and a FF of 0.48 for an overall PCE of 2.3%",
    "The most efficient devices, obtained using 1,8diiodooctane, had an average power-conversion efficiency of 5.1% under 100 mW/cm2, with short-circuit current Jsc ) 15.7 mA/cm2, fill factor FF ) 0.53, and open-circuit voltage Voc ) 0.61 V, i.e., an∼10% higher efficiency than that obtained with the use of 1,8-octanedithiol",
    "J–V curves, a signiﬁcant increase in Voc is clearly observed from PBDTTT–E to PBDTTT–CF. A Voc as high as 0.76 V was observed indevicesbasedonPBDTTT–CF",
    ".CombinedwithitshighJsc andﬁll factor (FF), a high PCE of 7.38+0.4% (a 5% device variation), measured in more than 75 devices, was achieved in the PBDTTT– CF system, the highest measured PCE being 7.73%.",
    "In the recent work26, higher values of Voc are observed when ﬂuorine, an atom of high electron afﬁnity, is introduced to the thieno[3,4-b]thiophene unit, a PCE of 6.1% having been demonstrated26",
    " Figure 2a shows the typical I-V curve under illumination of AM 1.5G (100 mW/ cm2) of the devices with Voc 0.68V, Jsc 12.7 mA/cm2, and FF 55%. ",
    "The average power conversion efﬁciency (PCE) of 100 devices reached 4.7 %, and for the best device, a PCE of 5.1% was observed.",
    "showed the thickness dependence of photovoltaic performance (Supplementary Figs 3 and 4 and Supplementary Tables 3 and 4). Notably, the PCE reached 10.1% (JSC =19.4 mAcm–2, VOC =0.708 V, FF=73.4%), with an average of 9.77%, for the inverted PC71BM cell with an active layer thickness of ∼290 nm, which is one of the highest PCEs observed in a single-junction cell",
    "It is interesting to note that PCEs close to 10% were also observed for the inverted PC61BM cell with a thickness of 280 nm (PCE=9.80% (average 9.55%), JSC =18.2 mA cm–2, VOC =0.729 V, FF=73.9%)",
    "The enhanced performance of DBFI-EDOT devices is largely a result of the enhanced Voc  (0.93 V) compared to the PC 71B M cells (0.67 V)." ,
    "the best performance seen in nonfullerene polymer solar cells to date. For comparison the reference optimized PC 71B M:PSEHTT photodiodes, gave the best PCE of 5.62% with an average PCE of 5.52% ± 0.09%",
    " Therefore, to the best of our knowledge, in demonstrating high PCEs of B9% with a high VOC of B1V, smallEloss and a small energy offset at the same time, PNOz4T is regarded as quite a unique narrow bandgap polymer.",
    "A PCE of about 7.4% has been achieved from... ",
    "The fill factor, at the same time, increases to 69%",
    "...Voc has increased to 0.75 V as expected...",
    "When illuminated with simulated solar light (AM1.5 Global, light intensity about 100 W m22), the PCz : PDI (1 : 4) cell displayed an Isc of 0.26 mA cm22,aVoc of 0.71 V, an FF of 0.37, and an efficiency of 0.63%, which to the best of our knowledge is the highest efficiency yet reported for a polymerbased solar cell not incorporating PCBM.",
    "The PCDTBT/PC70BM solar cells reproducibly yield JSC¼10.6 mA cm22, VOC¼0.88 V, FF¼0.66 and h e¼6.1%." ,
    "FF values of 59.23 and 50.52",
    "When illuminated with simulated solar light (AM1.5 Global, light intensity about 100 W m22), the PCz : PDI (1 : 4) cell displayed an Isc of 0.26 mA cm22,a Voc of 0.71 V, an FF of 0.37, and an efficiency of 0.63%, which to the best of our knowledge is the highest efficiency yet reported for a polymerbased solar cell not incorporating PCBM. "
    "The optimized cells had PDPP3T:[70]PCBM in a 1:2 weight ratio and provided Voc ) 0.65 V, Jsc ) 11.8 mA/cm2, and FF ) 0.60, resulting in an η value of 4.7%",
    "The devices prepared using chlorobenzene as solvent show higher performance with g = 2.5%, Jsc = 6.8 mA/cm2, Voc = 0.79 Volt, and FF = 47%. The devices prepared by using ODCB as solvent demonstrate the best performance with η = 3.2%,",
    "Figure 4 shows the J-V curves of an optimized device measured under AM 1.5G irradiation 100 mA/cm2 and dark conditions; its efﬁciency parameters are as follow: Voc=0.77 V, Jsc=9.10 mA/cm2, FF =0.55, and PCE=3.80%.",
    "The highest PCE of PSCs based on the PDTP-DTDPP(Bu):PC70BM system reached 2.71%, which was lower than the4-5%oftheP3HT:PCBMdevices.Thiscouldbemainly attributed to the lower VOC (∼0.4 V)." ,
    "The device exhibits a Voc of 0.56 V and a ﬁll factor of 63.3%, which yields an impressive PCE of 5.30%",
    "The champion result reached 6.58%, with a Voc of 0.70 V, a Jsc of 14.7 mA/cm2, and an FF of 0.64, which is the highest value so far for polymer solar cells.",
    "blend ratio of 1:3 exhibited a high short-circuit current of 10.87 mA/cm2 and a power conversion efficiency of 2.27%"
]

In [3]:
for sentence in Test_examples:
    s = sentence_preprocessing(Sentence(sentence))
    print(s.text)
    print(s.records.serialize())
    print('\n')

FIG. 3. Color online The I-V curves of the optimized pBTTT:PC71BM cell in the dark and under calibrated 1 sun illumination PCE=2.34%, Jsc=9.37 mA/cm2, Voc=0.525 V, FF=0.48.
[{'opv_materials': [{'name': 'pBTTT:PC71BM'}]}, {'opv_property': [{'name': 'PCE', 'value': '2.34', 'unit': '%'}]}, {'opv_property': [{'name': 'Jsc', 'value': '9.37', 'unit': 'mA/cm2'}]}, {'opv_property': [{'name': 'Voc', 'value': '0.525', 'unit': 'V'}]}, {'opv_property': [{'name': 'FF', 'value': '0.48'}]}]


 This cell had a Jsc of 9.37 mA/cm2, a Voc of 0.525 V, and a FF of 0.48 for an overall PCE of 2.3%
[{'opv_property': [{'name': 'Jsc', 'value': '9.37', 'unit': 'mA/cm2'}]}, {'opv_property': [{'name': 'Voc', 'value': '0.525', 'unit': 'V'}]}, {'opv_property': [{'name': 'FF', 'value': '0.48'}]}, {'opv_property': [{'name': 'PCE', 'value': '2.3', 'unit': '%'}]}]


The most efficient devices, obtained using 1,8diiodooctane, had an average power-conversion efficiency of 5.1% under 100 mW/cm2, with short-circuit cur