Use this to find papers of interest, in order to verify the scope of the search terms.  Investigated whoeol corpora and software packages keyword results.
<hr>
Initial setup

In [2]:
%reload_ext autoreload
%autoreload 2

In [3]:
import wosis
import pandas as pd
import metaknowledge as mk

# Helper functions for plotting
import wosis.analysis.plotting as wos_plot

# Analysis and search functions
from wosis.analysis import (preview_matches, search_records, keyword_matches, 
                            find_pubs_by_authors, preview_matches_by_keyword, get_unique_kw_titles,
                            remove_by_journals, remove_by_title)

# Plotting libraries
import matplotlib.pyplot as plt
import seaborn as sns

# This just helps make the plots look nicer
sns.set_style('darkgrid')
sns.set_context('paper', font_scale=2.0)



In [4]:
RC = mk.RecordCollection("tmp/rest_requested_corpora.txt")
corpora_df = wosis.rc_to_df(RC)

In [5]:
wos_config = wosis.load_config('config.yml')

In [43]:
software_packages = wosis.keyword_matches(RC, ['software', 'toolkit', 'toolbox'], threshold=95.0)

In [44]:
software_rc = software_packages.combine_recs()
software_df = wosis.rc_to_df(software_rc)

<hr>
Finding papers of interest by DOI

In [12]:
#DAKOTA
corpora_df.loc[corpora_df['DOI'] == '10.2172/991842', :]

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI


In [5]:
#PSUADE
corpora_df.loc[corpora_df['DOI'] == '10.1016/j.envsoft.2013.09.031', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
3322,WOS:000329561100024,2014,A comprehensive evaluation of various sensitiv...,RAINFALL-RUNOFF MODELS|IMPROVED CALIBRATION|CO...,sensitivity analysis sa is a commonly used app...,"Gan, Yanjun|Duan, Qingyun|Gong, Wei|Tong, Char...",ENVIRONMENTAL MODELLING & SOFTWARE,uncertainty quantification|sensitivity analysi...,10.1016/j.envsoft.2013.09.031


In [41]:
software_df.loc[software_df['DOI'] == '10.1016/j.envsoft.2013.09.031', :]

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
27,WOS:000329561100024,2014,A comprehensive evaluation of various sensitiv...,RAINFALL-RUNOFF MODELS IMPROVED CALIBRATION CO...,Sensitivity analysis (SA) is a commonly used a...,Elsevier Ltd. All rights reserved.,"Gan, YJ|Duan, QY|Gong, W|Tong, C|Sun, YW|Chu, ...",ENVIRONMENTAL MODELLING & SOFTWARE,uncertainty quantification sensitivity analysi...,10.1016/j.envsoft.2013.09.031


In [6]:
#SALib: too recent?
corpora_df.loc[corpora_df['DOI'] == '10.21105/joss.00097', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI


In [7]:
#UQLab
corpora_df.loc[corpora_df['DOI'] == '10.1061/9780784413609.257', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI


In [8]:
#SAFE
corpora_df.loc[corpora_df['DOI'] == '10.1016/j.envsoft.2015.04.009', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
12346,WOS:000356741300007,2015,A Matlab toolbox for Global Sensitivity Analysis,IDENTIFICATION|UNCERTAINTIES|MODELS,global sensitivity analysis gsa is increasingl...,"Pianosi, Francesca|Sarrazin, Fanny|Wagener, Th...",ENVIRONMENTAL MODELLING & SOFTWARE,global sensitivity analysis|matlab|octave|open...,10.1016/j.envsoft.2015.04.009


In [45]:
software_df.loc[software_df['DOI'] == '10.1016/j.envsoft.2015.04.009', :]

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
83,WOS:000356741300007,2015,A Matlab toolbox for Global Sensitivity Analysis,IDENTIFICATION UNCERTAINTIES MODELS,Global Sensitivity Analysis (GSA) is increasin...,Published by Elsevier Ltd.,"Pianosi, F|Sarrazin, F|Wagener, T",ENVIRONMENTAL MODELLING & SOFTWARE,global sensitivity analysis matlab octave open...,10.1016/j.envsoft.2015.04.009


In [9]:
#VARS-TOOL: too recent, using preceeding (2016) paper
corpora_df.loc[corpora_df['DOI'] == '10.1002/2015WR017559', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
189,WOS:000373117800026,2016,"A new framework for comprehensive, robust, and...",MODELS,based on the theoretical framework for sensiti...,"Razavi, Saman|Gupta, Hoshin V.",WATER RESOURCES RESEARCH,,10.1002/2015WR017559


In [24]:
software_df.loc[software_df['DOI'] == '10.1002/2015WR017559', :]

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI


In [10]:
#VARS-TOOL: too recent, using preceeding (2016) paper
corpora_df.loc[corpora_df['DOI'] == '10.1002/2015WR017558', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
5206,WOS:000373117800025,2016,"A new framework for comprehensive, robust, and...",MODELS,computer simulation models are continually gro...,"Razavi, Saman|Gupta, Hoshin V.",WATER RESOURCES RESEARCH,,10.1002/2015WR017558


In [25]:
software_df.loc[software_df['DOI'] == '10.1002/2015WR017558', :]

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI


In [17]:
#GUI-HDMR
corpora_df.loc[corpora_df['DOI'] == '10.1016/j.envsoft.2008.12.002', :]

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
5937,WOS:000265341800001,2009,GUI-HDMR - A software tool for global sensitiv...,STREET CANYON MODEL ENVIRONMENTAL-MODELS RS-HD...,The high dimensional model representation (HDM...,Elsevier Ltd. All rights reserved.,"Ziehn, T|Tomlin, AS",ENVIRONMENTAL MODELLING & SOFTWARE,global sensitivity analysis high dimensional m...,10.1016/j.envsoft.2008.12.002


In [26]:
software_df.loc[software_df['DOI'] == '10.1016/j.envsoft.2008.12.002', :]

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
55,WOS:000265341800001,2009,GUI-HDMR - A software tool for global sensitiv...,STREET CANYON MODEL ENVIRONMENTAL-MODELS RS-HD...,The high dimensional model representation (HDM...,Elsevier Ltd. All rights reserved.,"Ziehn, T|Tomlin, AS",ENVIRONMENTAL MODELLING & SOFTWARE,global sensitivity analysis high dimensional m...,10.1016/j.envsoft.2008.12.002


In [18]:
#searching for Jefferson active subspaces paper
corpora_df.loc[corpora_df['DOI'] == '10.1016/j.cageo.2015.07.001', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
12426,WOS:000361400900014,2015,Active subspaces for sensitivity analysis and ...,COMMON LAND MODEL|SURFACE PARAMETERS|ENERGY FL...,integrated hydrologic models coupled to land s...,"Jefferson, Jennifer L.|Gilbert, James M.|Const...",COMPUTERS & GEOSCIENCES,active subspaces|dimension reduction|energy fl...,10.1016/j.cageo.2015.07.001


In [27]:
software_df.loc[software_df['DOI'] == '10.1016/j.cageo.2015.07.001', :]

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI


<hr>
Finding papers which mention papers/packages of interest in keywords

In [28]:
#SimLab
simlab_rc = wosis.search_records(RC, ["simlab"], threshold=95.0)
simlab_df = wosis.rc_to_df(simlab_rc)

simlab_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
0,WOS:000238960100008,2006,Variance-based sensitivity analysis of the pro...,STABILITY MODEL UNSATURATED SOILS UNCERTAINTY ...,Analysis of the sensitivity of predictions of ...,Elsevier Ltd. All rights reserved.,"Hamm, NAS|Hall, JW|Anderson, MG",COMPUTERS & GEOSCIENCES,site investigation slope stability analysis st...,10.1016/j.cageo.2005.10.007
1,WOS:000279410600016,2010,Sensitivity analysis in fuzzy systems: Integra...,REAL-TIME PCR SOLAR-RADIATION MODEL QUANTIFICA...,This work addresses the sensitivity analysis o...,Elsevier Ltd. All rights reserved.,"Foscarini, F|Bellocchi, G|Confalonieri, R|Savi...",ENVIRONMENTAL MODELLING & SOFTWARE,dana-flsa fuzzy logic genetically modified org...,10.1016/j.envsoft.2010.03.024
2,WOS:000408861800155,2017,Improving Thermal Comfort of Low-Income Housin...,TROPICAL HUMID REGION BUILDINGS STANDARDS ADAP...,"In Thailand, the delivery of adequate low-inco...",,"Bhikhoo, N|Hashemi, A|Cruickshank, H",SUSTAINABILITY,thermal comfort low income housing thailand tr...,10.3390/su9081440


In [29]:
simlab_rc = wosis.search_records(software_rc, ["simlab"], threshold=95.0)
simlab_df = wosis.rc_to_df(simlab_rc)

simlab_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
0,WOS:000238960100008,2006,Variance-based sensitivity analysis of the pro...,STABILITY MODEL UNSATURATED SOILS UNCERTAINTY ...,Analysis of the sensitivity of predictions of ...,Elsevier Ltd. All rights reserved.,"Hamm, NAS|Hall, JW|Anderson, MG",COMPUTERS & GEOSCIENCES,site investigation slope stability analysis st...,10.1016/j.cageo.2005.10.007
1,WOS:000408861800155,2017,Improving Thermal Comfort of Low-Income Housin...,TROPICAL HUMID REGION BUILDINGS STANDARDS ADAP...,"In Thailand, the delivery of adequate low-inco...",,"Bhikhoo, N|Hashemi, A|Cruickshank, H",SUSTAINABILITY,thermal comfort low income housing thailand tr...,10.3390/su9081440


In [31]:
#DAKOTA
DAKOTA_rc = wosis.search_records(RC, ["DAKOTA"], threshold=95.0)
DAKOTA_df = wosis.rc_to_df(DAKOTA_rc)

DAKOTA_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
0,WOS:000258519700024,2008,Bayesian dynamic modelling for nonstationary h...,NORTH-ATLANTIC OSCILLATION ATMOSPHERIC CIRCULA...,"Forecasting of hydrologic time series, with th...","Copyright (C) 2008 John Wiley & Sons, Ltd.","Kumar, DN|Maity, R",HYDROLOGICAL PROCESSES,bayesian dynamic models nonstationarity foreca...,10.1002/hyp.6951
1,WOS:000418736000022,2017,A Lagging Model for Describing Drawdown Induce...,SENSITIVITY-ANALYSIS WELLBORE STORAGE LA CHALE...,This study proposes a generalized Darcy's law ...,,"Lin, YC|Yeh, HD",WATER RESOURCES RESEARCH,,10.1002/2017WR021115
2,WOS:000286782400011,2011,Devils lake emergency outlet diversion conflict,DECISION-SUPPORT-SYSTEM FRESH-WATER RESOURCES ...,The Devils Lake Emergency Outlet Diversion con...,Elsevier Ltd. All rights reserved.,"Ma, J|Hipel, KW|De, ML",JOURNAL OF ENVIRONMENTAL MANAGEMENT,graph model for conflict resolution transbound...,10.1016/j.jenvman.2010.08.027
3,WOS:000170209200019,2001,Net primary production of US Midwest croplands...,IRRIGATED WINTER-WHEAT GENETIC-IMPROVEMENT AGR...,"We studied crop harvested yield, as recorded i...",,"Prince, SD|Haskett, J|Steininger, M|Strand, H|...",ECOLOGICAL APPLICATIONS,agricultural statistics crop harvested yield h...,10.1890/1051-0761(2001)011[1194:NPPOUS]2.0.CO;2
4,WOS:000377473400008,2016,Cost comparison of syngas production from natu...,GTL,Underground coal gasification (UCG) is a promi...,,"Pei, P|Korom, SF|Ling, KG|Nasah, J",MITIGATION AND ADAPTATION STRATEGIES FOR GLOBA...,syngas underground coal gasification cost comp...,10.1007/s11027-014-9588-x


In [32]:
DAKOTA_rc = wosis.search_records(software_rc, ["DAKOTA"], threshold=95.0)
DAKOTA_df = wosis.rc_to_df(DAKOTA_rc)

DAKOTA_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
0,WOS:000374807600014,2016,Towards uncertainty quantification and paramet...,EQUIFINALITY,Component-based modeling frameworks make it ea...,Elsevier Ltd. All rights reserved.,"Peckham, SD|Kelbert, A|Hill, MC|Hutton, EWH",COMPUTERS & GEOSCIENCES,model uncertainty modeling frameworks componen...,10.1016/j.cageo.2016.03.005


In [33]:
#Sandia
sandia_rc = wosis.search_records(RC, ["sandia"], threshold=95.0)
sandia_df = wosis.rc_to_df(sandia_rc)

sandia_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
0,WOS:000256856000013,2008,Formulation of the static frame problem,,This report describes a static framework valid...,(C) 2007 Elsevier B.V. All rights reserved.,"Babuska, I|Nobile, F|Tempone, R",COMPUTER METHODS IN APPLIED MECHANICS AND ENGI...,model validation uncertainty quantification fa...,10.1016/j.cma.2007.12.010
1,WOS:000243852300003,2007,Control of downward migration of dense nonaque...,ENHANCED AQUIFER REMEDIATION HETEROGENEOUS AQU...,[] Sand tank experiments have been used to stu...,,"Jin, MQ|Hirasaki, GJ|Jackson, RE|Kostarelos, K...",WATER RESOURCES RESEARCH,,10.1029/2006WR004858
2,WOS:000301715700008,2012,A reduced mechanism for biodiesel surrogates w...,CHEMICAL KINETIC MECHANISMS PRINCIPAL COMPONEN...,Biodiesel is a promising alternative fuel for ...,,"Luo, ZY|Plomer, M|Lu, TF|Som, S|Longman, DE",COMBUSTION THEORY AND MODELLING,mechanism reduction biodiesel auto-ignition lo...,10.1080/13647830.2011.631034
3,WOS:000343415200006,2013,UNCERTAINTY IN THE DEVELOPMENT AND USE OF EQUA...,,In this paper we present the results from a se...,,"Weirs, VG|Fabian, N|Potter, K|McNamara, L|Otah...",INTERNATIONAL JOURNAL FOR UNCERTAINTY QUANTIFI...,materials uncertainty quantification represent...,10.1615/Int.J.UncertaintyQuantification.201200...
4,WOS:000256856000015,2008,A systematic approach to model validation base...,,This work describes a solution to the validati...,(C) 2007 Elsevier B.V. All rights reserved.,"Babuska, I|Nobile, F|Tempone, R",COMPUTER METHODS IN APPLIED MECHANICS AND ENGI...,model validation uncertainty quantification ba...,10.1016/j.cma.2007.08.031


In [34]:
sandia_rc = wosis.search_records(software_rc, ["sandia"], threshold=95.0)
sandia_df = wosis.rc_to_df(sandia_rc)

sandia_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
0,WOS:000343415200006,2013,UNCERTAINTY IN THE DEVELOPMENT AND USE OF EQUA...,,In this paper we present the results from a se...,,"Weirs, VG|Fabian, N|Potter, K|McNamara, L|Otah...",INTERNATIONAL JOURNAL FOR UNCERTAINTY QUANTIFI...,materials uncertainty quantification represent...,10.1615/Int.J.UncertaintyQuantification.201200...


In [35]:
#UQLab
uqlab_rc = wosis.search_records(RC, ["uqlab"], threshold=95.0)
uqlab_df = wosis.rc_to_df(uqlab_rc)

uqlab_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI


In [36]:
#SALib
salib_rc = wosis.search_records(RC, ["salib"], threshold=95.0)
salib_df = wosis.rc_to_df(salib_rc)

salib_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI


In [37]:
#MADS
mads_rc = wosis.search_records(RC, ["mads", "julia"], threshold=95.0)
mads_df = wosis.rc_to_df(mads_rc)

mads_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
0,WOS:000334856200002,2014,Analytical solutions for anomalous dispersion ...,HIGHLY HETEROGENEOUS FORMATIONS NON-FICKIAN TR...,Groundwater flow and transport often occur in ...,Published by Elsevier Ltd.,"O'Malley, D|Vesselinov, VV",ADVANCES IN WATER RESOURCES,anomalous dispersion stochastic transport anal...,10.1016/j.advwatres.2014.02.006
1,WOS:000404370900030,2017,High performance in power generation by pressu...,NATURAL SALINITY GRADIENTS HOLLOW-FIBER MEMBRA...,Pressure-retarded osmosis (PRO) is a renewable...,,"Sharifan, H|Madsen, HT|Morse, A",DESALINATION AND WATER TREATMENT,urmia lake pressure-retarded osmosis renewable...,10.5004/dwt.2017.20555
2,WOS:000250330700010,2007,Using a Bayesian belief network to predict sui...,NORTHWEST FOREST PLAN WATERING-POINTS CONSERVA...,Wildlife managers are often required to make i...,Elsevier Ltd. All rights reserved.,"Smith, CS|Howes, AL|Price, B|McAlpine, CA",BIOLOGICAL CONSERVATION,expert knowledge uncertainty wildlife manageme...,10.1016/j.biocon.2007.06.025


In [38]:
mads_rc = wosis.search_records(software_rc, ["mads", "julia"], threshold=95.0)
mads_df = wosis.rc_to_df(mads_rc)

mads_df.head()

Unnamed: 0,id,year,title,keywords,abstract,copyright,AU,SO,DE,DOI
