Initial setup

In [1]:
%reload_ext autoreload
%autoreload 2

In [2]:
import wosis
import pandas as pd
import metaknowledge as mk

# Helper functions for plotting
import wosis.analysis.plotting as wos_plot

# Analysis and search functions
from wosis.analysis import (preview_matches, search_records, keyword_matches, 
                            find_pubs_by_authors, preview_matches_by_keyword, get_unique_kw_titles,
                            remove_by_journals, remove_by_title)

# Plotting libraries
import matplotlib.pyplot as plt
import seaborn as sns

# This just helps make the plots look nicer
sns.set_style('darkgrid')
sns.set_context('paper', font_scale=2.0)



In [3]:
query_id = "756d39801152fe5f5f4ad3a3df9b6a30"
RC = mk.RecordCollection("tmp/{}.txt".format(query_id))

# Remove publications with no DOI
corpora_df = wosis.rc_to_df(RC)
corpora_df, removed_pubs = wosis.constrain.remove_empty_DOIs(corpora_df)

# Create a new metaknowledge collection
filtered_corpora = wosis.extract_recs(corpora_df.loc[:, 'id'], RC, name='Filtered Corpora')

Removing 1799 records with no DOIs


<hr>
Finding papers of interest by DOI

In [4]:
#DAKOTA
corpora_df.loc[corpora_df['DOI'] == '10.2172/991842', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI


In [5]:
#PSUADE
corpora_df.loc[corpora_df['DOI'] == '10.1016/j.envsoft.2013.09.031', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
3322,WOS:000329561100024,2014,A comprehensive evaluation of various sensitiv...,RAINFALL-RUNOFF MODELS|IMPROVED CALIBRATION|CO...,sensitivity analysis sa is a commonly used app...,"Gan, Yanjun|Duan, Qingyun|Gong, Wei|Tong, Char...",ENVIRONMENTAL MODELLING & SOFTWARE,uncertainty quantification|sensitivity analysi...,10.1016/j.envsoft.2013.09.031


In [6]:
#SALib: too recent?
corpora_df.loc[corpora_df['DOI'] == '10.21105/joss.00097', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI


In [7]:
#UQLab
corpora_df.loc[corpora_df['DOI'] == '10.1061/9780784413609.257', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI


In [8]:
#SAFE
corpora_df.loc[corpora_df['DOI'] == '10.1016/j.envsoft.2015.04.009', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
12346,WOS:000356741300007,2015,A Matlab toolbox for Global Sensitivity Analysis,IDENTIFICATION|UNCERTAINTIES|MODELS,global sensitivity analysis gsa is increasingl...,"Pianosi, Francesca|Sarrazin, Fanny|Wagener, Th...",ENVIRONMENTAL MODELLING & SOFTWARE,global sensitivity analysis|matlab|octave|open...,10.1016/j.envsoft.2015.04.009


In [9]:
#VARS-TOOL: too recent, using preceeding (2016) paper
corpora_df.loc[corpora_df['DOI'] == '10.1002/2015WR017559', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
189,WOS:000373117800026,2016,"A new framework for comprehensive, robust, and...",MODELS,based on the theoretical framework for sensiti...,"Razavi, Saman|Gupta, Hoshin V.",WATER RESOURCES RESEARCH,,10.1002/2015WR017559


In [10]:
#VARS-TOOL: too recent, using preceeding (2016) paper
corpora_df.loc[corpora_df['DOI'] == '10.1002/2015WR017558', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
5206,WOS:000373117800025,2016,"A new framework for comprehensive, robust, and...",MODELS,computer simulation models are continually gro...,"Razavi, Saman|Gupta, Hoshin V.",WATER RESOURCES RESEARCH,,10.1002/2015WR017558


In [11]:
#GUI-HDMR
corpora_df.loc[corpora_df['DOI'] == '10.1016/j.envsoft.2008.12.002', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
4206,WOS:000265341800001,2009,GUI-HDMR - A software tool for global sensitiv...,STREET CANYON MODEL|ENVIRONMENTAL-MODELS|RS-HD...,the high dimensional model representation hdmr...,"Ziehn, T.|Tomlin, A. S.",ENVIRONMENTAL MODELLING & SOFTWARE,global sensitivity analysis|high dimensional m...,10.1016/j.envsoft.2008.12.002


In [18]:
#searching for Jefferson active subspaces paper
corpora_df.loc[corpora_df['DOI'] == '10.1016/j.cageo.2015.07.001', :]

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
12426,WOS:000361400900014,2015,Active subspaces for sensitivity analysis and ...,COMMON LAND MODEL|SURFACE PARAMETERS|ENERGY FL...,integrated hydrologic models coupled to land s...,"Jefferson, Jennifer L.|Gilbert, James M.|Const...",COMPUTERS & GEOSCIENCES,active subspaces|dimension reduction|energy fl...,10.1016/j.cageo.2015.07.001


<hr>
Finding papers which mention papers/packages of interest in keywords

In [12]:
#SimLab
simlab_rc = wosis.search_records(filtered_corpora, ["simlab"], threshold=95.0)
simlab_df = wosis.rc_to_df(simlab_rc)

simlab_df.head()

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
0,WOS:000388157900001,2016,Implementing a composite indicator approach fo...,INDEX|SUSTAINABILITY|PERFORMANCE|MANAGEMENT|TU...,successful implementation of the european urba...,"Sabia, Gianpaolo|De Gisi, Sabino|Farina, Roberto",ECOLOGICAL INDICATORS,composite indicator|municipal wwtps|prioritiza...,10.1016/j.ecolind.2016.06.053
1,WOS:000279410600016,2010,Sensitivity analysis in fuzzy systems: Integra...,REAL-TIME PCR|SOLAR-RADIATION|MODEL|QUANTIFICA...,this work addresses the sensitivity analysis o...,"Foscarini, F.|Bellocchi, G.|Confalonieri, R.|S...",ENVIRONMENTAL MODELLING & SOFTWARE,dana-flsa|fuzzy logic|genetically modified org...,10.1016/j.envsoft.2010.03.024
2,WOS:000238960100008,2006,Variance-based sensitivity analysis of the pro...,STABILITY MODEL|UNSATURATED SOILS|UNCERTAINTY|...,analysis of the sensitivity of predictions of ...,"Hamm, N. A. S.|Hall, J. W.|Anderson, M. G.",COMPUTERS & GEOSCIENCES,site investigation|slope stability analysis|st...,10.1016/j.cageo.2005.10.007
3,WOS:000408861800155,2017,Improving Thermal Comfort of Low-Income Housin...,TROPICAL HUMID REGION|BUILDINGS|STANDARDS|ADAP...,in thailand the delivery of adequate lowincome...,"Bhikhoo, Nafisa|Hashemi, Arman|Cruickshank, He...",SUSTAINABILITY,thermal comfort|low income housing|thailand|tr...,10.3390/su9081440
4,WOS:000274350400010,2010,Sensitivity analysis of the rice model WARM in...,FLOODED RICE|YIELD|SIMULATE|WATER,sensitivity analysis studies how the variation...,"Confalonieri, Roberto|Bellocchi, Gianni|Tarant...",ENVIRONMENTAL MODELLING & SOFTWARE,aboveground biomass|morris method|simlab|simul...,10.1016/j.envsoft.2009.10.005


In [13]:
#DAKOTA
DAKOTA_rc = wosis.search_records(filtered_corpora, ["DAKOTA"], threshold=95.0)
DAKOTA_df = wosis.rc_to_df(DAKOTA_rc)

DAKOTA_df.head()

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
0,WOS:000207576300010,2008,Switchgrass Biomass Simulation at Diverse Site...,,the agricultural land management alternatives ...,"Kiniry, J. R.|Schmer, M. R.|Vogel, K. P.|Mitch...",BIOENERGY RESEARCH,biofuel|degree days|leaf area index,10.1007/s12155-008-9024-8
1,WOS:000220980100002,2004,Uncertainty of predictions of embankment dam b...,OUTFLOW,risk assessment studies considering the failur...,"Wahl, TL",JOURNAL OF HYDRAULIC ENGINEERING-ASCE,dam failure|uncertainty analysis|peak flow|ero...,10.1061/(ASCE)0733-9429(2004)130:5(389)
2,WOS:000377473400008,2016,Cost comparison of syngas production from natu...,GTL,underground coal gasification ucg is a promisi...,"Pei, Peng|Korom, Scott F.|Ling, Kegang|Nasah, ...",MITIGATION AND ADAPTATION STRATEGIES FOR GLOBA...,syngas|underground coal gasification|cost comp...,10.1007/s11027-014-9588-x
3,WOS:000374807600014,2016,Towards uncertainty quantification and paramet...,EQUIFINALITY,componentbased modeling frameworks make it eas...,"Peckham, Scott D.|Kelbert, Anna|Hill, Mary C.|...",COMPUTERS & GEOSCIENCES,model uncertainty|modeling frameworks|componen...,10.1016/j.cageo.2016.03.005
4,WOS:000258519700024,2008,Bayesian dynamic modelling for nonstationary h...,NORTH-ATLANTIC OSCILLATION|ATMOSPHERIC CIRCULA...,forecasting of hydrologic time series with the...,"Kumar, D. Nagesh|Maity, Rajib",HYDROLOGICAL PROCESSES,bayesian dynamic models|nonstationarity|foreca...,10.1002/hyp.6951


In [20]:
#Sandia
sandia_rc = wosis.search_records(filtered_corpora, ["sandia"], threshold=95.0)
sandia_df = wosis.rc_to_df(Sandia_rc)

sandia_df.head()

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
0,WOS:000256856000010,2008,Multivariate significance testing and model ca...,COMPUTATIONAL MODELS|COMPUTER-MODELS|VALIDATIO...,the importance of modeling and simulation in t...,"McFarland, John|Mahadevan, Sankaran",COMPUTER METHODS IN APPLIED MECHANICS AND ENGI...,model validation|multivariate statistics|signi...,10.1016/j.cma.2007.05.030
1,WOS:000257094800005,2008,Analytical risk-based model of gaseous and liq...,SENSITIVITY-ANALYSIS|SOIL|DIFFUSION,an analytical model of gaseous and liquidphase...,"Ho, Clifford K.",ENVIRONMENTAL MODELLING & SOFTWARE,radon|landfill|multiphase|transport|radium|pro...,10.1016/j.envsoft.2008.01.002
2,WOS:000343415200006,2013,UNCERTAINTY IN THE DEVELOPMENT AND USE OF EQUA...,,in this paper we present the results from a se...,"Weirs, V. Gregory|Fabian, Nathan|Potter, Krist...",INTERNATIONAL JOURNAL FOR UNCERTAINTY QUANTIFI...,materials|uncertainty quantification|represent...,10.1615/Int.J.UncertaintyQuantification.201200...
3,WOS:000256856000013,2008,Formulation of the static frame problem,,this report describes a static framework valid...,"Babuska, I.|Nobile, F.|Tempone, R.",COMPUTER METHODS IN APPLIED MECHANICS AND ENGI...,model validation|uncertainty quantification|fa...,10.1016/j.cma.2007.12.010
4,WOS:000243852300003,2007,Control of downward migration of dense nonaque...,ENHANCED AQUIFER REMEDIATION|HETEROGENEOUS AQU...,sand tank experiments have been used to study...,"Jin, Minquan|Hirasaki, George J.|Jackson, Rich...",WATER RESOURCES RESEARCH,,10.1029/2006WR004858


In [21]:
sandia_df.to_csv('sandia_papers.csv', index=False)

In [15]:
#UQLab
uqlab_rc = wosis.search_records(filtered_corpora, ["uqlab"], threshold=95.0)
uqlab_df = wosis.rc_to_df(uqlab_rc)

uqlab_df.head()

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI


In [16]:
#SALib
salib_rc = wosis.search_records(filtered_corpora, ["salib"], threshold=95.0)
salib_df = wosis.rc_to_df(salib_rc)

salib_df.head()

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI


In [17]:
#MADS
mads_rc = wosis.search_records(filtered_corpora, ["mads"], threshold=95.0)
mads_df = wosis.rc_to_df(mads_rc)

mads_df.head()

Unnamed: 0,id,year,title,keywords,abstract,AU,SO,DE,DOI
0,WOS:000404370900030,2017,High performance in power generation by pressu...,NATURAL SALINITY GRADIENTS|HOLLOW-FIBER MEMBRA...,pressureretarded osmosis pro is a renewable en...,"Sharifan, Hamidreza|Madsen, Henrik T.|Morse, A...",DESALINATION AND WATER TREATMENT,urmia lake|pressure-retarded osmosis|renewable...,10.5004/dwt.2017.20555
1,WOS:000334856200002,2014,Analytical solutions for anomalous dispersion ...,HIGHLY HETEROGENEOUS FORMATIONS|NON-FICKIAN TR...,groundwater flow and transport often occur in ...,"O'Malley, D.|Vesselinov, V. V.",ADVANCES IN WATER RESOURCES,anomalous dispersion|stochastic transport|anal...,10.1016/j.advwatres.2014.02.006


<hr>
Finding papers by author: need less specific search criteria