The goal of petroOne is to ...
You can install petroOne from github with:
# install.packages("devtools")
devtools::install_github("f0nzie/petroOne")
library(petroOne)
my_url <- make_search_url(query = "neural network", how = "any")
my_url
#> [1] "https://www.onepetro.org/search?q=neural+network&peer_reviewed=&published_between=&from_year=&to_year="
get_papers_count(my_url)
#> [1] 3314
# 3284
# 3314
We can send a query where we specify the starting years and the end year. Use the parameters as in the example below.
library(petroOne)
# neural network papers from 1990 to 2000. Exact phrase
my_url <- make_search_url(query = "neural network",
from_year = 1990,
to_year = 1999,
how = "all")
get_papers_count(my_url)
#> [1] 415
# 415
# 510
onepetro_page_to_dataframe(my_url)
#> # A tibble: 10 x 6
#> title_data
#> <chr>
#> 1 Deconvolution Using Neural Networks
#> 2 Neural Network Stacking Velocity Picking
#> 3 Drill-Bit Diagnosis With Neural Networks
#> 4 Seismic Principal Components Analysis Using Neural Networks
#> 5 Neural Networks And Paper Seismic Interpretation
#> 6 First Break Picking Using Neural Networks
#> 7 Artificial Intelligence I Neural Networks In Geophysics
#> 8 Inversion of Seismic Waveforms Using Neural Networks
#> 9 Neural Networks In the Petroleum Industry
#> 10 Reservoir Characterization Using Feedforward Neural Networks
#> # ... with 5 more variables: paper_id <chr>, source <chr>, type <chr>,
#> # year <chr>, author1_data <chr>
We can also get paper by the type of document. In this example we are requesting only "conference-paper" type.
# specify document type = "conference-paper", rows = 1000
my_url <- make_search_url(query = "neural network",
how = "all",
dc_type = "conference-paper",
rows = 1000)
get_papers_count(my_url)
#> [1] 2687
# 2661
# 2687
onepetro_page_to_dataframe(my_url)
#> # A tibble: 1,000 x 6
#> title_data
#> <chr>
#> 1 Deconvolution Using Neural Networks
#> 2 Neural Networks And AVO
#> 3 Neural Network Stacking Velocity Picking
#> 4 Predicting Wax Formation Using Artificial Neural Network
#> 5 Seismic Principal Components Analysis Using Neural Networks
#> 6 Neural Networks And Paper Seismic Interpretation
#> 7 Dynamic Neural Network Calibration of Quartz Transducers
#> 8 Estimation of Welding Distortion Using Neural Network
#> 9 Minimum-variance Deconvolution Using Artificial Neural Networks
#> 10 First Break Picking Using Neural Networks
#> # ... with 990 more rows, and 5 more variables: paper_id <chr>,
#> # source <chr>, type <chr>, year <chr>, author1_data <chr>
In this other example we are requesting for "journal-paper" type of papers.
# specify document type = "journal-paper", rows = 1000
my_url <- make_search_url(query = "neural network",
how = "all",
dc_type = "journal-paper",
rows = 1000)
get_papers_count(my_url)
#> [1] 304
# 303
# 304
onepetro_page_to_dataframe(my_url)
#> # A tibble: 304 x 6
#> title_data
#> <chr>
#> 1 Artificial Neural Networks Identify Restimulation Candidates
#> 2 Drill-Bit Diagnosis With Neural Networks
#> 3 Implicit Approximation of Neural Network and Applications
#> 4 Application of Artificial Neural Network to Pump Card Diagnosis
#> 5 Application of Artificial Neural Networks to Downhole Fluid Analysis
#> 6 Pseudodensity Log Generation by Use of Artificial Neural Networks
#> 7 Neural Network Approach Predicts U.S. Natural Gas Production
#> 8 An Artificial Neural Network Based Relative Permeability Predictor
#> 9 Neural Networks for Predictive Control of Drilling Dynamics
#> 10 Characterize Submarine Channel Reservoirs: A Neural- Network-Based Approach
#> # ... with 294 more rows, and 5 more variables: paper_id <chr>,
#> # source <chr>, type <chr>, year <chr>, author1_data <chr>
First, we need to find what is the total number of papers for a particular query. In this search we want all papers that have exact words "neural network".
my_url <- make_search_url(query = "neural network",
how = "all")
get_papers_count(my_url)
#> [1] 3025
# 3025 @ 200171009 total number of papers
In this example we investigate the type of papers available for a given search. In this case, we want exact match of "neural network" words.
result <- read_onepetro(my_url)
summary_by_doctype(result)
#> # A tibble: 6 x 2
#> name value
#> <chr> <dbl>
#> 1 Conference paper 2687
#> 2 General 4
#> 3 Journal paper 304
#> 4 Media 2
#> 5 Other 5
#> 6 Presentation 23
We see that most numerous papers are from conferences. We will proceed to gran the paper titles of those.
Here is a nother example of summaries. In this case, we want papers that contain the exact words "well test".
library(petroOne)
my_url <- make_search_url(query = "well test",
how = "all")
result <- read_onepetro(my_url)
summary_by_doctype(result)
#> # A tibble: 7 x 2
#> name value
#> <chr> <dbl>
#> 1 Chapter 8
#> 2 Conference paper 9298
#> 3 General 193
#> 4 Journal paper 2529
#> 5 Media 5
#> 6 Other 8
#> 7 Presentation 25
summary_by_publisher(result)
#> # A tibble: 20 x 2
#> name value
#> <chr> <dbl>
#> 1 American Petroleum Institute 42
#> 2 American Rock Mechanics Association 64
#> 3 BHR Group 10
#> 4 Carbon Management Technology Conference 1
#> 5 International Petroleum Technology Conference 364
#> 6 International Society for Rock Mechanics 39
#> 7 International Society of Offshore and Polar Engineers 15
#> 8 NACE International 45
#> 9 National Energy Technology Laboratory 8
#> 10 Offshore Mediterranean Conference 44
#> 11 Offshore Technology Conference 506
#> 12 Oil Industry Journal 14
#> 13 Petroleum Society of Canada 396
#> 14 Pipeline Simulation Interest Group 2
#> 15 Society of Exploration Geophysicists 75
#> 16 Society of Petroleum Engineers 10078
#> 17 Society of Petrophysicists and Well-Log Analysts 209
#> 18 Society of Underwater Technology 12
#> 19 Unconventional Resources Technology Conference 60
#> 20 World Petroleum Congress 77
summary_by_dates(result)
#> # A tibble: 76 x 2
#> name value
#> <chr> <dbl>
#> 1 Since 2017 347
#> 2 Since 2016 913
#> 3 Since 2015 1462
#> 4 Since 2014 2019
#> 5 Since 2013 2530
#> 6 Since 2012 3044
#> 7 Since 2011 3497
#> 8 Since 2010 4023
#> 9 Since 2009 4454
#> 10 Since 2008 4865
#> # ... with 66 more rows
summary_by_publications(result)
#> # A tibble: 575 x 2
#> name value
#> <chr> <dbl>
#> 1 10th North American Conference on Multiphase Technology 1
#> 2 10th World Petroleum Congress 1
#> 3 11th ISRM Congress 1
#> 4 11th World Petroleum Congress 4
#> 5 12th ISRM Congress 1
#> 6 12th International Conference on Multiphase Production Technology 2
#> 7 12th World Petroleum Congress 3
#> 8 13th ISRM International Congress of Rock Mechanics 1
#> 9 13th International Conference on Multiphase Production Technology 1
#> 10 13th World Petroleum Congress 3
#> # ... with 565 more rows
In this other example, we want papers that containg the word "well" or "test".
library(petroOne)
my_url <- make_search_url(query = "well test",
how = "any")
result <- read_onepetro(my_url)
summary_by_doctype(result)
#> # A tibble: 8 x 2
#> name value
#> <chr> <dbl>
#> 1 Chapter 60
#> 2 Conference paper 86778
#> 3 General 932
#> 4 Journal paper 15825
#> 5 Media 9
#> 6 Other 21
#> 7 Presentation 265
#> 8 Standard 95
summary_by_publisher(result)
#> # A tibble: 22 x 2
#> name value
#> <chr> <dbl>
#> 1 American Petroleum Institute 676
#> 2 American Rock Mechanics Association 3851
#> 3 American Society of Safety Engineers 1098
#> 4 BHR Group 221
#> 5 Carbon Management Technology Conference 82
#> 6 International Petroleum Technology Conference 1774
#> 7 International Society for Rock Mechanics 3975
#> 8 International Society of Offshore and Polar Engineers 7408
#> 9 NACE International 7708
#> 10 National Energy Technology Laboratory 21
#> # ... with 12 more rows
summary_by_dates(result)
#> # A tibble: 103 x 2
#> name value
#> <chr> <dbl>
#> 1 Since 2017 3542
#> 2 Since 2016 8690
#> 3 Since 2015 14264
#> 4 Since 2014 19543
#> 5 Since 2013 24213
#> 6 Since 2012 28710
#> 7 Since 2011 32778
#> 8 Since 2010 36993
#> 9 Since 2009 40482
#> 10 Since 2008 43857
#> # ... with 93 more rows
summary_by_publications(result)
#> # A tibble: 823 x 2
#> name value
#> <chr> <dbl>
#> 1 10th ISRM Congress 109
#> 2 10th North American Conference on Multiphase Technology 20
#> 3 10th World Petroleum Congress 82
#> 4 11th ISRM Congress 123
#> 5 11th World Petroleum Congress 74
#> 6 12th ISRM Congress 196
#> 7 12th International Conference on Multiphase Production Technology 31
#> 8 12th World Petroleum Congress 54
#> 9 13th ISRM International Congress of Rock Mechanics 228
#> 10 13th International Conference on Multiphase Production Technology 25
#> # ... with 813 more rows