In [3]:
import requests
import json
import re
import bs4
import time
import numpy as np
import pandas as pd

import sys
from os.path import exists
import signal

import CONFIG

In [4]:
def getBSFromURL(url):
    try:
        r = requests.get(url, headers = CONFIG.HEADER, timeout = 10)
        return getBS(r.text)
    
    except requests.exceptions.RequestException as e:
        print("Connection Error")
        raise e
    except requests.ReadTimeout as e:
        print("Timeout")
        raise e

def getBS(html):
    html_bs = bs4.BeautifulSoup(html, 'html.parser')
    return html_bs

## Get all Issues from selected decades

We scrape all the information of articles first from the main page of JSTOR.

By default, as in https://www.jstor.org/journal/amereconrevi, the titles of decades are first listed. Clicking on the decade makes an request to JSTOR backend to get the full list of the issues within the decade. 

The request are in the form of `https://www.jstor.org/journal/amereconrevi/decade/` + `ID`, where the `ID` is stored in the `data-filter` attribute in the element with class `expand-arrow`.

This returns a json object which contains the HTML element to append in the `ul` element, but we can simply turn them into `soup` objects and extract the link to the issues as well as the issue name, which are the `href` and the `text` of the `"a"` selector, respectively.

In [7]:
# a very simple sleeping function to avoid getting banned
def ImNotRobot(t = 5):
    sleepTime = np.random.uniform(t,t+5)
    print(f"sleeping {sleepTime} seconds")
    time.sleep(sleepTime)

# see if list of issue file already exist
def file(path_to_file):

    return exists(path_to_file)


# get url that returns all list if issues within the decade
def getURLinDecade(journal_url, decade_list):
    
    journal_bs = getBSFromURL(journal_url)
    all_decade_informations = journal_bs.select(".expand-arrow")
    
    needed_decade_informations = list(filter( 
        lambda x: (int(x['data-decade']) in decade_list), all_decade_informations))
    

    decade_issues_lists_url = [f"{journal_url}/decade/{u['data-filter']}" for u in needed_decade_informations]
    return decade_issues_lists_url

# go over the urls and get the url for all issues

def handleIssueText(t):
    return t.split('pp.')[0].strip()
    

    
def getAllIssuesInDecade(url):
    print ("processing " + url)
    issue_request = requests.get(url, headers = CONFIG.HEADER)

    issue_html = json.loads(issue_request.text)[0]
    soup = getBS(issue_html)
    all_issue = soup.select("a")
    
    print(all_issue)
    issues = []
    for issue in all_issue:
        issue_info = {
            'name':handleIssueText(issue.text),
            'url':issue['href']
        }
        issues.append(issue_info)
        
    return issues



In [8]:
all_journal_file_name = CONFIG.JOURNAL_NAME + '_all_issue.csv'

counter = 1
if exists(all_journal_file_name):
    pass
else:
    try:
        journal_url = CONFIG.URL
        URLinDecade = getURLinDecade(journal_url, CONFIG.SCRAPE_DECADES)

        allIssues = []
        for u in URLinDecade:
            ImNotRobot()
            allIssues += getAllIssuesInDecade(u)

        all_issues_df = pd.json_normalize(allIssues)
        all_issues_df['scraped'] = 0
        with open(all_journal_file_name, 'w') as fout:
            all_issues_df.to_csv(fout, header=True, index=False)
        
        if counter % 50 == 0 :
            ImNotRobot(120)
            
    except Exception as e:
        raise e
        

## Handling allIsue

We want to create a csv file, or xlsx file, that has the following column names


In [87]:
colNames = [
    "Source URL",
    "Title",
    "Long Volume",
    "Issue Vol.",
    "Issue No.",
    "Month",
    "Year",
    "Abstract"
]
# + Author List

I stored the resuls of issues into another file

In [6]:
def getArticles(url):
    issueBS = getBSFromURL(url)
    
    issue_name = issueBS.select('div.issue')
    if not issue_name:
        import Blocked
        raise Blocked.BlockedError("You might be blocked")
    
    issue_name = issue_name[0].text.strip()
    articlesWithAuthor = issueBS.select('div.contrib')
    return issue_name, articlesWithAuthor

def parseIssue(t):
    separated = t.split(',')
    
    # There are two different formats, yeez@@
    
    ## Vol. 77, No. 4, Jul., 2009
    if len(separated) == 4:
        vol = separated[0].strip()
        no = separated[1].strip()
        month = separated[2].strip()
        year = separated[3].strip()
    
    ##  Vol. 87, No. 4, July 2019
    else:
        vol = separated[0].strip()
        no = separated[1].strip()
        date = separated[2].strip().split(' ')
        month = date[0].strip()
        year = date[1].strip()
    return t, vol, no, month, year

def parseAuthor(a):
    authors = re.split(r'\s+and\s+|,(?!\s*Jr\.)\s*', a)
    split_authors = [e.strip() for e in authors]
    
    split_authors += [None]*(30-len(split_authors))
    return [a]+ split_authors

In [11]:
with open(all_journal_file_name) as f:
    all_issues_df = pd.read_csv(f)
needed_issues = all_issues_df[all_issues_df['scraped'] ==0 ]
display(needed_issues)

all_articles_file_name = CONFIG.JOURNAL_NAME + "_orig.csv"


counter = 1
for index, issue in needed_issues.iterrows():
    url = CONFIG.DOMAIN_URL + issue['url']
    try:     
        issue_name, articlesWithAuthor = getArticles(url)
        print(f"Processing : {counter}/{len(needed_issues)} \t {issue_name} ...")

        full_vol, vol, no, month, year = parseIssue(issue_name)

        tempArticles = []
        for article in articlesWithAuthor: 
            article_element = article.parent
            article_title = article_element.find('a').text.strip()
            article_url = CONFIG.DOMAIN_URL + article_element.find('a')['href']
            article_authors = parseAuthor( article.text.strip() )

            tempArticles.append([
                article_url,
                article_title,
                full_vol, vol, no, month, year,
                ''
            ] + 
            article_authors)
            print("Article Name  :  " + article_title)
        
        
        all_issues_df.loc[index, 'scraped'] = 1
        
        ## save
        with open(all_journal_file_name, 'w') as issue_f:
            all_issues_df.to_csv(issue_f, 
                                 header=True, 
                                 index=False)
        
        with open(all_articles_file_name, 'a') as article_f:
            tempDF = pd.DataFrame(tempArticles)
            tempDF.to_csv(article_f, 
                                header=False, 
                                index=False)
        print("="*30)
        if counter % 50 == 0 :
            ImNotRobot(120)
        counter += 1
        ImNotRobot()
        
    except Exception as e:
        print(e)
        sys.exit(0)

Unnamed: 0,name,url,scraped
115,"No. 5 Sep., 2000",/stable/10.2307/i353369,0
116,"No. 4 Jul., 2000",/stable/10.2307/i353368,0
117,"No. 3 May, 2000",/stable/10.2307/i353367,0
118,"No. 2 Mar., 2000",/stable/10.2307/i353366,0
119,"No. 1 Jan., 2000",/stable/10.2307/i353365,0
...,...,...,...
373,"No. 1 Jan., 1951",/stable/10.2307/i332597,0
374,"No. 4 Oct., 1950",/stable/10.2307/i332596,0
375,"No. 3 Jul., 1950",/stable/10.2307/i332530,0
376,"No. 2 Apr., 1950",/stable/10.2307/i332592,0


Processing : 1/263 	 Vol. 68, No. 5, Sep., 2000 ...
Article Name  :  Capital-Skill Complementarity and Inequality: A Macroeconomic Analysis
Article Name  :  GMM with Weak Identification
Article Name  :  A Reality Check for Data Snooping
Article Name  :  A Simple Adaptive Procedure Leading to Correlated Equilibrium
Article Name  :  Sticky Price Models of the Business Cycle: Can the Contract Multiplier Solve the Persistence Problem?
Article Name  :  A Noncooperative Model of Network Formation
Article Name  :  Genericity and Markovian Behavior in Stochastic Games
Article Name  :  Nonstationary Binary Choice
Article Name  :  Risk Aversion and Expected-Utility Theory: A Calibration Theorem
sleeping 8.630801361618389 seconds
Processing : 2/263 	 Vol. 68, No. 4, Jul., 2000 ...
Article Name  :  Efficiency, Equilibrium, and Asset Pricing with Risk of Default
Article Name  :  Competing Mechanisms in a Common Value Environment
Article Name  :  Panel Data Discrete Choice Models with Lagged Depende

Processing : 12/263 	 Vol. 66, No. 6, Nov., 1998 ...
Article Name  :  Efficient Intra-Household Allocations: A General Characterization and Empirical Tests
Article Name  :  The Noah's Ark Problem
Article Name  :  New Tools for Understanding Spurious Regressions
Article Name  :  Bootstrap Methods for Median Regression Models
Article Name  :  Efficiency and Voluntary Implementation in Markets with Repeated Pairwise Bargaining
Article Name  :  Inference on Structural Parameters in Instrumental Variables Regression with Weak Instruments
Article Name  :  Impartiality: Definition and Representation
Article Name  :  Strict Single Crossing and the Strict Spence-Mirrlees Condition: A Comment on Monotone Comparative Statics
sleeping 5.575605531546453 seconds
Processing : 13/263 	 Vol. 66, No. 5, Sep., 1998 ...
Article Name  :  Characterizing Selection Bias Using Experimental Data
Article Name  :  Short Run and Long Run Causality in Time Series: Theory
Article Name  :  Autoregressive Conditional 

Processing : 22/263 	 Vol. 65, No. 2, Mar., 1997 ...
Article Name  :  Edgeworth's Conjecture with Infinitely many Commodities: L^1
Article Name  :  Prediction, Optimization, and Learning in Repeated Games
Article Name  :  Price Formation in Single Call Markets
Article Name  :  Conditioning and Aggregation of Preferences
Article Name  :  On "Reputation" Refinements with Heterogeneous Beliefs
Article Name  :  The Evolution of Walrasian Behavior
Article Name  :  Report on the Activities of the Australasian Standing Committee of the Econometric Society
sleeping 6.536633133337477 seconds
Processing : 23/263 	 Vol. 65, No. 1, Jan., 1997 ...
Article Name  :  Preferences Over Solutions to the Bargaining Problem
Article Name  :  Rational Asset Pricing Bubbles
Article Name  :  Bayesian Vector Autoregressions with Stochastic Volatility
Article Name  :  A Divisible Search Model of Fiat Money
Article Name  :  Inference Concerning the Number of Factors in a Multivariate Nonparametric Relationship
Ar

Processing : 32/263 	 Vol. 63, No. 4, Jul., 1995 ...
Article Name  :  Ragnar Frisch, Editor of Econometrica 1933-1954
Article Name  :  Back to the Future: Generating Moment Implications for Continuous-Time Markov Processes
Article Name  :  Individual Income, Incomplete Information, and Aggregate Consumption
Article Name  :  Automobile Prices in Market Equilibrium
Article Name  :  Product Differentiation and Oligopoly in International Markets: The Case of the U.S. Automobile Industry
Article Name  :  Econometrics of First-Price Auctions
Article Name  :  Nonlinear Dynamics and Chaos in Optimal Growth: An Example
sleeping 6.381657811614255 seconds
Processing : 33/263 	 Vol. 63, No. 3, May, 1995 ...
Article Name  :  The Existence of Subgame-Perfect Equilibrium in Continuous Games with Almost Perfect Information: A Case for Public Randomization
Article Name  :  Perfect Equilibria in a Negotiation Model
Article Name  :  Renegotiation of Sales Contracts
Article Name  :  Optimal Procurement Me

Processing : 42/263 	 Vol. 61, No. 6, Nov., 1993 ...
Article Name  :  Innovation, Imitation, and Intellectual Property Rights
Article Name  :  Mechanism Design by Competing Sellers
Article Name  :  Bargaining with Deadlines and Imperfect Player Control
Article Name  :  Dynamic Procedures and Incentives in Public Good Economies
Article Name  :  t or 1 - t. That is the Trade-Off
Article Name  :  Vector Autoregressions and Causality
Article Name  :  Engel Functions, Panel Data, and Latent Variables
Article Name  :  Commitment Value of Contracts Under Renegotiation Constraints
sleeping 6.29444026107072 seconds
Processing : 43/263 	 Vol. 61, No. 5, Sep., 1993 ...
Article Name  :  Global Games and Equilibrium Selection
Article Name  :  Rational Learning Leads to Nash Equilibrium
Article Name  :  Learning, Local Interaction, and Coordination
Article Name  :  Indeterminacy of Equilibria in a Hyperinflationary World: Experimental Evidence
Article Name  :  The Organization of Decentralized Infor

Processing : 52/263 	 Vol. 60, No. 2, Mar., 1992 ...
Article Name  :  Nonparametric and Distribution-Free Estimation of the Binary Threshold Crossing and The Binary Choice Models
Article Name  :  The Cusum Test with Ols Residuals
Article Name  :  Household Composition, Labor Markets, and Labor Demand: Testing for Separation in Agricultural Household Models
Article Name  :  A Model of Growth Through Creative Destruction
Article Name  :  Stochastic Differential Utility
Article Name  :  Correlated Information and Mecanism Design
Article Name  :  Integration Versus Trend Stationary in Time Series
Article Name  :  Money and Interest in a Cash-in-Advance Economy: A Corrigendum
Article Name  :  Money and Interest in a Cash-in-Advance Economy: A Reply
Article Name  :  Report of the President
sleeping 9.641547706216867 seconds
Processing : 53/263 	 Vol. 60, No. 1, Jan., 1992 ...
Article Name  :  The Principal-Agent Relationship with an Informed Principal, II: Common Values
Article Name  :  Impl

Processing : 59/263 	 Vol. 59, No. 1, Jan., 1991 ...
Article Name  :  Aggregation and Social Choice: A Mean Voter Theorem
Article Name  :  Aggregation and Imperfect Competition: On the Existence of Equilibrium
Article Name  :  Lexicographic Probabilities and Choice Under Uncertainty
Article Name  :  Lexicographic Probabilities and Equilibrium Refinements
Article Name  :  The Optimality of Boiteux-Ramsey Pricing
Article Name  :  Monotonic Preferences and Core Equivalence
Article Name  :  Mixture Symmetry and Quadratic Utility
Article Name  :  Segmented or Competitive Labor Markets
Article Name  :  Job Exit Behavior of Older Men
Article Name  :  A Continuous Time Approximation to the Unstable First-Order Autoregressive Process: The Case Without an Intercept
Article Name  :  Solution to a Problem of Stochastic Process Switching
Article Name  :  Stochastic Process Switching: Some Simple Solutions
Article Name  :  Report of the Secretary
Article Name  :  Report of the Treasurer
Article Name

Processing : 67/263 	 Vol. 57, No. 5, Sep., 1989 ...
Article Name  :  A Method of Simulated Moments for Estimation of Discrete Response Models Without Numerical Integration
Article Name  :  Simulation and the Asymptotics of Optimization Estimators
Article Name  :  Power in Econometric Applications
Article Name  :  Seminonparametric Estimation of Conditionally Constrained Heterogeneous Processes: Asset Pricing Applications
Article Name  :  A Test of the Efficiency of a Given Portfolio
Article Name  :  Expectation and Variation in Multi-Period Decisions
Article Name  :  Extensive Form Games in Continuous Time: Pure Strategies
Article Name  :  Occupational Choice under Uncertainty When Experience Is a Determinant of Earnings
Article Name  :  Sampling Performance of Some Joint One-Sided Preliminary Test Estimators under Squared Error Loss
Article Name  :  Job Matching, Coalition Formation, and Gross Substitutes
sleeping 9.561697800010528 seconds
Processing : 68/263 	 Vol. 57, No. 4, Jul., 

Processing : 76/263 	 Vol. 56, No. 2, Mar., 1988 ...
Article Name  :  Efficiency Wages and the Inter-Industry Wage Structure
Article Name  :  Road Damage Externalities and Road User Charges
Article Name  :  An Econometric Analysis of Fluctuations in Aggregate Labor Supply and Demand
Article Name  :  Intertemporal Preferences and Labor Supply
Article Name  :  The Second Welfare Theorem with Nonconvex Preferences
Article Name  :  On the Theory of Infinitely Repeated Games with Discounting
Article Name  :  Finite Rationality and Interpersonal Complexity in Repeated Games
Article Name  :  Optimal Time-Consistent Fiscal Policy with Finite Lifetimes
Article Name  :  Conditions for Identification in Nonparametric and Parametric Models
Article Name  :  Managerial Task Assignment and Promotions
Article Name  :  Analytic Derivatives for Estimation of Discrete-Time, Linear-Quadratic, Dynamic, Optimization Models
Article Name  :  A General Approach to the Arbitrage Pricing Theory (APT)
Article Nam

Processing : 83/263 	 Vol. 55, No. 1, Jan., 1987 ...
Article Name  :  Correlated Equilibrium as an Expression of Bayesian Rationality
Article Name  :  Macroeconomic Planning and Disequilibrium: Estimates for Poland, 1955-1980
Article Name  :  Flexible Functional Forms and Global Curvature Conditions
Article Name  :  Posterior Implementability in a Two-Person Decision Problem
Article Name  :  The Dual Theory of Choice under Risk
Article Name  :  An Intertemporal General Equilibrium Asset Pricing Model: The Case of Diffusion Information
Article Name  :  Proper Risk Aversion
Article Name  :  Distributions of Preferences and the "Law of Demand"
Article Name  :  Intransitive Indifference and Revealed Preference
Article Name  :  Monetary Uncertainty and Investment in an Optimizing, Rational Expectations Model with Income Taxes and Government Debt
Article Name  :  Report of the Secretary
Article Name  :  Report of the Treasurer
Article Name  :  Report of the Editors
Article Name  :  Econometr

Processing : 90/263 	 Vol. 53, No. 6, Nov., 1985 ...
Article Name  :  The Econometrics of Nonlinear Budget Sets
Article Name  :  Strong Core Theorems with Nonconvex Preferences
Article Name  :  An Axiomatization of Harsanyi's Nontransferable Utility Solution
Article Name  :  Continuous Auctions and Insider Trading
Article Name  :  Implementing Arrow-Debreu Equilibria by Continuous Trading of Few Long-Lived Securities
Article Name  :  The First-Order Approach to Principal-Agent Problems
Article Name  :  General Equilibrium when Some Firms Follow Special Pricing Rules
Article Name  :  The Variability of Aggregate Demand with (S, s) Inventory Policies
Article Name  :  Conditions for the Existence of a Balance Growth Solution for the Leontief Dynamic Input-Output Model
Article Name  :  The Global Properties of the Minflex Laurent, Generalized Leontief, and Translog Flexible Functional Forms
Article Name  :  Poverty Measurement: A Decomposition of the Normalization Axiom
Article Name  :  No

Processing : 97/263 	 Vol. 52, No. 5, Sep., 1984 ...
Article Name  :  The Costs of Substitution
Article Name  :  Bertrand Equilibrium with Capacity Constraints and Restricted Mobility
Article Name  :  Payoffs in Nonatomic Economies: An Axiomatic Approach
Article Name  :  Effectivity Functions and Acceptable Game Forms
Article Name  :  Implementing Efficient Egalitarian Equivalent Allocations
Article Name  :  Nonmyopic Strategic Behavior in the MDP Planning Procedure
Article Name  :  Investment in Human and Nonhuman Capital, Transfers Among Siblings, and the Role of Government
Article Name  :  The Returns to Schooling: A Selectivity Bias Approach with a Continuous Choice Variable
Article Name  :  Specification Tests for the Multinomial Logit Model
Article Name  :  Testing for Unit Roots: 2
Article Name  :  Approximation to the Finite Sample Distribution for Nonstable First Order Stochastic Difference Equations
Article Name  :  Model Selection when There is "Minimal" Prior Information
Ar

Processing : 104/263 	 Vol. 51, No. 4, Jul., 1983 ...
Article Name  :  Regularity and Index Theory for Economies with Smooth Production Technologies
Article Name  :  On the Informational Size of Message Spaces for Efficient Resource Allocation Processes
Article Name  :  Large Indivisibles: An Analysis with Respect to Price Equilibrium and Fairness
Article Name  :  Equilibrium Price Dispersion
Article Name  :  Price Responsiveness and Market Conditions
Article Name  :  Equilibrium Limit Pricing: The Effects of Private Information and Stochastic Demand
Article Name  :  On the "Law of Demand"
Article Name  :  On State Dependent Preferences and Subjective Probabilities
Article Name  :  Collective Probabilistic Judgements
Article Name  :  Endogenous Formation of Coalitions
Article Name  :  A Generalization of the Quasilinear Mean with Applications to the Measurement of Income Inequality and Decision Theory Resolving the Allais Paradox
Article Name  :  The Influence of Classification and Obs

Processing : 110/263 	 Vol. 50, No. 4, Jul., 1982 ...
Article Name  :  Inflation, Tax Rules and Investment: Some Econometric Evidence
Article Name  :  Sequential Equilibria
Article Name  :  The Determination of Marginal Cost Prices under a Set of Axioms
Article Name  :  Regulating a Monopolist with Unknown Costs
Article Name  :  Acyclic Collective Choice Rules
Article Name  :  The Nonparametric Approach to Demand Analysis
Article Name  :  On the Transversality Condition in Infinite Horizon Optimal Problems
Article Name  :  Autoregressive Conditional Heteroscedasticity with Estimates of the Variance of United Kingdom Inflation
Article Name  :  Evaluation of the Distribution Function of the Limited Information Maximum Likelihood Estimator
Article Name  :  Large Sample Properties of Generalized Method of Moments Estimators
Article Name  :  An Investigation of the Robustness of the Tobit Estimator to Non-Normality
Article Name  :  Note on Estimating Linear Trend when Residuals are Autocorr

Processing : 116/263 	 Vol. 49, No. 4, Jul., 1981 ...
Article Name  :  The Classical Theorem on Existence of Competitive Equilibrium
Article Name  :  Intergenerational Transfers and the Distribution of Earnings
Article Name  :  Equity Oriented Fiscal Programs
Article Name  :  Utilitarianism, Egalitarianism, and the Timing Effect in Social Choice Problems
Article Name  :  k-Monotone Social Decision Functions and the Veto
Article Name  :  Risk Aversion with Random Initial Wealth
Article Name  :  Rational Expectations, Information Acquisition, and Competitive Bidding
Article Name  :  Fixed Costs and Labor Supply
Article Name  :  Individual Effects in a Nonlinear Model: Explicit Treatment of Heterogeneity in the Empirical Job-Search Model
Article Name  :  A Disaggregate Model of the Demand for Intercity Freight Transportation
Article Name  :  Stochastic Properties of Fast vs. Slow Growing Economies
Article Name  :  Exact Density Functions and Approximate Critical Regions for Likelihood Rat

Processing : 122/263 	 Vol. 48, No. 5, Jul., 1980 ...
Article Name  :  Manual for Econometrica Authors
Article Name  :  Sufficient Linear Structures: Econometric Applications
Article Name  :  Approximating a Truncated Normal Regression with the Method of Moments
Article Name  :  Some Approximations to the Distribution of Econometric Criteria which are Asymptotically Distributed as Chi-Squared
Article Name  :  Inferential Procedures in Stable Distributions for Class Frequency Data on Incomes
Article Name  :  Advertising and Aggregate Consumption: An Analysis of Causality
Article Name  :  Deterministic Models for Production of Services with Stochastic Technology
Article Name  :  Industry Structure and Cost-Reducing Investment
Article Name  :  An Index Theorem for General Equilibrium Models with Production
Article Name  :  Regeneration, Public Goods, and Economic Growth
Article Name  :  Equity Among Generations
Article Name  :  Nash Equilibria and Pareto Optimal Income Redistribution
Arti

Processing : 127/263 	 Vol. 47, No. 6, Nov., 1979 ...
Article Name  :  The Impossibility of Bayesian Group Decision Making with Separate Aggregation of Beliefs and Values
Article Name  :  Dominance Solvable Voting Schemes
Article Name  :  Sequences of Games with Varying Opponents
Article Name  :  Synopses in the Theory of Choice
Article Name  :  On Multivariate Risk Aversion
Article Name  :  Expectations and Money in a Dynamic Exchange Model
Article Name  :  The Ergodic Behavior of Stochastic Processes of Economic Equilibria
Article Name  :  Capital Accumulation on the Transition Path in a Monetary Optimizing Model
Article Name  :  The Estimation of Partial Adjustment Models with Rational Expectations
Article Name  :  Expectational Consistency, Informational Lags, and the Formulation of Expectations in Continuous Time Models
Article Name  :  Investors' Portfolio Behavior under Alternative Models of Long-Term Interest Rate Expectations: Unitary, Rational, or Autoregressive
Article Name 

Processing : 132/263 	 Vol. 47, No. 1, Jan., 1979 ...
Article Name  :  The Empirical Foundations of the Phillips Curve: Evidence from Canadian Wage Contract Data
Article Name  :  The Optimal Exploitation of Renewable Resource Stocks: Problems of Irreversible Investment
Article Name  :  A Procedure for Generating Pareto-Efficient Egalitarian-Equivalent Allocations
Article Name  :  Incentive Compatibility and the Bargaining Problem
Article Name  :  On Interpersonal Comparability and Social Welfare Orderings
Article Name  :  Dynamic Choice Theory and Dynamic Programming
Article Name  :  Lead-Lag Relations, Exogeneity and Prediction of Economic Time Series
Article Name  :  Efficiency of Least-Squares Estimation of Linear Trend when Residuals Are Autocorrelated
Article Name  :  Maximum Likelihood Estimation of Stochastic Linear Difference Equations with Autoregressive Moving Average Errors
Article Name  :  Sample Selection Bias as a Specification Error
Article Name  :  Evaluation of the Dis

Processing : 138/263 	 Vol. 46, No. 1, Jan., 1978 ...
Article Name  :  Bayesian Estimates of Equation System Parameters: An Application of Integration by Monte Carlo
Article Name  :  Approximating the Exact Finite Sample Distribution of a Spectral Estimator
Article Name  :  Regression Quantiles
Article Name  :  A Maximum Likelihood Procedure for Regression with Autocorrelated Errors
Article Name  :  Testing for Autocorrelation with Missing Observations
Article Name  :  On the Pooling of Time Series and Cross Section Data
Article Name  :  The Bilinear Complementarity Problem and Competitive Equilibria of Piecewise Linear Economic Models
Article Name  :  Wage and Price Controls in a Dynamic Macro Model
Article Name  :  Approximate Efficiency of Non-Walrasian Nash Equilibria
Article Name  :  Induced Preferences on Trades when Preferences May Be Intransitive and Incomplete
Article Name  :  A Note on the Characterization of Mechanisms for the Revelation of Preferences
Article Name  :  Consi

Processing : 143/263 	 Vol. 45, No. 4, May, 1977 ...
Article Name  :  Optimal Allocation of Public Goods: A Solution to the "Free Rider" Problem
Article Name  :  Necessary and Sufficient Conditions for a Pareto Optimum in Convex Programming
Article Name  :  Economic Environments for which there are Pareto Satisfactory Mechanisms
Article Name  :  A Two-Person Exchange Model
Article Name  :  Maximin Paths of Heterogeneous Capital Accumulation and the Instability of Paradoxical Steady States
Article Name  :  Social Decision Functions and the Veto
Article Name  :  On Preferences, Beliefs, and Manipulation within Voting Situations
Article Name  :  The Existence of Choice Functions
Article Name  :  A Matrix Measure of Multivariate Local Risk Aversion
Article Name  :  Linear Quadratic Control Theory for Models with Long Lags
Article Name  :  Social Experimentation, Truncated Distributions, and Efficient Estimation
Article Name  :  Some Properties of a Modification of the Limited Information E

Processing : 148/263 	 Vol. 44, No. 5, Sep., 1976 ...
Article Name  :  Turnpike Theory
Article Name  :  Optimal Growth in a Putty-Clay Model
Article Name  :  The Specification of Adaptive Expectations in Continuous Time Dynamic Economic Models
Article Name  :  A Non-Tâtonnement Model with Production and Consumption
Article Name  :  Limit Pricing, Uncertain Entry, and the Entry Lag
Article Name  :  Input-Output Analysis with Scale-Dependent Coefficients
Article Name  :  A Function for Size Distribution of Incomes
Article Name  :  The Demand Theory of the Weak Axiom of Revealed Preference
Article Name  :  Community Preferences and the Representative Consumer
Article Name  :  Irrelevant Alternatives and Social Welfare
Article Name  :  Self-Dual Preferences
Article Name  :  Representable Choice Functions
Article Name  :  Bayesian Limited Information Analysis of the Simultaneous Equations Model
Article Name  :  Testing for Serial Correlation in Dynamic Simultaneous Equation Models
Article N

Processing : 153/263 	 Vol. 43, No. 5/6, Sep. - Nov., 1975 ...
Article Name  :  Policy Related Voting and Electoral Equilibrium
Article Name  :  Degrees of Cardinality and Aggregate Partial Orderings
Article Name  :  The Continuity of Majority Rule Equilibrium
Article Name  :  Bounded One-Way Expected Utility
Article Name  :  A Disaggregate Analysis of Consumer Choice under Uncertainty
Article Name  :  An Adaptive Learning Rule for Multiperiod Decision Problems
Article Name  :  The Graph of the Walras Correspondence
Article Name  :  Personal Attributes, Job Performance, and Probability of Promotion
Article Name  :  Note on a Large-Sample Result in Specification Analysis
Article Name  :  Estimation and Hypothesis Testing in Singular Equation Systems with Autoregressive Disturbances
Article Name  :  The Power of the Durbin-Watson Test
Article Name  :  Semiorders and Choice Functions
Article Name  :  Semiorders and the Theory of Choice: A Correction
Article Name  :  Existence of a Continu

Processing : 160/263 	 Vol. 42, No. 4, Jul., 1974 ...
Article Name  :  Marx in the Light of Modern Economic Theory
Article Name  :  Some Remarks on the Core of a "Large" Economy
Article Name  :  The Topology of Pareto-Optimal Regions with Public Goods
Article Name  :  The Capacity of the Smithies Model to Explain the Growth Trend by Endogenous Forces
Article Name  :  Shadow Prices, Market Wages, and Labor Supply
Article Name  :  Impossibility Theorems without the Social Completeness Axiom
Article Name  :  Equilibrium and Stability
Article Name  :  An Experimental Study of Structural Estimators and Test Statistics Associated with Dynamical Econometric Models
Article Name  :  Identifiability in Linear Models
Article Name  :  Asymptotic Minimum-MSE Prediction in the Cobb-Douglas Model with a Multiplicative Disturbance Term
Article Name  :  The Exact Mean of the Two-Stage Least Squares Estimator of the Structural Parameters in an Equation Having Three Endogenous Variables
Article Name  :  

Processing : 166/263 	 Vol. 41, No. 4, Jul., 1973 ...
Article Name  :  Manipulation of Voting Schemes: A General Result
Article Name  :  Transitive Binary Social Choices and Intraprofile Conditions
Article Name  :  Incentives in Teams
Article Name  :  An Econometric Analysis of Fertility in Sweden, 1870-1965
Article Name  :  Choice of Response Functional Form in Designing Subsidy Experiments
Article Name  :  Generalized Costs of Adjustment and Dynamic Factor Demand Theory
Article Name  :  Neo-Classical Technology Sets and Properties of Production Possibility Sets
Article Name  :  Distributions of Estimates of Coefficients of a Single Equation in a Simultaneous System and Their Asymptotic Expansions
Article Name  :  Approximations to the Distribution Functions of Theil's k-Class Estimators
Article Name  :  Generalized Least Squares with an Estimated Autocovariance Matrix
Article Name  :  Alternative Tests of Independence between Stochastic Regressors and Disturbances
Article Name  :  Li

Processing : 172/263 	 Vol. 40, No. 4, Jul., 1972 ...
Article Name  :  Smooth Preferences
Article Name  :  Testing for Fourth Order Autocorrelation in Quarterly Regression Equations
Article Name  :  Fair Net Trades
Article Name  :  The Existence of Moments of the Ordinary Least Squares and Two-Stage Least Squares Estimators
Article Name  :  Finite-Sample Properties of the k-Class Estimators
Article Name  :  A Cost-Inclusive Simultaneous Equation Model of Birth Rates
Article Name  :  Weaker Criteria and Tests for Linear Restrictions in Regression
Article Name  :  Operational Techniques and Tables for Making Weak MSE Tests for Restrictions in Regressions
Article Name  :  A General Formulation of the Lechatelier-Samuelson Principle
Article Name  :  Regression with Non-Gaussian Stable Disturbances: Some Sampling Results
Article Name  :  The Factor-Price Equalization Theorem
Article Name  :  The S-Branch Utility Tree: A Generalization of the Linear Expenditure System
Article Name  :  An Eco

Processing : 175/263 	 Vol. 40, No. 1, Jan., 1972 ...
Article Name  :  Econometrics and Decision Theory
Article Name  :  Information Lost in Aggregation: A Bayesian Approach
Article Name  :  Tatonnement Stability: An Econometric Approach
Article Name  :  Timing of Innovations Under Rivalry
Article Name  :  A Direct Proof of Arrow's Theorem
Article Name  :  Stochastic Implications of Orbital Asymptotic Stability of a Nonlinear Trade Cycle Model
Article Name  :  More Stochastic Properties of the Klein-Goldberger Model
Article Name  :  Upper Hemi-Continuity of the Equilibrium-Set Correspondence for Pure Exchange Economies
Article Name  :  Population and Optimal Growth
Article Name  :  Indices Prospectifs Quantitatifs et Procedures Decentralisees d'Elaboration des Plans
Article Name  :  Social Preference Orderings and Majority Rule
Article Name  :  A Study of the Production Structure of the Indian Economy: An International Comparison
Article Name  :  A Mean Demand Function and Individual D

KeyboardInterrupt: 

## Filter Unwanted Articles

Some articles containing words like 
* Report on
* Report of
* annual report
don't have abstracts, and I exclude them

Also, there are 'Book Reviews', for which the author is in the form of 'Reviewed by:'

In [64]:
arts = pd.read_csv(all_articles_file_name, header = None)
print(len(arts))
exclude_words = ['Report of','Report on', 'Annual Reports','Criticism Invited']
dont_need = (arts[1].str.contains('|'.join(exclude_words),regex=True, case=False) | 
            arts[8].str.contains('Review by:'))
print("Articles to exclude : "+ str(sum(dont_need)))

articles_remain = arts[~dont_need]
articles_remain

## save those don't need into another file
arts[dont_need].to_csv('ECA_skipped.csv',index = False, header = False)

5713
Articles to exclude : 1110


We add the column name and create a new file with it

In [93]:
total_column_number = len(articles_remain.columns)
print(total_column_number)

col_name_with_author = colNames + [ f"Author {i+1}" for i in range(total_column_number-8)]

38


In [None]:
# articles_remain.columns = col_name_with_author
# articles_remain['scraped'] = [0]*len(articles_remain)
# articles_remain.to_csv(f'{CONFIG.JOURNAL_NAME}.csv', index = False)