In [1]:
#Problem Identification
##Given factors that include as legal issue and the idenitity of the Supreme Court Justice, this project will model and predict how each Justice will vote on future legal issues. The vote by the Supreme Court Justice is a target variable. This model may guide law firms and public policy groups in making litigation decisions.

In [2]:
#Import pandas, matplotlib.pyplot, and seaborn in the correct lines below
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import os



In [3]:
df = pd.read_csv('SCDB_2021_01_justiceCentered_LegalProvision.csv')


In [4]:

df.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 122088 entries, 0 to 122087
Data columns (total 61 columns):
 #   Column                    Non-Null Count   Dtype  
---  ------                    --------------   -----  
 0   caseId                    122088 non-null  object 
 1   docketId                  122088 non-null  object 
 2   caseIssuesId              122088 non-null  object 
 3   voteId                    122088 non-null  object 
 4   dateDecision              122088 non-null  object 
 5   decisionType              122088 non-null  int64  
 6   usCite                    117561 non-null  object 
 7   sctCite                   122088 non-null  object 
 8   ledCite                   122072 non-null  object 
 9   lexisCite                 122088 non-null  object 
 10  term                      122088 non-null  int64  
 11  naturalCourt              122088 non-null  int64  
 12  chief                     122088 non-null  object 
 13  docket                    121809 non-null  o

In [5]:
#This step selects the columns that are relevant to the analysis and limited to cases ruled on during the Roberts Court.

In [6]:
cols_to_subset = ['caseId','sctCite', 'caseName', 'chief', 'issue', 'issueArea', 'decisionDirection', 'authorityDecision1','lawType', 'lawSupp', 'lawMinor', 'decisionType', 'caseDisposition', 'caseDispositionUnusual', 'partyWinning', 'precedentAlteration', 'splitVote', 'majVotes', 'minVotes', 'justice', 'justiceName', 'vote', 'opinion', 'direction', 'majority']

In [7]:
df = df[cols_to_subset]

In [8]:
df = df[df['justiceName'] == 'JGRoberts']

In [9]:

df.info()

<class 'pandas.core.frame.DataFrame'>
Int64Index: 1527 entries, 108450 to 122079
Data columns (total 25 columns):
 #   Column                  Non-Null Count  Dtype  
---  ------                  --------------  -----  
 0   caseId                  1527 non-null   object 
 1   sctCite                 1527 non-null   object 
 2   caseName                1527 non-null   object 
 3   chief                   1527 non-null   object 
 4   issue                   1523 non-null   float64
 5   issueArea               1523 non-null   float64
 6   decisionDirection       1522 non-null   float64
 7   authorityDecision1      1501 non-null   float64
 8   lawType                 1492 non-null   float64
 9   lawSupp                 1492 non-null   float64
 10  lawMinor                409 non-null    object 
 11  decisionType            1527 non-null   int64  
 12  caseDisposition         1519 non-null   float64
 13  caseDispositionUnusual  1527 non-null   float64
 14  partyWinning            1526 non-

In [10]:
df.columns

Index(['caseId', 'sctCite', 'caseName', 'chief', 'issue', 'issueArea',
       'decisionDirection', 'authorityDecision1', 'lawType', 'lawSupp',
       'lawMinor', 'decisionType', 'caseDisposition', 'caseDispositionUnusual',
       'partyWinning', 'precedentAlteration', 'splitVote', 'majVotes',
       'minVotes', 'justice', 'justiceName', 'vote', 'opinion', 'direction',
       'majority'],
      dtype='object')

In [11]:
df.tail(10)

Unnamed: 0,caseId,sctCite,caseName,chief,issue,issueArea,decisionDirection,authorityDecision1,lawType,lawSupp,...,precedentAlteration,splitVote,majVotes,minVotes,justice,justiceName,vote,opinion,direction,majority
121998,2020-066,141 S. Ct. 1858,TERRY v. UNITED STATES,Roberts,10510.0,1.0,1.0,4.0,6.0,600.0,...,0.0,1,9,0,111,JGRoberts,1.0,1.0,1.0,2.0
122007,2020-067,141 S. Ct. 2090,GREER v. UNITED STATES,Roberts,10040.0,1.0,1.0,4.0,4.0,401.0,...,0.0,1,9,0,111,JGRoberts,1.0,1.0,1.0,2.0
122016,2020-067,141 S. Ct. 2090,UNITED STATES v. GARY,Roberts,10040.0,1.0,1.0,4.0,4.0,401.0,...,0.0,1,8,1,111,JGRoberts,1.0,1.0,1.0,2.0
122025,2020-068,141 S. Ct. 2244,PENNEAST PIPELINE CO. v. NEW JERSEY,Roberts,40070.0,4.0,2.0,1.0,2.0,211.0,...,0.0,1,5,4,111,JGRoberts,1.0,2.0,2.0,2.0
122034,2020-068,141 S. Ct. 2244,PENNEAST PIPELINE CO. v. NEW JERSEY,Roberts,80310.0,8.0,2.0,4.0,3.0,355.0,...,0.0,1,5,4,111,JGRoberts,1.0,2.0,2.0,2.0
122043,2020-070,141 S. Ct. 1145,"MAYS, WARDEN v. HINES",Roberts,10020.0,1.0,1.0,4.0,3.0,341.0,...,0.0,1,8,1,111,JGRoberts,1.0,1.0,1.0,2.0
122052,2020-071,141 S. Ct. 1467,ALASKA v. WRIGHT,Roberts,10020.0,1.0,1.0,4.0,3.0,341.0,...,0.0,1,9,0,111,JGRoberts,1.0,1.0,1.0,2.0
122061,2020-072,141 S. Ct. 2405,DUNN v. REEVES,Roberts,10020.0,1.0,1.0,3.0,3.0,341.0,...,0.0,1,6,3,111,JGRoberts,1.0,1.0,1.0,2.0
122070,2020-073,141 S. Ct. 2226,PAKDEL v. CITY AND COUNTY OF SAN FRANCISCO,Roberts,40070.0,4.0,1.0,2.0,2.0,211.0,...,0.0,1,9,0,111,JGRoberts,1.0,1.0,1.0,2.0
122079,2020-074,141 S. Ct. 2239,LOMBARDO v. ST. LOUIS,Roberts,40040.0,4.0,2.0,3.0,2.0,207.0,...,0.0,1,6,3,111,JGRoberts,1.0,1.0,2.0,2.0


In [13]:
df.shape

(1527, 25)