In [1]:
import re
import requests
import numpy as np
import pandas as pd
from bs4 import BeautifulSoup

In [2]:
remove_n = re.compile(r'\n')
html_element = re.compile(r'<.*?>')

**Single Case**

In [9]:
link = "https://primelegal.in/2022/02/27/in-a-motor-accident-the-tribunal-must-consider-compensation-on-account-of-loss-of-future-prospect-in-gauhati-high-court/"

In [10]:
data = requests.get(link)
soup = BeautifulSoup(data.content, 'html.parser')

In [11]:
parser = [{
    'Title': remove_n.sub('',str(title.string)),
    'Case Summary': ' '.join([(html_element.sub('',str(i))) for i in content.find_all('p')[:-2]]),
    'Judgement Link': content.find('a').attrs.get('href')
    }
  for title, content in zip(
      soup.find('h2', class_ = ['entry-title']),
      soup.find_all('div', class_ = ['entry-content'])
  )
]

In [12]:
df = pd.DataFrame(parser)
df = df[['Title', 'Case Summary', 'Judgement Link']]
df.head()

Unnamed: 0,Title,Case Summary,Judgement Link
0,"In A Motor Accident, The Tribunal Must Conside...",The learned Tribunal denied a claim for compen...,https://primelegal.in/2022/02/27/in-a-motor-ac...


### **All Cases**

`1-500`

In [15]:
all_links = []

for i in range(1,732):
  all_links.append(f"https://primelegal.in/category/blog/page/{i}/")
len(all_links)

731

In [14]:
titles, links, summaries = [], [], []

for page_no, case in enumerate(all_links):
  
  data = requests.get(case)
  soup = BeautifulSoup(data.content, 'html.parser')
  print(f"Page {page_no}")

  for case_no ,i in enumerate(soup.find('div', class_ = ['site-content']).find_all('article')):
  
    content = i.find('div', class_="entry-content")

    try:
        title = i.find('h2', class_="entry-title").find('a').string
    except AttributeError as e:
        title = np.NaN
        print(f"{e} --> Page no. {page_no} and case no. {case_no}")
      
    try:
        summary = ' '.join([(html_element.sub('',str(i))) for i in content.find_all('p')[:-2]])
    except AttributeError as e:
        summary = np.NaN
        print(f"{e} --> Page no. {page_no} and case no. {case_no}")
        
    try:
        link = content.find('a').attrs.get('href')
    except AttributeError as e:
        link = np.NaN
        print(f"{e} --> Page no. {page_no} and case no. {case_no}")


    titles.append(title)
    links.append(link)
    summaries.append(summary)

Page 0
'NoneType' object has no attribute 'attrs' --> Page no. 0 and case no. 3
Page 1
Page 2
Page 3
Page 4
Page 5
Page 6
Page 7
Page 8
Page 9
Page 10
Page 11
Page 12
Page 13
Page 14
Page 15
Page 16
Page 17
Page 18
Page 19
Page 20
'NoneType' object has no attribute 'attrs' --> Page no. 20 and case no. 1
Page 21
Page 22
Page 23
Page 24
Page 25
Page 26
Page 27
Page 28
Page 29
Page 30
Page 31
Page 32
Page 33
'NoneType' object has no attribute 'attrs' --> Page no. 33 and case no. 0
'NoneType' object has no attribute 'attrs' --> Page no. 33 and case no. 3
'NoneType' object has no attribute 'attrs' --> Page no. 33 and case no. 4
Page 34
Page 35
Page 36
'NoneType' object has no attribute 'attrs' --> Page no. 36 and case no. 4
Page 37
Page 38
Page 39
Page 40
Page 41
Page 42
Page 43
Page 44
Page 45
Page 46
Page 47
Page 48
Page 49
Page 50
Page 51
Page 52
Page 53
Page 54
'NoneType' object has no attribute 'attrs' --> Page no. 54 and case no. 1
Page 55
Page 56
Page 57
Page 58
Page 59
Page 60
Page 

In [18]:
Final_df = pd.DataFrame(list(zip(titles, summaries, links)), columns =['titles', 'summaries','links'])

In [20]:
Final_df

Unnamed: 0,titles,summaries,links
0,If it is summoned by the Court then respondent...,Court has validly served the respondent to be ...,https://primelegal.in/2022/03/21/if-it-is-summ...
1,Petitioner accused in illicit sale of the Indi...,Petitioner who was accused to be engaged in il...,https://primelegal.in/2022/03/21/petitioner-ac...
2,The Court can take judicial notice of public h...,Section 57 of the Evidence Act deals with fact...,https://primelegal.in/2022/03/21/the-court-can...
3,The quantity of contraband recovered from the ...,Conspiracy is always hatched in secrecy and it...,https://primelegal.in/?attachment_id=28615
4,Petitioner had been granted permission for use...,Petitioner had been granted permission for use...,https://primelegal.in/2022/03/20/petitioner-ha...
...,...,...,...
2491,"Under S.438 Cr.P.C., the Court while granting ...",While addressing an appeal against the order o...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Na...
2492,"For an Offence under S.304B IPC, it is pertine...",When an accused is booked under section 304B I...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Gu...
2493,The recovery of compound interest would not co...,It is also a norm of the banking industry to c...,https://primelegal.in/wp-content/uploads/2021/...
2494,The practice of forum shopping by litigant sho...,"The withdrawal of the proceedings, even if wit...",https://primelegal.in/wp-content/uploads/2021/...


`500-718`

In [16]:
Final_df1 = pd.DataFrame(list(zip(titles, summaries, links)), columns =['titles', 'summaries','links'])

In [17]:
Final_df1

Unnamed: 0,titles,summaries,links
0,The second complaint would not be maintainable...,Law does not prohibit filing or entertaining s...,https://primelegal.in/wp-content/uploads/2021/...
1,Three conditions must be fulfilled for an indi...,The first is the status of the person in the r...,https://www.mhc.tn.gov.in/judis/index.php/case...
2,Consent of a child below 18 years to indulge i...,If the victim of sexual assault is a child and...,https://www.mhc.tn.gov.in/judis/index.php/case...
3,RBI inflicted the 10cr penalty on HDFC Bank Li...,It was all started when two U.S. based law fir...,
4,“Soon before” Under S.304-B IPC does not mean ...,On a criminal appeal regarding bail for dowry ...,https://main.sci.gov.in/supremecourt/2009/7085...
...,...,...,...
1155,Disclosure of Personal Information is exempted...,The Hon’ble High Court of Delhi in Dr. RS Gupt...,https://primelegal.in/wp-content/uploads/2020/...
1156,Investor Protection Laws are not applicable to...,The Hon’ble High court of Orissa in Mahasweta ...,https://primelegal.in/wp-content/uploads/2020/...
1157,[AGR Dues] Timeframe to clear AGR dues by tele...,The Hon’ble Supreme Court of India Union of In...,https://primelegal.in/wp-content/uploads/2020/...
1158,There is no Automatic Apprehension of bias whe...,The Hon’ble Supreme Court of India in Mukesh S...,https://primelegal.in/wp-content/uploads/2020/...


In [22]:
DF = pd.concat([Final_df, Final_df1])
DF

Unnamed: 0,titles,summaries,links
0,If it is summoned by the Court then respondent...,Court has validly served the respondent to be ...,https://primelegal.in/2022/03/21/if-it-is-summ...
1,Petitioner accused in illicit sale of the Indi...,Petitioner who was accused to be engaged in il...,https://primelegal.in/2022/03/21/petitioner-ac...
2,The Court can take judicial notice of public h...,Section 57 of the Evidence Act deals with fact...,https://primelegal.in/2022/03/21/the-court-can...
3,The quantity of contraband recovered from the ...,Conspiracy is always hatched in secrecy and it...,https://primelegal.in/?attachment_id=28615
4,Petitioner had been granted permission for use...,Petitioner had been granted permission for use...,https://primelegal.in/2022/03/20/petitioner-ha...
...,...,...,...
1155,Disclosure of Personal Information is exempted...,The Hon’ble High Court of Delhi in Dr. RS Gupt...,https://primelegal.in/wp-content/uploads/2020/...
1156,Investor Protection Laws are not applicable to...,The Hon’ble High court of Orissa in Mahasweta ...,https://primelegal.in/wp-content/uploads/2020/...
1157,[AGR Dues] Timeframe to clear AGR dues by tele...,The Hon’ble Supreme Court of India Union of In...,https://primelegal.in/wp-content/uploads/2020/...
1158,There is no Automatic Apprehension of bias whe...,The Hon’ble Supreme Court of India in Mukesh S...,https://primelegal.in/wp-content/uploads/2020/...


In [23]:
DF.reset_index(inplace=True, drop=True)

In [24]:
DF

Unnamed: 0,titles,summaries,links
0,If it is summoned by the Court then respondent...,Court has validly served the respondent to be ...,https://primelegal.in/2022/03/21/if-it-is-summ...
1,Petitioner accused in illicit sale of the Indi...,Petitioner who was accused to be engaged in il...,https://primelegal.in/2022/03/21/petitioner-ac...
2,The Court can take judicial notice of public h...,Section 57 of the Evidence Act deals with fact...,https://primelegal.in/2022/03/21/the-court-can...
3,The quantity of contraband recovered from the ...,Conspiracy is always hatched in secrecy and it...,https://primelegal.in/?attachment_id=28615
4,Petitioner had been granted permission for use...,Petitioner had been granted permission for use...,https://primelegal.in/2022/03/20/petitioner-ha...
...,...,...,...
3651,Disclosure of Personal Information is exempted...,The Hon’ble High Court of Delhi in Dr. RS Gupt...,https://primelegal.in/wp-content/uploads/2020/...
3652,Investor Protection Laws are not applicable to...,The Hon’ble High court of Orissa in Mahasweta ...,https://primelegal.in/wp-content/uploads/2020/...
3653,[AGR Dues] Timeframe to clear AGR dues by tele...,The Hon’ble Supreme Court of India Union of In...,https://primelegal.in/wp-content/uploads/2020/...
3654,There is no Automatic Apprehension of bias whe...,The Hon’ble Supreme Court of India in Mukesh S...,https://primelegal.in/wp-content/uploads/2020/...


In [25]:
DF[DF.isna().any(axis=1)].shape

(33, 3)

In [26]:
DF[DF.isna().any(axis=1)]

Unnamed: 0,titles,summaries,links
104,The Discharge Application is the remedy that i...,If the allegations which have been made agains...,
114,Interest of home buyers prevails over banks in...,The Supreme Court upheld the decision of the R...,
157,,,
235,Liberty must be given to Approach Concerned Au...,"Wherein grievances have arisen, it is necessar...",
276,Both constitutional and statutory obligation o...,The statutory and constitutional obligation of...,
283,Appeal against Section 138 of Negotiable Instr...,CriminalJudgement Reviewed by sugam Anand Mish...,
756,To issue order or direction thereby directing ...,To issue order or direction thereby directing ...,
893,A writ of Habeus Corpus denied in the matters ...,The writ of Habeus corpus is provided in the c...,
1133,Emergence of no fresh grounds or events after ...,A person suffering from a mental disorder or m...,
1176,Right of indigent Muslim Woman for maintenance...,Getting married another time and having childr...,


In [27]:
DF.dropna(inplace=True)

In [29]:
DF[DF.isna().any(axis=1)]

Unnamed: 0,titles,summaries,links


In [30]:
DF

Unnamed: 0,titles,summaries,links
0,If it is summoned by the Court then respondent...,Court has validly served the respondent to be ...,https://primelegal.in/2022/03/21/if-it-is-summ...
1,Petitioner accused in illicit sale of the Indi...,Petitioner who was accused to be engaged in il...,https://primelegal.in/2022/03/21/petitioner-ac...
2,The Court can take judicial notice of public h...,Section 57 of the Evidence Act deals with fact...,https://primelegal.in/2022/03/21/the-court-can...
3,The quantity of contraband recovered from the ...,Conspiracy is always hatched in secrecy and it...,https://primelegal.in/?attachment_id=28615
4,Petitioner had been granted permission for use...,Petitioner had been granted permission for use...,https://primelegal.in/2022/03/20/petitioner-ha...
...,...,...,...
3651,Disclosure of Personal Information is exempted...,The Hon’ble High Court of Delhi in Dr. RS Gupt...,https://primelegal.in/wp-content/uploads/2020/...
3652,Investor Protection Laws are not applicable to...,The Hon’ble High court of Orissa in Mahasweta ...,https://primelegal.in/wp-content/uploads/2020/...
3653,[AGR Dues] Timeframe to clear AGR dues by tele...,The Hon’ble Supreme Court of India Union of In...,https://primelegal.in/wp-content/uploads/2020/...
3654,There is no Automatic Apprehension of bias whe...,The Hon’ble Supreme Court of India in Mukesh S...,https://primelegal.in/wp-content/uploads/2020/...


In [31]:
DF.reset_index(inplace=True, drop=True)

In [32]:
DF

Unnamed: 0,titles,summaries,links
0,If it is summoned by the Court then respondent...,Court has validly served the respondent to be ...,https://primelegal.in/2022/03/21/if-it-is-summ...
1,Petitioner accused in illicit sale of the Indi...,Petitioner who was accused to be engaged in il...,https://primelegal.in/2022/03/21/petitioner-ac...
2,The Court can take judicial notice of public h...,Section 57 of the Evidence Act deals with fact...,https://primelegal.in/2022/03/21/the-court-can...
3,The quantity of contraband recovered from the ...,Conspiracy is always hatched in secrecy and it...,https://primelegal.in/?attachment_id=28615
4,Petitioner had been granted permission for use...,Petitioner had been granted permission for use...,https://primelegal.in/2022/03/20/petitioner-ha...
...,...,...,...
3618,Disclosure of Personal Information is exempted...,The Hon’ble High Court of Delhi in Dr. RS Gupt...,https://primelegal.in/wp-content/uploads/2020/...
3619,Investor Protection Laws are not applicable to...,The Hon’ble High court of Orissa in Mahasweta ...,https://primelegal.in/wp-content/uploads/2020/...
3620,[AGR Dues] Timeframe to clear AGR dues by tele...,The Hon’ble Supreme Court of India Union of In...,https://primelegal.in/wp-content/uploads/2020/...
3621,There is no Automatic Apprehension of bias whe...,The Hon’ble Supreme Court of India in Mukesh S...,https://primelegal.in/wp-content/uploads/2020/...


In [41]:
templist = []
for i, link in enumerate(DF['links']):
    
    if 'file:///C:/Users/SIVA1964/' in link:
        print(i, link)
        templist.append(i)templist = []
for i, link in enumerate(DF['links']):
    
    if 'file:///C:/Users/SIVA1964/' in link:
        print(i, link)
        templist.append(i)

2373 file:///C:/Users/SIVA1964/Desktop/8th%20sem/C.%20Krishniah%20Chetty%20&%20Sons%20Private%20Limited%20vs.%20Deepali%20Company%20Private.pdf
2395 file:///C:/Users/SIVA1964/Desktop/8th%20sem/Abhishek%20Kumar%20Singh%20vs.%20G.%20Pattanaik%20&%20Ors..pdf
2473 file:///C:/Users/SIVA1964/Desktop/8th%20sem/Nathu%20Singh%20vs.%20State%20of%20Uttar%20Pradesh.pdf
2474 file:///C:/Users/SIVA1964/Desktop/8th%20sem/Gurmeet%20Singh%20vs.%20State%20of%20Punjab.pdf
2482 file:///C:/Users/SIVA1964/Desktop/8th%20sem/Vinod%20Kumar%20vs.%20State%20of%20Himachal%20Pradesh.pdf
2494 file:///C:/Users/SIVA1964/Desktop/8th%20sem/Davinder%20Kumar%20vs.%20State%20of%20H.P.%20and%20others.pdf
2502 file:///C:/Users/SIVA1964/Desktop/8th%20sem/Lekh%20Ram%20@Suneel%20Kumar%20vs.%20State%20of%20Himachal%20Pradesh.pdf
2510 file:///C:/Users/SIVA1964/Desktop/8th%20sem/Shri%20Jaishi%20Ram%20vs.%20Shri%20Manohar%20Lal%20&%20others.pdf
2518 file:///C:/Users/SIVA1964/Desktop/8th%20sem/sangita%20sharma%20vs%20Rohit%20kalia.p

In [42]:
templist

[2373, 2395, 2473, 2474, 2482, 2494, 2502, 2510, 2518, 2524, 2534]

In [43]:
DF.iloc[templist]

Unnamed: 0,titles,summaries,links
2373,Order XXIX Rule 1 Code of Civil procedure does...,Order XXIX Rule 1 Code of Civil procedure does...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/C....
2395,Contempt action ought to proceed only when wil...,"While hearing a contempt petition, the Apex Co...",file:///C:/Users/SIVA1964/Desktop/8th%20sem/Ab...
2473,"Under S.438 Cr.P.C., the Court while granting ...",While addressing an appeal against the order o...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Na...
2474,"For an Offence under S.304B IPC, it is pertine...",When an accused is booked under section 304B I...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Gu...
2482,Eligibility of a candidate to be construed in ...,While rendering judgment regarding a writ peti...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Vi...
2494,Notification issued by the government to be ac...,While hearing a case on the purchase of Dry Kh...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Da...
2502,Consent immaterial under POCSO Act when compla...,While hearing a bail application for offences ...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Le...
2510,Appellant Court may dispense with service of n...,Order 41 Rule 14 CPC provides that Appellate C...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Sh...
2518,Parties can approach the Family Court for enac...,While hearing a custodial dispute between pare...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/sa...
2524,Government Largesse cannot be distributed in a...,While hearing writ petitions on the procedure ...,file:///C:/Users/SIVA1964/Desktop/8th%20sem/Pr...


In [45]:
DF.drop(templist, inplace=True)
DF.reset_index(inplace=True, drop=True)

In [46]:
DF

Unnamed: 0,titles,summaries,links
0,If it is summoned by the Court then respondent...,Court has validly served the respondent to be ...,https://primelegal.in/2022/03/21/if-it-is-summ...
1,Petitioner accused in illicit sale of the Indi...,Petitioner who was accused to be engaged in il...,https://primelegal.in/2022/03/21/petitioner-ac...
2,The Court can take judicial notice of public h...,Section 57 of the Evidence Act deals with fact...,https://primelegal.in/2022/03/21/the-court-can...
3,The quantity of contraband recovered from the ...,Conspiracy is always hatched in secrecy and it...,https://primelegal.in/?attachment_id=28615
4,Petitioner had been granted permission for use...,Petitioner had been granted permission for use...,https://primelegal.in/2022/03/20/petitioner-ha...
...,...,...,...
3607,Disclosure of Personal Information is exempted...,The Hon’ble High Court of Delhi in Dr. RS Gupt...,https://primelegal.in/wp-content/uploads/2020/...
3608,Investor Protection Laws are not applicable to...,The Hon’ble High court of Orissa in Mahasweta ...,https://primelegal.in/wp-content/uploads/2020/...
3609,[AGR Dues] Timeframe to clear AGR dues by tele...,The Hon’ble Supreme Court of India Union of In...,https://primelegal.in/wp-content/uploads/2020/...
3610,There is no Automatic Apprehension of bias whe...,The Hon’ble Supreme Court of India in Mukesh S...,https://primelegal.in/wp-content/uploads/2020/...


In [49]:
DF.isna().sum()

titles       0
summaries    0
links        0
dtype: int64

In [50]:
DF.shape

(3612, 3)

In [51]:
DF.to_csv('primelegal.csv', header=True, index=False)