# Scraping data and making datasets 

### Import 

In [1]:
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import urllib.request as urllib2
from bs4 import BeautifulSoup

## Getting data from web pages
Our aim is to build a song lyrics dataset for some most popular hindi songs. 

### Details of the page 

In [10]:
song_list_url = 'https://www.azlyrics.com/a/arijitsingh.html'
song_list_page = urllib2.urlopen(song_list_url)
song_list = BeautifulSoup(song_list_page, 'html.parser')

### Writing out responses 

In [25]:
print('SONG LIST PAGE TYPE:-\n', type(song_list_page), sep='')
print('\nSONG LIST TYPE:-\n', type(song_list), sep='')
print('\nSONG LIST PAGE:-\n', song_list_page, sep='')
print('\nSONG LIST:-\n', song_list, sep='')

SONG LIST PAGE TYPE:-
<class 'http.client.HTTPResponse'>

SONG LIST TYPE:-
<class 'bs4.BeautifulSoup'>

SONG LIST PAGE:-
<http.client.HTTPResponse object at 0x7f0a2c0db320>

SONG LIST:-
<!DOCTYPE html>

<html lang="en">
<head>
<meta charset="utf-8"/>
<meta content="IE=edge" http-equiv="X-UA-Compatible"/>
<meta content="width=device-width, initial-scale=1" name="viewport"/>
<!-- The above 3 meta tags *must* come first in the head; any other head content must come *after* these tags -->
<meta content='Arijit Singh lyrics - 132 song lyrics sorted by album, including "Ae Dil Hai Mushkil", "Laal Ishq", "Samjhawan".' name="description"/>
<meta content="Arijit Singh, Arijit Singh lyrics, discography, albums, songs" name="keywords"/>
<meta content="noarchive" name="robots"/>
<title>Arijit Singh Lyrics</title>
<link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.4/css/bootstrap.min.css" rel="stylesheet"/>
<link href="//www.azlyrics.com/bsaz.css" rel="stylesheet"/>
<!-- HTML5 shim and Respo

### Playing with the library 

In [58]:
# traverse the parsed tree datastructure
print('title tag: ', song_list.title)
print('a tag: ', song_list.a)

# all tags are of type bs4.element.tag
print('\ntitle tag type: ', type(song_list.title))
print('a tag type: ', type(song_list.a))

# access parent element of datastructure which of the same type tag
print('\ntitle tag\'s parent name: ', song_list.title.parent.name)
print('a tag\'s parent name: ', song_list.a.parent.name)

# access properties of parents
print('\ntitle tag\'s parent type: ', type(song_list.title.parent))
print('a tag\'s parent type: ', type(song_list.a.parent))

# access properties of element tag
print('\ntitle tag name:  ', song_list.title.name)
print('a tag name:  ', song_list.a.name)

# accessing attributes of tags
print('\na tag class: ', song_list.a['class'])
print('a tag find all attributes: ', song_list.a.attrs)
print('a tag find all attributes type: ', type(song_list.a.attrs))

# find (returns a single item) and find all (for multiple: returns a list)
print('\nfind all \'a\' tags: ', song_list.find_all('a'))
print('find by attribute: ', song_list.find_all(target='_blank'))

# getting only text out of an element (it can be nested)
print('\nGet only text from an element:-\n', song_list.find('small').get_text(), sep='')

title tag:  <title>Arijit Singh Lyrics</title>
a tag:  <a class="navbar-brand" href="//www.azlyrics.com"><img alt="AZLyrics.com" class="pull-left" src="//www.azlyrics.com/az_logo_tr.png" style="max-height:40px; margin-top:-10px;"/></a>

title tag type:  <class 'bs4.element.Tag'>
a tag type:  <class 'bs4.element.Tag'>

title tag's parent name:  head
a tag's parent name:  div

title tag's parent type:  <class 'bs4.element.Tag'>
a tag's parent type:  <class 'bs4.element.Tag'>

title tag name:   title
a tag name:   a

a tag class:  ['navbar-brand']
a tag find all attributes:  {'class': ['navbar-brand'], 'href': '//www.azlyrics.com'}
a tag find all attributes type:  <class 'dict'>

find all 'a' tags:  [<a class="navbar-brand" href="//www.azlyrics.com"><img alt="AZLyrics.com" class="pull-left" src="//www.azlyrics.com/az_logo_tr.png" style="max-height:40px; margin-top:-10px;"/></a>, <a class="btn btn-menu" href="//www.azlyrics.com/a.html">A</a>, <a class="btn btn-menu" href="//www.azlyrics.co

### Getting list of songs from the page 

In [91]:
# get song list a
counter = 0
a_list = song_list.find_all('a')
song_href_a = []
song_name_a = []
song_refer_a = []
for anchor in a_list:
    if 'target' in anchor.attrs and anchor['target']== '_blank':
        print('Song:- ', anchor.string, '\nHref:- ', anchor.attrs['href'])
        print('Sibling:- ', anchor.next_sibling.string)
        song_name_a.append(anchor.string)
        song_href_a.append(anchor.attrs['href'])
        song_refer_a.append(anchor.next_sibling.string)
        counter = counter+1
print('Total songs: ', counter)

Song:-  Aa Jao Na 
Href:-  https://www.azlyrics.com/lyrics/bollywood/aajaona.html
Sibling:-  [from "Veere Di Wedding" soundtrack]
Song:-  Aaj Phir 
Href:-  ../lyrics/arijitsingh/aajphir.html
Sibling:-  [from "Hate Story 2" soundtrack]
Song:-  Aaj Se Teri 
Href:-  ../lyrics/arijitsingh/aajseteri.html
Sibling:-  [from "Padman" soundtrack]
Song:-  Aasan Nahin Yahan 
Href:-  ../lyrics/arijitsingh/aasannahinyahan.html
Sibling:-  [from "Aashiqui 2" soundtrack]
Song:-  Ab Raat 
Href:-  ../lyrics/arijitsingh/abraat.html
Sibling:-  [from "Dobaara" soundtrack]
Song:-  Ae Dil Hai Mushkil 
Href:-  ../lyrics/arijitsingh/aedilhaimushkil.html
Sibling:-  [from "Ae Dil Hai Mushkil" soundtrack]
Song:-  Ae Watan 
Href:-  https://www.azlyrics.com/lyrics/bollywood/aewatan.html
Sibling:-  [from "Raazi" soundtrack]
Song:-  Alizeh 
Href:-  ../lyrics/arijitsingh/alizeh.html
Sibling:-  [from "Ae Dil Hai Mushkil" soundtrack]
Song:-  Alvida 
Href:-  ../lyrics/arijitsingh/alvida.html
Sibling:-  [from "Rangoon" sou

### Store data to disk 

In [103]:
d = {'name': song_name_a, 'from': song_refer_a, 'href': song_href_a}
df = pd.DataFrame(data = d)
df.head()

Unnamed: 0,name,from,href
0,Aa Jao Na,"[from ""Veere Di Wedding"" soundtrack]",https://www.azlyrics.com/lyrics/bollywood/aaja...
1,Aaj Phir,"[from ""Hate Story 2"" soundtrack]",../lyrics/arijitsingh/aajphir.html
2,Aaj Se Teri,"[from ""Padman"" soundtrack]",../lyrics/arijitsingh/aajseteri.html
3,Aasan Nahin Yahan,"[from ""Aashiqui 2"" soundtrack]",../lyrics/arijitsingh/aasannahinyahan.html
4,Ab Raat,"[from ""Dobaara"" soundtrack]",../lyrics/arijitsingh/abraat.html


In [105]:
df.to_csv('arijit_songs.csv')

### Getting list of all the songs and storing it onto disk  

In [110]:
# preprocessing urls
start = df['href'][1].find('/lyrics')
end = len(df['href'][1])

In [111]:
df['href'][1][start:end]

'/lyrics/arijitsingh/aajphir.html'

In [114]:
type(df['href'])

pandas.core.series.Series

In [6]:
def to_lyrics_path(x):
    start = x.find('/lyrics')
    end = len(x)
    return x[start:end]

In [7]:
df['href'] = df['href'].apply(to_lyrics_path)    

In [118]:
df[0:10]

Unnamed: 0,name,from,href
0,Aa Jao Na,"[from ""Veere Di Wedding"" soundtrack]",/lyrics/bollywood/aajaona.html
1,Aaj Phir,"[from ""Hate Story 2"" soundtrack]",/lyrics/arijitsingh/aajphir.html
2,Aaj Se Teri,"[from ""Padman"" soundtrack]",/lyrics/arijitsingh/aajseteri.html
3,Aasan Nahin Yahan,"[from ""Aashiqui 2"" soundtrack]",/lyrics/arijitsingh/aasannahinyahan.html
4,Ab Raat,"[from ""Dobaara"" soundtrack]",/lyrics/arijitsingh/abraat.html
5,Ae Dil Hai Mushkil,"[from ""Ae Dil Hai Mushkil"" soundtrack]",/lyrics/arijitsingh/aedilhaimushkil.html
6,Ae Watan,"[from ""Raazi"" soundtrack]",/lyrics/bollywood/aewatan.html
7,Alizeh,"[from ""Ae Dil Hai Mushkil"" soundtrack]",/lyrics/arijitsingh/alizeh.html
8,Alvida,"[from ""Rangoon"" soundtrack]",/lyrics/arijitsingh/alvida.html
9,Baatein Ye Kabhi Na,"[from ""Khamoshiyan"" soundtrack]",/lyrics/arijitsingh/baateinyekabhina.html


### Get lyrics of the songs 

In [119]:
df['lyrics'] = ''

In [120]:
df[0:5]

Unnamed: 0,name,from,href,lyrics
0,Aa Jao Na,"[from ""Veere Di Wedding"" soundtrack]",/lyrics/bollywood/aajaona.html,
1,Aaj Phir,"[from ""Hate Story 2"" soundtrack]",/lyrics/arijitsingh/aajphir.html,
2,Aaj Se Teri,"[from ""Padman"" soundtrack]",/lyrics/arijitsingh/aajseteri.html,
3,Aasan Nahin Yahan,"[from ""Aashiqui 2"" soundtrack]",/lyrics/arijitsingh/aasannahinyahan.html,
4,Ab Raat,"[from ""Dobaara"" soundtrack]",/lyrics/arijitsingh/abraat.html,


In [5]:
import time
df = pd.read_csv('arijit_songs.csv')
df.head()

Unnamed: 0.1,Unnamed: 0,name,from,href
0,0,Aa Jao Na,"[from ""Veere Di Wedding"" soundtrack]",https://www.azlyrics.com/lyrics/bollywood/aaja...
1,1,Aaj Phir,"[from ""Hate Story 2"" soundtrack]",../lyrics/arijitsingh/aajphir.html
2,2,Aaj Se Teri,"[from ""Padman"" soundtrack]",../lyrics/arijitsingh/aajseteri.html
3,3,Aasan Nahin Yahan,"[from ""Aashiqui 2"" soundtrack]",../lyrics/arijitsingh/aasannahinyahan.html
4,4,Ab Raat,"[from ""Dobaara"" soundtrack]",../lyrics/arijitsingh/abraat.html


In [8]:
# trial run for two rows
host = 'https://www.azlyrics.com'
row1 = df[35:36]['href'].item()
row2 = df[86:87]['href'].item()
url1 = host+row1
print(url1)
url2 = host+row2
print(url2)
lyrics_page_response1 = urllib2.urlopen(url1)
lyrics_page_response2 = urllib2.urlopen(url2)
lyrics_page_bs1 = BeautifulSoup(lyrics_page_response1, 'html.parser')
lyrics_page_bs2 = BeautifulSoup(lyrics_page_response2, 'html.parser')
print(lyrics_page_bs1)
print(lyrics_page_bs2)

https://www.azlyrics.com/lyrics/arijitsingh/gulonmeinrangbhare.html
https://www.azlyrics.com/lyrics/arijitsingh/phirleayadilreprise.html
<!DOCTYPE html>

<html lang="en">
<head>
<meta charset="utf-8"/>
<meta content="IE=edge" http-equiv="X-UA-Compatible"/>
<meta content="width=device-width, initial-scale=1" name="viewport"/>
<meta content='Lyrics to "Gulon Mein Rang Bhare" song by Arijit Singh: Bada hai dard ka rishta Bada hai dard ka rishta Dard ka rishta o.. o.. o.. mm.. Bada hai dard ka ri...' name="description"/>
<meta content="Gulon Mein Rang Bhare lyrics, Arijit Singh Gulon Mein Rang Bhare lyrics, Arijit Singh lyrics" name="keywords"/>
<meta content="noarchive" name="robots"/>
<meta content="//www.azlyrics.com/az_logo_tr.png" property="og:image"/>
<title>Arijit Singh Lyrics - Gulon Mein Rang Bhare</title>
<link href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.4/css/bootstrap.min.css" rel="stylesheet"/>
<link href="//www.azlyrics.com/bsaz.css" rel="stylesheet"/>
<!-- HTML5 shim

In [9]:
from bs4 import Comment

In [None]:
host = 'https://www.azlyrics.com'
for idx, row in df.iterrows():
    lyrics_url = host + row['href']
    print('Lyrics URL: ', lyrics_url)
    lyrics_page = 

In [10]:
comments = lyrics_page_bs1.find_all(string=lambda text:isinstance(text,Comment))

In [15]:
comments[12].parent

<div>
<!-- Usage of azlyrics.com content by any third-party lyrics provider is prohibited by our licensing agreement. Sorry about that. -->
Bada hai dard ka rishta<br/>
Bada hai dard ka rishta<br/>
Dard ka rishta o.. o.. o.. mm..<br/>
<br/>
Bada hai dard ka rishta<br/>
Bada hai dard ka rishta<br/>
Bada hai dard ka rishta<br/>
Yeh dil ghareeb sahi<br/>
Tumhaare naam pe aayenge<br/>
Gham gusaar chale hmm..<br/>
<br/>
Gulon mein rang bhare<br/>
Baad-e-naubahaar chale<br/>
Gulon mein rang bhare<br/>
Baad-e-naubahaar chale<br/>
<br/>
Chale bhi aao ke gulshan ka karobaar chale<br/>
Chale bhi aao ke gulshan ka karobaar chale<br/>
Gulon mein rang bhare<br/>
Baad-e-naubahaar chale<br/>
Gulon mein rang bhare<br/>
Baad-e-naubahaar chale<br/>
<br/>
Hmm..<br/>
Qafas udaas hai yaaron sabaa se kuch to kaho<br/>
Qafas udaas hai yaaron sabaa se kuch to kaho<br/>
Kahin to bahr-e-Khuda aaj zikar-e-yaar chale<br/>
Chale bhi aao ke gulshan ka kaarobaar chale<br/>
Gulon mein rang bhare<br/>
Baad-e-naubahaar

In [16]:
comments2 = lyrics_page_bs2.find_all(string=lambda text:isinstance(text,Comment))

In [53]:
comments2[12].string.strip().find('Usage')

0

In [28]:
comments2[12].parent.text

'\n\r\nPhir le aaya dil majboor kya keeje\nRaas na aaya rehna door kya keeje\nDil keh raha use maqammal kar bhi aao\nWo jo adhoori si baat baaki hai\nWo jo adhoori si yaad baaki hai\nWo jo adhoori si yaad baaki hai\n\nKarte hain hum aaj qabool kya keeje\nHo gayi thi jo humse bhool kya keeje\nDil keh raha use mayassar kar bhi aao\nWo jo dabi si aas baaki hai\nWo jo dabi si aanch baaki hai\nWo jo dabi si aanch baaki hai\nWo jo dabi si aanch baaki hai\n\nKismat ko hai yeh manzoor kya keeje\nMilte rahe hum baadastoor kya keeje\nKismat ko hai yeh manzoor kya keeje\nMilte rahe hum baadastoor kya keeje\nDil keh raha hai use musalsal kar bhi aao\nWo jo ruki si raah baaki hai\nWo jo ruki si chaah baaki hai\nWo jo ruki si chaah baaki hai\nWo jo ruki si chaah baaki hai\n'

In [29]:
df.head()

Unnamed: 0.1,Unnamed: 0,name,from,href
0,0,Aa Jao Na,"[from ""Veere Di Wedding"" soundtrack]",/lyrics/bollywood/aajaona.html
1,1,Aaj Phir,"[from ""Hate Story 2"" soundtrack]",/lyrics/arijitsingh/aajphir.html
2,2,Aaj Se Teri,"[from ""Padman"" soundtrack]",/lyrics/arijitsingh/aajseteri.html
3,3,Aasan Nahin Yahan,"[from ""Aashiqui 2"" soundtrack]",/lyrics/arijitsingh/aasannahinyahan.html
4,4,Ab Raat,"[from ""Dobaara"" soundtrack]",/lyrics/arijitsingh/abraat.html


In [36]:
df.to_csv('arijit_singh.csv')

In [37]:
df.to_csv('arijit_singh_songs.csv', index=False)

In [38]:
df['lyrics'] = ''

In [39]:
df

Unnamed: 0,name,from,href,lyrics
0,Aa Jao Na,"[from ""Veere Di Wedding"" soundtrack]",/lyrics/bollywood/aajaona.html,
1,Aaj Phir,"[from ""Hate Story 2"" soundtrack]",/lyrics/arijitsingh/aajphir.html,
2,Aaj Se Teri,"[from ""Padman"" soundtrack]",/lyrics/arijitsingh/aajseteri.html,
3,Aasan Nahin Yahan,"[from ""Aashiqui 2"" soundtrack]",/lyrics/arijitsingh/aasannahinyahan.html,
4,Ab Raat,"[from ""Dobaara"" soundtrack]",/lyrics/arijitsingh/abraat.html,
5,Ae Dil Hai Mushkil,"[from ""Ae Dil Hai Mushkil"" soundtrack]",/lyrics/arijitsingh/aedilhaimushkil.html,
6,Ae Watan,"[from ""Raazi"" soundtrack]",/lyrics/bollywood/aewatan.html,
7,Alizeh,"[from ""Ae Dil Hai Mushkil"" soundtrack]",/lyrics/arijitsingh/alizeh.html,
8,Alvida,"[from ""Rangoon"" soundtrack]",/lyrics/arijitsingh/alvida.html,
9,Baatein Ye Kabhi Na,"[from ""Khamoshiyan"" soundtrack]",/lyrics/arijitsingh/baateinyekabhina.html,


In [40]:
df.loc[35]['href']

'/lyrics/arijitsingh/gulonmeinrangbhare.html'

In [41]:
req = urllib2.Request('https://www.azlyrics.com/lyrics/arijitsingh/gulonmeinrangbhare.html', 
                headers={'User-Agent': 'Mozilla/5.0 (X11; U; Linux i686) Gecko/20071127 Firefox/2.0.0.11'})
html = urllib2.urlopen(req).read()

b'<!DOCTYPE html>\r\n<html lang="en">\r\n<head>\r\n<meta charset="utf-8">\r\n<meta http-equiv="X-UA-Compatible" content="IE=edge">\r\n<meta name="viewport" content="width=device-width, initial-scale=1">\r\n<meta name="description" content="Lyrics to &quot;Gulon Mein Rang Bhare&quot; song by Arijit Singh: Bada hai dard ka rishta Bada hai dard ka rishta Dard ka rishta o.. o.. o.. mm.. Bada hai dard ka ri..."> \r\n<meta name="keywords" content="Gulon Mein Rang Bhare lyrics, Arijit Singh Gulon Mein Rang Bhare lyrics, Arijit Singh lyrics">\r\n<meta name="robots" content="noarchive">\r\n<meta property="og:image" content="//www.azlyrics.com/az_logo_tr.png">\r\n<title>Arijit Singh Lyrics - Gulon Mein Rang Bhare</title>\r\n\r\n<link rel="stylesheet" href="https://maxcdn.bootstrapcdn.com/bootstrap/3.3.4/css/bootstrap.min.css">\r\n<link rel="stylesheet" href="//www.azlyrics.com/bsaz.css">\r\n\r\n<!-- HTML5 shim and Respond.js for IE8 support of HTML5 elements and media queries -->\r\n<!--[if lt I

In [57]:
def if_start_lyrics_comment(comment):
    if comment.string.strip().find('Usage') != -1:
        return True
    return False

In [63]:
import random

In [64]:
host = 'https://www.azlyrics.com'
for idx, row in df[66:].iterrows():
    lyrics_url = host + row['href']
    print('Lyrics URL: ', lyrics_url)
    
    req = urllib2.Request(lyrics_url, 
                headers={'User-Agent': 'Mozilla/5.0 (X11; U; Linux i686) Gecko/20071127 Firefox/2.0.0.11'})
    time.sleep(random.randint(7, 20))
    lyrics_page = urllib2.urlopen(req).read()
    
    soup = BeautifulSoup(lyrics_page, 'html.parser')
    comments = soup.find_all(string = lambda x: isinstance(x,Comment))
    
    usage_comment = list(filter(if_start_lyrics_comment, comments))[0]
    lyrics.append(usage_comment.parent.text)


Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/mainteriyaadonmein.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/mainesochakechuraloon.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/manwalaage.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/manzarlounge.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/mastmagan.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/maulare.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/meet.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/mehram.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/meraishq.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/meritanhaiyonmein.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/milnehaimujhseaayi.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/murshida.html
Lyrics URL:  https://www.azlyrics.com/lyrics/arijitsingh/muskurane.html
Lyrics URL:  https://www.azlyrics.

In [65]:
len(lyrics)

132

In [66]:
lyrics

['\n\r\nTum thhe yahin\nPhir bhi tum gum thhe\nAur main laapata\nAb jo mile ho toh phir\nSaath hi mein reh jaao na [x2]\n\nThode thode se poore\nAur thode adhoore\nYe waade rahe kya pataa\nPoore honge kayi khwab\nReh jaayenge kuch adhoore\nAbhi kya pataa?\n\nAa jao na…\nAa jao na…\nAa jao itna bhi kya sochna\nAa jaao na\nAa jaao na\nAa jaao itna bhi kya sochna\n\nThoda sahi ik doosre mein\nAa reh le kahin\nAa jee bhi le\nKab? kyun? kahaan? kaise?\nSoche nahin…\n\nAa chal waadon ke bhatke huve\nJugnuon ko dikha dein sahi raasta\nAa chal sotey sitaaron ko haule se\nSehla ke roshan karein aasmaan\n\nAa jao na…\nAa jao na…\nAa jao itna bhi kya sochna\nAa jaao na\nAa jaao na\nAa jaao itna bhi kya sochna…\n\nHahmmm…\n\nShaamein keyi hongi thehri hui\nBaatein keyi hongi roothi hui\nChhoti si zidd hogi\nLambi si raatein\nPhir bhi pyaar reh jaayega\nRehta hamesha toh kuch bhi nahin\nPhir bhi naa jaane kyun mujhko yaqeen\nSab beetne par bhi\nSab chhutne par bhi\nYeh pyaar reh jaayega\n\nTum thhe

In [68]:
df.drop(columns='lyrics', inplace=True)

In [69]:
df.head()

Unnamed: 0,name,from,href
0,Aa Jao Na,"[from ""Veere Di Wedding"" soundtrack]",/lyrics/bollywood/aajaona.html
1,Aaj Phir,"[from ""Hate Story 2"" soundtrack]",/lyrics/arijitsingh/aajphir.html
2,Aaj Se Teri,"[from ""Padman"" soundtrack]",/lyrics/arijitsingh/aajseteri.html
3,Aasan Nahin Yahan,"[from ""Aashiqui 2"" soundtrack]",/lyrics/arijitsingh/aasannahinyahan.html
4,Ab Raat,"[from ""Dobaara"" soundtrack]",/lyrics/arijitsingh/abraat.html


In [70]:
df['lyrics'] = pd.Series(lyrics).values

In [71]:
df.head()

Unnamed: 0,name,from,href,lyrics
0,Aa Jao Na,"[from ""Veere Di Wedding"" soundtrack]",/lyrics/bollywood/aajaona.html,\n\r\nTum thhe yahin\nPhir bhi tum gum thhe\nA...
1,Aaj Phir,"[from ""Hate Story 2"" soundtrack]",/lyrics/arijitsingh/aajphir.html,\n\r\nAaj phir tumpe pyar aaya hai\nAaj phir t...
2,Aaj Se Teri,"[from ""Padman"" soundtrack]",/lyrics/arijitsingh/aajseteri.html,\n\r\nAaj se teri saari galiyan meri ho gayi\n...
3,Aasan Nahin Yahan,"[from ""Aashiqui 2"" soundtrack]",/lyrics/arijitsingh/aasannahinyahan.html,\n\r\nWo o o o...\n\nAasaan nahi yahaan aashiq...
4,Ab Raat,"[from ""Dobaara"" soundtrack]",/lyrics/arijitsingh/abraat.html,\n\r\nChaand ki aankhein bhaari si hain\nRaat ...


In [72]:
df.to_csv('arijit_songs_with_lyrics.csv', index=False)