In [1]:
import pandas as pd
import numpy as np
import json
import re
import nltk

In [2]:
with open("lyrics.json", "r") as file:
  data = json.load(file)

In [3]:
df = pd.DataFrame(data.items(), columns = ["SongName", "Lyrics"] )

In [4]:
df["Lyrics"] = df["Lyrics"].apply(lambda x: str(x).split("Contributor")[-1])

Cleaning


In [5]:
nltk.download('punkt')
nltk.download('stopwords')


[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data]   Unzipping tokenizers/punkt.zip.
[nltk_data] Downloading package stopwords to /root/nltk_data...
[nltk_data]   Unzipping corpora/stopwords.zip.


True

In [6]:
from nltk.corpus import stopwords
from nltk.tokenize import word_tokenize
from sklearn.metrics.pairwise import cosine_similarity

stop_words = set(stopwords.words('english'))

In [7]:


df["Tokens"] = df["Lyrics"].apply(lambda x: x.lower())
df["Tokens"] = df["Tokens"].apply(lambda x: re.sub(r'[^a-zA-Z\s]', '', x))
df["Tokens"] = df["Tokens"].apply(lambda x: word_tokenize(x))


In [8]:
def stopwordremover(listOfWords):
  noStopWords = []
  for word in listOfWords:
    if word not in stop_words:
      noStopWords.append(word)
  return noStopWords

In [9]:
# df["Tokens"] = df["Tokens"].apply(lambda x: stopwordremover(x))

In [10]:
df["Tokens"] = df["Tokens"].apply(lambda x: " ".join(x))

In [11]:
df = df[df["Tokens"] != "none"]

Vectoriser

TFIDF

In [12]:
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.feature_extraction.text import CountVectorizer

In [13]:
df = df[~df["Tokens"].isna()]

In [14]:
vectorizer = TfidfVectorizer()
X = vectorizer.fit_transform([ "Nobody claimed it was simple"] + list(df["Tokens"]))

In [15]:
cosine_similarities = cosine_similarity(X[0:1], X[1:]).flatten()

In [16]:

most_similar_indices = cosine_similarities.argsort()[::-1]

# Print the most similar documents
print("Most relevant documents to the query:")
for idx in most_similar_indices[:20]:
    print(f"Document {idx + 1}: {df.iloc[idx]['SongName']}")

Most relevant documents to the query:
Document 527: If I Can't Have You - Yvonne Elliman
Document 1018: Ain't Nobody - Chaka Khan
Document 785: The Scientist - Coldplay
Document 899: Technologic - Daft Punk
Document 1555: ABC - The Jackson 5
Document 155: Can't Nobody Hold Me Down (feat. Mase) - Diddy, Mase
Document 1525: This Is How We Do It - Montell Jordan
Document 668: Somewhere Only We Know - Lily Allen
Document 1508: The Logical Song - Remastered 2010 - Supertramp
Document 903: Animal - Mark Ronson Remix - Miike Snow, Mark Ronson
Document 766: Son Of A Preacher Man - Dusty Springfield
Document 1379: In My Place - Coldplay
Document 4: The One and Only - Chesney Hawkes
Document 816: Your Song - Billy Paul
Document 1345: Your Love Is a Lie - Simple Plan
Document 1114: Happy Together - Simple Plan
Document 48: Don't Go Breaking My Heart - Elton John, Kiki Dee
Document 1639: Acceptable In the 80's - Calvin Harris
Document 1306: Somewhere Only We Know - Keane
Document 1189: Iron Man - 

Developing queries

In [None]:
# format = {
#    "Song Name" : [
#         "Original Query",
#         "New Query"
#     ]
#  }

queries = {
    "Destroy Everything You Touch - Ladytron": [
        "Destroy everything you touch, today",
        "Destroy all you contact, now"
    ],
    "Wanted Dead Or Alive - Bon Jovi": [
        "Wanted dead or alive",
        "Wanted deceased or lively"
    ],
    "Millennium - Robbie Williams": [
        "We got stars directing our fate",
        "Celestial bodies guiding our destiny"
    ],
    "Advertising Space - Robbie Williams": [
        "There's no more audience",
        "No spectators remain"
    ],
    "Duality - Slipknot": [
        "I push my fingers into my eyes",
        "I press my digits into my eyes"
    ],
    "Are You Gonna Be My Girl - Jet": [
        "So one, two, three, take my hand and come with me",
        "Hence, one, two, three, clutch my hand and join me"
    ],
    "Raise Your Glass - P!nk": [
        "So raise your glass if you are wrong",
        "Therefore, raise your cup if you're incorrect"
    ],
    "Mad World - Gary Jules, Michael Andrews": [
        "All around me are familiar faces",
        "In my vicinity are recognized countenances"
    ],
    "California Dream - The Mamas & The Papas": [
        "All the leaves are brown and the sky is gray",
        "Every leaf is brown and the sky is grey"
    ],
    "You're No Good - Linda Ronstadt": [
        "Feelin' better now that we're through",
        "Sensing improved as we've parted"
    ],
    "Sorry, Blame It On Me - Akon": [
        "I'm sorry for the times that I left you home",
        "Apologies for instances when I abandoned you at home"
    ],
    "Waterloo - ABBA": [
        "My, my, at Waterloo Napoleon did surrender",
        "My, my, at Waterloo Napoleon capitulated"
    ],
    "Faces - Original Extended Version - Clio": [
        "Just go on, on and on",
        "Simply continue, on and on"
    ],
    "Clocks - Coldplay": [
        "Lights go out and I can't be saved",
        "Lamps extinguish and I can't be rescued"
    ],
    "Kickstart My Heart - Mötley Crüe": [
        "When we started this band, all we needed",
        "At the commencement of this ensemble, all we required"
    ],
    "Jungle Boogie - Kool & The Gang": [
        "Get down, get down",
        "Descend, descend"
    ],
    "MMMBop - Single Version - Hanson": [
        "MMMBop, ba duba dop",
        "MMMBop, ba duba dop"
    ],
    "Stupidisco - Junior Jack": [
        "I'm gonna show you my heaven",
        "I'll exhibit my paradise to you"
    ],
    "I'm Coming Out - Diana Ross": [
        "I'm coming out",
        "I am emerging"
    ],
    "Heaven Is A Place On Earth - Belinda Carlisle": [
        "Ooh, baby, do you know what that's worth?",
        "Oh, darling, comprehend its value?"
    ],
    "Bubbly - Colbie Caillat": [
        "It starts in my toes and I crinkle my nose",
        "It commences in my toes and I wrinkle my nose"
    ],
    "You're The One That I Want - From “Grease” - John Travolta, Olivia Newton-John": [
        "You're the one that I want",
        "You're the one I desire"
    ],
    "Not Over Yet '99 (feat. Grace) - Radio Edit - Planet Perfecto, Grace": [
        "Not over yet",
        "Not concluded yet"
    ],
    "Heartbreaker - Pat Benatar": [
        "Your love is like a tidal wave",
        "Your affection resembles an immense wave"
    ],
    "Everything I Own - Bread": [
        "You sheltered me from harm, kept me warm",
        "You shielded me from harm, kept me cozy"
    ],
    "Relax - Frankie Goes To Hollywood": [
        "Relax, don't do it",
        "Unwind, refrain from it"
    ],
    "Thriller - Michael Jackson": [
        "'Cause this is thriller, thriller night",
        "'Cause this is frightening, frightening night"
    ],
    "Conga - Gloria Estefan": [
        "Come on, shake your body, baby, do the conga",
        "Proceed, sway your physique, darling, perform the conga"
    ],
    "Janie's Got A Gun - Single Version - Aerosmith": [
        "Janie's got a gun",
        "Janie possesses a firearm"
    ],
    "Land Of Confusion - Remastered 2007 - Genesis": [
        "This is the world we live in",
        "This is the realm we reside in"
    ],
    "Criminal - Fiona Apple": [
        "I've been a bad, bad girl",
        "I've been a naughty, naughty girl"
    ],
    "Elevation - U2": [
        "Elevation",
        "Heightening"
    ],
    "A Day in the Life (Club Mix) - Black Riot": [
        "Come on, shake your body and do the conga",
        "Let's proceed, sway your physique and perform the conga"
    ],
    "Get It Together - The Go! Team": [
        "Get it together",
        "Unify"
    ],
    "I Don't Want to Miss a Thing - From \"Armageddon\" Soundtrack - Aerosmith": [
        "I don't want to miss a thing",
        "I don't wish to overlook anything"
    ],
    "Shimmy Shimmy Ya - Ol' Dirty Bastard": [
        "Shimmy shimmy ya, shimmy yam, shimmy yay",
        "Shimmy shimmy ya, shimmy yam, shimmy yay"
    ],
    "The Look - Roxette": [
        "She's got the look",
        "She possesses the appearance"
    ],
    "Walk On the Wild Side - Lou Reed": [
        "And the colored girls go",
        "And the vibrant ladies proceed"
    ],
    "Wuthering Heights - Kate Bush": [
        "Heathcliff, it's me, I'm Cathy, I've come home",
        "Heathcliff, it's me, I'm Cathy, I've returned"
    ],
    "Empire State Of Mind [Jay-Z + Alicia Keys] - JAY-Z": [
        "In New York, concrete jungle where dreams are made of",
        "In New York, urban setting where dreams are fashioned"
    ],
    "Superstar - Navigators": [
        "Superstar",
        "Celebrity"
    ],
    "Walkin' On Sunshine (Re-Recorded Version) - Katrina": [
        "I'm walking on sunshine, whoa",
        "I tread on sunshine, whoa"
    ],
    "Wiggle It - Radio Version - 2 In A Room": [
        "Just move your body and wiggle it",
        "Simply shift your physique and wiggle it"
    ],
    "Don't Let It Bring You Down - Annie Lennox": [
        "Don't let it bring you down",
        "Don't allow it to depress you"
    ],
    "The Boys Are Back In Town - Thin Lizzy": [
        "Guess who just got back today",
        "Guess who recently returned today"
    ],
    "The End of the World - Skeeter Davis": [
        "Why does the sun go on shining?",
        "Why does the sun continue to shine?"
    ],
        "Can't Take My Eyes Off You - Andy Williams": [
        "You're just too good to be true",
        "You're simply too genuine to be unreal"
    ],
    "If I Could Turn Back Time - Cher": [
        "If I could turn back time",
        "If I could reverse time"
    ],
    "Can't Help Falling in Love - Elvis Presley": [
        "Wise men say only fools rush in",
        "Sensible individuals suggest only fools hasten"
    ],
    "Bad Boys (Theme From Cops) - Original Version - Inner Circle": [
        "Bad boys, bad boys, whatcha gonna do?",
        "Delinquent individuals, delinquent individuals, what will you do?"
    ],
    "(What A) Wonderful World - Sam Cooke": [
        "Don't know much about history",
        "Not knowledgeable about history"
    ],
    "How to Save a Life - The Fray": [
        "Step one, you say, 'We need to talk'",
        "Initial step, you mention, 'We must converse'"
    ],
    "En apa som liknar dig - Darin": [
        "Det är något med din blick",
        "There's something about your gaze"
    ],
    "Crash into Me - Dave Matthews Band": [
        "You've got your ball, you've got your chain",
        "You possess your ball, you possess your chain"
    ],
    "I Just Called To Say I Love You - Stevie Wonder": [
        "I just called to say I love you",
        "I simply phoned to express my love"
    ],
    "Alive And Kicking - Simple Minds": [
        "You turn me on, you lift me up",
        "You excite me, you elevate me"
    ],
    "Free Fallin' - Tom Petty": [
        "She's a good girl, loves her mama",
        "She's a decent girl, adores her mother"
    ],
    "(I'm Gonna Be) 500 Miles - MxPx": [
        "When I wake up, well, I know I'm gonna be",
        "Upon awakening, I'm aware I'm going to be"
    ],
    "Boom, Boom, Boom, Boom!! - Generation 90": [
        "Boom, boom, boom, boom!! I want you in my room",
        "Bang, bang, bang, bang!! I desire your presence in my chamber"
    ],
    "Geronimo's Cadillac - Modern Talking": [
        "Geronimo's Cadillac, it's making all girls turn mad",
        "Geronimo's car, it's driving all girls crazy"
    ],
    "Grey Day - Madness": [
        "Hey you, don't watch that, watch this",
        "Hey you, don't observe that, observe this"
    ],
    "Superhero - Daze": [
        "Like a superhero, like an astronaut",
        "Similar to a superhero, akin to an astronaut"
    ],
    "Light My Fire - The Doors": [
        "You know that it would be untrue",
        "You're aware that it would be false"
    ],
    "Mr. Brightside - The Killers": [
        "Coming out of my cage and I've been doing just fine",
        "Emerging from my enclosure and I've been doing well"
    ],
    "I Fought the Law - The Clash": [
        "Breaking rocks in the hot sun",
        "Smashing rocks in the scorching sun"
    ],
    "Kayleigh - 2017 Remaster - Marillion": [
        "Do you remember, chalk hearts melting on a playground wall?",
        "Do you recall, chalk hearts dissolving on a schoolyard wall?"
    ],
    "Da Ya Think I'm Sexy? - Rod Stewart": [
        "She sits alone, waiting for suggestions",
        "She sits by herself, anticipating proposals"
    ],
    "Action Radius - Junkie XL": [
        "Control, control, control, control, control",
        "Regulate, regulate, regulate, regulate, regulate"
    ],
    "I've Been Thinking About You - Londonbeat": [
        "We must have been stone crazy",
        "We possibly were completely insane"
    ],
    "Step Up - Darin": [
        "Don't look back, keep your head held high",
        "Don't gaze rearward, maintain your elevated head"
    ],
    "Venus - the feelers": [
        "Goddess on the mountain top",
        "Deity atop the mountain"
    ],
    "Come and Get Your Love (Rerecorded Version) - Redbone": [
        "Hail, hail",
        "Greetings, greetings"
    ],
    "A Thousand Miles - Single Version - Vanessa Carlton": [
        "Making my way downtown, walking fast, faces pass and I'm home-bound",
        "Journeying through downtown, pacing quickly, faces glide past and I'm headed home"
    ],
    "Iron Man - Black Sabbath": [
        "I am Iron Man",
        "I embody Iron Man"
    ],
    "Walking in Memphis - Marc Cohn": [
        "Put on my blue suede shoes",
        "Wear my blue suede shoes"
    ],
    "You Make My Dreams (Come True) - Daryl Hall & John Oates": [
        "What I want, you've got",
        "What I desire, you possess"
    ],
    "So Sick - Ne-Yo": [
        "Gotta change my answering machine",
        "Need to modify my voicemail"
    ],
    "The Safety Dance - Men Without Hats": [
        "We can dance if we want to",
        "We're able to dance if we desire"
    ],
    "If U Seek Amy - Britney Spears": [
        "Lalalalala, oh baby baby",
        "Lalala, oh darling darling"
    ],
    "That's So Raven (Theme Song) - Raven-Symoné": [
        "Future I can see",
        "Future ahead of me"
    ],
    "Whenever, Wherever - Shakira": [
        "Lucky that my breasts are small and humble",
        "Fortunate that my chest is petite and modest"
    ],
    "High and Dry - Radiohead": [
        "Two jumps in a week, I bet you think that's pretty clever",
        "A couple of leaps in a week, you probably consider that smart"
    ],
    "Going Up The Country - Canned Heat": [
        "I'm going up the country, babe, don't you wanna go?",
        "I'm heading to the countryside, darling, wouldn't you like to come?"
    ],
    "Thank You - Dido": [
        "And I want to thank you",
        "And I desire to express gratitude"
    ],
    "Moonshadow - Yusuf / Cat Stevens": [
        "I'm being followed by a moonshadow, moon shadow, moonshadow",
        "I'm trailed by a moonlight shadow, moon shadow, moonshadow"
    ],
    "Get Ready - Rap Version Edit - 2 Unlimited": [
        "Y'all ready for this?",
        "Are all of you prepared for this?"
    ],
    "Ain't No Grave - Johnny Cash": [
        "Ain't no grave can hold my body down",
        "No tomb can confine my body"
    ],
    "No Rain - Blind Melon": [
        "I just want some one to say to me",
        "I simply wish someone would tell me"
    ],
    "It Ends Tonight - The All-American Rejects": [
        "Your subtleties, they strangle me",
        "Your nuances, they suffocate me"
    ],
    "Seaside - The Kooks": [
        "Do you want to go to the seaside?",
        "Would you like to visit the beach?"
    ],
    "Fly Away - Lenny Kravitz": [
        "I want to get away, I want to fly away",
        "I wish to escape, I wish to soar away"
    ],
    "Slave To The Music - Twenty 4 Seven": [
        "I'm a slave to the music, take your chance tonight",
        "I'm captivated by the music, seize your opportunity tonight"
    ],
    "Johnny, I Hardly Knew Ya - Dropkick Murphys": [
        "With drums and guns and guns and drums",
        "With percussion and firearms and firearms and percussion"
    ],
    "Barracuda - Heart": [
        "So this ain't the end, I saw you again",
        "So this isn't the finale, I witnessed you again"
    ],
    "Meet Me Halfway - Black Eyed Peas": [
        "Can you meet me halfway?",
        "Are you capable of meeting me midway?"
    ],
    "You Can Call Me Al - PMC All-Stars": [
        "A man walks down the street, he says why am I soft in the middle now?",
        "A gentleman strolls down the road, wondering why he's now soft in the middle?"
    ],
    "My Heart Will Go On - Love Theme from \"Titanic\" - Céline Dion": [
        "Near, far, wherever you are",
        "Close, distant, wherever you might be"
    ],
    "Everybody (Backstreet's Back) - Radio Edit - Backstreet Boys": [
        "Everybody, rock your body",
        "Everyone, move your body"
    ],
    "In the End - Linkin Park": [
        "I tried so hard and got so far",
        "I endeavored intensely and reached a distance"
    ],
    "Move on Up - Single Edit - Curtis Mayfield": [
        "Hush now child, and don't you cry",
        "Quiet now, child, and refrain from weeping"
    ],
    "Coco Jamboo - Radio Version - Mr. President": [
        "Put me up, put me down",
        "Lift me up, lower me down"
    ],
    "Ridin' - Chamillionaire, Krayzie Bone": [
        "They see me rollin', they hatin'",
        "They witness me rolling, they disapprove"
    ],
    "Freedom! '90 - George Michael": [
        "I won't let you down",
        "I will not disappoint you"
    ],
    "If I Didn't Have You - Billy Crystal, John Goodman": [
        "If I were a rich man",
        "If I were wealthy"
    ],
    "Every Breath You Take - The Police": [
        "Every breath you take, every move you make",
        "Each breath you take, every action you perform"
    ],
    "What's In It For Me - Amy Diamond": [
        "I saw you at the station",
        "I spotted you at the station"
    ],
    "Running In Your Veins - Renegade Five": [
        "Close your eyes and take a step forward",
        "Shut your eyes and proceed ahead"
    ],
    "The Ride - Basic Element": [
        "Come and join me, let's take the ride",
        "Join me and let's embark on the journey"
    ],
    "I Love You Always Forever - Donna Lewis": [
        "Feels like I'm standing in a timeless dream",
        "Seems like I'm in an eternal dream"
    ],
    "Do You Love Me - Amanda Jenssen": [
        "You really like my limousine",
        "You truly admire my limousine"
    ],
    "Just Like Heaven - The Cure": [
        "Show me how you do that trick",
        "Show to me how you perform that illusion"
    ],
    "Never Gonna Give You Up - Rick Astley": [
        "Never gonna let you down",
        "Never going to disappoint you"
    ],
    "Beggin' - Madcon": [
        "Put your loving hand out, baby",
        "Extend your affectionate hand, darling"
    ],
    "My Name Is - Eminem": [
        "Hi! My name is",
        "Hello! I am called"
    ],
    "Walkin' On The Sun - Smash Mouth": [
        "It ain't no joke, I'd like to buy the world a toke",
        "It's no laughing matter, I wish to purchase the world a puff"
    ],
    "Zou Bisou Bisou - Gillian Hills": [
        "Zou bisou bisou, mon dieu qu'ils sont doux",
        "Zou bisou bisou, my God, they're sweet"
    ],
    "Queen Of Hearts - Juice Newton": [
        "Midnight, and I'm a-waiting on the twelve-oh-five",
        "Midnight, and I'm anticipating the twelve-oh-five"
    ],
    "Saturday Night - Radio Mix - Whigfield": [
        "Dee dee na na na, dee dee na na na",
        "Dee dee na na na, dee dee na na na"
    ],
    "Escape (The Pina Colada Song) - Rupert Holmes": [
        "If you like piña coladas",
        "If you enjoy piña coladas"
    ],
    "Owner of a Lonely Heart - Yes": [
        "Owner of a lonely heart",
        "Possessor of a solitary heart"
    ],
    "True - Single Edit - Spandau Ballet": [
        "So true, funny how it seems",
        "So factual, interesting in what it appears"
    ],
    "Warning Sign - Coldplay": [
        "A warning sign, I missed the good part, then I realized",
        "An alerting indication, I overlooked the pleasant section, then I understood"
    ],
    "Behind Blue Eyes - Limp Bizkit": [
        "No one knows what it's like to be the bad man",
        "Nobody comprehends the experience of being the villain"
    ],
    "Never Be The Same Again - Melanie C, Lisa \"Left Eye\" Lopes": [
        "Never be the same again",
        "Never remain unchanged again"
    ],
    "Leave (Get Out) - Radio Edit - JoJo": [
        "Get out, right now",
        "Depart, immediately"
    ],
    "Go Your Own Way - 2004 Remaster - Fleetwood Mac": [
        "Loving you isn't the right thing to do",
        "Adoring you is not the appropriate choice"
    ],
    "Too Little, Too Late - JoJo": [
        "It's just too little too late",
        "It's simply insufficient, too delayed"
    ],
    "Broken Wings - Mr. Mister": [
        "Take these broken wings",
        "Accept these fractured wings"
    ],
    "Mister Know It All - Main Flow": [
        "You think you know it all",
        "You believe you comprehend everything"
    ],
    "Itchycoo Park - 2012 Remaster - Small Faces": [
        "Over bridge of sighs",
        "Across the bridge of sighs"
    ],
    "Free - La Cream": [
        "I want to be free",
        "I desire liberation"
    ],
    "I'm So Excited - The Pointer Sisters": [
        "I'm so excited, and I just can't hide it",
        "I'm extremely thrilled, and I simply can't conceal it"
    ],
    "We Are The People - Empire of the Sun": [
        "We are the people that rule the world",
        "We are the individuals who govern the world"
    ],
    "Maniac - Michael Sembello": [
        "Just a steel town girl on a Saturday night",
        "Simply a girl from an industrial city on a Saturday evening"
    ],
    "One More Time - Daft Punk": [
        "One more time",
        "Once more"
    ],
    "Bailamos - From \"Wild Wild West\" - Enrique Iglesias": [
        "Bailamos, let the rhythm take you over",
        "Bailamos, allow the rhythm to engulf you"
    ],
    "Talking to the Moon - Bruno Mars": [
        "I'm feeling like I'm famous, the talk of the town",
        "I feel as if I'm renowned, the subject of discussion"
    ],
    "Sweet Tides - Thievery Corporation": [
        "Listen to the sweet tides, it's going to take you away",
        "Observe the pleasant currents, it will transport you"
    ],
    "Venus - Bananarama": [
        "I'm your Venus, I'm your fire, your desire",
        "I am your Venus, I'm your flame, your longing"
    ],
     "If It Makes You Happy - Sheryl Crow": [
        "If it makes you happy",
        "If it brings you joy"
    ],
    "Tonight (I'm Fuckin' You) - Enrique Iglesias, Ludacris, DJ Frank E": [
        "I wanna do it to you tonight",
        "I desire to engage in it with you tonight"
    ],
    "Nothing Compares 2 U - Sinéad O'Connor": [
        "Nothing compares, nothing compares to you",
        "There's no comparison, nothing is alike to you"
    ],
    "Blue Christmas - Elvis Presley": [
        "I'll have a blue Christmas without you",
        "I'll experience a melancholic Christmas in your absence"
    ],
    "Re-Education (Through Labor) - Rise Against": [
        "To the sound of a heartbeat pounding away",
        "To the rhythm of a pulsating heartbeat"
    ],
    "Miss Alissa - Eagles Of Death Metal": [
        "Miss Alissa, she's the queen of the swing",
        "Miss Alissa, she reigns over the swing"
    ],
    "Behind These Hazel Eyes - Kelly Clarkson": [
        "Here I am, once again",
        "At this moment, once more"
    ],
    "Don't Let Go (Love) - En Vogue": [
        "What's it gonna be 'cuz I can't pretend",
        "What will it be because I can't feign"
    ],
    "Rock Me Amadeus - Falco": [
        "Amadeus, Amadeus",
        "Amadeus, Amadeus"
    ],
    "Good Day - Nappy Roots": [
        "I gotta say it was a good day",
        "I must admit it was a pleasant day"
    ],
    "YMCA - Original Version 1978 - Village People": [
        "Young man, there's no need to feel down",
        "Young man, there's no reason to be distressed"
    ],
    "Back for Good - Radio Mix - Take That": [
        "I guess now it's time for me to give up",
        "I suppose it's time for me to surrender now"
    ],
    "Hotel California - 2013 Remaster - Eagles": [
        "On a dark desert highway, cool wind in my hair",
        "On a dim desert road, a refreshing breeze in my hair"
    ],
    "Put Your Records On - Corinne Bailey Rae": [
        "Girl, put your records on, tell me your favorite song",
        "Girl, play your records, share your preferred song with me"
    ],
    "Move on Up - Single Edit - Curtis Mayfield": [
        "Hush now child, and don't you cry",
        "Quiet now, child, and refrain from weeping"
    ],
    "Coco Jamboo - Radio Version - Mr. President": [
        "Put me up, put me down",
        "Lift me up, lower me down"
    ],
    "Ridin' - Chamillionaire, Krayzie Bone": [
        "They see me rollin', they hatin'",
        "They witness me rolling, they disapprove"
    ],
    "Freedom! '90 - George Michael": [
        "I won't let you down",
        "I will not disappoint you"
    ],
    "If I Didn't Have You - Billy Crystal, John Goodman": [
        "If I were a rich man",
        "If I were wealthy"
    ],
    "Every Breath You Take - The Police": [
        "Every breath you take, every move you make",
        "Each breath you take, every action you perform"
    ],
    "What's In It For Me - Amy Diamond": [
        "Oh-oh-oh, what's in it for me?",
        "Oh-oh-oh, what benefits me?"
    ],
    "Running In Your Veins - Renegade Five": [
        "I'm running in your veins",
        "I course through your veins"
    ],
    "The Ride - Basic Element": [
        "On the ride",
        "During the journey"
    ],
    "I Love You Always Forever - Donna Lewis": [
        "I love you always forever",
        "I adore you eternally always"
    ],
    "Do You Love Me - Amanda Jenssen": [
        "Do you love me?",
        "Do you have affection for me?"
    ],
    "Just Like Heaven - The Cure": [
        "Show me, show me, show me how you do that trick",
        "Demonstrate, demonstrate, demonstrate how you perform that feat"
    ],
    "Never Gonna Give You Up - Rick Astley": [
        "Never gonna give you up",
        "Never intending to abandon you"
    ],
    "Beggin' - Madcon": [
        "Put your loving hand out, baby",
        "Extend your affectionate hand, darling"
    ],
    "My Name Is - Eminem": [
        "Hi! My name is",
        "Greetings! I am called"
    ],
    "Walkin' On The Sun - Smash Mouth": [
        "So don't delay, act now, supplies are running out",
        "Therefore, don't hesitate, take action immediately, stocks are depleting"
    ],
    "Zou Bisou Bisou - Gillian Hills": [
        "Zou bisou bisou",
        "Zou bisou bisou"
    ],
    "Queen Of Hearts - Juice Newton": [
        "Playing with the queen of hearts",
        "Engaging with the queen of hearts"
    ],
    "Saturday Night - Radio Mix - Whigfield": [
        "Saturday night, I feel the air is getting hot",
        "Saturday night, I sense the atmosphere heating up"
    ],
    "(Theme From) Midnight Express - Giorgio Moroder": [
        "If you can't sleep at night",
        "If you are unable to rest at night"
    ],
    "Ecuador - Sash!": [
        "Ecuador",
        "Ecuador"
    ],
    "Everywhere - 2017 Remaster - Fleetwood Mac": [
        "Can you hear me calling out your name?",
        "Can you perceive me beckoning your name?"
    ],
    "Memories (feat. Kid Cudi) - David Guetta, Kid Cudi": [
        "All the crazy shit I did tonight",
        "All the insane things I did tonight"
    ],
    "Summer Wine - Single Edit - Ville Valo, Natalia Avelon": [
        "Strawberries, cherries and an angel's kiss in spring",
        "Strawberries, cherries, and a celestial kiss in spring"
    ],
    "La Tortura (feat. Alejandro Sanz) - Shakira, Alejandro Sanz": [
        "Amarrao' aquí como estás",
        "Tied up here as you are"
    ],
    "Here I Go Again 87 - 2007 Remastered Version - Whitesnake": [
        "Here I go again on my own",
        "Once again, I journey alone"
    ],
    "Holding Out for a Hero - From 'Footloose' Soundtrack - Bonnie Tyler": [
        "I need a hero",
        "I require a champion"
    ],
    "The Scientist - Coldplay": [
        "Nobody said it was easy",
        "No one claimed it was simple"
    ],
    "Kernkraft 400 - DJ Gius Mix, Radio Edit - Zombie Nation": [
        "Do, do, do, do, do",
        "Do, do, do, do, do"
    ],
    "I Don't Want to Be - Gavin DeGraw": [
        "I don't want to be anything other than what I've been trying to be lately",
        "I don't wish to be anything except what I've been endeavoring to be recently"
    ],
    "She Drives Me Crazy - Fine Young Cannibals": [
        "She drives me crazy",
        "She exasperates me"
    ],
    "Everlasting Love - Love Affair": [
        "Hearts gone astray",
        "Hearts led astray"
    ],
    "Breathe (feat. Sean Paul) - Rap Version - Blu Cantrell, Sean Paul": [
        "So go on and take a bow",
        "Therefore, proceed and acknowledge"
    ],
    "Viva Las Vegas - Elvis Presley": [
        "Bright light city gonna set my soul, gonna set my soul on fire",
        "Radiant urban center will ignite my soul, will set my soul on fire"
    ],
    "Feel the Beat - Darude": [
        "Feel the beat",
        "Sense the rhythm"
    ],
    "Tell It to My Heart - Taylor Dayne": [
        "Tell it to my heart",
        "Express it to my heart"
    ],
    "Angel Of The Morning - Juice Newton": [
        "Just call me angel of the morning",
        "Just refer to me as angel of the morning"
    ],
    "Blurry - Puddle Of Mudd": [
        "Everything's so blurry",
        "Everything's so unclear"
    ],
    "Hello - Lionel Richie": [
        "Hello, is it me you're looking for?",
        "Greetings, are you searching for me?"
    ],
    "Shadows - Evoid": [
        "Walking through the shadows",
        "Strolling through the shadows"
    ],
    "What's Up? - 4 Non Blondes": [
        "And I say hey, hey, hey, hey",
        "And I exclaim hey, hey, hey, hey"
    ],
    "Ain't No Rest For The Wicked - Original Version - Cage The Elephant": [
        "Ain't no rest for the wicked",
        "No respite for the evil"
    ],
    "Whatta Man - Salt-N-Pepa, En Vogue": [
        "I wanna take a minute or two, and give much respect due",
        "I wish to take a moment or two, and show much deserved respect"
    ],
    "Chasing Cars - Snow Patrol": [
        "If I lay here",
        "If I recline here"
    ],
    "Lemon Tree - Fools Garden": [
        "I'm sitting here in the boring room",
        "I'm seated here in the mundane chamber"
    ],
    "What Is Love - 7\" Mix - Haddaway": [
        "What is love?",
        "What defines love?"
    ],
    "Dance Wiv Me - Dizzee Rascal, Calvin Harris, Chrom3": [
        "Do the dance, do the dance",
        "Execute the dance, execute the dance"
    ],
    "(I Can't Help) Falling In Love With You - UB40": [
        "Wise men say, only fools rush in",
        "Sensible individuals suggest, only foolish rush hastily"
    ],
    "Escape (The Pina Colada Song) - Rupert Holmes": [
        "I was tired of my lady",
        "I was weary of my lady"
    ],
    "Owner of a Lonely Heart - Yes": [
        "Move yourself",
        "Stir yourself"
    ],
    "True - Single Edit - Spandau Ballet": [
        "So true, funny how it seems",
        "So true, interesting how it appears"
    ],
    "Warning Sign - Coldplay": [
        "A warning sign",
        "An alerting indication"
    ],
    "Behind Blue Eyes - Limp Bizkit": [
        "No one knows what it's like",
        "Nobody comprehends how it feels"
    ],
    "Never Be The Same Again - Melanie C, Lisa \"Left Eye\" Lopes": [
        "Come on",
        "Proceed"
    ],
    "Leave (Get Out) - Radio Edit - JoJo": [
        "Get out right now",
        "Leave immediately"
    ],
    "Go Your Own Way - 2004 Remaster - Fleetwood Mac": [
        "You can go your own way",
        "You are free to choose your path"
    ],
    "Too Little, Too Late - JoJo": [
        "It's just too little too late",
        "It's simply inadequate, too belated"
    ],
    "Broken Wings - Mr. Mister": [
        "Take these broken wings",
        "Receive these fractured wings"
    ],
    "Mister Know It All - Main Flow": [
        "Mr. Know It All",
        "Mr. Professes Everything"
    ],
    "Itchycoo Park - 2012 Remaster - Small Faces": [
        "It's all too beautiful",
        "It's all exceedingly exquisite"
    ],
    "Free - La Cream": [
        "Everybody's free",
        "Everyone is liberated"
    ],
    "I'm So Excited - The Pointer Sisters": [
        "I'm so excited",
        "I'm exceedingly thrilled"
    ],
    "We Are The People - Empire of the Sun": [
        "We can remember swimming in December",
        "We recall swimming in December"
    ],
    "Maniac - Michael Sembello": [
        "She's a maniac",
        "She's a lunatic"
    ],
    "One More Time - Daft Punk": [
        "One more time",
        "Once again"
    ],
    "Talking to the Moon - Bruno Mars": [
        "I'm talking to the moon",
        "I'm conversing with the moon"
    ],
    "Sweet Tides - Thievery Corporation": [
        "It's love again",
        "It's love once more"
    ],
    "Venus - Bananarama": [
        "Goddess on the mountain top",
        "Divinity atop the mountain"
    ],
    "If It Makes You Happy - Sheryl Crow": [
        "If it makes you happy",
        "If it brings you joy"
    ],
    "Tonight (I'm Fuckin' You) - Enrique Iglesias, Ludacris, DJ Frank E": [
        "I know you want me",
        "I'm aware you desire me"
    ],
    "Nothing Compares 2 U - Sinéad O'Connor": [
        "It's been seven hours and fifteen days",
        "It has been seven hours and fifteen days"
    ],
    "Blue Christmas - Elvis Presley": [
        "I'll have a blue Christmas without you",
        "I'll experience a melancholic Christmas without you"
    ],
    "Re-Education (Through Labor) - Rise Against": [
        "To the sound of a heartbeat pounding away",
        "To the rhythm of a heartbeat pounding relentlessly"
    ],
    "Miss Alissa - Eagles Of Death Metal": [
        "Miss Alissa, she's the queen of the pack",
        "Miss Alissa, she reigns over the pack"
    ],
    "Behind These Hazel Eyes - Kelly Clarkson": [
        "Here I am, once again",
        "Here I stand, once more"
    ],
    "Don't Let Go (Love) - En Vogue": [
        "What's it gonna be?",
        "What will it be?"
    ],
    "Good Day - Nappy Roots": [
        "Good day",
        "Great day"
    ],
    "YMCA - Original Version 1978 - Village People": [
        "Young man, there's no need to feel down",
        "Young man, you needn't feel dejected"
    ],
    "Back for Good - Radio Mix - Take That": [
        "I guess now it's time for me to give up",
        "I suppose now it's time for me to relinquish"
    ],
    "Hotel California - 2013 Remaster - Eagles": [
        "On a dark desert highway",
        "On a dim desert highway"
    ],
    "Put Your Records On - Corinne Bailey Rae": [
        "Three little birds sat on my window",
        "Three little birds perched on my window"
    ],
        "Wanted Dead Or Alive - Bon Jovi": [
        "It's all the same, only the names will change",
        "Everything's identical, solely the identities alter"
    ],
    "Duality - Slipknot": [
        "I push my fingers into my eyes",
        "I thrust my digits into my eyes"
    ],
    "Mad World - Gary Jules, Michael Andrews": [
        "All around me are familiar faces",
        "Surrounding me are recognizable visages"
    ],
    "The Look - Roxette": [
        "Walking like a man, hitting like a hammer",
        "Strolling like a gentleman, striking like a mallet"
    ],
    "I Ran (So Far Away) - A Flock Of Seagulls": [
        "I walk along the avenue",
        "I stroll along the thoroughfare"
    ],
    "A Little Less Conversation - JXL Radio Edit Remix - Elvis Presley, JXL": [
        "A little less conversation, a little more action",
        "A tad fewer discussions, a bit more activity"
    ],
    "Push The Feeling On - Mk Dub Revisited Edit - Nightcrawlers, MK": [
        "Push the feeling on",
        "Propel the sensation forward"
    ],
    "If I Could Turn Back Time - Cher": [
        "If I could turn back time",
        "If I could reverse time"
    ],
    "Every Breath You Take - The Police": [
        "Every breath you take",
        "Each inhalation you make"
    ]
}


Measuring Results

In [None]:
def mostSimilar(query):
  vectorizer = TfidfVectorizer()
  X = vectorizer.fit_transform([query] + list(df["Tokens"]))
  cosine_similarities = cosine_similarity(X[0:1], X[1:]).flatten()
  most_similar_indices = cosine_similarities.argsort()[::-1]
  return most_similar_indices

In [None]:
def rank(mostSimilarIndex, songname):
  Rank = 1
  for i in df.iloc[mostSimilarIndex].SongName:
    if i == songname:
      return Rank
    else:
      Rank += 1



In [None]:
j = 0
rankOrignal = 0
rankModified = 0
for i in queries:
  songname = i
  modifiedQuery = queries[i][1]
  originalQuery = queries[i][0]

  modifiedQueryIndex = mostSimilar(modifiedQuery)
  originalQueryIndex = mostSimilar(originalQuery)
  try:
    rankOrignal += 1  / rank(originalQueryIndex, songname)
    rankModified += 1 / rank(modifiedQueryIndex, songname)
  except:
    continue

  print( songname, rank(originalQueryIndex, songname), rank(modifiedQueryIndex, songname))

  j += 1

print(rankModified  *( 1 / j), rankOrignal * (1/  j))





Destroy Everything You Touch - Ladytron 1 245
Wanted Dead Or Alive - Bon Jovi 169 908
Summertime - DJ Jazzy Jeff & The Fresh Prince 1 82
Millennium - Robbie Williams 1 24
Advertising Space - Robbie Williams 192 75
Booyaka 619 (Rey Mysterio) - WWE, P.O.D. 1 383
Duality - Slipknot 2 23
Are You Gonna Be My Girl - Jet 1 9
Raise Your Glass - P!nk 1 3
Rockstar - Nickelback 1 358
Mad World - Gary Jules, Michael Andrews 5 66
California Dream - The Mamas & The Papas 319 339
You're No Good - Linda Ronstadt 368 1525
Sorry, Blame It On Me - Akon 1 54
Waterloo - ABBA 1 1
Faces - Original Extended Version - Clio 215 167
Clocks - Coldplay 5 290
Kickstart My Heart - Mötley Crüe 94 1056
Jungle Boogie - Kool & The Gang 3 250
MMMBop - Single Version - Hanson 10 10
Stupidisco - Junior Jack 1599 1619
I'm Coming Out - Diana Ross 1 84
Heaven Is A Place On Earth - Belinda Carlisle 7 1511
Bubbly - Colbie Caillat 1 1
You're The One That I Want - From “Grease” - John Travolta, Olivia Newton-John 2 9
Not Over Yet

In [None]:
print(rankModified  *( 1 / j), rankOrignal * (1/  j))

0.20323051901585926 0.47832525998985465
