Read from a local copy of the ClaimReview Database

In [2]:
fc_path = "fact_checks_20180502.txt"

with open(fc_path) as f:
    fc_raw = f.readlines()

In [3]:
print("No. of Claims:", len(fc_raw))

No. of Claims: 8902


Functions to normalise the text

In [5]:
import re
import json
import nltk
from nltk.corpus import stopwords
from nltk.stem import WordNetLemmatizer
from nltk.corpus import wordnet

lemmatizer = WordNetLemmatizer()

def strip_html(data):
    p = re.compile(r'<.*?>')
    return p.sub('', data)

def clean_text(data):
    text = re.sub(r'[^\w\s]', ' ', data.lower()).replace("\n", "").replace("  ", " ")
    text = "".join([c for c in text if (c.isalpha() or c == " ")])
    text = text.split(" ")
    output = ""
    for word in text:
        if word not in stopwords.words("english"):
            output = output + " " + word
    return output.strip().replace("  ", " ")

def nltk2wn_tag(nltk_tag):
    if nltk_tag.startswith('J'):
        return wordnet.ADJ
    elif nltk_tag.startswith('V'):
        return wordnet.VERB
    elif nltk_tag.startswith('N'):
        return wordnet.NOUN
    elif nltk_tag.startswith('R'):
        return wordnet.ADV
    else:          
        return None
    
def lemmatize_sentence(sentence):
    nltk_tagged = nltk.pos_tag(nltk.word_tokenize(sentence))  
    wn_tagged = map(lambda x: (x[0], nltk2wn_tag(x[1])), nltk_tagged)
    res_words = []
    for word, tag in wn_tagged:
        if tag is None:            
            res_words.append(word)
        else:
            res_words.append(lemmatizer.lemmatize(word, tag))
    return " ".join(res_words)

def norm_text(data,):
    raw = strip_html(data)
    text = clean_text(raw)
    norm_text = lemmatize_sentence(text)
    return norm_text

In [17]:
for fc in fc_raw:
    fc = fc.strip("\n")
    fc = fc.replace("</script>", "").replace('<script type="application/ld+json">', "")
    fc = json.loads(fc)
    claim = fc["claimReviewed"]
#     date_published = fc["datePublished"]
    review_url = fc["url"]
    
    print("Claim:", claim)
    r.extract_keywords_from_text(claim)
    r.get_ranked_phrases()
    print(r.get_ranked_phrases_with_scores())
    print("")
    print("")

Claim: Actor Dwayne Johnson died filming a stunt for <I>Fast & Furious</I> 7.
[(25.0, 'actor dwayne johnson died filming'), (4.0, 'furious </'), (1.0, 'stunt'), (1.0, 'fast'), (1.0, '7')]


Claim: A "Muslim migrant" beats up a boy on crutches in a video posted to a site in the Netherlands.
[(4.0, 'video posted'), (4.0, 'muslim migrant'), (1.0, 'site'), (1.0, 'netherlands'), (1.0, 'crutches'), (1.0, 'boy'), (1.0, 'beats')]


Claim: Barack Obama said he would replace the U.S. national anthem with the song 'I'd Like to Teach the World to Sing.'
[(9.0, 'barack obama said'), (4.0, 'would replace'), (4.0, "sing .'"), (4.0, 'national anthem'), (1.0, 'world'), (1.0, 'u'), (1.0, 'teach'), (1.0, 'song'), (1.0, 'like')]


Claim: Meg White is replacing Rush's drummer Neil Peart.
[(9.0, 'drummer neil peart'), (4.0, 'replacing rush'), (4.0, 'meg white')]


Claim: About 1.1 million people legally enter the U.S. each year as permanent residents -- "65 percent of that is some kind of chain migration; 2

Claim: The Clintons were forced to return an estimated $200,000 in furniture, china and art they "stole" from the White House.
[(4.0, 'white house'), (1.0, 'stole'), (1.0, 'return'), (1.0, 'furniture'), (1.0, 'forced'), (1.0, 'estimated'), (1.0, 'clintons'), (1.0, 'china'), (1.0, 'art'), (1.0, '200'), (1.0, '000')]


Claim: Ted Cruz blamed God for his failed presidential campaign on Twitter.
[(16.0, 'ted cruz blamed god'), (9.0, 'failed presidential campaign'), (1.0, 'twitter')]


Claim: “According to the National Academy of Sciences, our current immigration system costs America’s taxpayers many billions of dollars a year.”
[(36.0, 'current immigration system costs america ’'), (9.0, 'taxpayers many billions'), (4.0, '“ according'), (4.0, 'year .”'), (4.0, 'national academy'), (1.0, 'sciences'), (1.0, 'dollars')]


Claim: A bust of Abraham Lincoln was vandalized in Chicago in protest of confederate statues.
[(4.0, 'confederate statues'), (4.0, 'abraham lincoln'), (1.0, 'vandalized'), (

Claim: President Donald Trump’s deal with Democratic leaders “basically freezes last year’s funding in place, which is a cut of $52 billion” in the defense budget.
[(62.0, 'democratic leaders “ basically freezes last year ’'), (18.0, 'president donald trump ’'), (9.0, '52 billion ”'), (4.0, 'defense budget'), (1.0, 'place'), (1.0, 'funding'), (1.0, 'deal'), (1.0, 'cut')]


Claim: "Alabama state police arrest 3 poll workers in Birmingham."
[(49.0, 'alabama state police arrest 3 poll workers'), (4.0, 'birmingham ."')]


Claim: "There’s no data that says a gun-free zone has saved lives."
[(9.0, 'saved lives ."'), (4.0, 'free zone'), (1.0, '’'), (1.0, 'says'), (1.0, 'gun'), (1.0, 'data')]


Claim: Queen Elizabeth said that she would "take America back" if Donald Trump gets elected president.
[(25.0, 'donald trump gets elected president'), (9.0, 'take america back'), (9.0, 'queen elizabeth said'), (1.0, 'would')]


Claim: A video shows a hunter getting attacked by a lion while posing with a

Claim: President Trump violated protocol by not standing or saluting during the playing of "Retreat" during an interview with Sean Hannity.
[(16.0, 'president trump violated protocol'), (4.0, 'sean hannity'), (1.0, 'standing'), (1.0, 'saluting'), (1.0, 'retreat'), (1.0, 'playing'), (1.0, 'interview')]


Claim: Yoko Ono confirmed that she had an affair with Hillary Clinton in the 1970s.
[(9.0, 'yoko ono confirmed'), (4.0, 'hillary clinton'), (1.0, 'affair'), (1.0, '1970s')]


Claim: About three-quarters of (Syrian refugees) are women and children. A full third of them are kids under 12 years old.
[(9.0, '12 years old'), (4.0, 'syrian refugees'), (4.0, 'full third'), (1.0, 'women'), (1.0, 'three'), (1.0, 'quarters'), (1.0, 'kids'), (1.0, 'children')]


Claim: A photograph shows a group of children in South Africa giving a meerkat a bath.
[(9.0, 'south africa giving'), (4.0, 'photograph shows'), (1.0, 'meerkat'), (1.0, 'group'), (1.0, 'children'), (1.0, 'bath')]


Claim: The name of the C

Claim: "Seven years later, (Scott Walker) has not hit his first campaign promise of creating 250,000 jobs."
[(9.0, 'seven years later'), (9.0, 'first campaign promise'), (9.0, '000 jobs ."'), (4.0, 'scott walker'), (4.0, 'creating 250'), (1.0, 'hit')]


Claim: "Not a single Democrat opposed Neil Gorsuch's confirmation in 2006."
[(25.0, 'single democrat opposed neil gorsuch'), (4.0, '2006 ."'), (1.0, 'confirmation')]


Claim: "In America, radical speech is not a crime."
[(4.0, 'radical speech'), (4.0, 'crime ."'), (1.0, 'america')]


Claim: Ads on Craigslist sought to recruit paid protesters to swarm Donald Trump rallies.
[(16.0, 'swarm donald trump rallies'), (9.0, 'recruit paid protesters'), (4.0, 'craigslist sought'), (1.0, 'ads')]


Claim: A photograph shows boxer Muhammad Ali with musician Michael Jackson.
[(25.0, 'photograph shows boxer muhammad ali'), (9.0, 'musician michael jackson')]


Claim: “Compliance with the terms of the Paris accord and the onerous energy restrictions it 

Claim: Republicans in Alabama filed a bill which (if passed) would prohibit people who owned cars from receiving food stamps.
[(9.0, 'would prohibit people'), (9.0, 'receiving food stamps'), (4.0, 'owned cars'), (4.0, 'alabama filed'), (1.0, 'republicans'), (1.0, 'passed'), (1.0, 'bill')]


Claim: “George W. Bush made the agreement about when American troops would leave Iraq, not Barack Obama."
[(25.0, 'american troops would leave iraq'), (9.0, '“ george w'), (9.0, 'barack obama ."'), (4.0, 'bush made'), (1.0, 'agreement')]


Claim: Donald Trump was pictured at a cross burning with the KKK.
[(4.0, 'donald trump'), (4.0, 'cross burning'), (1.0, 'pictured'), (1.0, 'kkk')]


Claim: Says Russ Feingold "voted to raise taxes on Social Security benefits for seniors, he even tried to give Social Security benefits to illegal immigrants."
[(14.5, 'give social security benefits'), (10.5, 'social security benefits'), (9.0, 'says russ feingold'), (9.0, 'illegal immigrants ."'), (4.0, 'raise taxes')

Claim: A photograph shows a small boy who was handcuffed at Dulles Airport due to temporary immigration restrictions implemented in January 2017.
[(16.0, 'temporary immigration restrictions implemented'), (9.0, 'dulles airport due'), (4.0, 'small boy'), (4.0, 'photograph shows'), (4.0, 'january 2017'), (1.0, 'handcuffed')]


Claim: Comedian Jeff Foxworthy slammed Hillary Clinton and was attacked by liberals.
[(36.0, 'comedian jeff foxworthy slammed hillary clinton'), (1.0, 'liberals'), (1.0, 'attacked')]


Claim: A list shows documents that several prominent news media executives have ties to the Obama administration.
[(25.0, 'several prominent news media executives'), (9.0, 'list shows documents'), (4.0, 'obama administration'), (1.0, 'ties')]


Claim: “It’s a debt-inducing, make-rich-people-richer tax bill that in the long run is not going to be helpful to the vast majority of people in my state that are sitting around the kitchen table trying to figure out how [to] come out even at 



Claim: The modern image of Jesus is modeled on Cesare Borgia, a gangster's son.
[(4.0, 'modern image'), (4.0, 'cesare borgia'), (1.0, 'son'), (1.0, 'modeled'), (1.0, 'jesus'), (1.0, 'gangster')]


Claim: Aerosmith once decided to play their set list in reverse, then opened  a concert with their encore and mistakenly walked off the stage.
[(4.0, 'set list'), (4.0, 'mistakenly walked'), (1.0, 'stage'), (1.0, 'reverse'), (1.0, 'play'), (1.0, 'opened'), (1.0, 'encore'), (1.0, 'decided'), (1.0, 'concert'), (1.0, 'aerosmith')]


Claim: "We are now, very proudly, an exporter of energy to the world."
[(4.0, 'world ."'), (1.0, 'proudly'), (1.0, 'exporter'), (1.0, 'energy')]


Claim: "I am taking action to affirm and improve the state’s commitment to privacy and equality. To that end, today I have signed an executive order with the goal of achieving that fine balance.”
[(9.0, 'fine balance .”'), (4.0, 'taking action'), (4.0, 'state ’'), (4.0, 'executive order'), (1.0, 'today'), (1.0, 'signed')



Claim: Photographs shows a man eating a dead baby served at a Taiwan restaurant.
[(9.0, 'dead baby served'), (4.0, 'taiwan restaurant'), (4.0, 'photographs shows'), (4.0, 'man eating')]


Claim: A photograph shows President Donald Trump reaching out to rescue a Harvey flooding victim.
[(36.0, 'photograph shows president donald trump reaching'), (9.0, 'harvey flooding victim'), (1.0, 'rescue')]


Claim: A mounted policeman's horse had its leg broken by protesters during anti-Trump demonstrations.
[(4.0, 'trump demonstrations'), (4.0, 'mounted policeman'), (4.0, 'leg broken'), (1.0, 'protesters'), (1.0, 'horse'), (1.0, 'anti')]


Claim: A list of coincidences connecting the number 108 to the Chicago Cubs world series victory in 2016 is accurate.
[(25.0, 'chicago cubs world series victory'), (4.0, 'number 108'), (4.0, 'coincidences connecting'), (1.0, 'list'), (1.0, 'accurate'), (1.0, '2016')]


Claim: The House voted to allow horses in the U.S. to be slaughtered for food.
[(4.0, 'house


Claim: During the Iowa caucuses, delegates are sometimes awarded through coin tosses, and Hillary Clinton won six coin tosses in the 2016 caucuses (awarding her a narrow victory).
[(9.0, 'narrow victory ).'), (8.0, 'six coin tosses'), (5.0, 'coin tosses'), (4.0, 'sometimes awarded'), (4.0, 'iowa caucuses'), (4.0, 'hillary clinton'), (4.0, '2016 caucuses'), (1.0, 'delegates'), (1.0, 'awarding')]


Claim: A Syrian refugee receives close to $400,000 in benefits a year from the German government in order to take care of his wives and children.
[(16.0, 'syrian refugee receives close'), (4.0, 'take care'), (4.0, 'german government'), (1.0, 'year'), (1.0, 'wives'), (1.0, 'order'), (1.0, 'children'), (1.0, 'benefits'), (1.0, '400'), (1.0, '000')]


Claim: Eleven states are implementing motorcycle curfews with stiff penalties for violators.
[(9.0, 'implementing motorcycle curfews'), (4.0, 'stiff penalties'), (4.0, 'eleven states'), (1.0, 'violators')]


Claim: Scammers place phone calls to hot

[(9.0, 'effective july 2016'), (4.0, 'electronic cigarettes'), (1.0, 'juice'), (1.0, 'fda'), (1.0, 'e'), (1.0, 'banned')]


Claim: Six anti-Trump protesters were killed by a truck in the course of demonstrating on a freeway.
[(4.0, 'trump protesters'), (4.0, 'six anti'), (1.0, 'truck'), (1.0, 'killed'), (1.0, 'freeway'), (1.0, 'demonstrating'), (1.0, 'course')]


Claim: A meme shows the American flag displayed on the White House in 2017, and a rainbow display in 2016.
[(9.0, 'american flag displayed'), (4.0, 'white house'), (4.0, 'rainbow display'), (4.0, 'meme shows'), (1.0, '2017'), (1.0, '2016')]


Claim: "In the mid 1990s, in our state, (Florida was) No. 1 in violent crime in America. ... The only concern I had was for the citizens of Florida, who were subjected to a violent crime every three minutes and 45 seconds."
[(22.0, 'violent crime every three minutes'), (9.0, '45 seconds ."'), (7.0, 'violent crime'), (4.0, 'mid 1990s'), (1.0, 'subjected'), (1.0, 'state'), (1.0, 'florida'),

[(9.0, 'dollar spending bill'), (4.0, 'reinvestment act'), (4.0, 'president obama'), (4.0, 'fancy name'), (4.0, 'crumbling roads'), (4.0, 'bridges ,"'), (4.0, 'american recovery'), (4.0, 'absolutely nothing'), (1.0, 'trillion'), (1.0, 'supposed'), (1.0, 'show'), (1.0, 'fix'), (1.0, 'arra'), (1.0, 'almost'), (1.0, '."')]


Claim: "Hatchimal" bath bombs are giving children chemical burns.
[(16.0, 'giving children chemical burns'), (4.0, 'bath bombs'), (1.0, 'hatchimal')]


Claim: Wendy's restaurants replaced workers with machines at thousands of locations because of a hike in the minimum wage.
[(9.0, 'restaurants replaced workers'), (4.0, 'minimum wage'), (1.0, 'wendy'), (1.0, 'thousands'), (1.0, 'machines'), (1.0, 'locations'), (1.0, 'hike')]


Claim: Ted Nugent called Colin Kaepernick a "chimp" when discussing the President's support for the athlete's protest.
[(25.0, 'ted nugent called colin kaepernick'), (1.0, 'support'), (1.0, 'protest'), (1.0, 'president'), (1.0, 'discussing'), (1.

Claim: Adolf Hitler was a “leftist” who stated that Nazis “are socialists [and] mortal enemies of the present capitalist economic system.”
[(25.0, 'present capitalist economic system .”'), (8.5, '“ leftist ”'), (4.5, 'nazis “'), (4.0, 'mortal enemies'), (4.0, 'adolf hitler'), (1.0, 'stated'), (1.0, 'socialists')]


Claim: "California is once again the sixth-largest economy in the world. If you add the GDP’s of Washington and Oregon, California would surpass the United Kingdom to become the fifth-largest economy in the world."
[(8.0, 'california would surpass'), (4.0, 'united kingdom'), (4.0, 'largest economy'), (4.0, 'gdp ’'), (3.5, 'world ."'), (2.0, 'california'), (1.5, 'world'), (1.0, 'washington'), (1.0, 'sixth'), (1.0, 'oregon'), (1.0, 'fifth'), (1.0, 'become'), (1.0, 'add')]


Claim: Says Ann Kirkpatrick “votes with her party nearly 90 percent of the time.”
[(25.0, 'says ann kirkpatrick “ votes'), (16.0, 'party nearly 90 percent'), (4.0, 'time .”')]


Claim: A kitten died after i

Claim: A DNA test confirmed that actor Bryshere Y. Gray is the biological son of rap mogu Jay-Z.
[(9.0, 'rap mogu jay'), (9.0, 'dna test confirmed'), (4.0, 'biological son'), (4.0, 'actor bryshere'), (1.0, 'z'), (1.0, 'gray')]


Claim: "You will learn more about Donald Trump by going down to the Federal Election Commission" to see the financial disclosure form than by looking at tax returns.
[(9.0, 'financial disclosure form'), (9.0, 'federal election commission'), (4.0, 'tax returns'), (4.0, 'donald trump'), (1.0, 'see'), (1.0, 'looking'), (1.0, 'learn'), (1.0, 'going')]


Claim: Life expectancy in the United States is now lower because of Obamacare.
[(4.0, 'united states'), (4.0, 'life expectancy'), (1.0, 'obamacare'), (1.0, 'lower')]


Claim: The accused school shooter in Florida is a Dreamer, a DACA recipient, or undocumented.
[(9.0, 'accused school shooter'), (4.0, 'daca recipient'), (1.0, 'undocumented'), (1.0, 'florida'), (1.0, 'dreamer')]


Claim: Says Hillary Clinton's Iran nu

Claim: Says that compared to direct sales by manufacturers, consumers "save avg of $500 per car sold through franchised dealer model."
[(16.0, 'franchised dealer model ."'), (16.0, '500 per car sold'), (4.0, 'save avg'), (4.0, 'direct sales'), (1.0, 'says'), (1.0, 'manufacturers'), (1.0, 'consumers'), (1.0, 'compared')]


Claim: "House GOP rules package bars CBO from counting spikes in deficit spending spurred by an ACA repeal."
[(36.0, 'house gop rules package bars cbo'), (9.0, 'deficit spending spurred'), (9.0, 'aca repeal ."'), (4.0, 'counting spikes')]


Claim: "Numerous foreign-born individuals have been convicted or implicated in terrorism-related crimes since September 11, 2001."
[(25.0, 'related crimes since september 11'), (4.0, 'numerous foreign'), (4.0, 'born individuals'), (4.0, '2001 ."'), (1.0, 'terrorism'), (1.0, 'implicated'), (1.0, 'convicted')]


Claim: The 2017 Perseid Meteor shower will be the brightest meteor shower in recorded human history.
[(15.0, '2017 perseid 


Claim: Fox News Channel CEO Roger Ailes said that 'the truth is whatever people will believe.'
[(49.0, 'fox news channel ceo roger ailes said'), (4.0, 'whatever people'), (4.0, "believe .'"), (1.0, 'truth')]


Claim: Says he did not discuss sanctions with Russian ambassador to U.S.
[(4.0, 'russian ambassador'), (4.0, 'discuss sanctions'), (1.0, 'u'), (1.0, 'says')]


Claim: California’s marijuana legalization initiative, Prop. 64 "allows marijuana smoking ads in prime time, on programs with millions of children and teenage viewers."
[(15.5, 'allows marijuana smoking ads'), (9.5, 'marijuana legalization initiative'), (9.0, 'teenage viewers ."'), (4.0, 'prime time'), (4.0, 'california ’'), (1.0, 'prop'), (1.0, 'programs'), (1.0, 'millions'), (1.0, 'children'), (1.0, '64')]


Claim: A photograph shows a threatening letter from a "neighborhood town watch" that was widely circulated to Muslims in the United States.
[(9.0, 'neighborhood town watch'), (4.0, 'widely circulated'), (4.0, 'unite


Claim: Women absorb and retain DNA from every man they have had sex with.
[(4.0, 'women absorb'), (4.0, 'retain dna'), (4.0, 'every man'), (1.0, 'sex')]


Claim: Dick Smith penned an email to customers denigrating the Muslim religion.
[(9.0, 'dick smith penned'), (4.0, 'muslim religion'), (4.0, 'customers denigrating'), (1.0, 'email')]


Claim: A new study published by Oxford University researchers proved that women with big butts are smarter and healthier.
[(16.0, 'oxford university researchers proved'), (9.0, 'new study published'), (4.0, 'big butts'), (1.0, 'women'), (1.0, 'smarter'), (1.0, 'healthier')]


Claim: Two photographs of the earth taken by NASA in 1978 and 2012 document the dramatic effects of deforestation in North America.
[(4.0, 'two photographs'), (4.0, 'north america'), (4.0, 'earth taken'), (4.0, 'dramatic effects'), (4.0, '2012 document'), (1.0, 'nasa'), (1.0, 'deforestation'), (1.0, '1978')]


Claim: “Only half of the murders in the city of St. Louis get solved.”


Claim: Melania Trump suggested her husband could "make peace with the blacks" by increasing their food stamp payments.
[(9.0, 'melania trump suggested'), (9.0, 'food stamp payments'), (4.0, 'make peace'), (4.0, 'husband could'), (1.0, 'increasing'), (1.0, 'blacks')]


Claim: A photograph shows a sleepy cheetah at a greyhound race.
[(4.0, 'sleepy cheetah'), (4.0, 'photograph shows'), (4.0, 'greyhound race')]


Claim: Says Hillary Clinton "is the one that labeled African-American youth as ‘superpredators.’"
[(9.0, '‘ superpredators .’"'), (9.0, 'says hillary clinton'), (4.0, 'labeled african'), (4.0, 'american youth'), (1.0, 'one')]


Claim: In September 2017, the makers of Reese's Peanut Butter Cups announced they were discontinuing the candy and withdrawing it from circulation.
[(16.0, 'peanut butter cups announced'), (4.0, 'september 2017'), (1.0, 'withdrawing'), (1.0, 'reese'), (1.0, 'makers'), (1.0, 'discontinuing'), (1.0, 'circulation'), (1.0, 'candy')]


Claim: Smithfield Foods w


Claim: "This will be the last time — April — that you’re going to (fill out) that old-fashioned, big, lots of pages, complicated tax form. Because next April you’re going to, in many cases, (file) one page, one card. It’s going to be very, very different. Very, very different."
[(23.5, 'last time — april —'), (9.0, 'complicated tax form'), (5.5, 'next april'), (4.0, 'one page'), (4.0, 'one card'), (4.0, 'many cases'), (3.5, 'different ."'), (1.5, 'different'), (1.0, '’'), (1.0, 'pages'), (1.0, 'old'), (1.0, 'lots'), (1.0, 'going'), (1.0, 'fill'), (1.0, 'file'), (1.0, 'fashioned'), (1.0, 'big')]


Claim: Preacher Joel Osteen was "horrified" at recently learning that Jesus was crucified.
[(9.0, 'preacher joel osteen'), (4.0, 'recently learning'), (1.0, 'jesus'), (1.0, 'horrified'), (1.0, 'crucified')]


Claim: The "Fire Fairy Challenge" has tricked multiple children into harming themselves.
[(9.0, 'tricked multiple children'), (9.0, 'fire fairy challenge'), (1.0, 'harming')]


Claim: "S

Claim: A photograph shows a donut with "Muslim writing" on it.
[(4.0, 'photograph shows'), (4.0, 'muslim writing'), (1.0, 'donut')]


Claim: Denzel Washington criticized Meryl Streep for making a political speech during the 2017 Golden Globes award ceremony.
[(25.0, 'denzel washington criticized meryl streep'), (25.0, '2017 golden globes award ceremony'), (4.0, 'political speech'), (1.0, 'making')]


Claim: "When Donald Trump spoke in Phoenix, he looked the audience in the eye and he said ‘no, we're building a wall and we're deporting everybody.’ He said, quote, ‘they will all be gone. They will all be gone.’ This is one of the ones where you can go to the tape on it and see what Donald Trump has said."
[(8.5, 'deporting everybody .’'), (8.0, 'donald trump spoke'), (5.0, 'donald trump'), (4.0, 'gone .’'), (3.666666666666667, 'said ."'), (3.166666666666667, 'said ‘'), (1.6666666666666667, 'said'), (1.5, '‘'), (1.5, 'gone'), (1.0, 'wall'), (1.0, 'tape'), (1.0, 'see'), (1.0, 'quote'), (1.

Claim: Crabs swarmed onto a Florida road after Hurricane Irma.
[(9.0, 'crabs swarmed onto'), (4.0, 'hurricane irma'), (4.0, 'florida road')]


Claim: "The U.S. government has certified that at least 700,000 Americans have lost their jobs due to changing trade flows resulting from NAFTA."
[(16.0, 'changing trade flows resulting'), (4.0, 'nafta ."'), (4.0, 'least 700'), (4.0, 'jobs due'), (4.0, '000 americans'), (1.0, 'u'), (1.0, 'lost'), (1.0, 'government'), (1.0, 'certified')]


Claim: While Mayor Rick Kriseman said he would dip into reserves this year because of Hurricane Irma, he "went into the emergency reserves before Irma ever hit."
[(16.0, 'mayor rick kriseman said'), (15.0, 'irma ever hit ."'), (5.0, 'hurricane irma'), (4.0, 'would dip'), (3.5, 'emergency reserves'), (1.5, 'reserves'), (1.0, 'year'), (1.0, 'went')]


Claim: Did Donald Trump inherit an economic mess?
[(9.0, 'donald trump inherit'), (4.0, 'economic mess')]




Claim: Norway announced that it was changing its name 


Claim: In a leaked e-mail, Hillary Clinton said "we must destroy Syria for Israel."
[(9.0, 'must destroy syria'), (9.0, 'hillary clinton said'), (4.0, 'leaked e'), (4.0, 'israel ."'), (1.0, 'mail')]


Claim: "It’s possible that non-citizen voters were responsible for Obama’s 2008 victory in North Carolina."
[(9.0, 'north carolina ."'), (4.0, 'citizen voters'), (4.0, '2008 victory'), (3.5, 'obama ’'), (1.5, '’'), (1.0, 'responsible'), (1.0, 'possible'), (1.0, 'non')]


Claim: Residents of Flint, Michigan, are legally prohibited from selling their homes and moving away due to the ongoing water crisis.
[(9.0, 'ongoing water crisis'), (9.0, 'moving away due'), (4.0, 'legally prohibited'), (1.0, 'selling'), (1.0, 'residents'), (1.0, 'michigan'), (1.0, 'homes'), (1.0, 'flint')]


Claim: Say Gretchen Carlson said, "The 2nd Amendment Was Written Before Guns Were Invented."
[(16.0, 'say gretchen carlson said'), (4.0, 'invented ."'), (4.0, '2nd amendment'), (1.0, 'written'), (1.0, 'guns')]


Cl

Claim: Mandalay Bay security guard Jesus Campos was an "accomplice" to Las Vegas Strip mass shooter Stephen Paddock.
[(49.0, 'las vegas strip mass shooter stephen paddock'), (36.0, 'mandalay bay security guard jesus campos'), (1.0, 'accomplice')]


Claim: In May 2017, Pinnacle Foods announced the "largest recall in recent times" of several Aunt Jemima products due to possible Listeria contamination.
[(25.0, 'several aunt jemima products due'), (9.0, 'possible listeria contamination'), (9.0, 'pinnacle foods announced'), (4.0, 'recent times'), (4.0, 'may 2017'), (4.0, 'largest recall')]


Claim: A photograph show Ivanka Trump with Vladimir Putin and Wendi Murdoch.
[(16.0, 'photograph show ivanka trump'), (4.0, 'wendi murdoch'), (4.0, 'vladimir putin')]


Claim: Members of antifa groups attacked an elderly woman and Malia Obama was arrested in connection with the incident.
[(9.0, 'antifa groups attacked'), (4.0, 'malia obama'), (4.0, 'elderly woman'), (1.0, 'members'), (1.0, 'incident'), 

Claim: Philando Castile was wanted for armed robbery when he was killed by police officers.
[(4.0, 'police officers'), (4.0, 'philando castile'), (4.0, 'armed robbery'), (1.0, 'wanted'), (1.0, 'killed')]


Claim: Says both Donald Trump and Hillary Clinton say Planned Parenthood is "terrific and that it should keep taxpayer funding."
[(25.0, 'hillary clinton say planned parenthood'), (16.0, 'keep taxpayer funding ."'), (4.0, 'donald trump'), (1.0, 'terrific'), (1.0, 'says')]


Claim: Clint Eastwood was found dead in Brentwood, California, in May or June 2017.
[(4.0, 'june 2017'), (4.0, 'found dead'), (4.0, 'clint eastwood'), (1.0, 'may'), (1.0, 'california'), (1.0, 'brentwood')]


Claim: A video shows a shopper being struck by an inflatable raft inside a department store.
[(9.0, 'inflatable raft inside'), (4.0, 'video shows'), (4.0, 'department store'), (1.0, 'struck'), (1.0, 'shopper')]


Claim: In September 2017, authorities in Houston, Texas warned residents to use gas masks as they 

Claim: A chyron on a network news channel contained a vulgar insult against Senate Majority Leader Mitch McConnell.
[(25.0, 'senate majority leader mitch mcconnell'), (16.0, 'network news channel contained'), (4.0, 'vulgar insult'), (1.0, 'chyron')]


Claim: Republican Rep. Todd Rokita of Indiana voted “against Trump’s border wall.”
[(9.0, 'indiana voted “'), (9.0, 'border wall .”'), (4.0, 'trump ’'), (4.0, 'todd rokita'), (4.0, 'republican rep')]


Claim: “I’ve got five years of experience as a national security staffer in the U.S. Congress. I held top secret security clearance.”
[(34.5, 'held top secret security clearance .”'), (10.5, 'national security staffer'), (9.0, 'got five years'), (1.0, '“'), (1.0, '’'), (1.0, 'u'), (1.0, 'experience'), (1.0, 'congress')]


Claim: Says Sen. Dianne Feinstein said "if she had 51 votes in the Senate for 'Mr. and Ms. America, turn in all of your guns,' they would do it."
[(9.0, 'dianne feinstein said'), (4.0, 'says sen'), (4.0, "guns ,'"), (4.0, 

Claim: "This administration and this Congress have been systematically cutting funding to border security since the Democrats took control."
[(16.0, 'democrats took control ."'), (9.0, 'systematically cutting funding'), (9.0, 'border security since'), (1.0, 'congress'), (1.0, 'administration')]


Claim: An "abortionist" strangled an infant following a failed saline abortion, while other clinicians failed to intervene.
[(8.5, 'failed saline abortion'), (4.5, 'clinicians failed'), (4.0, 'infant following'), (1.0, 'strangled'), (1.0, 'intervene'), (1.0, 'abortionist')]


Claim: “First of all, 72 individuals, according to the Center for Immigration Studies, have been implicated in terroristic activity in the United States who hail from those seven nations, point one.”
[(9.0, 'point one .”'), (4.0, '“ first'), (4.0, 'united states'), (4.0, 'terroristic activity'), (4.0, 'seven nations'), (4.0, 'immigration studies'), (4.0, '72 individuals'), (1.0, 'implicated'), (1.0, 'hail'), (1.0, 'center

Claim: Thomas Crapper invented the flush toilet.
[(9.0, 'thomas crapper invented'), (4.0, 'flush toilet')]


Claim: “Donald Trump wants to eliminate overtime pay for people. . . . He nominates someone to head the Labor Department who wants to gut overtime pay.”
[(15.0, 'gut overtime pay .”'), (14.5, '“ donald trump wants'), (10.0, 'eliminate overtime pay'), (4.0, 'nominates someone'), (4.0, 'labor department'), (2.5, 'wants'), (1.0, 'people'), (1.0, 'head')]


Claim: Wisconsin governor Scott Walker said that Labor Day should be replaced with Patriots Day.
[(25.0, 'wisconsin governor scott walker said'), (4.0, 'patriots day'), (4.0, 'labor day'), (1.0, 'replaced')]


Claim: Says Hillary Clinton once "wanted a wall" on the Mexican border.
[(9.0, 'says hillary clinton'), (4.0, 'mexican border'), (1.0, 'wanted'), (1.0, 'wall')]


Claim: Donald Trump referred to Canadians as "snow Mexicans" in a 22 February 2016 tweet.
[(16.0, '22 february 2016 tweet'), (9.0, 'donald trump referred'), (4.0,


Claim: California wine contains dangerous levels of arsenic.
[(25.0, 'california wine contains dangerous levels'), (1.0, 'arsenic')]


Claim: Musicians Robert Plant and Cher plan to wed at Westminster Abbey in July 2016.
[(9.0, 'musicians robert plant'), (4.0, 'westminster abbey'), (4.0, 'july 2016'), (4.0, 'cher plan'), (1.0, 'wed')]


Claim: Hillary Clinton made fun of hurricane Irma victims and called them "Florida hillbillies."
[(16.0, 'hillary clinton made fun'), (9.0, 'hurricane irma victims'), (9.0, 'florida hillbillies ."'), (1.0, 'called')]


Claim: Sears sold 'Free Palestine' shirts on its web site.
[(4.0, 'web site'), (4.0, 'sears sold'), (4.0, 'free palestine'), (1.0, 'shirts')]


Claim: President Trump “signed an executive order allowing our veterans to get 100% medical bills paid at hospitals other than a V.A. hospital.”
[(16.0, 'president trump “ signed'), (9.0, 'medical bills paid'), (9.0, 'executive order allowing'), (4.0, 'hospital .”'), (4.0, 'get 100'), (1.0, 'vete

Claim: A photograph shows President Donald Trump in a diaper.
[(25.0, 'photograph shows president donald trump'), (1.0, 'diaper')]


Claim: Keanu Reeves gave an envelope of cash to a stranger in order to help pay for a kidney transplant.
[(9.0, 'keanu reeves gave'), (4.0, 'kidney transplant'), (4.0, 'help pay'), (1.0, 'stranger'), (1.0, 'order'), (1.0, 'envelope'), (1.0, 'cash')]


Claim: A home pregnancy test can detect testicular cancer.
[(9.0, 'home pregnancy test'), (9.0, 'detect testicular cancer')]


Claim: Singer Beyoncé Knowles was killed in a car crash.
[(9.0, 'singer beyoncé knowles'), (4.0, 'car crash'), (1.0, 'killed')]


Claim: "Although we were able to beat back Trump’s effort to repeal the Affordable Care Act, 3 million fewer Americans have health insurance today than before Trump took office."
[(16.0, 'trump took office ."'), (16.0, 'beat back trump ’'), (16.0, '3 million fewer americans'), (9.0, 'health insurance today'), (9.0, 'affordable care act'), (1.0, 'repeal'), 



Claim: Birth control pioneer Margaret Sanger "believed that people like me should be eliminated."
[(25.0, 'birth control pioneer margaret sanger'), (4.0, 'people like'), (4.0, 'eliminated ."'), (1.0, 'believed')]


Claim: California’s prisons budget in 1970 "was about 3 percent of the general fund. Now, it’s 8.9 percent, about $12 billion."
[(9.0, '12 billion ."'), (4.0, 'prisons budget'), (4.0, 'general fund'), (4.0, '9 percent'), (4.0, '3 percent'), (3.5, 'california ’'), (1.5, '’'), (1.0, '8'), (1.0, '1970')]


Claim: Michele Bachmann said that Christopher Columbus was the first person to set foot on the North American continent.
[(9.0, 'north american continent'), (9.0, 'michele bachmann said'), (4.0, 'set foot'), (4.0, 'first person'), (4.0, 'christopher columbus')]


Claim: At the 2018 World Economic Forum in Davos, Switzerland, President Trump told billionaire George Soros to "go to hell."
[(36.0, 'president trump told billionaire george soros'), (16.0, '2018 world economic fo


Claim: Burger King has introduced a new "adult meal" for Valentine's Day that includes a sex toy.
[(4.0, 'sex toy'), (4.0, 'burger king'), (4.0, 'adult meal'), (1.0, 'valentine'), (1.0, 'new'), (1.0, 'introduced'), (1.0, 'includes'), (1.0, 'day')]


Claim: "70 million Americans have a criminal record — that’s one in three adults."
[(9.0, 'three adults ."'), (9.0, 'criminal record —'), (9.0, '70 million americans'), (1.0, '’'), (1.0, 'one')]


Claim: Former California state senator Leland Yee, a gun control advocate, was arrested for gun trafficking.
[(36.0, 'former california state senator leland yee'), (8.5, 'gun control advocate'), (4.5, 'gun trafficking'), (1.0, 'arrested')]


Claim: Of the six U.S.-based Nobel science laureates in 2017, all were immigrants; every U.S.-based laureate in 2016 was also born outside the country.
[(23.0, '.- based nobel science laureates'), (11.0, '.- based laureate'), (9.0, 'also born outside'), (4.0, 'six u'), (4.0, 'every u'), (1.0, 'immigrants'), (

Claim: Penn State's Joe Paterno said "when you get into the end zone, act like you've been there before."
[(9.0, 'joe paterno said'), (4.0, 'penn state'), (4.0, 'end zone'), (4.0, 'act like'), (1.0, 'get'), (1.0, '."')]


Claim: "400 bills have my name on them either as a sponsor or a co-sponsor. You don’t get that done unless you work with folks on the other side."
[(4.0, 'side ."'), (4.0, 'done unless'), (4.0, '400 bills'), (1.0, '’'), (1.0, 'work'), (1.0, 'sponsor'), (1.0, 'name'), (1.0, 'get'), (1.0, 'folks'), (1.0, 'either'), (1.0, 'co')]


Claim: Parking lot carjackers are placing flyers or $100 bills on the windows of automobiles, then taking the cars when drivers step out of their vehicles to remove them.
[(9.0, 'parking lot carjackers'), (4.0, 'placing flyers'), (4.0, 'drivers step'), (4.0, '100 bills'), (1.0, 'windows'), (1.0, 'vehicles'), (1.0, 'taking'), (1.0, 'remove'), (1.0, 'cars'), (1.0, 'automobiles')]


Claim: The United Nations will kill all Americans who refuse to t

Claim: "Under Pat McCrory, (North Carolina) has fallen to 41st in teacher pay."
[(9.0, 'teacher pay ."'), (4.0, 'pat mccrory'), (4.0, 'north carolina'), (1.0, 'fallen'), (1.0, '41st')]


Claim: The Fyre Festival was oversold and rapidly descended into chaos, leaving attendees stranded due to its last-minute cancellation.
[(16.0, 'leaving attendees stranded due'), (4.0, 'rapidly descended'), (4.0, 'minute cancellation'), (4.0, 'fyre festival'), (1.0, 'oversold'), (1.0, 'last'), (1.0, 'chaos')]


Claim: “The story that came out tonight as reported is false.”
[(4.0, 'false .”'), (1.0, '“'), (1.0, 'tonight'), (1.0, 'story'), (1.0, 'reported'), (1.0, 'came')]


Claim: In July 2017, it was announced that Finnish researchers would begin human trials of a Type 1 diabetes vaccine in 2018.
[(36.0, 'finnish researchers would begin human trials'), (16.0, 'type 1 diabetes vaccine'), (4.0, 'july 2017'), (1.0, 'announced'), (1.0, '2018')]


Claim: The Republicans "still want to privatize (Social Secu

Claim: Secretary of State John Kerry "funneled" taxpayer money into his daughter's global charity.
[(9.0, 'state john kerry'), (4.0, 'taxpayer money'), (4.0, 'global charity'), (1.0, 'secretary'), (1.0, 'funneled'), (1.0, 'daughter')]


Claim: Says White House adviser Steve Bannon said, "Nobody can blame you for beating your wife if it’s out of love."
[(49.0, 'says white house adviser steve bannon said'), (4.0, 'love ."'), (1.0, '’'), (1.0, 'wife'), (1.0, 'nobody'), (1.0, 'blame'), (1.0, 'beating')]


Claim: Betsy DeVos said that a 40 percent approval rating meant that President Trump had the support of more than half the country.
[(25.0, '40 percent approval rating meant'), (9.0, 'betsy devos said'), (4.0, 'president trump'), (1.0, 'support'), (1.0, 'half'), (1.0, 'country')]


Claim: "This is my exact words. ‘I love all the people of our country’ …. They (the media say), ‘Is he a racist?’ "
[(14.5, 'media say ), ‘'), (9.0, 'country ’ ….'), (4.0, 'racist ?’'), (4.0, 'exact words'), (2

Claim: “We’ve done more against ISIS in nine months than the previous administration has done during its whole administration — by far, by far.”
[(8.5, 'whole administration —'), (4.5, 'previous administration'), (4.0, 'nine months'), (3.5, 'far .”'), (1.5, 'far'), (1.0, '“'), (1.0, '’'), (1.0, 'isis'), (1.0, 'done')]


Claim: "Our economy is so much stronger than when (Barack Obama and Joe Biden) took office. Nearly 15 million new private-sector jobs."
[(25.0, 'nearly 15 million new private'), (9.0, 'sector jobs ."'), (4.0, 'took office'), (4.0, 'much stronger'), (4.0, 'joe biden'), (4.0, 'barack obama'), (1.0, 'economy')]


Claim: Mars, Incorporated released a "Pods" product shortly after the Tide Pod Challenge went viral in 2018.
[(25.0, 'tide pod challenge went viral'), (4.0, 'product shortly'), (4.0, 'incorporated released'), (1.0, 'pods'), (1.0, 'mars'), (1.0, '2018')]


Claim: Former Haitian official Klaus Oberwein died in a suspicious suicide days before he was scheduled to tes



Claim: "Right now we are at 90 percent health insurance covered. That's the highest we've ever been in our country."
[(25.0, '90 percent health insurance covered'), (4.0, 'country ."'), (1.0, 'right'), (1.0, 'highest'), (1.0, 'ever')]


Claim: Eighteen U.S. states still have laws banning oral sex.
[(16.0, 'laws banning oral sex'), (4.0, 'states still'), (4.0, 'eighteen u')]


Claim: There is verifiable evidence that a large earthquake will strike the Indian Ocean and cause a deadly tsunami before the end of 2017.
[(4.0, 'verifiable evidence'), (4.0, 'large earthquake'), (4.0, 'indian ocean'), (4.0, 'deadly tsunami'), (1.0, 'strike'), (1.0, 'end'), (1.0, 'cause'), (1.0, '2017')]


Claim: "What does Trumpcare do? Yank tax credits away from veterans unlike any other American."
[(16.0, 'yank tax credits away'), (4.0, 'veterans unlike'), (4.0, 'american ."'), (1.0, 'trumpcare')]


Claim: President Donald Trump decided to ban schools in an effort to curb school shootings.
[(16.0, 'presiden

Claim: Miami-Dade County announced plans to create "texting lanes" on its highways.
[(16.0, 'dade county announced plans'), (4.0, 'texting lanes'), (1.0, 'miami'), (1.0, 'highways'), (1.0, 'create')]


Claim: Federal agents raided a mosque near Dearborn, MIchigan and arrested several ISIS combatants planning suicide attacks.
[(49.0, 'arrested several isis combatants planning suicide attacks'), (9.0, 'mosque near dearborn'), (9.0, 'federal agents raided'), (1.0, 'michigan')]


Claim: Queen Elizabeth is so upset at public comments made by royal bride-to-be Meghan Markle that she has suspended or threatened to suspend Prince Harry's wedding.
[(9.0, 'suspend prince harry'), (9.0, 'public comments made'), (4.0, 'royal bride'), (4.0, 'queen elizabeth'), (4.0, 'meghan markle'), (1.0, 'wedding'), (1.0, 'upset'), (1.0, 'threatened'), (1.0, 'suspended')]


Claim: false
[(1.0, 'false')]


Claim: Says "$3 trillion in offshore money... is coming back into the economy" because of the GOP tax bills.


In [14]:
from rake_nltk import Rake

# Uses stopwords for english from NLTK, and all puntuation characters by
# default
r = Rake()

# Extraction given the text.
r.extract_keywords_from_text("In August 2018, adhesive replicas of President Donald Trump's recently-destroyed star were placed on the Walk of Fame on Hollywood Boulevard.")

# # Extraction given the list of strings where each string is a sentence.
# r.extract_keywords_from_sentences(<list of sentences>)

# To get keyword phrases ranked highest to lowest.
print(r.get_ranked_phrases())

# To get keyword phrases ranked highest to lowest with scores.
print(r.get_ranked_phrases_with_scores())

['president donald trump', 'hollywood boulevard', 'destroyed star', 'august 2018', 'adhesive replicas', 'walk', 'recently', 'placed', 'fame']
[(9.0, 'president donald trump'), (4.0, 'hollywood boulevard'), (4.0, 'destroyed star'), (4.0, 'august 2018'), (4.0, 'adhesive replicas'), (1.0, 'walk'), (1.0, 'recently'), (1.0, 'placed'), (1.0, 'fame')]
