In [1]:
from pyspark.sql.functions import udf, col, lower, regexp_replace, concat_ws, trim
from pyspark.ml.feature import Tokenizer, StopWordsRemover
from pyspark.sql.types import ArrayType, StringType, IntegerType

file_location = "dbfs:///FileStore/tables/all-news/*.csv"
file_type = "csv"

# CSV options
infer_schema = "false"
first_row_is_header = "true"
delimiter = ","

# The applied options are for CSV files. For other file types, these will be ignored.
df_file = spark.read.format(file_type) \
  .option("inferSchema", infer_schema) \
  .option("header", first_row_is_header) \
  .option("sep", delimiter) \
  .load(file_location) \
  .select('id', 'title', 'content') \
  .na.drop()

# Delete punctuation
df_cleaned = df_file.select('id', (lower(regexp_replace('title', "[^a-zA-Z\\s]", " ")).alias('title')), \
                                  (lower(regexp_replace('content', "[^a-zA-Z\\s]", " ")).alias('content')))

df_cleaned = df_cleaned.select('id', (regexp_replace('title', "[!-~]?\\b[\\w]\\b[!-~]?", " ")).alias('title'), \
                                     (regexp_replace('content', "[!-~]?\\b[\\w]\\b[!-~]?", " ")).alias('content'))

df_cleaned = df_cleaned.select('id', (regexp_replace(trim(col('title')), " +", " ")).alias('title'), \
                                     (regexp_replace(trim(col('content')), " +", " ")).alias('content'))

# Tokenize title
title_tokenizer = Tokenizer(inputCol='title', outputCol='tokenized_title')
df_tokenized_title = title_tokenizer.transform(df_cleaned).select('id', 'tokenized_title', 'content')

# Remove stopwords from title
stopwords_title_remover = StopWordsRemover(inputCol='tokenized_title', outputCol='cleaned_title')
df_title_removed_stopwords = stopwords_title_remover.transform(df_tokenized_title).select('id', 'cleaned_title', 'content')

# Clean words whose lenght is less than 1
filter_length_udf = udf(lambda row: [x for x in row if len(x) > 1], ArrayType(StringType()))
df_final_title = df_title_removed_stopwords.withColumn('cleaned_title', filter_length_udf(col('cleaned_title')))

# Tokenize content
content_tokenizer = Tokenizer(inputCol='content', outputCol='tokenized_content')
df_tokenized_content = content_tokenizer.transform(df_final_title).select('id', 'cleaned_title', 'tokenized_content')

# Remove stopwords from content
stopwords_remover = StopWordsRemover(inputCol='tokenized_content', outputCol='cleaned_content')
df_removed_stopwords = stopwords_remover.transform(df_tokenized_content).select('id', 'cleaned_title', 'cleaned_content')

# Filter length in content
df_final = df_removed_stopwords.withColumn('cleaned_content', filter_length_udf(col('cleaned_content')))

# Make title and content strings and id an integer
df_final = df_final.withColumn('cleaned_title', concat_ws(" ", 'cleaned_title')) \
           .withColumn('cleaned_content', concat_ws(" ", 'cleaned_content')) \
           .withColumn('id', df_final['id'].cast(IntegerType())) \
           .select('id', col('cleaned_title').alias('title'), col('cleaned_content').alias('content')) 
           
display(df_final)

id,title,content
17283,house republicans fret winning health care suit new york times,washington congressional republicans new fear comes health care lawsuit obama administration might win incoming trump administration choose longer defend executive branch suit challenges administration authority spend billions dollars health insurance subsidies americans handing house republicans big victory issues sudden loss disputed subsidies conceivably cause health care program implode leaving millions people without access health insurance republicans prepared replacement lead chaos insurance market spur political backlash republicans gain full control government stave outcome republicans find awkward position appropriating huge sums temporarily prop obama health care law angering conservative voters demanding end law years another twist donald trump administration worried preserving executive branch prerogatives choose fight republican allies house central questions dispute eager avoid ugly political pileup republicans capitol hill trump transition team gaming handle lawsuit election put limbo least late february united states court appeals district columbia circuit yet ready divulge strategy given pending litigation involves obama administration congress inappropriate comment said phillip blando spokesman trump transition effort upon taking office trump administration evaluate case related aspects affordable care act potentially decision judge rosemary collyer ruled house republicans standing sue executive branch spending dispute obama administration distributing health insurance subsidies violation constitution without approval congress justice department confident judge collyer decision reversed quickly appealed subsidies remained place appeal successfully seeking temporary halt proceedings mr trump won house republicans last month told court transition team currently discussing potential options resolution matter take effect inauguration jan suspension case house lawyers said provide future administration time consider whether continue prosecuting otherwise resolve appeal republican leadership officials house acknowledge possibility cascading effects payments totaled estimated billion suddenly stopped insurers receive subsidies exchange paying costs deductibles eligible consumers race drop coverage since losing money loss subsidies destabilize entire program cause lack confidence leads insurers seek quick exit well anticipating trump administration might inclined mount vigorous fight house republicans given dim view health care law team lawyers month sought intervene case behalf two participants health care program request lawyers predicted deal house republicans new administration dismiss settle case produce devastating consequences individuals receive reductions well nation health insurance health care systems generally matter happens house republicans say want prevail two overarching concepts congressional power purse right congress sue executive branch violates constitution regarding spending power house republicans contend congress never appropriated money subsidies required constitution suit initially championed john boehner house speaker time later house committee reports republicans asserted administration desperate funding required treasury department provide despite widespread internal skepticism spending proper white house said spending permanent part law passed annual appropriation required even though administration initially sought one important house republicans judge collyer found congress standing sue white house issue ruling many legal experts said flawed want precedent set restore congressional leverage executive branch spending power standing trump administration may come pressure advocates presidential authority fight house matter shared views health care since precedents broad repercussions complicated set dynamics illustrating quick legal victory house trump era might come costs republicans never anticipated took obama white house
17284,rift officers residents killings persist south bronx new york times,bullet shells get counted blood dries votive candles burn people peer windows see crime scenes gone cold band yellow police tape blowing breeze south bronx across harlem river manhattan shorthand urban dysfunction still suffers violence levels long ago slashed many parts new york city yet city efforts fight remain splintered underfunded burdened scandal th precinct southern tip bronx poor minority neighborhoods across country people long hounded infractions crying protection grievous injury death september four every five shootings precinct year unsolved city precincts th highest murder rate fewest detectives per violent crime reflecting disparities staffing hit hardest neighborhoods outside manhattan according new york times analysis police department data investigators precinct saddled twice number cases department recommends even bosses called police headquarters answer sharpest crime rise city year across bronx investigative resources squeezed highest rate city five boroughs thinnest detective staffing nine precinct detective squads violent crime city borough robbery squad smaller manhattan even though bronx cases year homicide squad one detective every four murders compared one detective roughly every two murders upper manhattan one detective per murder lower manhattan lobbies family apartments outside methadone clinics art studios people take note inequity hear police commanders explain lack resources place floodlight dangerous block post officers corner watch witnesses cower behind doors fearful gunman crew confident police department ability protect though people see lot rarely testify south bronx many predominantly black hispanic neighborhoods like united states contract police community tatters people stories crime reports ignored calls went unanswered hours others tell call help ending caller arrest minor charge leading hours fetid holding cell paradox policing th precinct neighborhoods historically prime targets aggressive tactics like designed ward disorder precinct detectives less time anywhere else city answer blood spilled violent crimes gola white beside daughter shot killed playground summer four years son gunned housing project ticked public safety resources said scant bronx neighborhoods like security cameras lights locks investigating police officers nothing said comes families said authorities really care much feel times documenting murders logged year th precinct one handful neighborhoods deadly violence remains problem era crime new york city homicides precinct year nine strain detectives go unsolved half year look take law hands hundreds conversations grieving relatives friends witnesses police officers social forces flare murder place like th precinct become clearer merciless gang codes mental illness drugs long memories feuds simmered officers view reasons murders never solved also emerge paralyzing fear retribution victims carrying secrets graves relentless casework forces detectives move hopes break come later frustrations build sides detectives phones rarely ring tips officers grow embittered witnesses cooperate meantime victim friends conduct investigations talk grabbing stash gun wheel well mother apartment find suspect chasm police community gangs gun violence flourish parents try protect families drug crews threats officers work overcome residue years mistrust understaffing communities still go racing one call next streets around st mary park scene two fatal shootings logged th precinct year unsolved james fernandez heard talk murders door apartment east th street betances houses lived end long hallway strewn hypodermic needles empty dope bags discarded hennessy bottles young men spoke subset bloods gang made drug market slinging marijuana cocaine regulars flashing firearms blowing smoke fernandez apartment mr fernandez asked young men move answered busting car kind crime anachronism much new york still rattles th precinct even though murders fallen year major felony crimes per resident residential district city also one poorest communities country many young men find way underground markets mr fernandez one shrink threats growing lower east side rode bicycle around customers drug dealers worked collected payments backpack leaving life got tech maintenance job three years ago moved betances houses wife daughter two choices get help drug crew call police help risk labeled snitch call old lower east side bosses muscle risk violence chose police walked local substation police service area asked protection daughter using inhaler relieve coughs marijuana smoke mr fernandez wife got terrible headaches lot killers going kill sergeant police report quoted telling mr fernandez august second report filed day said warned going shoot window mr fernandez told police teenagers names appear reports went home said one friends seen walk substation tried intimidate filing another report three days later propped bike door said open door say something body slam mr fernandez wife maria fernandez wrote slips paper used document hallway ruckus inadequate police response boys made comments easy target slap opened door made drug sale threatened beat fernandez family ones snitching notes say another complaint substation days first brought relief week later feeling desperate ms fernandez tried calling first substation one boys blew weed smoke door made threat attack police never came wrote notes tried th precinct station house next officers desk left standing public waiting area said making fear seen officers put worse danger months later said came door announced front teenagers complaint drug activity mr fernandez started work said police failed wired camera peephole record drugs guns footage hark back new york still much present precinct residents around morning sgt michael lopuzzo walks tall wooden doors th precinct station house cases land metal desk dead bodies known cause strip club brawls shooting victims hobbling hospital bring resistance every turn reminding earlier era city campaign haven got one single phone call putting right direction said sergeant lopuzzo head precinct detective squad one day summer worked answer email inquiry murder victim aunt killer caught people understand often detectives feel effects people turning police witnesses shout away doors neighbors know refuse talk people shot wounded bronx early september third victims refused cooperate period th precinct squad detectives closed three nonfatal shootings robbery cases part resistance stems preventive policing tactics like hallmark style former mayor michael bloomberg police commissioner raymond kelly near height strategy th precinct stops city stops officers used force frisks stops year people done nothing criminal precinct also one areas department flooded newest officers roll calls pressured generate numbers write tickets make arrests choice give summons young man playing park dark even officers done growing neighborhood need bring something today justify existence officer argenis rosado joined precinct said interview station house re small area day day re hammering community course community eventually going turn pressure warped way officers residents saw rookies ignore someone might drinking outside sitting stoop cops came time probably viewed community differently said hector espada veteran precinct wanted way somehow give someone summons feel like guys still civil conversation morale wilted aged station house alexander avenue mott haven officers felt pressure downgrade crime complaints make appear less serious several said interviews overlooked crime reports immigrants seen unlikely complain watched supervisors badger victims repeating stories hopes drop complaints practice downgrading complaints resulted disciplining officers precinct last year one string scandals left officers feeling overscrutinized problems also existed elsewhere four commanders precinct sent packing five years one officers found ticket fixing forgiving parking tickets friends another recorded giving guidance stop frisk black boys men ages officers fled commands others became reluctant take assignments proactive policing units like put situations street whenever walked doors precinct seemed like black cloud said russell lewis th like heaviness walked wanted hours minutes go home didn want get caught anything precinct covers two square miles dozen housing projects mean overflows people methadone clinics draw addicts around city lofts southern edge precinct presage wave gentrification even police department hired officers neighborhood policing counterterrorism officers th precinct said still rush calls shift number unchanged new police commissioner james neill said handling similar south bronx precinct years ago several dozen calls time waiting response residents know want police domestic problem helps hint weapon last year precinct drew number civilian complaints officer misconduct city lawsuits stemming police actions precinct trying improve morale new commanding officer deputy inspector brian hennessy cadre department calls neighborhood coordination officers patrol since last january part citywide effort mr neill mayor bill de blasio bring back beat cop unencumbered chasing every last call listen people concerns help investigations precinct made among gun arrests city officers said discretion resolve encounters without summons arrest one corner near school courtlandt avenue east st street long spawned complaints gunfire fights inspector hennessy officers painted graffiti swept drug paraphernalia summer people said first answer complaints years inspector acknowledged residue policing lingers perception really sticks said workload th precinct startling reveals gap detective squads equipped answer violent crime manhattan compared bronx brooklyn queens three precinct detectives carrying cases year many others loads high even though department advises violent precincts assigned homicide typically four days investigate dealing cases quieter precincts give detectives month little distraction investigate murder detectives th precinct handled average violent felonies year murders rapes felony assaults robberies contrast detective precinct southern end staten island carries nine cases detective precinct patrolling union square gramercy park handles detective precinct washington heights handles citywide median last year th violent crime cases per detective bronx whole precinct detective carried average violent felonies year compared manhattan brooklyn queens staten island rape cases robbery patterns later sent specialized units precinct detectives extensive initial work interview victims write reports process evidence precincts much manhattan whiter wealthier south bronx often property felonies like stolen laptops credit cards police say complex even accounting crimes th precinct heaviest caseloads overall crime per detective city michael palladino head detectives endowment association former bronx officer said staffing disparities affected department efforts build trust communities like south bronx witnesses make calculation said cooperate detectives much work won even get chance protect ll late retaliation comes sergeant lopuzzo turned prestigious post stay th precinct said squad worked tirelessly handle cases people every squad wanted detectives staffing needs counterterrorism units task forces created new deployment challenges across department fight army army wish said details police department assigns officers closely held constantly flux public minimal information personnel allocated presented times analysis confidential staffing data department chief detectives robert boyce vowed send detectives th precinct said department reassess deployment broadly troubled precincts said recent decision bring gang narcotics vice detectives command made easier shift personnel chief boyce said burdens detectives went beyond felony crimes include cases noted support precinct squads got centralized units focusing robberies gangs grand larcenies example major crime keeps pounding th precinct rates tenth percent lower even citywide crime dropped third period precinct detective squad shrank eight investigators years according staffing data obtained city council freedom information law request squad covering union square gramercy park crime dropped third period grew investigators th precinct given additional detective four investigators summer already missing three detectives illness reasons retired detectives skeptical community relations alone drive crime city last busiest precincts rather say police department dedicating resources providing sort robust investigative response seems standard manhattan crime manhattan solved said howard landesberg th precinct detective late outer boroughs like forgotten retired detectives said understaffing made harder solve crimes bronx brooklyn queens higher prevalence gang drug killings already saddled investigators cases people inclined cooperate detectives closed percent homicides manhattan percent staten island year compared percent bronx percent queens percent brooklyn last year homicides detectives cleared percent manhattan percent bronx percent queens percent staten island percent brooklyn culture police department worry manhattan said joseph giacalone former sergeant bronx cold case squad part money added de blasio came talked tale two cities done complete opposite said business usual bronx struggles extend prosecutions last five years prosecutors bronx declined prosecute violent felony cases anywhere else city rate conviction bronx routinely lowest city well ticked year surpass brooklyn rate november bronx prosecutors work streamline cases cases become even difficult win problem th precinct allowed defense lawyers attack credibility officers implicated said patrice shaughnessy spokeswoman bronx district attorney office district attorney darcel clark elected said statement judge bronx heard jurors impartial trust police tide mistrust sergeant lopuzzo detectives work hours straight fresh cases buy chinese takeout money murder suspect carry surveillance videos home hopes personal computers may enhance better squad computer buy urn homeless mother murdered son ashes box months killing seem like people glittering city paying attention th precinct homicide victims newly fatherless children go back school without therapist help victims families wander confused courthouse nearly miss appearance newspapers largely ignore killings people criminal pasts pushing priority lists chiefs police headquarters stuffy squad room detectives th precinct grapple inheritance government neglect meet mothers believe sons might never murdered city guidance counselor listened pleas help stay enrolled city housing worker fixed locks lights building detectives work alongside vicious system streets punishing police cooperators young men scan court paperwork prison looking names people turned one murder victim precinct year cast crew avoided arrested gang takedown believed cooperating longtime th precinct detective jeff meenagh said witness homicide case going testify went back neighborhood told anyone testified get deserve allies sergeant lopuzzo makes friendly long helped clear woman son robbery charge locating surveillance video proved robber mother started calling tips code name gun car example always refused testify cut ties year sergeant lopuzzo arrested son stabbing two people shooting new york city owns east th street buildings side james fernandez betances houses said reality ground different drug boss ran block october mr fernandez increasingly afraid fed mr fernandez wife went far give officers keys building door get whenever wanted showed videos offered access camera see happening hallway couple officers said needed supervisor permission others answered young men making threats officers occasionally stopped outside building causing young men scatter come inside mr fernandez said menacing worsened mr fernandez daughter harassed arrived home school grew distressed parents start seeing therapist mr fernandez made several complaints office borough president ruben diaz jr visited victim advocate district attorney office oct sent online note police commissioner office went proper channels help note said precincts failed us except officers helped us hands tied one else turn months video multiple crimes taking place extreme danger th psa won anything wrote referring local substation please need speak one authority local substation commander deputy inspector jerry sullivan bronx narcotics unit alerted complaints mr fernandez said never heard relied street instincts protect family made pleas man thought employing dealers hallway activity quieted briefly returned young men rented room woman apartment upstairs mr fernandez approached different man learned boss operation man agreed ask dealers calm even hired drug customer sweep hallway mr fernandez said two weeks later dealing harassment resumed went old lower east side bosses hired men trail wife daughter way building make sure made safely school times sat outside betances houses also bought two bulletproof vests find one small enough daughter faith city new york faith police faith politicians mr fernandez said thing know sure god re situation left defend family paying close attention happening hallway mr fernandez said learned details two recent homicides th precinct investigating calls help going nowhere said decided put greater risk talking tell police learned bending backward nobody even anything said going help ain going help last january new neighborhood coordination officer working residents betances houses ended arrests housing command inspector sullivan said chief boyce said silos gang narcotics detectives used work made responding complaints difficult recent restructuring remove obstacles one live like mr fernandez lived people dealing drugs outside apartment said mr fernandez complaints spur arrests two men hallway caught separately year shootings one mr fernandez named police report charged summer hitting officer metal folding chair firing three gunshots crowd court papers say held rikers island attempted murder charge late mr fernandez may moved family away
17285,tyrus wong bambi artist thwarted racial bias dies new york times,walt disney bambi opened critics praised spare haunting visual style vastly different anything disney done know film striking appearance created chinese immigrant artist took inspiration landscape paintings song dynasty extent contribution bambi remains mark film animation widely known decades like film title character artist tyrus wong weathered irrevocable separation mother hope making life america incarceration isolation rigorous interrogation still child years followed endured poverty discrimination chronic lack recognition work disney also fine art finding acclaim mr wong died friday hollywood studio artist painter printmaker calligrapher illustrator later years maker fantastical kites one celebrated artists th century marginalization long subject passed much career unknown general public artistic recognition mr wong find noteworthy fact among chinese immigrant men generation professional prospects largely limited menial jobs like houseboy laundryman trained painter mr wong leading figure modernist movement flourished california first second world wars work included group shows art institute chicago also featured picasso matisse paul klee staff artist hollywood studios drew storyboards made vibrant paintings detailed architectural illustrations helped director envision scene shot years work informed look animated pictures disney films warner brothers studios among sands iwo jima rebel without cause wild bunch dozens films worked bambi mr wong belatedly renowned truly involved every phase production john canemaker animator historian animation new york university said interview obituary march created art direction really never seen animation mr wong subject water paper paint sky major retrospective disney family museum san francisco museum windows overlook san francisco bay contemplate angel island nine decades earlier lone sought gain admission country adamantly want wong gen yeo name sometimes romanized wong gaing yoo born oct farming village guangdong province young child already exhibited love drawing encouraged father seeking better economic prospects gen yeo father embarked united states leaving mother sister behind gen yeo never see mother obliged travel false identities state affairs known among chinese immigrants paper son hope circumventing chinese exclusion act signed law president chester arthur act drastically curtailed number chinese people allowed enter country among earliest united states laws impose severe restrictions immigration unforeseen loophole opened form san francisco earthquake fire huge number municipal documents including birth immigration records destroyed many newly arrived chinese capitalized loss maintaining born san francisco fire united states citizens entitled bring relatives case gen yeo father paper sons posing relatives attuned deception united states immigration officials put chinese arrivals formidable inquisition ensure claimed questions came like gunfire direction village face many windows house house rice bin wide well deep trees village lakes shops name sponsoring relative interrogated separately answers match new arrival major mistake series smaller ones mean deportation stand chance passing aspirants memorized rigorous dossiers known coaching papers ensuing interrogation hard enough adults gen yeo undergo alone dec month sea wongs landed angel island immigration station elder mr wong traveling merchant named look get son look tai yow angel island considered ellis island west coast lisa see author gold mountain nonfiction chronicle family said interview however continued goal really different ellis island supposed welcoming angel island opened specifically keep chinese mr wong father previously lived united states look get able clear immigration quickly new arrival gen yeo detained island nearly month child among immigrants held scared half death cried mr wong recalled tyrus documentary directed pamela tom premiered every day miserable miserable hated place jan presence interpreter stenographer young gen yeo posing look tai yow interrogated three inspectors father already questioned gen yeo well prepared answered without error sacramento joined father schoolteacher americanized tai yow tyrus known tyrus wong ever soon afterward father son separated elder mr wong moved los angeles seek work reasons lost time take son tyrus lived sacramento boardinghouse attending elementary school two years later possibly tyrus traveled los angeles join father found work gambling den lived boardinghouse sandwiched butcher shop brothel school tyrus worked houseboy two pasadena families earning cents day first art teacher father trained nightly calligraphy dip brush water trace ghostly characters newspaper afford ink drawing paper tyrus junior high teacher noting drawing talent arranged summer scholarship otis art institute los angeles account indifferent student public school tyrus found calling institute otis college art design scholarship ended declined return junior high father scraped together tuition small fortune let stay otis youngest student studied least five years simultaneously working school janitor graduating long afterward father died leaving young mr wong entirely mr wong artist works progress administration creating paintings libraries public spaces friends including artist benji okubo founded oriental artists group los angeles organized exhibitions members work level exposure asian artists time mr wong newly married needing steady work joined disney creating thousands intermediate drawings bring animated sequences life asians novelty hollywood studios mr wong made keenly aware fact first disney later warner brothers one flung racial epithet another assumed sight worked company cafeteria affront job painstaking repetitive mr wong quickly work animation terrible use talents landscape artist painter mr canemaker said reprieve came late mr wong learned disney adapting bambi life woods novel austrian writer felix salten fawn whose mother killed hunter trying animate book disney reached impasse studio enjoyed great success animated film snow white seven dwarfs baroque production every detail backgrounds every petal every flower every leaf every tree meticulously represented attempt use similar style bambi found ornate backgrounds camouflaged deer forest creatures narrative centered mr wong spied chance said gee outdoor scenery recalled video interview years afterward adding said gee landscape painter invoking exquisite landscape paintings song dynasty rendered watercolors pastels series nature scenes moody lyrical atmospheric lush spare backgrounds subtly suggested stroke two brush walt disney went crazy said mr canemaker wrote mr wong book animation begins art lives disney inspirational sketch artists said love indefinite quality mysterious quality forest mr wong unofficially promoted rank inspirational sketch artist mr canemaker explained designer person went questions color lay something even influenced music special effects look drawings inspired people mr wong spent two years painting illustrations inform every aspect bambi throughout finished film lent brooding quality stark landscapes misty desaturated palette figures often seen silhouette influence unmistakable wake bitter employees strike year disney fired mr wong though chosen strike felt studio good mr canemaker said let go amid lingering climate resentments bambi mr wong name appears quite far credits mere background artist mr wong joined warner brothers working lent occasion studios retirement indignities endured confined studios trying buy house wife former ruth kim told property inquired sold month go back sign still mr wong recalled tyrus japanese attack pearl harbor december mr wong like many took wearing lapel button proclaiming heritage lest angry american beat street war permanently dispersed fledgling oriental artists group mr wong friend mr okubo sent tens thousands internment camp world war ii hadn happened think artists even artists name today ms see said little movement barely started split apart war mr wong became united states citizen also designed christmas cards hallmark painted elegant designs dinnerware sought collectors longtime resident sunland calif became retirement renowned kitemaker designing building hand coloring astonishing airworthy creations butterflies swallows whole flocks owls centipedes feet long streaked southern california sky like paint blue canvas last years ruth wong life ill dementia mr wong forsook work care death slowly began making art formal recognition influence bambi mr wong named disney legend honor whose previous recipients include fred macmurray julie andrews annette funicello bestowed walt disney company outstanding contributions retrospective work curated part ms see inaugural exhibition chinese american museum los angeles disney family museum retrospective water paper paint sky traveled museum chinese america lower manhattan mr wong death home sunland confirmed filmmaker ms tom survivors include three daughters kay fong wong kim wong two grandchildren daughters small mr wong encouraged make art father encouraged yet let coloring books reason simple want children constrained said lines laid others
17286,among deaths heavy toll pop music new york times,death may great equalizer isn necessarily evenhanded fields endeavor suffered mortal losses consider muhammad ali arnold palmer sports hollywood deaths carrie fisher debbie reynolds pop music world hands bleakest year start david bowie whose stage persona androgynous glam rocker dance pop star electronic experimentalist music year days old news came died cancer hinted time short lyrics final album released two days death otherwise gone great lengths hide illness public wish privacy ensured death appear come blue came another shock three months later prince accidentally overdosed painkiller collapsed elevator sprawling home studio near minneapolis death came indications one including prince rogers nelson seen coming energetic onstage ever holding otherwise healthy regimen successfully defied age sixth decade death leonard cohen hand rd year undoubtedly see coming shoulder went hesitate say merry way ever wise troubadour playing sellout crowds shrugging inevitable knowing dark finally overtake saying essentially another song hadn delivered enough jolts system closed year yet another death george michael sensation whose aura dimmed later years went bed never woke christmas pop music figures fell year many voices still embedded nicked vinyl grooves old records lot people bear throw roster included paul kantner jefferson airplane keith emerson greg lake emerson lake palmer glenn frey eagles maurice white earth wind fire leon russell piano pounder delta blues wail mountain man mass hair died merle haggard rugged country poet common man outlaw joined bluegrass legend ralph stanley guitar virtuoso practically glued elvis swiveling hips early days scotty moore george martin whose genius creative influence sounds john paul george ringo extension entire rock era hailed fifth beatle music stars fill arenas idols another stripe mighty athletes left scene figure among towering ali called greatest sports figure th century boxer combined power grace brains way ring never seen great athlete matters war race religion coursed life publicly turbulent way people hated refused drafted vietnam war decision cost heavyweight title people admired even loved principled stands high spirits lightning mind winking yes rhyming motormouth illness closed little contain certainly mere ropes around ring palmer transformational golf first media star gentleman game never quite began gathering army rolling greenswards leading charge shirt coming untucked cigarette dangling lips club weapon pressed attack entire generation postwar guys took game arnie women athletically blessed magnetically cool telegenically handsome somehow one said gordie howe mr hockey son saskatchewan prairie tore national hockey league hung skates died ralph branca trolley car conductor son living reminder one crushing mistake fastball bobby thomson decided national league pennant sometimes never lived pat summitt coach elevated women basketball led tennessee teams eight championships won games college coach defeat alzheimer disease dying within months national basketball association lost two giants different eras clyde lovelette olympic college champion transformed game one first truly big men hardwood heir nate thurmond defensive stalwart battled russell wilt kareem paint hall fame career even older baseball ranks monte irvin died people still around remember watching play particularly prime star negro circuit barred major leagues made hall fame anyway new york giant became major league baseball first black executive died fans pondered question hung many athletic career shackled discrimination different question entirely different sphere arose stunning news justice antonin scalia died hunting trip texas thick one consequential supreme court careers modern times left void conservative jurisprudence urgently vacancy bench yet filled raising still questions may await country exits public stage returned us past nancy reagan death evoked white house glamour west coast conservatism took residence banks potomac john glenn us thinking burst national pride soaring outer space deaths tom hayden daniel berrigan avatars defiance harked back student rebellions vietnam war roiling home front phyllis schlafly obituaries windows roots right wing ascension american politics death janet reno first woman serve attorney general recalled clinton years eight firestorm waco tex international tug war cuban boy named eli gonz lez bitter senate battle impeachment shores fidel castro death summoned memories cuban revolution nuclear brinkmanship enduring enmity strongman superpower miles away name boutros egyptian diplomat led united nations led replayed nightmares genocide rwanda bosnia death shimon peres removed last link founding israel conjured decades growing military power fitful strivings peace elie wiesel new york tireless struggle compel world never forget made us confront gas chambers auschwitz writers even fiction world poorer without literary voices harper lee umberto eco pat conroy jim harrison anita brookner alvin toffler gloria naylor william trevor mention playwrights peter shaffer dario fo edward albee dead treasured spun viewing pleasure none lustily ms fisher princess leia star wars tales day later capping year startling deaths ms reynolds singing acting leading lady earlier era died throes mother grief devotees harry potter movies saddened death alan rickman played deliciously dour professor severus snape blockbuster franchise whose career stage screen far richer many snape younger fans may known zsa zsa gabor celebrity contrast outshone modest acting career gene wilder garry shandling died year perfected brand hilariously neurotic comedy fit culture time abe vigoda godfather movies barney miller actually die actually done years ago wildly uninformed people spread word side camera directors whose vision came us parts jacques rivette french new wave auteur meditations life art abbas kiarostami iranian master searching examinations ordinary lives andrzej wajda rival ingmar bergman akira kurosawa critics eyes haunting tales poland boot first nazis communists long roster television stars generation two ago passed images younger selves frozen time noel neill adventures superman alan young mister ed robert vaughn man william schallert patty duke father daughter patty duke show dan haggerty life times grizzly adams florence henderson brady bunch alan thicke growing pains garry marshall creative force practically owned prime time happy days mork mindy laverne shirley died broadway lights dimmed memory brian bedford tammy grimes anne jackson brilliant day architect zaha hadid left behind monuments fertile imagination shaken acolytes around world street photographer bill cunningham found fashion statements every corner suddenly missing making manhattan overnight less idiosyncratic less interesting place smiling skinny man pedaling bicycle among honking cabs blue french worker jacket camera slung around neck picture split scene seemingly generation fellow photographers made art recording last half th century ruth gruber marc riboud louis stettner tv journalists morley safer gwen ifill tv commentator john mclaughlin tried make sense music precincts emptier without conductor revolutionary composer pierre boulez new music soprano phyllis curtin jazz artists mose allison bobby hutcherson gato barbieri rapper phife dawg malik taylor latin megastar juan gabriel silicon valley saw giant depart andrew grove led semiconductor revolution intel television industry lost executive grant tinker made nbc network watch prime time astrophysics smaller world women science said farewell pioneer champion vera rubin tens thousands people might choked death saved simple ingenious maneuver passing henry heimlich prompted sympathy even gratitude come think eliciting large silent thank live bad way anyone go brings us marion pritchard died inspired measures gratitude profound brave young dutch student gentile risked life save jews death camps early one instance shooting nazi stooge seize three little children hiding estimate saved people many still alive died weeks ago anyone guess know certain reasonably surmise good many still possession selfless gift matchless legacy lives
17287,kim jong un says north korea preparing test long range missile new york times,seoul south korea north korea leader kim said sunday country making final preparations conduct first test intercontinental ballistic missile bold statement less month inauguration donald trump although north korea conducted five nuclear tests last decade ballistic missile tests alone although habitually threatens attack united states nuclear weapons country never intercontinental ballistic missile icbm annual new year day speech broadcast north kctv sunday mr kim spoke proudly strides said country made nuclear weapons ballistic missile programs said north korea continue bolster weapons programs long united states remained hostile continued joint military exercises south korea reached final stage preparations intercontinental ballistic rocket said analysts region said mr kim might conduct another weapons test coming months taking advantage leadership changes united states south korea mr trump sworn jan south korea president park whose powers suspended parliamentary impeachment dec waiting constitutional court rule whether formally removed office reinstated north korea conducts test coming months test mr trump new administration despite years increasingly harsh sanctions north korea advancing toward mr kim professed goal arming isolated country ability deliver nuclear warhead united states mr kim speech sunday indicated north korea may rocket several times year complete icbm program said cheong senior research fellow sejong institute south korea first tests come even mr trump inauguration mr cheong said need take note fact first new year speech kim mentioned intercontinental ballistic missile said speech mr kim comment mr trump election doubt still runs deep north korea mastered technology needed build reliable icbm analysts region said north launchings rockets put satellites orbit recent years showed country cleared key technological hurdles north satellite launch february south korean defense officials said unha rocket used launch successfully reconfigured missile fly miles warhead pounds far enough reach united states north korea deployed rodong ballistic missiles reach south korea japan spotty record musudan ballistic missile range long enough reach american military bases pacific including guam north also claimed series successes testing various icbm technologies although claims verified often disputed officials analysts region said make nuclear warheads small enough fit onto ballistic missile also claimed success testing technology allows missile return earth atmosphere without breaking april north korea reported successful ground test engine intercontinental ballistic missile time mr kim said north tip intercontinental ballistic rockets powerful nuclear warheads keep cesspool evils earth including mainland within striking range sept north conducted fifth powerful nuclear test mr kim later attended another ground test new rocket engine exhorting government prepare another rocket launch soon possible november united nations security council imposed new sanctions north
17288,sick cold queen elizabeth misses new year service new york times,london queen elizabeth ii battling cold week missed new year day church service country estate sandringham buckingham palace said sunday week earlier queen missed christmas day church service first time since illness queen yet feel ready attend church still recuperating heavy cold palace said statement queen husband prince philip also ill well enough attend services church sandringham norfolk east coast england queen ascended throne became world monarch following death king bhumibol adulyadej thailand october also britain monarch last year surpassed queen victoria reign mother lived age
17289,taiwan president accuses china renewed intimidation new york times,beijing president tsai taiwan sharply criticized china leaders saturday saying resorted military economic threats order intimidate island step step beijing going back old path dividing coercing even threatening intimidating taiwan told journalists taipei capital news conference tensions taiwan china rivals since communist revolution intensified december ms tsai spoke phone american donald trump breaking longstanding diplomatic practice recent weeks china stepped military activities near taiwan sending sole aircraft carrier waters near island dispatching military planes region monday beijing announced tom pr ncipe island nation west coast africa one taiwan fewer two dozen remaining diplomatic allies switched allegiance mainland provoking outcry taiwan despite beijing recent actions said hurt feelings taiwanese people destabilized relations ms tsai vowed avoid confrontation bow pressure course revert old path confrontation said ms tsai faces delicate task registering discontent beijing also sending message taiwan exercise restraint united states sees taiwan one reliable allies asia sold billions dollars weapons island long sought avoid conflict two sides election mr trump complicate matters antagonized beijing series critical comments also questioned one china policy underpinned relations washington beijing decades criticized china military buildup disputed south china sea bonnie glaser asia expert center strategic international studies washington said ms tsai words might reassure american officials pursue rash policies face china show strength remains calm rational patient ms glaser wrote email still ms tsai whose democratic progressive party traditionally favored independence taiwan face serious challenges coming months many people taiwan nervous mr trump use island bargaining chip china ms tsai preference stability region may mesh mr trump bombastic style richard bush director center east asia policy studies brookings institution washington said ms tsai understood need maintain balance among relations china relations united states domestic politics ms tsai vision however may align well incoming trump administration apparent belief pressure china fronts obama administration said ms tsai also sought quell concerns planned stopovers houston san francisco visit central america scheduled january chinese ministry foreign affairs thursday called united states block ms tsai entering country warning visit embolden independence activists taiwan ms tsai described visit unofficial saying transit stop transit stop
17290,biggest loser bodies fought regain weight new york times,danny cahill stood slightly dazed blizzard confetti audience screamed family ran stage won season nbc reality television show biggest loser shedding weight anyone ever program astonishing pounds seven months got scale see evening dec weighed pounds dressed shorts lean athletic handsome model ve got life back declared mean feel like million bucks mr cahill left show stage hollywood flew directly new york start triumphal tour talk shows chatting jay leno regis philbin joy behar heard fans world elation knew bounds years since pounds crept back onto frame despite best efforts fact season contestants regained much weight lost arduously even heavier yet experiences bitter personal disappointment gift science study season contestants yielded surprising new discoveries physiology obesity help explain many people struggle unsuccessfully keep weight lose kevin hall scientist federal research center admits weakness reality tv idea follow biggest loser contestants six years victorious night project first measure happened people long six years lost large amounts weight intensive dieting exercise results researchers said stunning showed hard body fights back weight loss frightening amazing said dr hall expert metabolism national institute diabetes digestive kidney diseases part national institutes health blown away resting metabolism determines many calories person burns rest show began contestants though hugely overweight normal metabolisms size meaning burning normal number calories people weight ended metabolisms slowed radically bodies burning enough calories maintain thinner sizes researchers knew anyone deliberately loses weight even start normal weight even underweight slower metabolism diet ends surprised see biggest loser contestants slow metabolisms show ended shocked researchers happened next years went numbers scale climbed contestants metabolisms recover became even slower pounds kept piling bodies intensifying effort pull contestants back original weight mr cahill one worst regained pounds metabolism slowed much maintain current weight pounds eat calories day less typical man size anything turns fat struggles contestants went help explain hard make headway nation obesity problem afflicts third american adults despite spending billions dollars drugs dieting programs even motivated working biology experience shows body fight back years said dr michael schwartz obesity diabetes researcher professor medicine university washington new important key point tv lose enormous amounts weight go six years get away basic biological reality said dr schwartz involved study long initial weight body going try get back show doctor robert huizenga says expected contestants metabolic rates fall show hoping smaller drop questioned though whether measurements six years later accurate maintaining weight loss difficult said tells contestants exercise least nine hours week monitor diets keep weight unfortunately many contestants unable find afford adequate ongoing support exercise doctors psychologists sleep specialists trainers something need work hard change said email study findings published monday journal obesity part scientific push answer fundamental questions obesity researchers figuring fat makes many people develop diabetes medical conditions searching new ways block poison fat starting unravel reasons bariatric surgery allows people lose significant amounts weight dieting often fails looking afresh medical care obese people hope work eventually lead new therapies treat obesity chronic disease help keep weight control life people tried lose weight know hard keep weight many blame pounds come back obesity research consistently shown dieters mercy bodies muster hormones altered metabolic rate pull back old weights whether hundreds pounds extra many people trying keep always weight person body maintains without effort known weight change years may effect aging point weight easy maintain weight body fights defend finding way thwart mechanisms goal scientists striving first though trying understand greater detail dr david ludwig director new balance foundation obesity prevention center boston children hospital involved research said findings showed need new approaches weight control cautioned study limited small size lack control group obese people lose weight added findings made sense subset successful dieters said show return normal metabolism hope rest us still added shouldn interpreted mean doomed battle biology remain fat means need explore approaches scientists say weight maintenance treated issue separate weight loss challenge solved say progress truly made obesity lot basic research still need said dr margaret jackson directing project pfizer group testing drug animals least acts like leptin hormone controls hunger weight loss leptin levels fall people become hungry idea trick brains people lost weight become ravenous lack leptin many contestants kept enough weight improve health became physically active low weights strived keep eluded one erinn egbert caregiver mother versailles ky struggles mightily keep pounds metabolism burns fewer calories day expected someone size people understand treat like drug said ms egbert went pounds show weighs two treats turn binge period struggle six years season ended contestants went last fall three days testing researchers concerned contestants might try frantically lose weight coming shipped equipment measure physical activity weight visit information sent remotely contestants received metabolic results last week shocked reflection decided numbers explained lot friends drinking beer gaining massive amounts weight mr cahill said moment started drinking beer goes another pounds said right something wrong body sean algaier pastor charlotte feels cheated went pounds contestant show weight burning fewer calories day expected man size kind like hearing life sentence said slower metabolisms reason contestants regained weight though constantly battled hunger cravings binges investigators found least one reason plummeting levels leptin contestants started normal levels leptin season finale almost leptin made ravenous time weight returned leptin levels drifted half season began researchers found thus helping explain urges eat leptin one cluster hormones control hunger although dr hall colleagues measure rest another group researchers different project study funded australia national health medical research council dr joseph proietto university melbourne colleagues recruited overweight people agreed consume calories day eight nine weeks lost average nearly pounds next year pounds started coming back dr proietto colleagues looked leptin four hormones satiate people levels fell study subjects also looked hormone makes people want eat level rose surprising coordinated effect dr proietto said body puts multiple mechanisms place get back weight way maintain weight loss hungry time desperately need agents suppress hunger safe use mr cahill said weight problem began third grade got fat fatter starve eat whole cake frosting spoon afterward cower pantry kitchen feeling overwhelmed shame years insatiable urge eat kept overcoming weight climbed pounds used look think horrible monster subhuman said began sleeping recliner heavy sleep lying walking hurt stairs agony buying clothes waist humiliating remember sitting dressing room one day nothing fit looked traffic outside street thought run front car eventually seized biggest loser best chance lose enough weight live normal life tried three times finally selected show began contestants underwent medical tests sure endure rigorous schedule lay ahead rigorous sequestered biggest loser ranch contestants mr cahill exercised seven hours day burning calories according calorie tracker show gave took electrolyte tablets help replace salts lost sweating consuming many fewer calories eventually others sent home four months try keep losing weight mr cahill set goal deficit per day idea lose pound day quit job land surveyor routine went like wake run treadmill minutes breakfast typically one egg two egg whites half grapefruit piece sprouted grain toast run treadmill another minutes rest minutes bike ride nine miles gym work two half hours shower ride home eat lunch typically grilled skinless chicken breast cup broccoli spears asparagus rest hour drive gym another round exercise burned enough calories hit goal went back gym dinner work times found running around neighborhood dark indicator reset zero midnight day show finale mr cahill others dressed carefully hide rolls loose skin remained surprise horror lost weight wore compression undergarments hold mr cahill knew maintain finale weight pounds mentally physically exhausted barely moved two weeks publicity tour ended started new career giving motivational speeches biggest loser ever next four years managed keep weight pounds exercising two three hours day two years ago went back job surveyor pounds started coming back soon scale hit mr cahill started weighing measuring food stepped exercise got back pounds weight edged slow metabolism part problem food cravings opens bag chips thinking eat five bites black eat whole bag chips say dr lee kaplan obesity researcher harvard says brain sets number calories consume easy people miss much eat matters less fact bodies want hold calories dr michael rosenbaum obesity researcher columbia university collaborated dr hall previous studies said body systems regulating many calories consumed many burned tightly coupled people strenuously trying lose weight maintain significant weight loss still pounds insidiously creep eat million calories year burn except annoying calories result average annual weight gain one two pounds said small differences intake output average calories per day less one starburst candy cumulative consequences time devastating clear whether small imbalance resultant weight gain us experience age consequences changes lifestyle environment biology aging dr rosenbaum added effects small imbalances calories eaten calories burned pronounced people deliberately lose weight dr hall said yes signals regain weight wondered many extra calories people driven eat found way figure analyzed data clinical trial people took diabetes drug canagliflozin makes spill calories day urine took placebo drug known effect brain person realize calories spilled taking drug gradually lost weight every five pounds lost without realizing eating additional calories day extra calories dr hall said bigger driver weight regained slowing metabolism added people fought urge eat calories hungry unless continue fight constantly regain weight said mean modest weight loss hopeless experts say individuals respond differently diet manipulations diets example exercise drugs among interventions dr ludwig said simply cutting calories answer doubt exceptional individuals ignore primal biological signals maintain weight loss long term restricting calories said added people combination incessant hunger slowing metabolism recipe weight regain explaining individuals maintain weight loss months dr rosenbaum agreed difficulty keeping weight reflects biology pathological lack willpower affecting said mr cahill knows report dr hall group showing much metabolism slowed stopped blaming weight gain shame shoulders went said
17291,first mixtape romance new york times,hillary kerr founder digital media company los angeles tell song playing five years ago jukebox bar somewhat randomly met man became husband days version sung nico german made famous andy warhol velvet underground actually song playing met jonathan leahy december night bar silver lake district los angeles ms kerr remember exactly playing met moment jumping like tigger put answering usual questions mr leahy told music supervisor girls hbo show created starring lena dunham enough get ms kerr bouncing music changed life told mr leahy mr leahy quiet shy least doesn jump upon meeting people mesmerized main reaction said lot easier talk beautiful women bar re working hit show exchanged email addresses act politeness promise soundtrack went quiet almost year mr leahy ms kerr active social lives focused careers mr leahy grew laconia graduated college william mary williamsburg va landed los angeles later year music supervisor aperture music joined manish raval tom wolfe responsible music girls team also worked films including trainwreck television series new girl addition mr leahy music supervisor survivor remorse starz ms kerr grew la jolla section san diego graduated university southern california eventually made way new york took job assistant elle magazine moved back west coast los angeles fellow elle alum katherine power created company best known website wear casts eye celebrity culture fashion million monthly unique visitors ms kerr ms power also started wear clothing accessories line sold target nine months initial meeting mr leahy emailed ms kerr friend wanted get fashion industry ms kerr mr leahy friend met long boozy brunch began email text bit banter ms kerr said neither knew interest intention months later texted ask help score ticket see band lord huron mr leahy happens friend ben schneider band lead singer extra ticket one moments universe conspires make seem cooler actually mr leahy said ms kerr met show mr leahy ms kerr moved ambiguous mixtape era months emailed texted coy friends texts revolving around music example ms kerr visiting new york texted mr leahy request walking around soho music sent link love john newman club vibe romantic lyrics wanted read ms kerr said figured correctly turns new friend bit clueless guy didn spend much time thinking woman might react song shared another time emailed link fleetwood mac version need love bad listening ms kerr said called friend katie time continued referred supervisor knew crush said mean something mr leahy acknowledged might difficult person think sending ms kerr message song sort thought maybe much shared anyway man sent song bedbedbedbedbed vacationer remix deleted scenes friend phase ms kerr said ms kerr played game made mr leahy mix cd handwritten liner notes titled feynman diagrams mr leahy told text conversation thought idea feynman diagrams physicists map interactions subatomic particles romantic mix ms kerr included mazzy star song ve let bit easter egg actual feelings said around time ms kerr texted mr leahy photo drink menu bar roger room focused drink named song christmas card hooker minneapolis happens mr leahy favorite tom waits tune made rethink things bit said adding hillary kerr clearly trifled early mr leahy invited bleachers concert band lead singer jack antonoff ms dunham boyfriend ms dunham concert well meeting ms kerr said ve heard much ms kerr mr leahy shared first kiss night proposed polihale beach kauai hawaii jan dec friends relatives gathered palm springs calif colony palms hotel opened reputed mobster al wertheimer whose poolside guests included frank sinatra ronald reagan kirk douglas zsa zsa gabor ms kerr walked grassy aisle courtyard wearing structured lace reem acra dress strapless bustier full skirt four musicians played feeling instrumental song mr leahy wrote ms kerr minutes cocktail reception ms kerr best friends descended upon jen atkin celebrity hairstylist social media star started fussing flower sewn bride hair joey maalouf celebrity makeup artist creator service glam app whipped tube lip gloss reapplied bride pucker done makeup look went sickeningly stunning perfect said guests mingled drinks pool framed banquette tables lit strings bulbs sky turned pink stars appeared guests snapped photos shared hundreds thousands follow members illuminati imwithkerr letsgetleahyed looks like art directed eva chen head fashion partnerships instagram said took worked assistant elle ms kerr friends bride groom celebrated saw great match based passion also music leigh belz ray features news director instyle another former elle colleague made trip hillary loves music casual thing ms ray said used say ultimate fantasy become music director married one romantic first dance solomon burke need mr mrs leahy use maiden name professionally settled several hours serious dancing songs spun left hawaiian honeymoon mr leahy completed first important act husband pulled together many songs considered soundtrack romance made wife mixtape dec colony palms hotel palm springs calif flora bride groom married white birch trellis white birch state tree new hampshire mr leahy grew parents richard marie leahy reside structure wrapped white peonies sahara roses camellia greens readings mr leahy family roman catholic ms kerr parents john carole kerr spiritual religiously observant many guests artistic bent bride groom planned accordingly marshall goldsmith executive coach author lifelong family friend ms kerr officiated friends relatives stood read poems james kavanaugh mary oliver well passage supreme court ruling legalizing marriage little catholic priest little lesbian pulitzer prize winner little equal rights ms kerr explained ceremony
17292,calling angels enduring trials job new york times,angels everywhere mu iz family apartment bronx paintings angels wall ceramic angels flanking ancient vcr angels strumming lyres blowing little golden trumpets bathroom shelves jos zoraida mu iz children struggled deal series trials setbacks including cancer debilitating epilepsy deep depression near eviction sometimes seemed angels love forces holding things together zoraida early life puerto rico like something tropical dickens novel siblings mother built house hand hurricane ravaged home children father withdrew support zoraida grandfather father absent father destroyed house rage barely teenager met jos vietnam war veteran permission uncle judge married moved new york started new life built boilers worked construction using skills learned child clothing store mr mu iz began violent seizures eight day respond medication longer work stopped working take care still determined live something like normal life started family first child jos jr heart defect time six operations angels came first one painting gift cousin operated son told angel supposed die ms mu iz said figured angels taking care protecting family angels gifts friends relatives picked street like furniture mu izes overstuffed apartment complex westchester avenue bronx much restored ms mu iz many people throw away things buy said second son jesus became epileptic girl maria completed family mr mu iz felt like horrible stubborn toothache turned cancer lower jaw ms mu iz stayed room husband received radiation treatment willing take anything said never left alone never radiation work save mr mu iz life surgeons removed tongue lower jaw cut hole esophagus disfigured depressed unable speak consume nothing thicker milk needs care household mu iz children grew ve every craziness said jos jr suffered depression severe dropped college confined apartment every years time family held seemingly thread summer younger son jesus got job zaro bakery manhattan financial district family rent tied income rent tripled august month jesus school bills pay family paid funeral expenses jos sr mother died summer things began unravel fell behind rent utilities food often scarce family regularly skipped meals around time ms mu iz got touch catholic charities archdiocese new york one eight organizations supported new york times neediest cases fund covered back rent got warm coats blankets helped apply food stamps first time neediest cases fund family paid electric bill things looking ways jesus returning college track wants paramedic maria graduated december nursing program thinking father illness wants oncologist jos jr accepted new york film academy photography program jos sr continues battle cancer zoraida severely depressed keeps going asked gestured toward family sitting beside beneath painted angels give strength even times collapse said jos jr agreed use parents siblings motivation said re ms mu iz said


In [2]:
articles_rdd = df_final.rdd.map(lambda x: (x['id'], x['title'], x['content']))
print(articles_rdd.take(5))

In [3]:
# Inverted index

import itertools
import operator

def accumulate(l):
  it = itertools.groupby(l, operator.itemgetter(0))
  for key, subiter in it:
     yield key, sum(item[1] for item in subiter)


inverted_index_rdd = articles_rdd.flatMap(lambda line: [(word , (line[0], 1)) for word in (line[1] + " " + line[2]).split(" ")]) \
                                 .groupByKey() \
                                 .map(lambda word: (word[0], list(word[1]))) \
                                 .map(lambda lista: (lista[0], sorted(list(accumulate(lista[1])), key = lambda x: -x[1]))) \
                                 .cache()


inverted_index_rdd.take(5)

In [4]:
# Online

new_df = df_file.withColumn('id', df_file['id'].cast(IntegerType())) \
                .select('id', 'title', 'content') 

file_rdd = new_df.rdd.map(lambda x: (x['id'], x['title']))
file_map = file_rdd.collectAsMap()

In [5]:
dbutils.widgets.text("word", "Please enter word to search")
dbutils.widgets.text("search", "Please enter id to search")

In [6]:
toSearch = str(dbutils.widgets.get("word"))
final_result = inverted_index_rdd.filter(lambda x, toSearch=toSearch: x[0] == toSearch) \
                                 .flatMap(lambda result: result[1])

final_result_list = final_result.collect()
print(final_result_list)

In [7]:
def printing_result(): 
  cont = 0
  maximum = 5
  for i in final_result_list:
    if cont == maximum: break
    if i[0] != None:
      cont += 1
      yield i[1], list(((k, v) for k, v in file_map.items() if k == i[0]))

print(list(printing_result()))

In [8]:
from collections import defaultdict

def accumulate2(l):
  d = defaultdict(list)
  for k, *v in l:
    d[k].append(sum(v))
  for k in d.keys():
    yield k, len(d[k])

news_rdd = articles_rdd.flatMap(lambda line: [(line[0] , (word, 1)) for word in (line[1] + " " + line[2]).split(" ")]) \
                       .groupByKey() \
                       .map(lambda word: (word[0], list(word[1]))) \
                       .filter(lambda x: x[0] != None) \
                       .map(lambda lista: (lista[0], sorted(list(accumulate2(lista[1])), key = lambda x: -x[1]))) \
                       .cache()

news_rdd.count()

In [9]:
from functools import reduce

id_search = int(dbutils.widgets.get("search"))
if not id_search in file_map or id_search == None: print("Not found")
else:
  new_title = file_map[id_search]
  in_new_rdd = news_rdd.filter(lambda x, id_search=id_search: x[0] == id_search)  
  in_new_list = in_new_rdd.collect()
  
  def news_similarity2(rdd_other_news):
    list1 = in_new_list[0][1]
    list2 = rdd_other_news[1]
    list3 = []
    for value in list1:
      for v in list2:
        if value[0] == v[0]: list3.append(value[0]) 
    union = list1 + list2
    distance_list = list(filter((lambda x, list3=list3: x[0] in list3), union))
    if len(distance_list) != 0:
      last_result = reduce(lambda a, b: (a[0], a[1] + b[1]) if a[0] != "" and b[0] != "" else 0, distance_list)[1]
      result = [rdd_other_news[0], last_result, len(list3)]
    else:
      result = [rdd_other_news[0], 0, 0]
    return result

  other_news = news_rdd.filter(lambda x, id_search=id_search: x[0] != id_search) 
  sim_news = other_news.map(news_similarity2) \
                          .sortBy(lambda x: -x[1])
                          
  sim_news_df = sim_news.toDF(["id","similarity","words"])
  display(sim_news_df)

id,similarity,words
,58485,231
36274.0,1035,110
51752.0,995,82
18600.0,995,82
25704.0,991,109
24476.0,982,84
75718.0,954,112
24673.0,937,120
75386.0,921,113
75323.0,915,110


In [10]:
aux = sim_news.take(5)
news_result_final = []
for i in aux:
  news_result_final.append(i[0])
print(id_search, new_title, news_result_final)