In [1]:
import pandas as pd

In [2]:
gr_data = pd.read_csv('gr_data_genre_modified.csv')
gr_data = gr_data.drop(['Unnamed: 0'],axis=1)
display(gr_data.head(2),gr_data.shape)

Unnamed: 0,title,series,author,rating,description,language,isbn,genres,characters,bookFormat,...,publishDate,firstPublishDate,awards,numRatings,ratingsByStars,likedPercent,setting,bbeScore,bbeVotes,price
0,The Hunger Games,The Hunger Games #1,Suzanne Collins,4.33,WINNING MEANS FAME AND FORTUNE.LOSING MEANS CE...,English,9780440000000.0,"['Fantasy', 'Science Fiction', 'Dystopia', 'Yo...","['Katniss Everdeen', 'Peeta Mellark', 'Cato (H...",Hardcover,...,09/14/08,,['Locus Award Nominee for Best Young Adult Boo...,6376780,"['3444695', '1921313', '745221', '171994', '93...",96.0,"['District 12, Panem', 'Capitol, Panem', 'Pane...",2993816,30516,5.09
1,Harry Potter and the Order of the Phoenix,Harry Potter #5,"J.K. Rowling, Mary GrandPré (Illustrator)",4.5,There is a door at the end of a silent corrido...,English,9780440000000.0,"['Fantasy', 'Science Fiction', 'Magic', 'Young...","['Sirius Black', 'Draco Malfoy', 'Ron Weasley'...",Paperback,...,09/28/04,06/21/03,['Bram Stoker Award for Works for Young Reader...,2507623,"['1593642', '637516', '222366', '39573', '14526']",98.0,['Hogwarts School of Witchcraft and Wizardry (...,2632233,26923,7.38


(52478, 23)

#### List of unique genres

In [3]:
# Define an empty list to store the genres
genres_list = []

# Loop through all rows of genres
for i in range(len(gr_data)):
    # Get the genres for the current row
    genres_row = gr_data['genres'][i]

    # Remove the square brackets and single quotes
    genres_row = genres_row.replace('[','').replace(']','').replace("'",'')

    # Split the row into individual genres
    genres = genres_row.split(',')

    # Loop through each genre in the row
    for genre in genres:
        # Clean up the genre by removing any extra whitespace and converting to title case
        genre = genre.strip().title()
        # Check if the genre is not empty and not already in the genres_list
        if genre and genre not in genres_list:
            # If it contains non-ASCII characters, skip it
            if any(ord(c) > 127 for c in genre):
                continue
            # If it's not in the genres_list, add it
            else:
                genres_list.append(genre)

# Print the final genres list and its length
print("Length of uniques genres after cleaning: from 980 to",len(genres_list))
print("")
#print(genres_list)

Length of uniques genres after cleaning: from 980 to 617



### New genre dataframe

In [4]:
# New dataframe with columns named with unique genres of genres_list
genres_data = pd.DataFrame(columns=genres_list)
genres_data

Unnamed: 0,Fantasy,Science Fiction,Dystopia,Young Adult,Fiction,Action,Adventure,Romance,Magic,Children,...,Low Fantasy,Christian Contemporary Fiction,Battle Of Britain,Aircraft,Go,Civil War History,Racing,Led Zeppelin,10Th Century,Spanish History


In [57]:
#genres_data.columns

In [58]:
#genres_data.shape

### Filling genre dataframe

ast is a built-in Python module that provides a way to work with abstract syntax trees (ASTs) in Python code. In this specific case, ast.literal_eval() is used to safely evaluate a string containing a Python literal structure, such as a list or dictionary, and return the corresponding Python object. This is used to convert a string representation of a list of genres into an actual list that can be iterated over in the subsequent code.

In [9]:
import ast

# Iterate over each value in gr_data['genres']
for i in range(len(gr_data['genres'])):
    
    # Retrieve the string value of the genres for the current row
    genre_list_str = gr_data['genres'][i]
    
    # Use ast.literal_eval() to convert the string value to a list of genres
    genre_list = ast.literal_eval(genre_list_str)

    # Check if the list of genres is empty
    if len(genre_list) == 0:
        
        # If the list is empty, set the value of 'Unknown' column to 1
        genres_data['Unknown'] = 1
        
    else:
        
        # If the list is not empty, iterate over each genre in the list
        for genre in genre_list:
            
            # Check if the genre is already a column in genres_data
            if genre in genres_data.columns:
                
                # If the genre is already a column, add 1 to the corresponding row for the current book
                genres_data.loc[i, genre] = 1
                
            else:
                
                # If the genre is not already a column, create a new column for the genre with all values set to 0
                genres_data[genre] = 0
                
                # Then, add 1 to the corresponding row for the current book
                genres_data.loc[i, genre] = 1
    
    # Print the current row number being processed
    print(f"Processed row {i+1}", end="\r")


Processed row 52478

In [10]:
genres_data.shape

(47855, 638)

In [11]:
genres_data.head()

Unnamed: 0,Fantasy,Science Fiction,Dystopia,Young Adult,Fiction,Action,Adventure,Romance,Magic,Children,...,1st Grade,TV and Series,NSFW,Mills and Boon,Maps and Cartography,Gender and Sexuality,11th Century,漫画,Veganism and Vegetarianism,10th Century
0,1.0,1.0,1.0,1.0,1,1.0,1.0,1.0,,,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,1.0,1.0,,1.0,1,,1.0,,1.0,1.0,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,,,,1.0,1,,,,,,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,,,,,1,,,1.0,,,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,1.0,1.0,,1.0,1,,,1.0,,,...,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [12]:
# Saving new dataframe of unique genres to csv
genres_data.to_csv('genres_df_transposed.csv')

### Loading new genre dataframe

In [146]:
genres_df2 = pd.read_csv('genres_df_transposed.csv')

In [147]:
display(genres_df2.head(), genres_df2.shape)

Unnamed: 0.1,Unnamed: 0,Fantasy,Science Fiction,Dystopia,Young Adult,Fiction,Action,Adventure,Romance,Magic,Children,Audiobook,School,Classics,Historical Fiction,Novels,Literature,Historical,Historical Romance,Adult,Urban Fantasy,Paranormal,Paranormal Romance,Vampires,Holocaust,War,Politics,Christian Fiction,Christianity,Epic Fantasy,Civil War,Love,Drama,Coming Of Age,Contemporary,Comedy,Humor,Poetry,Picture Books,Short Stories,Gothic,Mystery,Thriller,Suspense,Crime,Mystery Thriller,Asian Countries,Asia,Horror,European Literature,European Countries,Plays,Esoterica,Philosophy,Self Help,Inspirational,Mental Health,North American Countries,Angels,Chick Lit,Animals,Chapter Books,Magical Realism,Time Travel,Iberoamerican Literature,Fairy Tales,Greek Mythology,Mythology,Dragons,Epic,Monsters,Gastronomy,Food And Nutrition,Feminism,Unfinished,Music And Musicians,Medieval,Apocalyptic,Detective,Victorian,Mental Illness,Psychology,Family,African American Literature,New York,Religion,Ireland,Nonfiction,History,Memoires And Biographies,Eastern Religions And Faith,Africa,Steampunk,Economics,Contemporary Romance,Womens,Lgtbi And Queer,Young Adult Fantasy,Travel,Young Adult Contemporary,Storytime,Mathematics,Counting,True Crime,Cats,Westerns,Superheroes,Graphic Novel And Comics,World War I,Theatre,Australia,Christmas,Holiday,Science,Arthurian,Banned Books,Pirates,Erotica,Prehistoric,Witches,Retellings,Asian Literature,Tudor Period,Media Tie In,Dinosaurs,Religion Studies,Werewolves,Portugal,Southern,Southern Gothic,Journalism,Race,Speculative Fiction,Survival,College,Tragedy,African Countries,Ancient History,Abuse,Guides And Travel,The United States Of America,Reference,Space,Military Fiction,Anthologies,Childrens Classics,Essays,Cyberpunk,Fae,African Literature,Legal Thriller,Physics,Death,Music,Islam,Ghosts,Regency,Germany,Collections,Judaism,True Story,Aliens,Law,Biology,Evolution,Anthropology,Political Science,Futuristic,French Revolution,Alternate History,American History,Christian Romance,Robots,Ancient,Dark,Fairies,Folklore,Zombies,Education,Demons,Mountaineering,Sports,Medical,Medicine,Theory,Academic,Unicorns,Business,Leadership,New Age,Personal Development,Horse Racing,American Civil War,Espionage,Social Justice And Activism,Astronomy,American Revolution,Presidents,Gender,Greece,Nobel Prize,Noir,Native Americans,Writing,Love Story,Sociology,Business And Finance,Social Science,Health,Disability,Halloween,Communication,Relationships,Aviation,Romanticism,Israel,European History,Productivity,Management,Fighters,Psychological Thriller,Mythology And Fairy Tales,Outdoors,Murder Mystery,Shapeshifters,Marriage,Architecture,Animal Fiction,M M Romance,South American Countries,Fashion,Programming And Computer Science,Cults,Weird Fiction,Lovecraftian,Cultural,Dark Fantasy,North American Literature,Historical Mystery,Batman,Americana,Genetics,Romantic Suspense,Emotion,Womens Fiction,New Weird,Hugo Awards,Diary And Journal,Buisness,Sports Romance,Polygamy,Entrepreneurship,Money,Personal Finance,Baseball,Young Adult Paranormal,Crafts,Spy Thriller,Elves,Plants,Police,Archaeology,Gardening,Historical Fantasy,Conspiracy Theories,World History,Medieval History,Military History,Ecology,Sustainability,Technology,Gaming,Utopia,Linguistics,Rabbits,Manga,Comic Fantasy,Ghost Stories,Amazon,Poverty,Parenting,Hard Boiled,Aspergers,Social,Nordic Noir,Gender Studies,Wildlife,Anime,Shojo,Counter Culture,Illness,Time Travel Romance,Young Adult Historical Fiction,Cartoon,Artificial Intelligence,American Revolutionary War,Heroic Fantasy,Forgotten Realms,Dragonlance,Regency Romance,Amish,Modern,Geography,Doctors,Chess,Martial Arts,Engineering,Pop Culture,Pulp,Wizards,Adoption,Hockey,Teaching,Boarding School,Star Wars,Fitness,Fantasy Romance,Natural History,Fan Fiction,Mermaids,Society,Mormonism,Neuroscience,Poetry Plays,Discipleship,Mixed Martial Arts,Short Story Collection,Walking,Science Fiction Romance,Young Adult Science Fiction,Rock N Roll,Mysticism,Psychoanalysis,Hard Science Fiction,Health Care,Urban,Academia,Dying Earth,Fostering,Anarchism,Satanism,Human Development,Design,Conservation,Sexuality,Film,Medieval Romance,Western Romance,Drawing,How To,Research,Cars And Motorcycles,Shonen,Maritime,Anthropomorphic,Military Science Fiction,Favorites,Cities,Urban Planning,Vegan,Cozy Mystery,Deception,Princesses,Technical,Virtual Reality,Prayer,Photography,Harlequin,Reverse Harem,Cycling,Russian History,Own,Superman,Wicca,Josei,The World,Native American History,Love Inspired,Love Inspired Historical,Literary Criticism,Journal,Brain,Lesbian Fiction,Military Romance,Sewing And Crafts,Cinderella,Prostitution,Divorce,Birds,Epic Poetry,Marathi,Swashbuckling,Transport,Government,New Adult Romance,Football,Counselling,Cthulhu Mythos,Mine,Dictionaries,Prehistory,Spanish Civil War,Wilderness,Number,International,Surreal,Us Presidents,Naval History,Light Novel,Terrorism,Seinen,Classical Studies,Futurism,Singularity,Quantum Mechanics,Fat Studies,Gothic Romance,Tasmania,Humanities,Recreation,Basketball,Female Authors,Marvel,Psychiatry,Sci Fi Fantasy,X Men,Microhistory,Elizabethan Period,Teachers,Climbing,Gay Fiction,Soccer,Paranormal Mystery,Class,Judaica,Zen,Oral History,Punk,Lesbian Romance,Holland,Splatterpunk,Interracial Romance,Urban Studies,Jazz,Paganism,Victor Frankenstein,Slice Of Life,Near Future,Chemistry,M M Fantasy,Nursery Rhymes,Trains,Puzzles,Hip Hop,Alternate Universe,Climate Change,Palaeontology,Social Media,Tea,Western Historical Romance,American Classics,Firefighters,Alexandria,Geology,Romanovs,Drinking,Polyamory,Bizarro Fiction,Climate Change Fiction,Disease,Post Colonial,Asexual,Wine,Baha I,Manhwa,Nerd,Soviet History,Russian Revolution,International Relations,Soldiers,Musicals,Labor,Doctor Who,Feminist Theory,Fire Services,Egyptology,Webcomic,Tv And Series,Paranormal Urban Fantasy,Slash Fiction,Yaoi,Roman Britain,Buffy The Vampire Slayer,Amish Fiction,Komik,Lenin,International Development,Angola,Pilots,Star Trek,Alchemy,Edwardian,Role Playing Games,Personal Growth,Mary Shelley,Weird West,Witchcraft,Libya,Planetary Romance,Shounen Ai,Alcohol,Mali,Rus,Spider Man,Moroccan,Erotic Horror,Vegetarian,Cryptozoology,Trivia,Victorian Romance,Harem,Ethnography,Cultural Studies,Frugal,Alternative Medicine,Reportage,Booze,Museums,Agriculture,Horticulture,Battle Of Gettysburg,Lie,Mistery,Stories,Sewing,Canon,M M Contemporary,Students,Stuart,M M Sports Romance,Star Trek The Next Generation,Academics,Green,Bicycles,Helicopters,Amateur Sleuth,M M Historical Romance,Nazi Party,Futuristic Romance,Maps And Cartography,Hqn,Graphic Novels Comics Manga,Mail Order Brides,Yuri,Nursing,Traditional Chinese Medicine,Georgian Romance,Viking Romance,Stand Up,Ornithology,Beer,Soviet Union,Civil War Eastern Theater,Latin American History,M M Paranormal,Manga Romance,Creation Science,Naval Historical Fiction,Star Trek Deep Space Nine,Silhouette,Gothic Horror,Gamebooks,Choose Your Own Adventure,Japanese History,World Of Darkness,Railways,Veganism And Vegetarianism,Mira,Wonder Woman,Herbs,Low Fantasy,Christian Contemporary Fiction,Battle Of Britain,Aircraft,Go,Civil War History,Racing,Led Zeppelin,Spanish History,World War II,19th Century,Asian countries,LGBT,"Gastronomy, Food and Nutrition",20th Century,Music and Musicians,Memoires and Biographies,Eastern Religions and Faith,LGTBI and Queer,Graphic Novel and Comics,BDSM,Art and Photography,18th Century,Guides and Travel,Social Justice and Activism,Business and Finance,Beauty and The Beast,Mythology and Fairy Tales,Programming and Computer Science,14th Century,Diary and Journal,15th Century,Unknown,16th Century,Sword and Sorcery,Dungeons and Dragons,17th Century,21st Century,13th Century,12th Century,Cars and Motorcycles,Bande Dessinée,Sewing and Crafts,Sao Tome and Principe,Food and Drink,History and Politics,Sword and Planet,2nd Grade,40k,1st Grade,TV and Series,NSFW,Mills and Boon,Maps and Cartography,Gender and Sexuality,11th Century,漫画,Veganism and Vegetarianism,10th Century
0,0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,1,1.0,1.0,,1.0,1.0,,1.0,,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,2,,,,1.0,1.0,,,,,,,1.0,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,3,,,,,1.0,,,1.0,,,,,1.0,1.0,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,4,1.0,1.0,,1.0,1.0,,,1.0,,,,,,,,,,,,1.0,1.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


(47855, 639)

In [148]:
gr_data['genres'][0]

"['Fantasy', 'Science Fiction', 'Dystopia', 'Young Adult', 'Fiction', 'Action', 'Adventure', 'Romance']"

In [149]:
gr_data['genres'][1]

"['Fantasy', 'Science Fiction', 'Magic', 'Young Adult', 'Children', 'Fiction', 'Audiobook', 'School', 'Adventure', 'Classics']"

##### 'Unnamed: 0'

In [150]:
# 'Unnamed: 0' column holds the index in gr_data, so I'll keep it to merge with it later
genres_df2 = genres_df2.rename(columns={'Unnamed: 0': 'index_gr_data'})

##### Columns with only '0' as values

In [151]:
to_delete = ['World War Ii', '19Th Century', 'Lgbt', '20Th Century', 'Bdsm', '18Th Century',
             'Beauty And The Beast', '14Th Century', '15Th Century', '16Th Century', 
             'Sword And Sorcery', 'Dungeons And Dragons', '17Th Century', '21St Century',
             '13Th Century', '12Th Century', 'Sao Tome And Principe', 'Food And Drink',
             'History And Politics', 'Sword And Planet', 'Art And Photography', '2Nd Grade',
             '40K', '1St Grade', 'Nsfw', 'Mills And Boon', 'Gender And Sexuality', 
             '11Th Century', '10Th Century']

len(to_delete)

29

In [152]:
# Lowering names from both 'to_delete' list and dataframe's columns.

for i in range(len(to_delete)):
    to_delete[i] = to_delete[i].lower()
    
#to_delete

In [153]:
for col in genres_df2.columns:
    genres_df2.rename(columns={col: col.lower()}, inplace=True)
    
genres_df2.columns

Index(['index_gr_data', 'fantasy', 'science fiction', 'dystopia',
       'young adult', 'fiction', 'action', 'adventure', 'romance', 'magic',
       ...
       '1st grade', 'tv and series', 'nsfw', 'mills and boon',
       'maps and cartography', 'gender and sexuality', '11th century', '漫画',
       'veganism and vegetarianism', '10th century'],
      dtype='object', length=639)

In [154]:
# Dropping these columns
genres_df2 = genres_df2.drop(columns=to_delete,axis=1)

In [155]:
genres_df2.shape

(47855, 610)

##### Difference of number of rows between original and new dataframes

In [156]:
print("There's a difference of", len(gr_data)-len(genres_df2), "rows between dataframes.")

There's a difference of 4623 rows between dataframes.


In [157]:
# Checking rows not included: description is [] empty

# Get a list of index values from gr_data that are not present in genres_df
diff_rows = gr_data[~gr_data.index.isin(genres_df2['index_gr_data'])]

# Rows from gr_data that are not present in genres_df
display(diff_rows.head(3), diff_rows.shape)


Unnamed: 0,title,series,author,rating,description,language,isbn,genres,characters,bookFormat,edition,pages,publisher,publishDate,firstPublishDate,awards,numRatings,ratingsByStars,likedPercent,setting,bbeScore,bbeVotes,price
1483,Beg For Mercy,Mercy #3,Lucian Bane (Goodreads Author),4.29,"The fight is on in this installment, Mercy is ...",English,10000000000000.0,[],[],Kindle Edition,,,,August 18th 2015,08/17/15,[],714,"['439', '130', '87', '27', '31']",92.0,[],3246,33,
1567,سیمای شکسته پدر سالار,,سید مرتضی مصطفوی (Goodreads Author),3.56,"رمان بلند ""سیمای شکسته پدر سالار"" که از تعلیق...",Persian,9786010000000.0,[],[],ebook,فارسی,367.0,نشر داستان,March 6th 2017,10/28/16,[],700,"['332', '99', '79', '6', '184']",73.0,[],2943,30,
2040,Life Song,,Christine M. Knight (Goodreads Author),4.18,Overview: Mavis was born to be a songbird. Her...,,9780990000000.0,[],[],Paperback,,338.0,Highlight Publishing,October 14th 2013,10-01-2013,[],74,"['44', '11', '11', '4', '4']",89.0,[],1983,20,18.8


(4623, 23)

In [158]:
diff_rows['genres'].value_counts()

[]    4623
Name: genres, dtype: int64

In [159]:
genres_df2['unknown'].value_counts(dropna=False)

1.0    47835
NaN       20
Name: unknown, dtype: int64

In [160]:
# Correcting values of actual 'unkown'
genres_df2['unknown'] = 0.0
genres_df2['unknown'].value_counts(dropna=False)

0.0    47855
Name: unknown, dtype: int64

In [161]:
index_num = diff_rows.index[0]
index_num

1483

In [162]:
diff_rows_indexes = diff_rows.index.tolist()
len(diff_rows_indexes)

4623

In [163]:
genres_df2.shape

(47855, 610)

###### Adding missing rows to genres_df2 (index and 'unknown' = 1)


In [164]:
#for index_num in diff_rows_indexes:
#    genres_df2.loc[index_num] = 0
#    genres_df2.loc[index_num, 'index_gr_data'] = index_num

In [165]:
for index_num in diff_rows_indexes:
    #Add a new row to the genres_df2 DataFrame and set all columns to 0
    genres_df2.loc[len(genres_df2)] = 0
    # Add the current index to the index_gr_data column of the newly added row
    genres_df2.at[len(genres_df2)-1, 'index_gr_data'] = index_num
    # Set the 'unknown' column of the newly added row to 1.0
    genres_df2.at[len(genres_df2)-1, 'unknown'] = 1.0


In [169]:
# Checking that there are 52.478 rows
display(genres_df2.head(3), genres_df2.shape)

Unnamed: 0,index_gr_data,fantasy,science fiction,dystopia,young adult,fiction,action,adventure,romance,magic,children,audiobook,school,classics,historical fiction,novels,literature,historical,historical romance,adult,urban fantasy,paranormal,paranormal romance,vampires,holocaust,war,politics,christian fiction,christianity,epic fantasy,civil war,love,drama,coming of age,contemporary,comedy,humor,poetry,picture books,short stories,gothic,mystery,thriller,suspense,crime,mystery thriller,asian countries,asia,horror,european literature,european countries,plays,esoterica,philosophy,self help,inspirational,mental health,north american countries,angels,chick lit,animals,chapter books,magical realism,time travel,iberoamerican literature,fairy tales,greek mythology,mythology,dragons,epic,monsters,gastronomy,food and nutrition,feminism,unfinished,music and musicians,medieval,apocalyptic,detective,victorian,mental illness,psychology,family,african american literature,new york,religion,ireland,nonfiction,history,memoires and biographies,eastern religions and faith,africa,steampunk,economics,contemporary romance,womens,lgtbi and queer,young adult fantasy,travel,young adult contemporary,storytime,mathematics,counting,true crime,cats,westerns,superheroes,graphic novel and comics,world war i,theatre,australia,christmas,holiday,science,arthurian,banned books,pirates,erotica,prehistoric,witches,retellings,asian literature,tudor period,media tie in,dinosaurs,religion studies,werewolves,portugal,southern,southern gothic,journalism,race,speculative fiction,survival,college,tragedy,african countries,ancient history,abuse,guides and travel,the united states of america,reference,space,military fiction,anthologies,childrens classics,essays,cyberpunk,fae,african literature,legal thriller,physics,death,music,islam,ghosts,regency,germany,collections,judaism,true story,aliens,law,biology,evolution,anthropology,political science,futuristic,french revolution,alternate history,american history,christian romance,robots,ancient,dark,fairies,folklore,zombies,education,demons,mountaineering,sports,medical,medicine,theory,academic,unicorns,business,leadership,new age,personal development,horse racing,american civil war,espionage,social justice and activism,astronomy,american revolution,presidents,gender,greece,nobel prize,noir,native americans,writing,love story,sociology,business and finance,social science,health,disability,halloween,communication,relationships,aviation,romanticism,israel,european history,productivity,management,fighters,psychological thriller,mythology and fairy tales,outdoors,murder mystery,shapeshifters,marriage,architecture,animal fiction,m m romance,south american countries,fashion,programming and computer science,cults,weird fiction,lovecraftian,cultural,dark fantasy,north american literature,historical mystery,batman,americana,genetics,romantic suspense,emotion,womens fiction,new weird,hugo awards,diary and journal,buisness,sports romance,polygamy,entrepreneurship,money,personal finance,baseball,young adult paranormal,crafts,spy thriller,elves,plants,police,archaeology,gardening,historical fantasy,conspiracy theories,world history,medieval history,military history,ecology,sustainability,technology,gaming,utopia,linguistics,rabbits,manga,comic fantasy,ghost stories,amazon,poverty,parenting,hard boiled,aspergers,social,nordic noir,gender studies,wildlife,anime,shojo,counter culture,illness,time travel romance,young adult historical fiction,cartoon,artificial intelligence,american revolutionary war,heroic fantasy,forgotten realms,dragonlance,regency romance,amish,modern,geography,doctors,chess,martial arts,engineering,pop culture,pulp,wizards,adoption,hockey,teaching,boarding school,star wars,fitness,fantasy romance,natural history,fan fiction,mermaids,society,mormonism,neuroscience,poetry plays,discipleship,mixed martial arts,short story collection,walking,science fiction romance,young adult science fiction,rock n roll,mysticism,psychoanalysis,hard science fiction,health care,urban,academia,dying earth,fostering,anarchism,satanism,human development,design,conservation,sexuality,film,medieval romance,western romance,drawing,how to,research,cars and motorcycles,shonen,maritime,anthropomorphic,military science fiction,favorites,cities,urban planning,vegan,cozy mystery,deception,princesses,technical,virtual reality,prayer,photography,harlequin,reverse harem,cycling,russian history,own,superman,wicca,josei,the world,native american history,love inspired,love inspired historical,literary criticism,journal,brain,lesbian fiction,military romance,sewing and crafts,cinderella,prostitution,divorce,birds,epic poetry,marathi,swashbuckling,transport,government,new adult romance,football,counselling,cthulhu mythos,mine,dictionaries,prehistory,spanish civil war,wilderness,number,international,surreal,us presidents,naval history,light novel,terrorism,seinen,classical studies,futurism,singularity,quantum mechanics,fat studies,gothic romance,tasmania,humanities,recreation,basketball,female authors,marvel,psychiatry,sci fi fantasy,x men,microhistory,elizabethan period,teachers,climbing,gay fiction,soccer,paranormal mystery,class,judaica,zen,oral history,punk,lesbian romance,holland,splatterpunk,interracial romance,urban studies,jazz,paganism,victor frankenstein,slice of life,near future,chemistry,m m fantasy,nursery rhymes,trains,puzzles,hip hop,alternate universe,climate change,palaeontology,social media,tea,western historical romance,american classics,firefighters,alexandria,geology,romanovs,drinking,polyamory,bizarro fiction,climate change fiction,disease,post colonial,asexual,wine,baha i,manhwa,nerd,soviet history,russian revolution,international relations,soldiers,musicals,labor,doctor who,feminist theory,fire services,egyptology,webcomic,tv and series,paranormal urban fantasy,slash fiction,yaoi,roman britain,buffy the vampire slayer,amish fiction,komik,lenin,international development,angola,pilots,star trek,alchemy,edwardian,role playing games,personal growth,mary shelley,weird west,witchcraft,libya,planetary romance,shounen ai,alcohol,mali,rus,spider man,moroccan,erotic horror,vegetarian,cryptozoology,trivia,victorian romance,harem,ethnography,cultural studies,frugal,alternative medicine,reportage,booze,museums,agriculture,horticulture,battle of gettysburg,lie,mistery,stories,sewing,canon,m m contemporary,students,stuart,m m sports romance,star trek the next generation,academics,green,bicycles,helicopters,amateur sleuth,m m historical romance,nazi party,futuristic romance,maps and cartography,hqn,graphic novels comics manga,mail order brides,yuri,nursing,traditional chinese medicine,georgian romance,viking romance,stand up,ornithology,beer,soviet union,civil war eastern theater,latin american history,m m paranormal,manga romance,creation science,naval historical fiction,star trek deep space nine,silhouette,gothic horror,gamebooks,choose your own adventure,japanese history,world of darkness,railways,veganism and vegetarianism,mira,wonder woman,herbs,low fantasy,christian contemporary fiction,battle of britain,aircraft,go,civil war history,racing,led zeppelin,spanish history,asian countries.1,"gastronomy, food and nutrition",music and musicians.1,memoires and biographies.1,eastern religions and faith.1,lgtbi and queer.1,graphic novel and comics.1,guides and travel.1,social justice and activism.1,business and finance.1,mythology and fairy tales.1,programming and computer science.1,diary and journal.1,unknown,cars and motorcycles.1,bande dessinée,sewing and crafts.1,tv and series.1,maps and cartography.1,漫画,veganism and vegetarianism.1
0,0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,1,1.0,1.0,,1.0,1.0,,1.0,,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,2,,,,1.0,1.0,,,,,,,1.0,1.0,1.0,1.0,1.0,1.0,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


(52478, 610)

In [167]:
# Saving new dataframe of unique genres to csv
genres_df2.to_csv('genres_df_allrows.csv')

#### Dealing with NaN

In [177]:
genres_df3 = pd.read_csv('genres_df_allrows.csv')

In [178]:
genres_df3 = genres_df3.drop(['Unnamed: 0'],axis=1)

In [179]:
genres_df3.shape

(52478, 610)

In [180]:
# Total amount of NaNs in the dataframe (should be 0)
genres_df3.isna().sum().sum()

28618575

In [181]:
# Filling Na
genres_df3 = genres_df3.fillna(0.0)

In [182]:
genres_df3.isna().sum().sum()

0

In [184]:
genres_df3.head()

Unnamed: 0,index_gr_data,fantasy,science fiction,dystopia,young adult,fiction,action,adventure,romance,magic,children,audiobook,school,classics,historical fiction,novels,literature,historical,historical romance,adult,urban fantasy,paranormal,paranormal romance,vampires,holocaust,war,politics,christian fiction,christianity,epic fantasy,civil war,love,drama,coming of age,contemporary,comedy,humor,poetry,picture books,short stories,gothic,mystery,thriller,suspense,crime,mystery thriller,asian countries,asia,horror,european literature,european countries,plays,esoterica,philosophy,self help,inspirational,mental health,north american countries,angels,chick lit,animals,chapter books,magical realism,time travel,iberoamerican literature,fairy tales,greek mythology,mythology,dragons,epic,monsters,gastronomy,food and nutrition,feminism,unfinished,music and musicians,medieval,apocalyptic,detective,victorian,mental illness,psychology,family,african american literature,new york,religion,ireland,nonfiction,history,memoires and biographies,eastern religions and faith,africa,steampunk,economics,contemporary romance,womens,lgtbi and queer,young adult fantasy,travel,young adult contemporary,storytime,mathematics,counting,true crime,cats,westerns,superheroes,graphic novel and comics,world war i,theatre,australia,christmas,holiday,science,arthurian,banned books,pirates,erotica,prehistoric,witches,retellings,asian literature,tudor period,media tie in,dinosaurs,religion studies,werewolves,portugal,southern,southern gothic,journalism,race,speculative fiction,survival,college,tragedy,african countries,ancient history,abuse,guides and travel,the united states of america,reference,space,military fiction,anthologies,childrens classics,essays,cyberpunk,fae,african literature,legal thriller,physics,death,music,islam,ghosts,regency,germany,collections,judaism,true story,aliens,law,biology,evolution,anthropology,political science,futuristic,french revolution,alternate history,american history,christian romance,robots,ancient,dark,fairies,folklore,zombies,education,demons,mountaineering,sports,medical,medicine,theory,academic,unicorns,business,leadership,new age,personal development,horse racing,american civil war,espionage,social justice and activism,astronomy,american revolution,presidents,gender,greece,nobel prize,noir,native americans,writing,love story,sociology,business and finance,social science,health,disability,halloween,communication,relationships,aviation,romanticism,israel,european history,productivity,management,fighters,psychological thriller,mythology and fairy tales,outdoors,murder mystery,shapeshifters,marriage,architecture,animal fiction,m m romance,south american countries,fashion,programming and computer science,cults,weird fiction,lovecraftian,cultural,dark fantasy,north american literature,historical mystery,batman,americana,genetics,romantic suspense,emotion,womens fiction,new weird,hugo awards,diary and journal,buisness,sports romance,polygamy,entrepreneurship,money,personal finance,baseball,young adult paranormal,crafts,spy thriller,elves,plants,police,archaeology,gardening,historical fantasy,conspiracy theories,world history,medieval history,military history,ecology,sustainability,technology,gaming,utopia,linguistics,rabbits,manga,comic fantasy,ghost stories,amazon,poverty,parenting,hard boiled,aspergers,social,nordic noir,gender studies,wildlife,anime,shojo,counter culture,illness,time travel romance,young adult historical fiction,cartoon,artificial intelligence,american revolutionary war,heroic fantasy,forgotten realms,dragonlance,regency romance,amish,modern,geography,doctors,chess,martial arts,engineering,pop culture,pulp,wizards,adoption,hockey,teaching,boarding school,star wars,fitness,fantasy romance,natural history,fan fiction,mermaids,society,mormonism,neuroscience,poetry plays,discipleship,mixed martial arts,short story collection,walking,science fiction romance,young adult science fiction,rock n roll,mysticism,psychoanalysis,hard science fiction,health care,urban,academia,dying earth,fostering,anarchism,satanism,human development,design,conservation,sexuality,film,medieval romance,western romance,drawing,how to,research,cars and motorcycles,shonen,maritime,anthropomorphic,military science fiction,favorites,cities,urban planning,vegan,cozy mystery,deception,princesses,technical,virtual reality,prayer,photography,harlequin,reverse harem,cycling,russian history,own,superman,wicca,josei,the world,native american history,love inspired,love inspired historical,literary criticism,journal,brain,lesbian fiction,military romance,sewing and crafts,cinderella,prostitution,divorce,birds,epic poetry,marathi,swashbuckling,transport,government,new adult romance,football,counselling,cthulhu mythos,mine,dictionaries,prehistory,spanish civil war,wilderness,number,international,surreal,us presidents,naval history,light novel,terrorism,seinen,classical studies,futurism,singularity,quantum mechanics,fat studies,gothic romance,tasmania,humanities,recreation,basketball,female authors,marvel,psychiatry,sci fi fantasy,x men,microhistory,elizabethan period,teachers,climbing,gay fiction,soccer,paranormal mystery,class,judaica,zen,oral history,punk,lesbian romance,holland,splatterpunk,interracial romance,urban studies,jazz,paganism,victor frankenstein,slice of life,near future,chemistry,m m fantasy,nursery rhymes,trains,puzzles,hip hop,alternate universe,climate change,palaeontology,social media,tea,western historical romance,american classics,firefighters,alexandria,geology,romanovs,drinking,polyamory,bizarro fiction,climate change fiction,disease,post colonial,asexual,wine,baha i,manhwa,nerd,soviet history,russian revolution,international relations,soldiers,musicals,labor,doctor who,feminist theory,fire services,egyptology,webcomic,tv and series,paranormal urban fantasy,slash fiction,yaoi,roman britain,buffy the vampire slayer,amish fiction,komik,lenin,international development,angola,pilots,star trek,alchemy,edwardian,role playing games,personal growth,mary shelley,weird west,witchcraft,libya,planetary romance,shounen ai,alcohol,mali,rus,spider man,moroccan,erotic horror,vegetarian,cryptozoology,trivia,victorian romance,harem,ethnography,cultural studies,frugal,alternative medicine,reportage,booze,museums,agriculture,horticulture,battle of gettysburg,lie,mistery,stories,sewing,canon,m m contemporary,students,stuart,m m sports romance,star trek the next generation,academics,green,bicycles,helicopters,amateur sleuth,m m historical romance,nazi party,futuristic romance,maps and cartography,hqn,graphic novels comics manga,mail order brides,yuri,nursing,traditional chinese medicine,georgian romance,viking romance,stand up,ornithology,beer,soviet union,civil war eastern theater,latin american history,m m paranormal,manga romance,creation science,naval historical fiction,star trek deep space nine,silhouette,gothic horror,gamebooks,choose your own adventure,japanese history,world of darkness,railways,veganism and vegetarianism,mira,wonder woman,herbs,low fantasy,christian contemporary fiction,battle of britain,aircraft,go,civil war history,racing,led zeppelin,spanish history,asian countries.1,"gastronomy, food and nutrition",music and musicians.1,memoires and biographies.1,eastern religions and faith.1,lgtbi and queer.1,graphic novel and comics.1,guides and travel.1,social justice and activism.1,business and finance.1,mythology and fairy tales.1,programming and computer science.1,diary and journal.1,unknown,cars and motorcycles.1,bande dessinée,sewing and crafts.1,tv and series.1,maps and cartography.1,漫画,veganism and vegetarianism.1
0,0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
1,1,1.0,1.0,0.0,1.0,1.0,0.0,1.0,0.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
2,2,0.0,0.0,0.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
3,3,0.0,0.0,0.0,0.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0
4,4,1.0,1.0,0.0,1.0,1.0,0.0,0.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1.0,1.0,1.0,1.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0


In [185]:
gr_data['genres'][1]

"['Fantasy', 'Science Fiction', 'Magic', 'Young Adult', 'Children', 'Fiction', 'Audiobook', 'School', 'Adventure', 'Classics']"

In [186]:
gr_data['genres'][1]

"['Fantasy', 'Science Fiction', 'Magic', 'Young Adult', 'Children', 'Fiction', 'Audiobook', 'School', 'Adventure', 'Classics']"

In [187]:
genres_df3.shape

(52478, 610)

### Saving clean genre dataframe

In [188]:
genres_df3.to_csv('genres_clean_dataset.csv')