# <font color='blue'>Análise de Dados com Linguagem Python</font>

## <font color='blue'>Projeto 7</font>
## <font color='blue'>Web Data Analytics - Limpeza e Formatação de Dados</font>

## Instalando e Carregando os Pacotes

In [1]:
# Versão da Linguagem Python
from platform import python_version
print('Versão da Linguagem Python Usada Neste Jupyter Notebook:', python_version())

Versão da Linguagem Python Usada Neste Jupyter Notebook: 3.9.7


In [3]:
# Imports
import re
import numpy as np
import pandas as pd
import warnings
warnings.filterwarnings('ignore')

## Carregando o Dataset

In [5]:
# Carrega os arquivos
df = pd.read_csv("dados/Processamento/animeInfoCombination.csv")

In [6]:
# Aumenta o número de colunas que podemos visualizar aqui no navegador
pd.set_option("display.max_columns", 97)

In [7]:
# Visualiza amostra de dados
df.head()

Unnamed: 0,name,producers,ranking,votersCount,score,popularity,members,favorite,episodes,animeType,premiredDate,animeSource,genres,studios,licenses,rating,voiceActorNameandLanguage,staffNameandOccupation
0,Fullmetal Alchemist: Brotherhood,"['Aniplex', 'SquareEnix', 'MainichiBroadcastin...",1,1650275,9.15,3,2713695,191501,64.0,TV,Spring 2009,Manga,"['ActionAction', 'AdventureAdventure', 'Comedy...",Bones,"['Funimation', 'AniplexofAmerica']",R-17+,"[['Kugimiya,Rie', 'Japanese'], ['Ponticelli,Be...","[['Cook,Justin', 'Producer'], ['Yonai,Noritomo..."
1,Gintama°,"['TVTokyo', 'Aniplex', 'Dentsu']",2,173906,9.09,337,493336,13063,51.0,TV,Spring 2015,Manga,"['ActionAction', 'ComedyComedy', 'Sci-FiSci-Fi']",Bandai Namco Pictures,"['Funimation', 'Crunchyroll']",PG-13-Teens,"[['Kugimiya,Rie', 'Japanese'], ['Ishii,Kouji',...","[['Fujita,Youichi', 'Director,Storyboard,Plann..."
2,Shingeki no Kyojin Season 3 Part 2,"['ProductionI.G', 'Dentsu', 'MainichiBroadcast...",3,1127900,9.09,33,1635976,46238,10.0,TV,Spring 2019,Manga,"['ActionAction', 'DramaDrama', 'FantasyFantasy...",Wit Studio,['Funimation'],R-17+,"[['Ishikawa,Yui', 'Japanese'], ['Perino,Elena'...","[['Morishita,Katsuji', 'Producer,Planning'], [..."
3,Steins;Gate,"['FrontierWorks', 'MediaFactory', 'Movic', 'AT...",4,1128557,9.09,12,2117018,162324,24.0,TV,Spring 2011,Visual novel,"['DramaDrama', 'Sci-FiSci-Fi', 'SuspenseSuspen...",White Fox,['Funimation'],PG-13-Teens,"[['Seki,Tomokazu', 'Japanese'], ['Rinehart,Tys...","[['Iwasa,Gaku', 'Producer'], ['Yasuda,Takeshi'..."
4,Fruits Basket: The Final,"['TVTokyo', 'TVOsaka', 'NihonAdSystems', 'Haku...",5,124091,9.06,619,288314,13330,13.0,TV,Spring 2021,Manga,"['ComedyComedy', 'DramaDrama', 'RomanceRomance...",TMS Entertainment,['Funimation'],PG-13-Teens,"[['Iwami,Manaka', 'Japanese'], ['Ruis,Carolina...","[['Ibata,Yoshihide', 'Director'], ['Aketagawa,..."


## Funções de Limpeza e Formatação

In [8]:
df["producers"]

0      ['Aniplex', 'SquareEnix', 'MainichiBroadcastin...
1                       ['TVTokyo', 'Aniplex', 'Dentsu']
2      ['ProductionI.G', 'Dentsu', 'MainichiBroadcast...
3      ['FrontierWorks', 'MediaFactory', 'Movic', 'AT...
4      ['TVTokyo', 'TVOsaka', 'NihonAdSystems', 'Haku...
                             ...                        
495                                              ['NHK']
496                                          ['TVAsahi']
497                                ['NHK', 'SogoVision']
498    ['TVTokyo', 'GeneonUniversalEntertainment', 'S...
499                             ['Nonefound', 'addsome']
Name: producers, Length: 500, dtype: object

In [9]:
def remove_quote(word):
    return word.replace("'","")

In [10]:
def remove_openBracket(word):
    return word.replace("[","")

In [11]:
def remove_closeBracket(word):
    return word.replace("]","")

In [12]:
def remove_commaWithSemicolon(word):
    return word.replace(",",";")

In [13]:
def remove_space(word):
    return word.replace(" ","")

## Limpeza e Formatação dos Dados

In [14]:
# Aplica as funções para formatar os nomes dos producers
df["producers"] = remove_quote(df["producers"].str)
df["producers"] = remove_openBracket(df["producers"].str)
df["producers"] = remove_closeBracket(df["producers"].str)
df["producers"] = remove_commaWithSemicolon(df["producers"].str)
df["producers"] = remove_space(df["producers"].str)

In [15]:
df["producers"][0]

'Aniplex;SquareEnix;MainichiBroadcastingSystem;StudioMoriken'

In [16]:
df["genres"]

0      ['ActionAction', 'AdventureAdventure', 'Comedy...
1       ['ActionAction', 'ComedyComedy', 'Sci-FiSci-Fi']
2      ['ActionAction', 'DramaDrama', 'FantasyFantasy...
3      ['DramaDrama', 'Sci-FiSci-Fi', 'SuspenseSuspen...
4      ['ComedyComedy', 'DramaDrama', 'RomanceRomance...
                             ...                        
495                   ['RomanceRomance', 'SportsSports']
496    ['ActionAction', 'AdventureAdventure', 'DramaD...
497    ['ActionAction', 'AdventureAdventure', 'Fantas...
498    ['ComedyComedy', 'RomanceRomance', 'Supernatur...
499    ['AdventureAdventure', 'ComedyComedy', 'Fantas...
Name: genres, Length: 500, dtype: object

In [17]:
# Aplica as funções para formatar os nomes dos genres
df["genres"] = remove_quote(df["genres"].str)
df["genres"] = remove_openBracket(df["genres"].str)
df["genres"] = remove_closeBracket(df["genres"].str)
df["genres"] = remove_commaWithSemicolon(df["genres"].str)
df["genres"] = remove_space(df["genres"].str)

In [18]:
df["genres"][0]

'ActionAction;AdventureAdventure;ComedyComedy;DramaDrama;FantasyFantasy'

In [19]:
df["licenses"]

0                  ['Funimation', 'AniplexofAmerica']
1                       ['Funimation', 'Crunchyroll']
2                                      ['Funimation']
3                                      ['Funimation']
4                                      ['Funimation']
                            ...                      
495                                               NaN
496                                               NaN
497    ['MediaBlasters', 'DiscotekMedia', 'Tokyopop']
498                               ['SentaiFilmworks']
499                                 ['DiscotekMedia']
Name: licenses, Length: 500, dtype: object

In [20]:
# Aplica as funções para formatar os nomes das licenses
df["licenses"] = remove_quote(df["licenses"].str)
df["licenses"] = remove_openBracket(df["licenses"].str)
df["licenses"] = remove_closeBracket(df["licenses"].str)
df["licenses"] = remove_commaWithSemicolon(df["licenses"].str)
df["licenses"] = remove_space(df["licenses"].str)

In [21]:
df["licenses"][0]

'Funimation;AniplexofAmerica'

In [22]:
# Amostra dos dados
df.head()

Unnamed: 0,name,producers,ranking,votersCount,score,popularity,members,favorite,episodes,animeType,premiredDate,animeSource,genres,studios,licenses,rating,voiceActorNameandLanguage,staffNameandOccupation
0,Fullmetal Alchemist: Brotherhood,Aniplex;SquareEnix;MainichiBroadcastingSystem;...,1,1650275,9.15,3,2713695,191501,64.0,TV,Spring 2009,Manga,ActionAction;AdventureAdventure;ComedyComedy;D...,Bones,Funimation;AniplexofAmerica,R-17+,"[['Kugimiya,Rie', 'Japanese'], ['Ponticelli,Be...","[['Cook,Justin', 'Producer'], ['Yonai,Noritomo..."
1,Gintama°,TVTokyo;Aniplex;Dentsu,2,173906,9.09,337,493336,13063,51.0,TV,Spring 2015,Manga,ActionAction;ComedyComedy;Sci-FiSci-Fi,Bandai Namco Pictures,Funimation;Crunchyroll,PG-13-Teens,"[['Kugimiya,Rie', 'Japanese'], ['Ishii,Kouji',...","[['Fujita,Youichi', 'Director,Storyboard,Plann..."
2,Shingeki no Kyojin Season 3 Part 2,ProductionI.G;Dentsu;MainichiBroadcastingSyste...,3,1127900,9.09,33,1635976,46238,10.0,TV,Spring 2019,Manga,ActionAction;DramaDrama;FantasyFantasy;Mystery...,Wit Studio,Funimation,R-17+,"[['Ishikawa,Yui', 'Japanese'], ['Perino,Elena'...","[['Morishita,Katsuji', 'Producer,Planning'], [..."
3,Steins;Gate,FrontierWorks;MediaFactory;Movic;AT-X;Kadokawa...,4,1128557,9.09,12,2117018,162324,24.0,TV,Spring 2011,Visual novel,DramaDrama;Sci-FiSci-Fi;SuspenseSuspense,White Fox,Funimation,PG-13-Teens,"[['Seki,Tomokazu', 'Japanese'], ['Rinehart,Tys...","[['Iwasa,Gaku', 'Producer'], ['Yasuda,Takeshi'..."
4,Fruits Basket: The Final,TVTokyo;TVOsaka;NihonAdSystems;Hakusensha;Avex...,5,124091,9.06,619,288314,13330,13.0,TV,Spring 2021,Manga,ComedyComedy;DramaDrama;RomanceRomance;Sliceof...,TMS Entertainment,Funimation,PG-13-Teens,"[['Iwami,Manaka', 'Japanese'], ['Ruis,Carolina...","[['Ibata,Yoshihide', 'Director'], ['Aketagawa,..."


> Precisamos limpar um pouco mais a coluna genres (gêneros).

- Removeremos `[ '`  

- Removeremos todos os gêneros duplicados

- Atribuiremos o novo dataframe de gêneros ao dataframe original

In [23]:
# Novo dataframe a partir do split da lista
newdf = pd.DataFrame(df["genres"].str.split(';'))

In [24]:
# Amostra
newdf.head()

Unnamed: 0,genres
0,"[ActionAction, AdventureAdventure, ComedyComed..."
1,"[ActionAction, ComedyComedy, Sci-FiSci-Fi]"
2,"[ActionAction, DramaDrama, FantasyFantasy, Mys..."
3,"[DramaDrama, Sci-FiSci-Fi, SuspenseSuspense]"
4,"[ComedyComedy, DramaDrama, RomanceRomance, Sli..."


In [25]:
# Obtendo a lista de gêneros únicos para que possamos substituí-los todos mais tarde
unique_values = []
for genres in newdf["genres"]:
    if type(genres) != float:
        for genre in genres:
            if genre not in unique_values:
                unique_values.append(genre)

In [26]:
# Todos os gêneros únicos
unique_values

['ActionAction',
 'AdventureAdventure',
 'ComedyComedy',
 'DramaDrama',
 'FantasyFantasy',
 'Sci-FiSci-Fi',
 'MysteryMystery',
 'SuspenseSuspense',
 'RomanceRomance',
 'SliceofLifeSliceofLife',
 'SupernaturalSupernatural',
 'SportsSports',
 'HorrorHorror',
 'EcchiEcchi',
 'AvantGardeAvantGarde',
 'BoysLoveBoysLove',
 'GourmetGourmet']

In [27]:
# Passando por todos os dados e, em seguida, mudando seus gêneros
for index, genres in enumerate(newdf["genres"]):
    new_genre = ""
    if type(genres) != float:
        for genre in genres:
            if genre == "ActionAction":
                new_genre += "Action"
            elif genre == "AdventureAdventure":
                new_genre += "Adventure"
            elif genre == "ComedyComedy":
                new_genre += "Comedy"
            elif genre == "DramaDrama":
                new_genre += "Drama"
            elif genre == "FantasyFantasy":
                new_genre += "Fantasy"
            elif genre == "Sci-FiSci-Fi":
                new_genre += "Sci-fi"
            elif genre == "MysteryMystery":
                new_genre += "Mystery"
            elif genre == "SuspenseSuspense":
                new_genre += "Suspense"
            elif genre == "RomanceRomance":
                new_genre += "Romance"
            elif genre == "SliceofLifeSliceofLife":
                new_genre += "Sliceoflife"
            elif genre == "SupernaturalSupernatural":
                new_genre += "Supernatural"
            elif genre == "SportsSports":
                new_genre += "Sports"
            elif genre == "HorrorHorror":
                new_genre += "Horror"
            elif genre == "EcchiEcchi":
                new_genre += "Ecchi"
            elif genre == "AvantGardeAvantGarde":
                new_genre += "Avant_garde"
            elif genre == "BoysLoveBoysLove":
                new_genre += "Boys_love"
            elif genre == "GourmetGourmet":
                new_genre += "Gourmet"
            elif genre == "GirlsLoveGirlsLove":
                new_genre += "Girls_love"
            elif genre == "WorkLifeWorkLife":
                new_genre += "Work_life"
    newdf["genres"][index] = new_genre

In [28]:
# Atribuindo as informações do gênero alterado ao novo dataframe
for index, genres in enumerate(newdf["genres"]):
    if type(genres) != float:
        newdf["genres"][index] = ";".join(re.findall('[A-Z][^A-Z]*', newdf["genres"][index]))

In [29]:
newdf.head()

Unnamed: 0,genres
0,Action;Adventure;Comedy;Drama;Fantasy
1,Action;Comedy;Sci-fi
2,Action;Drama;Fantasy;Mystery
3,Drama;Sci-fi;Suspense
4,Comedy;Drama;Romance;Sliceoflife;Supernatural


In [30]:
# Substituindo as informações de gênero pelos dados limpos
df["genres"] = newdf["genres"]

In [31]:
df.head()

Unnamed: 0,name,producers,ranking,votersCount,score,popularity,members,favorite,episodes,animeType,premiredDate,animeSource,genres,studios,licenses,rating,voiceActorNameandLanguage,staffNameandOccupation
0,Fullmetal Alchemist: Brotherhood,Aniplex;SquareEnix;MainichiBroadcastingSystem;...,1,1650275,9.15,3,2713695,191501,64.0,TV,Spring 2009,Manga,Action;Adventure;Comedy;Drama;Fantasy,Bones,Funimation;AniplexofAmerica,R-17+,"[['Kugimiya,Rie', 'Japanese'], ['Ponticelli,Be...","[['Cook,Justin', 'Producer'], ['Yonai,Noritomo..."
1,Gintama°,TVTokyo;Aniplex;Dentsu,2,173906,9.09,337,493336,13063,51.0,TV,Spring 2015,Manga,Action;Comedy;Sci-fi,Bandai Namco Pictures,Funimation;Crunchyroll,PG-13-Teens,"[['Kugimiya,Rie', 'Japanese'], ['Ishii,Kouji',...","[['Fujita,Youichi', 'Director,Storyboard,Plann..."
2,Shingeki no Kyojin Season 3 Part 2,ProductionI.G;Dentsu;MainichiBroadcastingSyste...,3,1127900,9.09,33,1635976,46238,10.0,TV,Spring 2019,Manga,Action;Drama;Fantasy;Mystery,Wit Studio,Funimation,R-17+,"[['Ishikawa,Yui', 'Japanese'], ['Perino,Elena'...","[['Morishita,Katsuji', 'Producer,Planning'], [..."
3,Steins;Gate,FrontierWorks;MediaFactory;Movic;AT-X;Kadokawa...,4,1128557,9.09,12,2117018,162324,24.0,TV,Spring 2011,Visual novel,Drama;Sci-fi;Suspense,White Fox,Funimation,PG-13-Teens,"[['Seki,Tomokazu', 'Japanese'], ['Rinehart,Tys...","[['Iwasa,Gaku', 'Producer'], ['Yasuda,Takeshi'..."
4,Fruits Basket: The Final,TVTokyo;TVOsaka;NihonAdSystems;Hakusensha;Avex...,5,124091,9.06,619,288314,13330,13.0,TV,Spring 2021,Manga,Comedy;Drama;Romance;Sliceoflife;Supernatural,TMS Entertainment,Funimation,PG-13-Teens,"[['Iwami,Manaka', 'Japanese'], ['Ruis,Carolina...","[['Ibata,Yoshihide', 'Director'], ['Aketagawa,..."


> Agora limpamos e formatamos os dados de voiceActorNameandLanguage

- Removeremos `[ '` 

- Precisamos ter certeza de que todos os dubladores estão em suas próprias colunas, como dubladores japoneses

- Precisamos mesclar as colunas de idioma das vozes dos Atores 

In [32]:
# Criamos um dataframe apenas para voiceActorNameandLanguage porque queremos fazer as mudanças 
# e depois acrescentá-las ao dataframe original
newdf = pd.DataFrame(df["voiceActorNameandLanguage"])

In [33]:
# Removendo [[e]] do final de cada string em voiceActorNameandLanguage 
for index, data in enumerate(newdf["voiceActorNameandLanguage"]):
    if type(data) != float:
        newdf["voiceActorNameandLanguage"][index] = newdf["voiceActorNameandLanguage"][index].replace("[[","[")
        newdf["voiceActorNameandLanguage"][index] = newdf["voiceActorNameandLanguage"][index].replace("]]","]")

In [34]:
# Remove aspas simples e [ de voiceActorNameandLanguage 
newdf["voiceActorNameandLanguage"] = remove_quote(newdf["voiceActorNameandLanguage"].str)
newdf["voiceActorNameandLanguage"] = remove_openBracket(newdf["voiceActorNameandLanguage"].str)

In [35]:
# Remove "], " e então [ e então faz o split dos dados com base em ; 
# Por fim, criar a lista de atores e sseus idiomas
for index, data in enumerate(newdf["voiceActorNameandLanguage"]):
    if type(data) != float:
        newdf["voiceActorNameandLanguage"][index] = re.sub(r"], ", ";", newdf["voiceActorNameandLanguage"][index])
        newdf["voiceActorNameandLanguage"][index] = remove_closeBracket(newdf["voiceActorNameandLanguage"][index])
        newdf["voiceActorNameandLanguage"][index] = newdf["voiceActorNameandLanguage"][index].split(";")
        for i, newData in enumerate(newdf["voiceActorNameandLanguage"][index]):
            newdf["voiceActorNameandLanguage"][index][i] = newdf["voiceActorNameandLanguage"][index][i].split(", ")

In [36]:
# Obtém os idiomas únicos usados em diferentes animes
# Encontramos idiomas únicos para que possam ser nossas colunas
unique_languages = []
for index, info in enumerate(newdf["voiceActorNameandLanguage"]):
    for data in newdf["voiceActorNameandLanguage"][index]:
        if len(data) > 1:
            if data[1] not in unique_languages:
                unique_languages.append(data[1])

In [37]:
# Idiomas únicos
unique_languages

['Japanese',
 'Italian',
 'Portuguese(BR)',
 'German',
 'Hungarian',
 'English',
 'Korean',
 'Spanish',
 'French',
 'Mandarin',
 'Hebrew']

In [38]:
# Criando um dicionário de lista para que possamos transformá-lo em um dataframe mais tarde
new_dic = dict()
for data in unique_languages:
    new_dic[data] = []

In [39]:
new_dic

{'Japanese': [],
 'Italian': [],
 'Portuguese(BR)': [],
 'German': [],
 'Hungarian': [],
 'English': [],
 'Korean': [],
 'Spanish': [],
 'French': [],
 'Mandarin': [],
 'Hebrew': []}

In [40]:
# Criando um dataframe que irá dividir as vozes dos atores com base em seu idioma
for index, info in enumerate(newdf["voiceActorNameandLanguage"]):
    if len(info) > 1:
        Japanese = []
        Italian = []
        PortugueseBR = []
        German = []
        Hungarian = []
        English = []
        Korean = []
        Spanish = []
        French = []
        Mandarin = []
        Hebrew = []
        for data in newdf["voiceActorNameandLanguage"][index]:
            if data[1] == "Japanese":
                Japanese.append(data[0])
            elif data[1] == "Italian":
                Italian.append(data[0])
            elif data[1] == "Portuguese(BR)":
                PortugueseBR.append(data[0])
            elif data[1] == "German":
                German.append(data[0])
            elif data[1] == "Hungarian":
                Hungarian.append(data[0])
            elif data[1] == "English":
                English.append(data[0])
            elif data[1] == "Korean":
                Korean.append(data[0])
            elif data[1] == "Spanish":
                Spanish.append(data[0])
            elif data[1] == "French":
                French.append(data[0])
            elif data[1] == "Mandarin":
                Mandarin.append(data[0])
            elif data[1] == "Hebrew":
                Hebrew.append(data[0])
        new_dic["Japanese"].append(";".join(Japanese))
        new_dic["Italian"].append(";".join(Italian))
        new_dic["Portuguese(BR)"].append(";".join(PortugueseBR))
        new_dic["German"].append(";".join(German))
        new_dic["Hungarian"].append(";".join(Hungarian))
        new_dic["English"].append(";".join(English))
        new_dic["Korean"].append(";".join(Korean))
        new_dic["Spanish"].append(";".join(Spanish))
        new_dic["French"].append(";".join(French))
        new_dic["Mandarin"].append(";".join(Mandarin))
        new_dic["Hebrew"].append(";".join(Hebrew))
    else:
        new_dic["Japanese"].append(np.nan)
        new_dic["Italian"].append(np.nan)
        new_dic["Portuguese(BR)"].append(np.nan)
        new_dic["German"].append(np.nan)
        new_dic["Hungarian"].append(np.nan)
        new_dic["English"].append(np.nan)
        new_dic["Korean"].append(np.nan)
        new_dic["Spanish"].append(np.nan)
        new_dic["French"].append(np.nan)
        new_dic["Mandarin"].append(np.nan)
        new_dic["Hebrew"].append(np.nan)

In [41]:
# Converte o dicionário em dataframe
newestdf = pd.DataFrame(new_dic)

In [42]:
newestdf.head()

Unnamed: 0,Japanese,Italian,Portuguese(BR),German,Hungarian,English,Korean,Spanish,French,Mandarin,Hebrew
0,"Kugimiya,Rie;Park,Romi;Utsumi,Kenji;Utsumi,Ken...","Ponticelli,Benedetta;Novara,Renato;Scianca,Pat...","Andreatto,Rodrigo;Campos,Marcelo;Zink,Mariana;...","Gerick,Wanja;Turba,David;Häcke,Maximiliane;Mai...","Baráth,István;Szabó,Máté;Faragó,András;Varga,R...","Whitehead,Maxey;Truncale,Lily;Mignogna,Vic;Hof...","Yun,MiNa;O,InSeong;Yang,JeongHwa;Lee,JiYeong;H...","Torres,Jhonny;Vieira,JoseManuel;Perez,LuisMigu...","Pic,Audrey;Boudonnat,Lucille;Pestel,Arthur;Cre...",,
1,"Kugimiya,Rie;Ishii,Kouji;Sugita,Tomokazu;Tomat...",,,,,"Loewen,Jocelyne;Daingerfield,Michael;Pitre,Sab...",,,,,
2,"Ishikawa,Yui;Inoue,Marina;Kamiya,Hiroshi;Kaji,...","Perino,Elena;Bolognesi,Gaia;Raffaeli,Daniele;C...","Stefane,Mayara;Volpato,Pedro;Sangregório,Bruno...",,,"Nishimura,Trina;Grelle,Josh;Mercer,Matthew;Pap...",,,"Bienaimé,Nathalie;Niverd,Victor;Méyère,Bruno;G...",,
3,"Seki,Tomokazu;Imai,Asami;Miyano,Mamoru;Hanazaw...","Vivio,Paolo;Paolelli,Rachele;Chevalier,Davide;...","Casemiro,Bruno;Cunha,Maitê;Rinaldi,André;Lua,B...","Wirthgen,Jesco;Bäcker,Manuela;Gavrilis,Marios;...",,"Rinehart,Tyson;Nishimura,Trina;Tatum,JohnMicha...","Wu,JeongSin;Hong,SiHo;Yeo,MinJeong;Kim,SeoYeon...","Naro,Jordi","Pasquier,Laurent;Cornibert,Sarah;Wilhelm,Marc;...",,
4,"Iwami,Manaka;Uchida,Yuuma;Shimazaki,Nobunaga;S...",,"Ruis,Carolina;Campos,Fábio;Volpato,Pedro;Caval...",,,"Yeung,Suzie;Sabat,Christopher;Leigh,Cherami",,,,,


In [43]:
# Merge
df = df.merge(newestdf, left_index = True, right_index = True, sort = False)

In [44]:
df.head()

Unnamed: 0,name,producers,ranking,votersCount,score,popularity,members,favorite,episodes,animeType,premiredDate,animeSource,genres,studios,licenses,rating,voiceActorNameandLanguage,staffNameandOccupation,Japanese,Italian,Portuguese(BR),German,Hungarian,English,Korean,Spanish,French,Mandarin,Hebrew
0,Fullmetal Alchemist: Brotherhood,Aniplex;SquareEnix;MainichiBroadcastingSystem;...,1,1650275,9.15,3,2713695,191501,64.0,TV,Spring 2009,Manga,Action;Adventure;Comedy;Drama;Fantasy,Bones,Funimation;AniplexofAmerica,R-17+,"[['Kugimiya,Rie', 'Japanese'], ['Ponticelli,Be...","[['Cook,Justin', 'Producer'], ['Yonai,Noritomo...","Kugimiya,Rie;Park,Romi;Utsumi,Kenji;Utsumi,Ken...","Ponticelli,Benedetta;Novara,Renato;Scianca,Pat...","Andreatto,Rodrigo;Campos,Marcelo;Zink,Mariana;...","Gerick,Wanja;Turba,David;Häcke,Maximiliane;Mai...","Baráth,István;Szabó,Máté;Faragó,András;Varga,R...","Whitehead,Maxey;Truncale,Lily;Mignogna,Vic;Hof...","Yun,MiNa;O,InSeong;Yang,JeongHwa;Lee,JiYeong;H...","Torres,Jhonny;Vieira,JoseManuel;Perez,LuisMigu...","Pic,Audrey;Boudonnat,Lucille;Pestel,Arthur;Cre...",,
1,Gintama°,TVTokyo;Aniplex;Dentsu,2,173906,9.09,337,493336,13063,51.0,TV,Spring 2015,Manga,Action;Comedy;Sci-fi,Bandai Namco Pictures,Funimation;Crunchyroll,PG-13-Teens,"[['Kugimiya,Rie', 'Japanese'], ['Ishii,Kouji',...","[['Fujita,Youichi', 'Director,Storyboard,Plann...","Kugimiya,Rie;Ishii,Kouji;Sugita,Tomokazu;Tomat...",,,,,"Loewen,Jocelyne;Daingerfield,Michael;Pitre,Sab...",,,,,
2,Shingeki no Kyojin Season 3 Part 2,ProductionI.G;Dentsu;MainichiBroadcastingSyste...,3,1127900,9.09,33,1635976,46238,10.0,TV,Spring 2019,Manga,Action;Drama;Fantasy;Mystery,Wit Studio,Funimation,R-17+,"[['Ishikawa,Yui', 'Japanese'], ['Perino,Elena'...","[['Morishita,Katsuji', 'Producer,Planning'], [...","Ishikawa,Yui;Inoue,Marina;Kamiya,Hiroshi;Kaji,...","Perino,Elena;Bolognesi,Gaia;Raffaeli,Daniele;C...","Stefane,Mayara;Volpato,Pedro;Sangregório,Bruno...",,,"Nishimura,Trina;Grelle,Josh;Mercer,Matthew;Pap...",,,"Bienaimé,Nathalie;Niverd,Victor;Méyère,Bruno;G...",,
3,Steins;Gate,FrontierWorks;MediaFactory;Movic;AT-X;Kadokawa...,4,1128557,9.09,12,2117018,162324,24.0,TV,Spring 2011,Visual novel,Drama;Sci-fi;Suspense,White Fox,Funimation,PG-13-Teens,"[['Seki,Tomokazu', 'Japanese'], ['Rinehart,Tys...","[['Iwasa,Gaku', 'Producer'], ['Yasuda,Takeshi'...","Seki,Tomokazu;Imai,Asami;Miyano,Mamoru;Hanazaw...","Vivio,Paolo;Paolelli,Rachele;Chevalier,Davide;...","Casemiro,Bruno;Cunha,Maitê;Rinaldi,André;Lua,B...","Wirthgen,Jesco;Bäcker,Manuela;Gavrilis,Marios;...",,"Rinehart,Tyson;Nishimura,Trina;Tatum,JohnMicha...","Wu,JeongSin;Hong,SiHo;Yeo,MinJeong;Kim,SeoYeon...","Naro,Jordi","Pasquier,Laurent;Cornibert,Sarah;Wilhelm,Marc;...",,
4,Fruits Basket: The Final,TVTokyo;TVOsaka;NihonAdSystems;Hakusensha;Avex...,5,124091,9.06,619,288314,13330,13.0,TV,Spring 2021,Manga,Comedy;Drama;Romance;Sliceoflife;Supernatural,TMS Entertainment,Funimation,PG-13-Teens,"[['Iwami,Manaka', 'Japanese'], ['Ruis,Carolina...","[['Ibata,Yoshihide', 'Director'], ['Aketagawa,...","Iwami,Manaka;Uchida,Yuuma;Shimazaki,Nobunaga;S...",,"Ruis,Carolina;Campos,Fábio;Volpato,Pedro;Caval...",,,"Yeung,Suzie;Sabat,Christopher;Leigh,Cherami",,,,,


> Limpeza e formatação dos dados de staffNameandOccupation

- Removeremos `[ '` 

- Precisamos organizá-los com base em sua profissão

- Precisamos atribuir o novo dataframe staffNameandOccupation ao dataframe original

In [45]:
staffNnO = pd.DataFrame(df["staffNameandOccupation"])

In [46]:
# Limpeza dos dados
for index, data in enumerate(staffNnO["staffNameandOccupation"]):
    staffNnO["staffNameandOccupation"][index] = staffNnO["staffNameandOccupation"][index].replace("[[", "[")
    staffNnO["staffNameandOccupation"][index] = staffNnO["staffNameandOccupation"][index].replace("]]", "]")
    staffNnO["staffNameandOccupation"][index] = staffNnO["staffNameandOccupation"][index].replace("[\'", "")
    staffNnO["staffNameandOccupation"][index] = staffNnO["staffNameandOccupation"][index].replace("\'", "")
    staffNnO["staffNameandOccupation"][index] = staffNnO["staffNameandOccupation"][index].replace("], ", ";")
    staffNnO["staffNameandOccupation"][index] = staffNnO["staffNameandOccupation"][index].replace("]", "")

In [47]:
# Faz o split com base no índice
for index, data in enumerate(staffNnO["staffNameandOccupation"]):
    staffNnO["staffNameandOccupation"][index] = staffNnO["staffNameandOccupation"][index].split(";")
    for i, info in enumerate(staffNnO["staffNameandOccupation"][index]):
        staffNnO["staffNameandOccupation"][index][i] = staffNnO["staffNameandOccupation"][index][i].split(", ")

In [48]:
# Gera o dataframe
for i in range(len(staffNnO["staffNameandOccupation"])):
    for j, job in enumerate(staffNnO["staffNameandOccupation"][i]):
        if len(staffNnO["staffNameandOccupation"][i][j]) > 1:
            staffNnO["staffNameandOccupation"][i][j][-1] = staffNnO["staffNameandOccupation"][i][j][1].split(",")

In [49]:
staffNnO

Unnamed: 0,staffNameandOccupation
0,"[[Cook,Justin, [Producer]], [Yonai,Noritomo, [..."
1,"[[Fujita,Youichi, [Director, Storyboard, Plann..."
2,"[[Morishita,Katsuji, [Producer, Planning]], [N..."
3,"[[Iwasa,Gaku, [Producer]], [Yasuda,Takeshi, [P..."
4,"[[Ibata,Yoshihide, [Director]], [Aketagawa,Jin..."
...,...
495,"[[Murata,Masahiko, [Director]], [Takakuwa,Haji..."
496,"[[Katsumata,Tomoharu, [Director]], [Nishizawa,..."
497,"[[Kobayashi,Tsuneo, [Director]], [Kon,Chiaki, ..."
498,"[[Matsuda,Akio, [Producer]], [Osedo,Satoshi, [..."


In [50]:
# Fazer com que a profissão única seja usada em diferentes animes
unique_profes = []
for i in range(len(staffNnO["staffNameandOccupation"])):
    for j, job in enumerate(staffNnO["staffNameandOccupation"][i]):
        if len(job) > 1:
            for k, profes in enumerate(job[1]):
                if profes not in unique_profes:
                    unique_profes.append(profes)

In [51]:
unique_profes

['Producer',
 'Director',
 'EpisodeDirector',
 'Storyboard',
 'SoundDirector',
 'KeyAnimation',
 '2ndKeyAnimation',
 'CharacterDesign',
 'Script',
 'SeriesComposition',
 'ThemeSongLyrics',
 'ThemeSongPerformance',
 'ThemeSongArrangement',
 'ThemeSongComposition',
 'AnimationDirector',
 'OriginalCreator',
 'ADRDirector',
 'ExecutiveProducer',
 'ChiefAnimationDirector',
 'DirectorofPhotography',
 'In-BetweenAnimation',
 'BackgroundArt',
 'Planning',
 'ColorDesign',
 'AssistantAnimationDirector',
 'Editing',
 'ArtDirector',
 'Music',
 'ProductionCoordination',
 'DigitalPaint',
 'ColorSetting',
 'AssistantDirector',
 'SoundEffects',
 'InsertedSongPerformance',
 'OriginalCharacterDesign',
 'Setting',
 'Screenplay',
 'AssociateProducer',
 'SpecialEffects',
 'AnimationCheck',
 'ProductionAssistant',
 'SoundSupervisor',
 'PrincipleDrawing',
 'AssistantProducer',
 'ProductionManager',
 'SoundManager',
 'Co-Director',
 'SeriesProductionDirector',
 'MechanicalDesign',
 'PlanningProducer',
 'Layou

In [52]:
# Criando um dicionário de lista para que possamos transformá-lo em um dataframe mais tarde
profes_dic = dict()
for data in unique_profes:
    profes_dic[data] = []

In [53]:
profes_dic

{'Producer': [],
 'Director': [],
 'EpisodeDirector': [],
 'Storyboard': [],
 'SoundDirector': [],
 'KeyAnimation': [],
 '2ndKeyAnimation': [],
 'CharacterDesign': [],
 'Script': [],
 'SeriesComposition': [],
 'ThemeSongLyrics': [],
 'ThemeSongPerformance': [],
 'ThemeSongArrangement': [],
 'ThemeSongComposition': [],
 'AnimationDirector': [],
 'OriginalCreator': [],
 'ADRDirector': [],
 'ExecutiveProducer': [],
 'ChiefAnimationDirector': [],
 'DirectorofPhotography': [],
 'In-BetweenAnimation': [],
 'BackgroundArt': [],
 'Planning': [],
 'ColorDesign': [],
 'AssistantAnimationDirector': [],
 'Editing': [],
 'ArtDirector': [],
 'Music': [],
 'ProductionCoordination': [],
 'DigitalPaint': [],
 'ColorSetting': [],
 'AssistantDirector': [],
 'SoundEffects': [],
 'InsertedSongPerformance': [],
 'OriginalCharacterDesign': [],
 'Setting': [],
 'Screenplay': [],
 'AssociateProducer': [],
 'SpecialEffects': [],
 'AnimationCheck': [],
 'ProductionAssistant': [],
 'SoundSupervisor': [],
 'Princi

In [54]:
# Gerando o dataframe
for i in range(len(staffNnO["staffNameandOccupation"])):
    Producer = []
    Director = []
    EpisodeDirector = []
    Storyboard = []
    SoundDirector = []
    KeyAnimation = []
    KeyAnimation2nd = []
    CharacterDesign = []
    Script = []
    SeriesComposition = []
    ThemeSongLyrics = []
    ThemeSongPerformance = []
    ThemeSongArrangement = []
    ThemeSongComposition = []
    AnimationDirector = []
    OriginalCreator = []
    ADRDirector = []
    ExecutiveProducer = []
    ChiefAnimationDirector = []
    DirectorofPhotography = []
    In_BetweenAnimation = []
    BackgroundArt = []
    Planning = []
    ColorDesign = []
    AssistantAnimationDirector = []
    Editing = []
    ArtDirector = []
    Music = []
    ProductionCoordination = []
    DigitalPaint = []
    ColorSetting = []
    AssistantDirector = []
    SoundEffects = []
    InsertedSongPerformance = []
    OriginalCharacterDesign = []
    Setting = []
    Screenplay = []
    AssociateProducer = []
    SpecialEffects = []
    AnimationCheck = []
    ProductionAssistant = []
    SoundSupervisor = []
    PrincipleDrawing = []
    AssistantProducer = []
    ProductionManager = []
    SoundManager = []
    Co_Director = []
    SeriesProductionDirector = []
    MechanicalDesign = []
    PlanningProducer = []
    Layout = []
    ChiefProducer = []
    Recording = []
    DialogueEditing = []
    RecordingEngineer = []
    Creator = []
    RecordingAssistant = []
    Publicity = []
    Co_Producer = []
    CastingDirector = []
    Re_RecordingMixing = []
    AssistantProductionCoordinat = []
    SettingManager = []
    
    # Encontrando profissões únicas para que sejam nossas colunas.
    for j, job in enumerate(staffNnO["staffNameandOccupation"][i]):
        if len(job) > 1:
            for k, profes in enumerate(job[1]):
                if profes == "Producer":
                    Producer.append(job[0])
                elif profes == 'Director':
                    Director.append(job[0])
                elif profes == 'EpisodeDirector':
                    EpisodeDirector.append(job[0])
                elif profes == 'Storyboard':
                    Storyboard.append(job[0])
                elif profes == 'SoundDirector':
                    SoundDirector.append(job[0])
                elif profes == 'KeyAnimation':
                    KeyAnimation.append(job[0])
                elif profes == '2ndKeyAnimation':
                    KeyAnimation2nd.append(job[0])
                elif profes == 'CharacterDesign':
                    CharacterDesign.append(job[0])
                elif profes == 'Script':
                    Script.append(job[0])
                elif profes == 'SeriesComposition':
                    SeriesComposition.append(job[0])
                elif profes == 'ThemeSongLyrics':
                    ThemeSongLyrics.append(job[0])
                elif profes == 'ThemeSongPerformance':
                    ThemeSongPerformance.append(job[0])
                elif profes == 'ThemeSongArrangement':
                    ThemeSongArrangement.append(job[0])
                elif profes == 'ThemeSongComposition':
                    ThemeSongComposition.append(job[0])
                elif profes == 'AnimationDirector':
                    AnimationDirector.append(job[0])
                elif profes == 'OriginalCreator':
                    OriginalCreator.append(job[0])
                elif profes == 'ADRDirector':
                    ADRDirector.append(job[0])
                elif profes == 'ExecutiveProducer':
                    ExecutiveProducer.append(job[0])
                elif profes == 'ChiefAnimationDirector':
                    ChiefAnimationDirector.append(job[0])
                elif profes == 'DirectorofPhotography':
                    DirectorofPhotography.append(job[0])
                elif profes == 'In-BetweenAnimation':
                    In_BetweenAnimation.append(job[0])
                elif profes == 'BackgroundArt':
                    BackgroundArt.append(job[0])
                elif profes == 'Planning':
                    Planning.append(job[0])
                elif profes == 'ColorDesign':
                    ColorDesign.append(job[0])
                elif profes == 'AssistantAnimationDirector':
                    AssistantAnimationDirector.append(job[0])
                elif profes == 'Editing':
                    Editing.append(job[0])
                elif profes == 'ArtDirector':
                    ArtDirector.append(job[0])
                elif profes == 'Music':
                    Music.append(job[0])
                elif profes == 'ProductionCoordination':
                    ProductionCoordination.append(job[0])
                elif profes == 'DigitalPaint':
                    DigitalPaint.append(job[0])
                elif profes == 'ColorSetting':
                    ColorSetting.append(job[0])
                elif profes == 'AssistantDirector':
                    AssistantDirector.append(job[0])
                elif profes == 'SoundEffects':
                    SoundEffects.append(job[0])
                elif profes == 'InsertedSongPerformance':
                    InsertedSongPerformance.append(job[0])
                elif profes == 'OriginalCharacterDesign':
                    OriginalCharacterDesign.append(job[0])
                elif profes == 'Setting':
                    Setting.append(job[0])
                elif profes == 'Screenplay':
                    Screenplay.append(job[0])
                elif profes == 'AssociateProducer':
                    AssociateProducer.append(job[0])
                elif profes == 'SpecialEffects':
                    SpecialEffects.append(job[0])
                elif profes == 'AnimationCheck':
                    AnimationCheck.append(job[0])
                elif profes == 'ProductionAssistant':
                    ProductionAssistant.append(job[0])
                elif profes == 'SoundSupervisor':
                    SoundSupervisor.append(job[0])
                elif profes == 'PrincipleDrawing':
                    PrincipleDrawing.append(job[0])
                elif profes == 'AssistantProducer':
                    AssistantProducer.append(job[0])
                elif profes == 'ProductionManager':
                    ProductionManager.append(job[0])
                elif profes == 'SoundManager':
                    SoundManager.append(job[0])
                elif profes == 'Co-Director':
                    Co_Director.append(job[0])
                elif profes == 'SeriesProductionDirector':
                    SeriesProductionDirector.append(job[0])
                elif profes == 'MechanicalDesign':
                    MechanicalDesign.append(job[0])
                elif profes == 'PlanningProducer':
                    PlanningProducer.append(job[0])
                elif profes == 'Layout':
                    Layout.append(job[0])
                elif profes == 'ChiefProducer':
                    ChiefProducer.append(job[0])
                elif profes == 'Recording':
                    Recording.append(job[0])
                elif profes == 'DialogueEditing':
                    DialogueEditing.append(job[0])
                elif profes == 'RecordingEngineer':
                    RecordingEngineer.append(job[0])
                elif profes == 'Creator':
                    Creator.append(job[0])
                elif profes == 'RecordingAssistant':
                    RecordingAssistant.append(job[0])
                elif profes == 'Publicity':
                    Publicity.append(job[0])
                elif profes == 'Co-Producer':
                    Co_Producer.append(job[0])
                elif profes == 'CastingDirector':
                    CastingDirector.append(job[0])
                elif profes == 'Re-RecordingMixing':
                    Re_RecordingMixing.append(job[0])
                elif profes == 'AssistantProductionCoordinat':
                    AssistantProductionCoordinat.append(job[0])
                elif profes == 'SettingManager':
                    SettingManager.append(job[0])
    
    # Adiciona ao dicionário
    profes_dic["Producer"].append(";".join(Producer))
    profes_dic["Director"].append(";".join(Director))
    profes_dic["EpisodeDirector"].append(";".join(EpisodeDirector))
    profes_dic["Storyboard"].append(";".join(Storyboard))
    profes_dic["SoundDirector"].append(";".join(SoundDirector))
    profes_dic["KeyAnimation"].append(";".join(KeyAnimation))
    profes_dic["2ndKeyAnimation"].append(";".join(KeyAnimation2nd))
    profes_dic["CharacterDesign"].append(";".join(CharacterDesign))
    profes_dic["Script"].append(";".join(Script))
    profes_dic["SeriesComposition"].append(";".join(SeriesComposition))
    profes_dic["ThemeSongLyrics"].append(";".join(ThemeSongLyrics))
    profes_dic["ThemeSongPerformance"].append(";".join(ThemeSongPerformance))
    profes_dic["ThemeSongArrangement"].append(";".join(ThemeSongArrangement))
    profes_dic["ThemeSongComposition"].append(";".join(ThemeSongComposition))
    profes_dic["AnimationDirector"].append(";".join(AnimationDirector))
    profes_dic["OriginalCreator"].append(";".join(OriginalCreator))
    profes_dic["ADRDirector"].append(";".join(ADRDirector))
    profes_dic["ExecutiveProducer"].append(";".join(ExecutiveProducer))
    profes_dic["ChiefAnimationDirector"].append(";".join(ChiefAnimationDirector))
    profes_dic["DirectorofPhotography"].append(";".join(DirectorofPhotography))
    profes_dic["In-BetweenAnimation"].append(";".join(In_BetweenAnimation))
    profes_dic["BackgroundArt"].append(";".join(BackgroundArt))
    profes_dic["Planning"].append(";".join(Planning))
    profes_dic["ColorDesign"].append(";".join(ColorDesign))
    profes_dic["AssistantAnimationDirector"].append(";".join(AssistantAnimationDirector))
    profes_dic["Editing"].append(";".join(Editing))
    profes_dic["ArtDirector"].append(";".join(ArtDirector))
    profes_dic["Music"].append(";".join(Music))
    profes_dic["ProductionCoordination"].append(";".join(ProductionCoordination))
    profes_dic["DigitalPaint"].append(";".join(DigitalPaint))
    profes_dic["ColorSetting"].append(";".join(ColorSetting))
    profes_dic["AssistantDirector"].append(";".join(AssistantDirector))
    profes_dic["SoundEffects"].append(";".join(SoundEffects))
    profes_dic["InsertedSongPerformance"].append(";".join(InsertedSongPerformance))
    profes_dic["OriginalCharacterDesign"].append(";".join(OriginalCharacterDesign))
    profes_dic["Setting"].append(";".join(Setting))
    profes_dic["Screenplay"].append(";".join(Screenplay))
    profes_dic["AssociateProducer"].append(";".join(AssociateProducer))
    profes_dic["SpecialEffects"].append(";".join(SpecialEffects))
    profes_dic["AnimationCheck"].append(";".join(AnimationCheck))
    profes_dic["ProductionAssistant"].append(";".join(ProductionAssistant))
    profes_dic["SoundSupervisor"].append(";".join(SoundSupervisor))
    profes_dic["PrincipleDrawing"].append(";".join(PrincipleDrawing))
    profes_dic["AssistantProducer"].append(";".join(AssistantProducer))
    profes_dic["ProductionManager"].append(";".join(ProductionManager))
    profes_dic["SoundManager"].append(";".join(SoundManager))
    profes_dic["Co-Director"].append(";".join(Co_Director))
    profes_dic["SeriesProductionDirector"].append(";".join(SeriesProductionDirector))
    profes_dic["MechanicalDesign"].append(";".join(MechanicalDesign))
    profes_dic["PlanningProducer"].append(";".join(PlanningProducer))
    profes_dic["Layout"].append(";".join(Layout))
    profes_dic["ChiefProducer"].append(";".join(ChiefProducer))
    profes_dic["Recording"].append(";".join(Recording))
    profes_dic["DialogueEditing"].append(";".join(DialogueEditing))
    profes_dic["RecordingEngineer"].append(";".join(RecordingEngineer))
    profes_dic["Creator"].append(";".join(Creator))
    profes_dic["RecordingAssistant"].append(";".join(RecordingAssistant))
    profes_dic["Publicity"].append(";".join(Publicity))
    profes_dic["Co-Producer"].append(";".join(Co_Producer))
    profes_dic["CastingDirector"].append(";".join(CastingDirector))
    profes_dic["Re-RecordingMixing"].append(";".join(Re_RecordingMixing))
    profes_dic["AssistantProductionCoordinat"].append(";".join(AssistantProductionCoordinat))
    profes_dic["SettingManager"].append(";".join(SettingManager))

In [55]:
len(unique_profes)

63

In [56]:
# Converte o dicionário em dataframe
occupation = pd.DataFrame(profes_dic)

In [57]:
occupation.head(10)

Unnamed: 0,Producer,Director,EpisodeDirector,Storyboard,SoundDirector,KeyAnimation,2ndKeyAnimation,CharacterDesign,Script,SeriesComposition,ThemeSongLyrics,ThemeSongPerformance,ThemeSongArrangement,ThemeSongComposition,AnimationDirector,OriginalCreator,ADRDirector,ExecutiveProducer,ChiefAnimationDirector,DirectorofPhotography,In-BetweenAnimation,BackgroundArt,Planning,ColorDesign,AssistantAnimationDirector,Editing,ArtDirector,Music,ProductionCoordination,DigitalPaint,ColorSetting,AssistantDirector,SoundEffects,InsertedSongPerformance,OriginalCharacterDesign,Setting,Screenplay,AssociateProducer,SpecialEffects,AnimationCheck,ProductionAssistant,SoundSupervisor,PrincipleDrawing,AssistantProducer,ProductionManager,SoundManager,Co-Director,SeriesProductionDirector,MechanicalDesign,PlanningProducer,Layout,ChiefProducer,Recording,DialogueEditing,RecordingEngineer,Creator,RecordingAssistant,Publicity,Co-Producer,CastingDirector,Re-RecordingMixing,AssistantProductionCoordinat,SettingManager
0,"Cook,Justin;Yonai,Noritomo","Irie,Yasuhiro","Irie,Yasuhiro;Ikehata,Hiroshi;Ikezoe,Takahiro;...","Irie,Yasuhiro;Ikezoe,Takahiro;Kinutani,Soushi;...","Mima,Masafumi","Ikezoe,Takahiro;Kinutani,Soushi;Morii,Kenshiro...","Ikezoe,Takahiro;Akasaka,Shunji;Kameda,Yoshimic...","Morii,Kenshirou;Kanno,Hiroki","Burgmeier,John;Minakami,Seishi;Oonogi,Hiroshi;...","Oonogi,Hiroshi",CHEMISTRY;NICOTouchestheWalls;SCANDAL;SID;Suki...,"CHEMISTRY;Fukuhara,Miho;[""LilB"";NICOTouchesthe...","Kameda,Seiji;NICOTouchestheWalls;SID;SukimaSwitch",NICOTouchestheWalls;SID;SukimaSwitch;Yui,"Aono,Atsushi;Iijima,Hiroya;Ishino,Satoshi;Koba...","Arakawa,Hiromu","Bezerra,Úrsula;Campos,Marcelo;Glass,Caitlin;Ka...","Fukunaga,Gen","Fukuoka,Hidenori;Kameda,Yoshimichi;Kaneda,Naomi","Furumoto,Mayuko","Kameda,Yoshimichi;Oosawa,Mina;Saitou,Kengo;Yok...","Kanehira,Kazushige;Nakajima,Mika;Ooizumi,Anna;...","Minami,Masahiko;Ueda,Masuo","Nakao,Fusako","Park,Seong-Hu;Yoshioka,Takeshi","Sadamatsu,Gou","Satou,Takeshi","Senju,Akira","Shinya,Une","Uemura,Takako",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,,"Fujita,Youichi;Miyawaki,Chizuru","Asami,Matsuo;Koshida,Tomoaki;Minami,Yasuhiro;M...","Fujita,Youichi;Miyawaki,Chizuru;Minami,Yasuhiro","Takamatsu,Shinji","Miyawaki,Chizuru;Abe,Miyuki;Hayashi,Kanako;Hay...","Hayashi,Kanako;Honjou,Keiichirou;Sasaki,Youhei","Takeuchi,Shinji","Kishimoto,Taku;Matsubara,Shuu;Mieno,Hitomi",,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks,AquaTimez;BLUEENCOUNT;CHiCO;DOES;HoneyWorks;Ne...,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks;Swimy,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks,"Honjou,Keiichirou;Ikeuchi,Naoko;Ishikawa,Marik...","Sorachi,Hideaki",,,,"Teramoto,Yuuki",,,"Fujita,Youichi","Utagawa,Ritsuko","Nakamura,Yumi","Seyama,Takeshi","Fukushima,Takayoshi;Maniwa,Nami",AudioHighs,,,"Utagawa,Ritsuko",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,"Morishita,Katsuji;Nakatake,Tetsuya;Wada,Jouji;...","Araki,Tetsurou;Koizuka,Masashi","Araki,Tetsurou;Itoga,Shintaro;Tanaka,Hiroyuki;...","Araki,Tetsurou;Akamatsu,Yasuhiro;Komatsuda,Dai...","Mima,Masafumi","Imai,Arifumi;Izawa,Tamami;Oota,Emi;Yamauchi,Ryou",,"Asano,Kyouji","Kobayashi,Yasuko;Seko,Hiroshi","Kobayashi,Yasuko",,CinemaStaff;LinkedHorizon,,,"Koizuka,Masashi;Chiba,Takaaki;Ebisu,Takuma;Has...","Isayama,Hajime","Sangregório,Bruno","Ishikawa,Mitsuhisa","Asano,Kyouji;Kadowaki,Satoshi","Yamada,Kazuhiro",,"Fujii,Kazushi","Morishita,Katsuji","Hashimoto,Satoshi",,"Hida,Aya","Yoshihara,Shunichirou","Sawano,Hiroyuki",,,,"Koizuka,Masashi;Tanaka,Hiroyuki","Kurahashi,Shizuo",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,"Iwasa,Gaku;Yasuda,Takeshi","Hamasaki,Hiroshi;Satou,Takuya","Hamasaki,Hiroshi;Satou,Takuya;Kobayashi,Kouji;...","Hamasaki,Hiroshi;Satou,Takuya;Kobayashi,Tomoki...","Fujiyama,Fusanobu","Hamasaki,Hiroshi;Aono,Atsushi;Arai,Nobuhiro;Hi...","Hamaguchi,Akira;Satou,Hiroaki","Sakai,Kyuuta","Hanada,Jukki;Nemoto,Toshizou;Tatum,JohnMichael...","Hanada,Jukki","Shikura,Chiyomaru","Itou,Kanako;Sakakibara,Yui",,"Shikura,Chiyomaru","Aono,Atsushi;Arai,Nobuhiro;Igari,Takashi;Ikega...","Shikura,Chiyomaru;5pb.;Nitroplus","Clinkenbeard,Colleen;Rinaldi,André","Fukunaga,Gen","Sakai,Kyuuta","Nakamura,Keisuke",,"Kanehira,Kazushige;Kouji,Etou;Maeda,Yuki;Nemot...","Yasuda,Takeshi;Shikura,Chiyomaru","Satou,Miyuki","Ikegami,Tarou;Nakamura,Kazuhisa;Sakai,Kyuuta;Y...",,"Kouji,Etou","Abo,Takeshi",,,,,,JunjounoAfilia,huke,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,,"Ibata,Yoshihide",,,"Aketagawa,Jin",,,"Shindou,Yuu",,"Kishimoto,Taku",,GENIC;WARPsUP,,,,"Takaya,Natsuki","Falcão,Jonas",,,"Cai,Bolun;Shitara,Nozomi",,"Fujii,Yuuta",,"Sugawara,Mika",,"Hida,Aya","Kamiyama,Youko","Yokoyama,Masaru",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
5,,"Fujita,Youichi","Fujita,Youichi;Minami,Yasuhiro;Miyawaki,Chizur...","Fujita,Youichi;Minami,Yasuhiro;Miyawaki,Chizur...","Kobayashi,Katsuyoshi","Miyawaki,Chizuru;Abe,Shingo;Habe,Takashi;Haseg...","Miyawaki,Chizuru;Matsuyama,Kouji;Taniguchi,Yos...","Takeuchi,Shinji","Shimoyama,Kento;Yamatoya,Akatsuki;Yokote,Michiko","Yamatoya,Akatsuki",Prague;SPYAIR;ecosystem,FLiP;Prague;SPYAIR;ecosystem;serialTVdrama,Prague;SPYAIR;ecosystem,Prague;SPYAIR;ecosystem,"Hisayuki,Hirokazu;Honjou,Keiichirou;Ishikawa,M...","Sorachi,Hideaki",,,,,,"Kanai,Shingo",,"Utagawa,Ritsuko",,"Seyama,Takeshi",,AudioHighs,,,"Utagawa,Ritsuko",,"Mutou,Akiko","Anri;Arai,Masahito;DOES",,,,,,,,,,,,,,,,,,,,,,,,,,,,,
6,"Maruyama,Masao;Nakatani,Toshio","Koujina,Hiroshi","Aoki,Hiroyasu;Kawamura,Kenichi;Nakayama,Naomi;...","Aoki,Hiroyasu;Kawamura,Kenichi;Nakayama,Naomi;...","Yamada,Chiaki","Yoshida,Daisuke;Abe,Misao;Abiru,Takahiko;Chiba...","Hatta,Yousuke;Kato,Miho;Liang,Boya;Nagasaka,Ke...","Yoshimatsu,Takahiro","Hirano,Yasushi;Hirota,Mitsutaka;Kamio,Ryuu;Mae...","Kamio,Ryuu;Maekawa,Atsushi","Fear,andLoathinginLasVegas;Galneryus;Hyadain","Fear,andLoathinginLasVegas;Galneryus;Ono,Masat...","Fear,andLoathinginLasVegas;Galneryus;Hyadain","Fear,andLoathinginLasVegas;Galneryus;Hyadain","Ushijima,Shinichirou;Yoshida,Daisuke;Abiru,Tak...","Togashi,Yoshihiro","Laisné,Grégory;Méyère,Bruno;Oliver,Tony",,"Yoshida,Daisuke;Yoshimatsu,Takahiro","Arahata,Kazuya","Lee,Mi-Yeong","Ikeda,Yuuji",,"Horikawa,Yoshinori",,,"Ishiki,Mio","Hirano,Yoshihisa;Mozart,WolfgangAmadeus",,,,"Aoki,Hiroyasu;Ushijima,Shinichirou","Wada,Toshiya",,,"Ushijima,Shinichirou","Kamio,Ryuu;Maekawa,Atsushi",,,,,,,,,,,,,,,,,,,,,,,,,,
7,,"Ishiguro,Noboru","Ishiguro,Noboru;Asami,Takashi;Hata,Yoshito;Ima...","Ishiguro,Noboru;Asami,Takashi;Maejima,Kenichi;...","Aketagawa,Susumu","Imaizumi,Kenichi;Suzuki,Toshimasa;Aoki,Mariko;...",,"Kise,Kazuchika;Nakura,Yasuhiro;Onda,Naoyuki;Su...","Endo,Akinori;Shudou,Takeshi;Yanagawa,Shigeru",,LISA,"Konno,Hiromi;LISA;Ogura,Kei","Mori,Hideharu",,"Imaizumi,Kenichi;Maejima,Kenichi;Arai,Yutaka;K...","Tanaka,Yoshiki",,,"Motoki,Hisatoshi","Ishikawa,Kinichi;Okazaki,Hideo","Imaizumi,Kenichi;Ishii,Hisashi;Itou,Hideki","Kamikubo,Yoshihiro;Kaneko,Hidetoshi;Matsudaira...",,,"Maejima,Kenichi",,"Ikeda,Yuuji;Kaneko,Hidetoshi;Nagao,Hitoshi;Shi...","Bach,JohannSebastian;Brahms,Johannes;Bruckner,...",,,"Seki,Mieko",,"Kurahashi,Shizuo",,"Kogawa,Tomonori;Kawajiri,Yoshiaki;Motoki,Hisat...",,,"Anzai,Tetsuo","Maekawa,Takashi","Matsuoka,Hideaki","Ochi,Koujin",,,,,,,,,,,,,,,,,,,,,,
8,,"Fujita,Youichi","Fujita,Youichi;Miyawaki,Chizuru","Fujita,Youichi;Miyawaki,Chizuru",,"Inada,Toshiko;Murata,Noriyasu;Saitou,Kazuya;Sa...",,"Takeuchi,Shinji","Shimoyama,Kento;Yamatoya,Akatsuki;Yokote,Michiko","Yamatoya,Akatsuki",SPYAIR,"AMOYAMO;SPYAIR;Takahashi,Mikako",SPYAIR,SPYAIR,"Sasaki,Youhei;Suzuki,Hiromi","Sorachi,Hideaki",,,,,,"Nakajima,Yuichiro;Nuibe,Fumie",,"Utagawa,Ritsuko",,"Seyama,Takeshi",,AudioHighs,,,,,"Mutou,Akiko",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
9,,"Fujita,Youichi;Miyawaki,Chizuru",,,"Takamatsu,Shinji","Yoshida,Wakako",,"Takeuchi,Shinji",,"Miyawaki,Chizuru",,SPYAIR,,,,"Sorachi,Hideaki",,,"Takeuchi,Shinji",,,,,,,,,,,,,,,DOES,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


## Gerando o Dataframe Final

In [58]:
# Merge
df1 = df.merge(occupation, left_index = True, right_index = True, sort = False)

In [59]:
df1.head()

Unnamed: 0,name,producers,ranking,votersCount,score,popularity,members,favorite,episodes,animeType,premiredDate,animeSource,genres,studios,licenses,rating,voiceActorNameandLanguage,staffNameandOccupation,Japanese,Italian,Portuguese(BR),German,Hungarian,English,Korean,Spanish,French,Mandarin,Hebrew,Producer,Director,EpisodeDirector,Storyboard,SoundDirector,KeyAnimation,2ndKeyAnimation,CharacterDesign,Script,SeriesComposition,ThemeSongLyrics,ThemeSongPerformance,ThemeSongArrangement,ThemeSongComposition,AnimationDirector,OriginalCreator,ADRDirector,ExecutiveProducer,ChiefAnimationDirector,DirectorofPhotography,In-BetweenAnimation,BackgroundArt,Planning,ColorDesign,AssistantAnimationDirector,Editing,ArtDirector,Music,ProductionCoordination,DigitalPaint,ColorSetting,AssistantDirector,SoundEffects,InsertedSongPerformance,OriginalCharacterDesign,Setting,Screenplay,AssociateProducer,SpecialEffects,AnimationCheck,ProductionAssistant,SoundSupervisor,PrincipleDrawing,AssistantProducer,ProductionManager,SoundManager,Co-Director,SeriesProductionDirector,MechanicalDesign,PlanningProducer,Layout,ChiefProducer,Recording,DialogueEditing,RecordingEngineer,Creator,RecordingAssistant,Publicity,Co-Producer,CastingDirector,Re-RecordingMixing,AssistantProductionCoordinat,SettingManager
0,Fullmetal Alchemist: Brotherhood,Aniplex;SquareEnix;MainichiBroadcastingSystem;...,1,1650275,9.15,3,2713695,191501,64.0,TV,Spring 2009,Manga,Action;Adventure;Comedy;Drama;Fantasy,Bones,Funimation;AniplexofAmerica,R-17+,"[['Kugimiya,Rie', 'Japanese'], ['Ponticelli,Be...","[['Cook,Justin', 'Producer'], ['Yonai,Noritomo...","Kugimiya,Rie;Park,Romi;Utsumi,Kenji;Utsumi,Ken...","Ponticelli,Benedetta;Novara,Renato;Scianca,Pat...","Andreatto,Rodrigo;Campos,Marcelo;Zink,Mariana;...","Gerick,Wanja;Turba,David;Häcke,Maximiliane;Mai...","Baráth,István;Szabó,Máté;Faragó,András;Varga,R...","Whitehead,Maxey;Truncale,Lily;Mignogna,Vic;Hof...","Yun,MiNa;O,InSeong;Yang,JeongHwa;Lee,JiYeong;H...","Torres,Jhonny;Vieira,JoseManuel;Perez,LuisMigu...","Pic,Audrey;Boudonnat,Lucille;Pestel,Arthur;Cre...",,,"Cook,Justin;Yonai,Noritomo","Irie,Yasuhiro","Irie,Yasuhiro;Ikehata,Hiroshi;Ikezoe,Takahiro;...","Irie,Yasuhiro;Ikezoe,Takahiro;Kinutani,Soushi;...","Mima,Masafumi","Ikezoe,Takahiro;Kinutani,Soushi;Morii,Kenshiro...","Ikezoe,Takahiro;Akasaka,Shunji;Kameda,Yoshimic...","Morii,Kenshirou;Kanno,Hiroki","Burgmeier,John;Minakami,Seishi;Oonogi,Hiroshi;...","Oonogi,Hiroshi",CHEMISTRY;NICOTouchestheWalls;SCANDAL;SID;Suki...,"CHEMISTRY;Fukuhara,Miho;[""LilB"";NICOTouchesthe...","Kameda,Seiji;NICOTouchestheWalls;SID;SukimaSwitch",NICOTouchestheWalls;SID;SukimaSwitch;Yui,"Aono,Atsushi;Iijima,Hiroya;Ishino,Satoshi;Koba...","Arakawa,Hiromu","Bezerra,Úrsula;Campos,Marcelo;Glass,Caitlin;Ka...","Fukunaga,Gen","Fukuoka,Hidenori;Kameda,Yoshimichi;Kaneda,Naomi","Furumoto,Mayuko","Kameda,Yoshimichi;Oosawa,Mina;Saitou,Kengo;Yok...","Kanehira,Kazushige;Nakajima,Mika;Ooizumi,Anna;...","Minami,Masahiko;Ueda,Masuo","Nakao,Fusako","Park,Seong-Hu;Yoshioka,Takeshi","Sadamatsu,Gou","Satou,Takeshi","Senju,Akira","Shinya,Une","Uemura,Takako",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,Gintama°,TVTokyo;Aniplex;Dentsu,2,173906,9.09,337,493336,13063,51.0,TV,Spring 2015,Manga,Action;Comedy;Sci-fi,Bandai Namco Pictures,Funimation;Crunchyroll,PG-13-Teens,"[['Kugimiya,Rie', 'Japanese'], ['Ishii,Kouji',...","[['Fujita,Youichi', 'Director,Storyboard,Plann...","Kugimiya,Rie;Ishii,Kouji;Sugita,Tomokazu;Tomat...",,,,,"Loewen,Jocelyne;Daingerfield,Michael;Pitre,Sab...",,,,,,,"Fujita,Youichi;Miyawaki,Chizuru","Asami,Matsuo;Koshida,Tomoaki;Minami,Yasuhiro;M...","Fujita,Youichi;Miyawaki,Chizuru;Minami,Yasuhiro","Takamatsu,Shinji","Miyawaki,Chizuru;Abe,Miyuki;Hayashi,Kanako;Hay...","Hayashi,Kanako;Honjou,Keiichirou;Sasaki,Youhei","Takeuchi,Shinji","Kishimoto,Taku;Matsubara,Shuu;Mieno,Hitomi",,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks,AquaTimez;BLUEENCOUNT;CHiCO;DOES;HoneyWorks;Ne...,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks;Swimy,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks,"Honjou,Keiichirou;Ikeuchi,Naoko;Ishikawa,Marik...","Sorachi,Hideaki",,,,"Teramoto,Yuuki",,,"Fujita,Youichi","Utagawa,Ritsuko","Nakamura,Yumi","Seyama,Takeshi","Fukushima,Takayoshi;Maniwa,Nami",AudioHighs,,,"Utagawa,Ritsuko",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,Shingeki no Kyojin Season 3 Part 2,ProductionI.G;Dentsu;MainichiBroadcastingSyste...,3,1127900,9.09,33,1635976,46238,10.0,TV,Spring 2019,Manga,Action;Drama;Fantasy;Mystery,Wit Studio,Funimation,R-17+,"[['Ishikawa,Yui', 'Japanese'], ['Perino,Elena'...","[['Morishita,Katsuji', 'Producer,Planning'], [...","Ishikawa,Yui;Inoue,Marina;Kamiya,Hiroshi;Kaji,...","Perino,Elena;Bolognesi,Gaia;Raffaeli,Daniele;C...","Stefane,Mayara;Volpato,Pedro;Sangregório,Bruno...",,,"Nishimura,Trina;Grelle,Josh;Mercer,Matthew;Pap...",,,"Bienaimé,Nathalie;Niverd,Victor;Méyère,Bruno;G...",,,"Morishita,Katsuji;Nakatake,Tetsuya;Wada,Jouji;...","Araki,Tetsurou;Koizuka,Masashi","Araki,Tetsurou;Itoga,Shintaro;Tanaka,Hiroyuki;...","Araki,Tetsurou;Akamatsu,Yasuhiro;Komatsuda,Dai...","Mima,Masafumi","Imai,Arifumi;Izawa,Tamami;Oota,Emi;Yamauchi,Ryou",,"Asano,Kyouji","Kobayashi,Yasuko;Seko,Hiroshi","Kobayashi,Yasuko",,CinemaStaff;LinkedHorizon,,,"Koizuka,Masashi;Chiba,Takaaki;Ebisu,Takuma;Has...","Isayama,Hajime","Sangregório,Bruno","Ishikawa,Mitsuhisa","Asano,Kyouji;Kadowaki,Satoshi","Yamada,Kazuhiro",,"Fujii,Kazushi","Morishita,Katsuji","Hashimoto,Satoshi",,"Hida,Aya","Yoshihara,Shunichirou","Sawano,Hiroyuki",,,,"Koizuka,Masashi;Tanaka,Hiroyuki","Kurahashi,Shizuo",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,Steins;Gate,FrontierWorks;MediaFactory;Movic;AT-X;Kadokawa...,4,1128557,9.09,12,2117018,162324,24.0,TV,Spring 2011,Visual novel,Drama;Sci-fi;Suspense,White Fox,Funimation,PG-13-Teens,"[['Seki,Tomokazu', 'Japanese'], ['Rinehart,Tys...","[['Iwasa,Gaku', 'Producer'], ['Yasuda,Takeshi'...","Seki,Tomokazu;Imai,Asami;Miyano,Mamoru;Hanazaw...","Vivio,Paolo;Paolelli,Rachele;Chevalier,Davide;...","Casemiro,Bruno;Cunha,Maitê;Rinaldi,André;Lua,B...","Wirthgen,Jesco;Bäcker,Manuela;Gavrilis,Marios;...",,"Rinehart,Tyson;Nishimura,Trina;Tatum,JohnMicha...","Wu,JeongSin;Hong,SiHo;Yeo,MinJeong;Kim,SeoYeon...","Naro,Jordi","Pasquier,Laurent;Cornibert,Sarah;Wilhelm,Marc;...",,,"Iwasa,Gaku;Yasuda,Takeshi","Hamasaki,Hiroshi;Satou,Takuya","Hamasaki,Hiroshi;Satou,Takuya;Kobayashi,Kouji;...","Hamasaki,Hiroshi;Satou,Takuya;Kobayashi,Tomoki...","Fujiyama,Fusanobu","Hamasaki,Hiroshi;Aono,Atsushi;Arai,Nobuhiro;Hi...","Hamaguchi,Akira;Satou,Hiroaki","Sakai,Kyuuta","Hanada,Jukki;Nemoto,Toshizou;Tatum,JohnMichael...","Hanada,Jukki","Shikura,Chiyomaru","Itou,Kanako;Sakakibara,Yui",,"Shikura,Chiyomaru","Aono,Atsushi;Arai,Nobuhiro;Igari,Takashi;Ikega...","Shikura,Chiyomaru;5pb.;Nitroplus","Clinkenbeard,Colleen;Rinaldi,André","Fukunaga,Gen","Sakai,Kyuuta","Nakamura,Keisuke",,"Kanehira,Kazushige;Kouji,Etou;Maeda,Yuki;Nemot...","Yasuda,Takeshi;Shikura,Chiyomaru","Satou,Miyuki","Ikegami,Tarou;Nakamura,Kazuhisa;Sakai,Kyuuta;Y...",,"Kouji,Etou","Abo,Takeshi",,,,,,JunjounoAfilia,huke,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,Fruits Basket: The Final,TVTokyo;TVOsaka;NihonAdSystems;Hakusensha;Avex...,5,124091,9.06,619,288314,13330,13.0,TV,Spring 2021,Manga,Comedy;Drama;Romance;Sliceoflife;Supernatural,TMS Entertainment,Funimation,PG-13-Teens,"[['Iwami,Manaka', 'Japanese'], ['Ruis,Carolina...","[['Ibata,Yoshihide', 'Director'], ['Aketagawa,...","Iwami,Manaka;Uchida,Yuuma;Shimazaki,Nobunaga;S...",,"Ruis,Carolina;Campos,Fábio;Volpato,Pedro;Caval...",,,"Yeung,Suzie;Sabat,Christopher;Leigh,Cherami",,,,,,,"Ibata,Yoshihide",,,"Aketagawa,Jin",,,"Shindou,Yuu",,"Kishimoto,Taku",,GENIC;WARPsUP,,,,"Takaya,Natsuki","Falcão,Jonas",,,"Cai,Bolun;Shitara,Nozomi",,"Fujii,Yuuta",,"Sugawara,Mika",,"Hida,Aya","Kamiyama,Youko","Yokoyama,Masaru",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [60]:
# Drop de colunas que não fazem mais sentido
df1.drop(['voiceActorNameandLanguage', 'staffNameandOccupation'], axis = 1, inplace = True)

In [61]:
# Reindexação do dataframe
df1.set_index("ranking", inplace = True)

In [62]:
df1.head()

Unnamed: 0_level_0,name,producers,votersCount,score,popularity,members,favorite,episodes,animeType,premiredDate,animeSource,genres,studios,licenses,rating,Japanese,Italian,Portuguese(BR),German,Hungarian,English,Korean,Spanish,French,Mandarin,Hebrew,Producer,Director,EpisodeDirector,Storyboard,SoundDirector,KeyAnimation,2ndKeyAnimation,CharacterDesign,Script,SeriesComposition,ThemeSongLyrics,ThemeSongPerformance,ThemeSongArrangement,ThemeSongComposition,AnimationDirector,OriginalCreator,ADRDirector,ExecutiveProducer,ChiefAnimationDirector,DirectorofPhotography,In-BetweenAnimation,BackgroundArt,Planning,ColorDesign,AssistantAnimationDirector,Editing,ArtDirector,Music,ProductionCoordination,DigitalPaint,ColorSetting,AssistantDirector,SoundEffects,InsertedSongPerformance,OriginalCharacterDesign,Setting,Screenplay,AssociateProducer,SpecialEffects,AnimationCheck,ProductionAssistant,SoundSupervisor,PrincipleDrawing,AssistantProducer,ProductionManager,SoundManager,Co-Director,SeriesProductionDirector,MechanicalDesign,PlanningProducer,Layout,ChiefProducer,Recording,DialogueEditing,RecordingEngineer,Creator,RecordingAssistant,Publicity,Co-Producer,CastingDirector,Re-RecordingMixing,AssistantProductionCoordinat,SettingManager
ranking,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1,Unnamed: 23_level_1,Unnamed: 24_level_1,Unnamed: 25_level_1,Unnamed: 26_level_1,Unnamed: 27_level_1,Unnamed: 28_level_1,Unnamed: 29_level_1,Unnamed: 30_level_1,Unnamed: 31_level_1,Unnamed: 32_level_1,Unnamed: 33_level_1,Unnamed: 34_level_1,Unnamed: 35_level_1,Unnamed: 36_level_1,Unnamed: 37_level_1,Unnamed: 38_level_1,Unnamed: 39_level_1,Unnamed: 40_level_1,Unnamed: 41_level_1,Unnamed: 42_level_1,Unnamed: 43_level_1,Unnamed: 44_level_1,Unnamed: 45_level_1,Unnamed: 46_level_1,Unnamed: 47_level_1,Unnamed: 48_level_1,Unnamed: 49_level_1,Unnamed: 50_level_1,Unnamed: 51_level_1,Unnamed: 52_level_1,Unnamed: 53_level_1,Unnamed: 54_level_1,Unnamed: 55_level_1,Unnamed: 56_level_1,Unnamed: 57_level_1,Unnamed: 58_level_1,Unnamed: 59_level_1,Unnamed: 60_level_1,Unnamed: 61_level_1,Unnamed: 62_level_1,Unnamed: 63_level_1,Unnamed: 64_level_1,Unnamed: 65_level_1,Unnamed: 66_level_1,Unnamed: 67_level_1,Unnamed: 68_level_1,Unnamed: 69_level_1,Unnamed: 70_level_1,Unnamed: 71_level_1,Unnamed: 72_level_1,Unnamed: 73_level_1,Unnamed: 74_level_1,Unnamed: 75_level_1,Unnamed: 76_level_1,Unnamed: 77_level_1,Unnamed: 78_level_1,Unnamed: 79_level_1,Unnamed: 80_level_1,Unnamed: 81_level_1,Unnamed: 82_level_1,Unnamed: 83_level_1,Unnamed: 84_level_1,Unnamed: 85_level_1,Unnamed: 86_level_1,Unnamed: 87_level_1,Unnamed: 88_level_1,Unnamed: 89_level_1
1,Fullmetal Alchemist: Brotherhood,Aniplex;SquareEnix;MainichiBroadcastingSystem;...,1650275,9.15,3,2713695,191501,64.0,TV,Spring 2009,Manga,Action;Adventure;Comedy;Drama;Fantasy,Bones,Funimation;AniplexofAmerica,R-17+,"Kugimiya,Rie;Park,Romi;Utsumi,Kenji;Utsumi,Ken...","Ponticelli,Benedetta;Novara,Renato;Scianca,Pat...","Andreatto,Rodrigo;Campos,Marcelo;Zink,Mariana;...","Gerick,Wanja;Turba,David;Häcke,Maximiliane;Mai...","Baráth,István;Szabó,Máté;Faragó,András;Varga,R...","Whitehead,Maxey;Truncale,Lily;Mignogna,Vic;Hof...","Yun,MiNa;O,InSeong;Yang,JeongHwa;Lee,JiYeong;H...","Torres,Jhonny;Vieira,JoseManuel;Perez,LuisMigu...","Pic,Audrey;Boudonnat,Lucille;Pestel,Arthur;Cre...",,,"Cook,Justin;Yonai,Noritomo","Irie,Yasuhiro","Irie,Yasuhiro;Ikehata,Hiroshi;Ikezoe,Takahiro;...","Irie,Yasuhiro;Ikezoe,Takahiro;Kinutani,Soushi;...","Mima,Masafumi","Ikezoe,Takahiro;Kinutani,Soushi;Morii,Kenshiro...","Ikezoe,Takahiro;Akasaka,Shunji;Kameda,Yoshimic...","Morii,Kenshirou;Kanno,Hiroki","Burgmeier,John;Minakami,Seishi;Oonogi,Hiroshi;...","Oonogi,Hiroshi",CHEMISTRY;NICOTouchestheWalls;SCANDAL;SID;Suki...,"CHEMISTRY;Fukuhara,Miho;[""LilB"";NICOTouchesthe...","Kameda,Seiji;NICOTouchestheWalls;SID;SukimaSwitch",NICOTouchestheWalls;SID;SukimaSwitch;Yui,"Aono,Atsushi;Iijima,Hiroya;Ishino,Satoshi;Koba...","Arakawa,Hiromu","Bezerra,Úrsula;Campos,Marcelo;Glass,Caitlin;Ka...","Fukunaga,Gen","Fukuoka,Hidenori;Kameda,Yoshimichi;Kaneda,Naomi","Furumoto,Mayuko","Kameda,Yoshimichi;Oosawa,Mina;Saitou,Kengo;Yok...","Kanehira,Kazushige;Nakajima,Mika;Ooizumi,Anna;...","Minami,Masahiko;Ueda,Masuo","Nakao,Fusako","Park,Seong-Hu;Yoshioka,Takeshi","Sadamatsu,Gou","Satou,Takeshi","Senju,Akira","Shinya,Une","Uemura,Takako",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,Gintama°,TVTokyo;Aniplex;Dentsu,173906,9.09,337,493336,13063,51.0,TV,Spring 2015,Manga,Action;Comedy;Sci-fi,Bandai Namco Pictures,Funimation;Crunchyroll,PG-13-Teens,"Kugimiya,Rie;Ishii,Kouji;Sugita,Tomokazu;Tomat...",,,,,"Loewen,Jocelyne;Daingerfield,Michael;Pitre,Sab...",,,,,,,"Fujita,Youichi;Miyawaki,Chizuru","Asami,Matsuo;Koshida,Tomoaki;Minami,Yasuhiro;M...","Fujita,Youichi;Miyawaki,Chizuru;Minami,Yasuhiro","Takamatsu,Shinji","Miyawaki,Chizuru;Abe,Miyuki;Hayashi,Kanako;Hay...","Hayashi,Kanako;Honjou,Keiichirou;Sasaki,Youhei","Takeuchi,Shinji","Kishimoto,Taku;Matsubara,Shuu;Mieno,Hitomi",,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks,AquaTimez;BLUEENCOUNT;CHiCO;DOES;HoneyWorks;Ne...,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks;Swimy,AquaTimez;BLUEENCOUNT;DOES;HoneyWorks,"Honjou,Keiichirou;Ikeuchi,Naoko;Ishikawa,Marik...","Sorachi,Hideaki",,,,"Teramoto,Yuuki",,,"Fujita,Youichi","Utagawa,Ritsuko","Nakamura,Yumi","Seyama,Takeshi","Fukushima,Takayoshi;Maniwa,Nami",AudioHighs,,,"Utagawa,Ritsuko",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,Shingeki no Kyojin Season 3 Part 2,ProductionI.G;Dentsu;MainichiBroadcastingSyste...,1127900,9.09,33,1635976,46238,10.0,TV,Spring 2019,Manga,Action;Drama;Fantasy;Mystery,Wit Studio,Funimation,R-17+,"Ishikawa,Yui;Inoue,Marina;Kamiya,Hiroshi;Kaji,...","Perino,Elena;Bolognesi,Gaia;Raffaeli,Daniele;C...","Stefane,Mayara;Volpato,Pedro;Sangregório,Bruno...",,,"Nishimura,Trina;Grelle,Josh;Mercer,Matthew;Pap...",,,"Bienaimé,Nathalie;Niverd,Victor;Méyère,Bruno;G...",,,"Morishita,Katsuji;Nakatake,Tetsuya;Wada,Jouji;...","Araki,Tetsurou;Koizuka,Masashi","Araki,Tetsurou;Itoga,Shintaro;Tanaka,Hiroyuki;...","Araki,Tetsurou;Akamatsu,Yasuhiro;Komatsuda,Dai...","Mima,Masafumi","Imai,Arifumi;Izawa,Tamami;Oota,Emi;Yamauchi,Ryou",,"Asano,Kyouji","Kobayashi,Yasuko;Seko,Hiroshi","Kobayashi,Yasuko",,CinemaStaff;LinkedHorizon,,,"Koizuka,Masashi;Chiba,Takaaki;Ebisu,Takuma;Has...","Isayama,Hajime","Sangregório,Bruno","Ishikawa,Mitsuhisa","Asano,Kyouji;Kadowaki,Satoshi","Yamada,Kazuhiro",,"Fujii,Kazushi","Morishita,Katsuji","Hashimoto,Satoshi",,"Hida,Aya","Yoshihara,Shunichirou","Sawano,Hiroyuki",,,,"Koizuka,Masashi;Tanaka,Hiroyuki","Kurahashi,Shizuo",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,Steins;Gate,FrontierWorks;MediaFactory;Movic;AT-X;Kadokawa...,1128557,9.09,12,2117018,162324,24.0,TV,Spring 2011,Visual novel,Drama;Sci-fi;Suspense,White Fox,Funimation,PG-13-Teens,"Seki,Tomokazu;Imai,Asami;Miyano,Mamoru;Hanazaw...","Vivio,Paolo;Paolelli,Rachele;Chevalier,Davide;...","Casemiro,Bruno;Cunha,Maitê;Rinaldi,André;Lua,B...","Wirthgen,Jesco;Bäcker,Manuela;Gavrilis,Marios;...",,"Rinehart,Tyson;Nishimura,Trina;Tatum,JohnMicha...","Wu,JeongSin;Hong,SiHo;Yeo,MinJeong;Kim,SeoYeon...","Naro,Jordi","Pasquier,Laurent;Cornibert,Sarah;Wilhelm,Marc;...",,,"Iwasa,Gaku;Yasuda,Takeshi","Hamasaki,Hiroshi;Satou,Takuya","Hamasaki,Hiroshi;Satou,Takuya;Kobayashi,Kouji;...","Hamasaki,Hiroshi;Satou,Takuya;Kobayashi,Tomoki...","Fujiyama,Fusanobu","Hamasaki,Hiroshi;Aono,Atsushi;Arai,Nobuhiro;Hi...","Hamaguchi,Akira;Satou,Hiroaki","Sakai,Kyuuta","Hanada,Jukki;Nemoto,Toshizou;Tatum,JohnMichael...","Hanada,Jukki","Shikura,Chiyomaru","Itou,Kanako;Sakakibara,Yui",,"Shikura,Chiyomaru","Aono,Atsushi;Arai,Nobuhiro;Igari,Takashi;Ikega...","Shikura,Chiyomaru;5pb.;Nitroplus","Clinkenbeard,Colleen;Rinaldi,André","Fukunaga,Gen","Sakai,Kyuuta","Nakamura,Keisuke",,"Kanehira,Kazushige;Kouji,Etou;Maeda,Yuki;Nemot...","Yasuda,Takeshi;Shikura,Chiyomaru","Satou,Miyuki","Ikegami,Tarou;Nakamura,Kazuhisa;Sakai,Kyuuta;Y...",,"Kouji,Etou","Abo,Takeshi",,,,,,JunjounoAfilia,huke,,,,,,,,,,,,,,,,,,,,,,,,,,,,
5,Fruits Basket: The Final,TVTokyo;TVOsaka;NihonAdSystems;Hakusensha;Avex...,124091,9.06,619,288314,13330,13.0,TV,Spring 2021,Manga,Comedy;Drama;Romance;Sliceoflife;Supernatural,TMS Entertainment,Funimation,PG-13-Teens,"Iwami,Manaka;Uchida,Yuuma;Shimazaki,Nobunaga;S...",,"Ruis,Carolina;Campos,Fábio;Volpato,Pedro;Caval...",,,"Yeung,Suzie;Sabat,Christopher;Leigh,Cherami",,,,,,,"Ibata,Yoshihide",,,"Aketagawa,Jin",,,"Shindou,Yuu",,"Kishimoto,Taku",,GENIC;WARPsUP,,,,"Takaya,Natsuki","Falcão,Jonas",,,"Cai,Bolun;Shitara,Nozomi",,"Fujii,Yuuta",,"Sugawara,Mika",,"Hida,Aya","Kamiyama,Youko","Yokoyama,Masaru",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [63]:
# Salva em disco
df1.to_csv("dados/Processamento/animeData.csv")

# Fim