<a href="https://colab.research.google.com/github/sheilta/orbitgeny/blob/main/Pandas_Library.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

# **Import library**

In [1]:
import pandas as pd
import numpy as np

## Manipulating Data with Series

In [2]:
s = pd.Series([3, -5, 7, 4], index=['a', 'b', 'c', 'd']) # membuat 1 kolom dengan berindex a, b, c, d
s

a    3
b   -5
c    7
d    4
dtype: int64

In [3]:
series = pd.Series([1, 0.5, 4, 5.5, 'lima']) # membuat 1 kolom yang berisi beberapa type data
series

0       1
1     0.5
2       4
3     5.5
4    lima
dtype: object

In [4]:
ss = pd.Series([1.4, 5.6, 3, 3, 6], [1, 2, -3, 4, 5])
ss

 1    1.4
 2    5.6
-3    3.0
 4    3.0
 5    6.0
dtype: float64

### Mengambil atau memilih kolom tertentu pada series

In [5]:
s

a    3
b   -5
c    7
d    4
dtype: int64

In [6]:
s[~(s < 1)] # mengambil nilai, dimana negasi dari s > 1 atau s bukan > 1

a    3
c    7
d    4
dtype: int64

In [7]:
s[(s < -1) | (s > 3)] # mengambil nilai, dimana s < -1 atau s > 3

b   -5
c    7
d    4
dtype: int64

In [8]:
s['a'] = 6 # merubah nilai pada label a
s

a    6
b   -5
c    7
d    4
dtype: int64

In [9]:
s.drop(['a', 'c']) # menghapus label a dan c

b   -5
d    4
dtype: int64

In [10]:
s['b'] # memilih var s index b

-5

## Manipulating Data with Data Frame

### Membuat dataframe dari suatu series

In [11]:
df1 = pd.DataFrame(ss)
df1

Unnamed: 0,0
1,1.4
2,5.6
-3,3.0
4,3.0
5,6.0


### Membuat dataframe dengan key dan value

In [12]:
data = {'Country': ['Belgium', 'India', 'Brazil'], 'Capital': ['Brussels', 'New Delhi', 'Brasília'], 'Population': [11190846, 1303171035, 207847528]}
df = pd.DataFrame(data, columns=['Country', 'Capital', 'Population'])
df

Unnamed: 0,Country,Capital,Population
0,Belgium,Brussels,11190846
1,India,New Delhi,1303171035
2,Brazil,Brasília,207847528


### Selection

In [13]:
df[1:] # memilih kolom 1 sampai terakhir

Unnamed: 0,Country,Capital,Population
1,India,New Delhi,1303171035
2,Brazil,Brasília,207847528


In [14]:
df.iloc[[0],[0]] # memilih kolom index 0 dan kolom 0

Unnamed: 0,Country
0,Belgium


In [15]:
df.iloc[1:,[0]] # memilih kolom 1 sampai terakhir, dan baris index ke-0

Unnamed: 0,Country
1,India
2,Brazil


In [16]:
df.iat[0,0] # memilih baris index 0 dan kolom 0

'Belgium'

In [17]:
df.iat[1,0] # memilih baris index 1 dan kolom 0

'India'

In [18]:
df.loc[[0], ['Country']] # memilih baris index ke-0 pada kolom Country

Unnamed: 0,Country
0,Belgium


In [19]:
df.loc[:,['Capital']] # memilih baris semua index pada kolom Capital

Unnamed: 0,Capital
0,Brussels
1,New Delhi
2,Brasília


In [20]:
df.at[0,'Country'] # sama halnya dengan .loc tetapi bedanya 0 merupakan nilai skalar, jadi pengambilan nilai hanya satu

'Belgium'

In [21]:
df.at[1,'Capital']

'New Delhi'

In [22]:
df[df['Population'] > 1200000000] # memilih baris (atau kolom) dengan populasi >  1,2 M

Unnamed: 0,Country,Capital,Population
1,India,New Delhi,1303171035


In [23]:
# df.ix[1,'Capital']
df.loc[1,'Capital']

'New Delhi'

In [24]:
print(pd.__version__)

1.1.5


Atribut dan Method Data Frame lainnya

In [25]:
df

Unnamed: 0,Country,Capital,Population
0,Belgium,Brussels,11190846
1,India,New Delhi,1303171035
2,Brazil,Brasília,207847528


In [26]:
df.drop('Country', axis=1) # menghapus kolom Country

Unnamed: 0,Capital,Population
0,Brussels,11190846
1,New Delhi,1303171035
2,Brasília,207847528


In [27]:
df.drop([1], axis=0) # menghapus baris di index ke-1

Unnamed: 0,Country,Capital,Population
0,Belgium,Brussels,11190846
2,Brazil,Brasília,207847528


In [28]:
df.sort_index() # mengurutkan berdasarkan index

Unnamed: 0,Country,Capital,Population
0,Belgium,Brussels,11190846
1,India,New Delhi,1303171035
2,Brazil,Brasília,207847528


In [29]:
df.rank() # menentukan peringkat

Unnamed: 0,Country,Capital,Population
0,1.0,2.0,1.0
1,3.0,3.0,3.0
2,2.0,1.0,2.0


In [30]:
df.sort_values(by='Capital') # mengurutkan kolom Capital berdasarkan abjad

Unnamed: 0,Country,Capital,Population
2,Brazil,Brasília,207847528
0,Belgium,Brussels,11190846
1,India,New Delhi,1303171035


In [31]:
df.shape # untuk mengetahui jumlah baris dan kolom

(3, 3)

In [32]:
df.index # untuk mengetahui index

RangeIndex(start=0, stop=3, step=1)

In [33]:
df.columns # untuk mengetahui nilai kolom

Index(['Country', 'Capital', 'Population'], dtype='object')

In [34]:
df.info() # untuk mengetahui info 

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 3 entries, 0 to 2
Data columns (total 3 columns):
 #   Column      Non-Null Count  Dtype 
---  ------      --------------  ----- 
 0   Country     3 non-null      object
 1   Capital     3 non-null      object
 2   Population  3 non-null      int64 
dtypes: int64(1), object(2)
memory usage: 200.0+ bytes


In [35]:
df.count() # menghitung jumlah elemen bukan NA / None

Country       3
Capital       3
Population    3
dtype: int64

In [36]:
df.sum() # menentukan jumlah

Country              BelgiumIndiaBrazil
Capital       BrusselsNew DelhiBrasília
Population                   1522209409
dtype: object

In [37]:
df.cumsum() # menentukan jumlah komulatif berdasarkan grup

Unnamed: 0,Country,Capital,Population
0,Belgium,Brussels,11190846
1,BelgiumIndia,BrusselsNew Delhi,1314361881
2,BelgiumIndiaBrazil,BrusselsNew DelhiBrasília,1522209409


In [38]:
df.min() # menentukan nilai minimum

Country        Belgium
Capital       Brasília
Population    11190846
dtype: object

In [39]:
df.max() # menentukan nilai maximum

Country            India
Capital        New Delhi
Population    1303171035
dtype: object

In [40]:
df.describe() # menampilkan statistik data

Unnamed: 0,Population
count,3.0
mean,507403100.0
std,696134600.0
min,11190850.0
25%,109519200.0
50%,207847500.0
75%,755509300.0
max,1303171000.0


In [41]:
df.mean() # menentukan rata-rata

Population    5.074031e+08
dtype: float64

In [42]:
df.median() # menentukan nilai tengah

Population    207847528.0
dtype: float64

### Mengimport Data ke Data Frame

In [43]:
#Contoh mengimport dari web
url = 'https://people.sc.fsu.edu/~jburkardt/data/csv/freshman_kgs.csv'
df2 = pd.read_csv(url)
df2

Unnamed: 0,Sex,"""Weight (Sep)""","""Weight (Apr)""","""BMI (Sep)""","""BMI (Apr)"""
0,M,72,59,22.02,18.14
1,M,97,86,19.70,17.44
2,M,74,69,24.09,22.43
3,M,93,88,26.97,25.57
4,F,68,64,21.51,20.10
...,...,...,...,...,...
62,M,65,71,22.51,24.45
63,M,75,82,23.69,25.80
64,F,42,49,15.08,17.74
65,M,74,82,22.64,25.33


In [45]:
disney = '/content/walt-disne-movies.csv'
data = pd.read_csv(disney, sep=";")
data
# Sumber data: Kaggle

Unnamed: 0.1,Unnamed: 0,title,Production company,Country,Language,Running time,Budget,Box office,Release date,imdb,metascore,rotten_tomatoes,Directed by,Produced by,Based on,Starring,Music by,Distributed by,Cinematography,Edited by,Screenplay by
0,0,Academy Award Review of,Walt Disney Productions,United States,English,41.0,,4.547200e+01,19/05/1937,7.2,,,,,,,,,,,
1,1,Snow White and the Seven Dwarfs,Walt Disney Productions,United States,English,83.0,1490000.0,4.180000e+08,21/12/1937,7.6,95.0,,"['David Hand (supervising)', 'William Cottrell...",Walt Disney,"['Snow White', 'by The', 'Brothers Grimm']","['Adriana Caselotti', 'Lucille La Verne', 'Har...","['Frank Churchill', 'Paul Smith', 'Leigh Harli...",RKO Radio Pictures,,,
2,2,Pinocchio,Walt Disney Productions,United States,English,88.0,2600000.0,1.640000e+08,07/02/1940,7.4,99.0,73%,"['Ben Sharpsteen', 'Hamilton Luske', 'Bill Rob...",Walt Disney,"['The Adventures of Pinocchio', 'by', 'Carlo C...","['Cliff Edwards', 'Dickie Jones', 'Christian R...","['Leigh Harline', 'Paul J. Smith']",RKO Radio Pictures,,,
3,3,Fantasia,Walt Disney Productions,United States,English,126.0,2280000.0,8.330000e+07,13/11/1940,7.7,96.0,95%,"['Samuel Armstrong', 'James Algar', 'Bill Robe...","['Walt Disney', 'Ben Sharpsteen']",,"['Leopold Stokowski', 'Deems Taylor']",See program,RKO Radio Pictures,James Wong Howe,,
4,4,The Reluctant Dragon,Walt Disney Productions,United States,English,74.0,600000.0,9.600000e+05,20/06/1941,6.9,,68%,"['Alfred Werker', '(live action)', 'Hamilton L...",Walt Disney,,"['Robert Benchley', 'Frances Gifford', 'Buddy ...","['Frank Churchill', 'Larry Morey']",RKO Radio Pictures,Bert Giennon,Paul Weatherwax,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
439,439,The Little Mermaid,"['Walt Disney Pictures', 'Lucamar Productions'...",United States,English,,,,,7.6,88.0,93%,Rob Marshall,"['Rob Marshall', 'John DeLuca', 'Marc Platt', ...","['Disney', ""'s"", 'The Little Mermaid', 'by', '...","['Halle Bailey', 'Jonah Hauer-King', 'Daveed D...","['Alan Menken (score and songs)', 'Howard Ashm...","['Walt Disney Studios', 'Motion Pictures']",Dion Beebe,Wyatt Smith,"['Jane Goldman', 'David Magee']"
440,440,Peter Pan & Wendy,"['Walt Disney Pictures', 'Whitaker Entertainme...",United States,English,,,,,,,,David Lowery,"['Jim Whitaker', 'Joe Roth']","[""Disney 's Peter Pan"", 'Peter and Wendy by J....","['Alexander Molony', 'Ever Anderson', 'Jude La...",,Walt Disney Studios Motion Pictures,Bojan Bazelli,,"['David Lowery', 'Toby Halbrooks']"
441,441,Home Alone,"['20th Century Studios', 'Hutch Parker Enterta...",United States,English,,,,,7.6,63.0,66%,Dan Mazer,"['Hutch Parker', 'Dan Wilson']","['Home Alone', 'by', 'John Hughes']","['Archie Yates', 'Rob Delaney', 'Ellie Kemper'...",John Debney,Disney+,Mitchell Amundsen,,"['Mikey Day', 'Streeter Seidell']"
442,442,Shrunk,"['Walt Disney Pictures', 'Mandeville Films']",United States,English,,,,,,,,Joe Johnston,"['David Hoberman', 'Todd Lieberman']","['Characters', 'by', 'Stuart Gordon', ',', 'Br...","['Josh Gad', 'Rick Moranis']",,"['Walt Disney Studios', 'Motion Pictures']",,,Todd Rosenberg


In [46]:
data.head() 
# Fungsi head() digunakan untuk mendapatkan n baris pertama. Ini berguna untuk menguji dengan cepat apakah objek Anda- 
# memiliki tipe data yang tepat di dalamnya. Untuk nilai negatif n , fungsi head() mengembalikan semua baris kecuali 
# n baris terakhir, setara dengan df[:-n].

Unnamed: 0.1,Unnamed: 0,title,Production company,Country,Language,Running time,Budget,Box office,Release date,imdb,metascore,rotten_tomatoes,Directed by,Produced by,Based on,Starring,Music by,Distributed by,Cinematography,Edited by,Screenplay by
0,0,Academy Award Review of,Walt Disney Productions,United States,English,41.0,,45.472,19/05/1937,7.2,,,,,,,,,,,
1,1,Snow White and the Seven Dwarfs,Walt Disney Productions,United States,English,83.0,1490000.0,418000000.0,21/12/1937,7.6,95.0,,"['David Hand (supervising)', 'William Cottrell...",Walt Disney,"['Snow White', 'by The', 'Brothers Grimm']","['Adriana Caselotti', 'Lucille La Verne', 'Har...","['Frank Churchill', 'Paul Smith', 'Leigh Harli...",RKO Radio Pictures,,,
2,2,Pinocchio,Walt Disney Productions,United States,English,88.0,2600000.0,164000000.0,07/02/1940,7.4,99.0,73%,"['Ben Sharpsteen', 'Hamilton Luske', 'Bill Rob...",Walt Disney,"['The Adventures of Pinocchio', 'by', 'Carlo C...","['Cliff Edwards', 'Dickie Jones', 'Christian R...","['Leigh Harline', 'Paul J. Smith']",RKO Radio Pictures,,,
3,3,Fantasia,Walt Disney Productions,United States,English,126.0,2280000.0,83300000.0,13/11/1940,7.7,96.0,95%,"['Samuel Armstrong', 'James Algar', 'Bill Robe...","['Walt Disney', 'Ben Sharpsteen']",,"['Leopold Stokowski', 'Deems Taylor']",See program,RKO Radio Pictures,James Wong Howe,,
4,4,The Reluctant Dragon,Walt Disney Productions,United States,English,74.0,600000.0,960000.0,20/06/1941,6.9,,68%,"['Alfred Werker', '(live action)', 'Hamilton L...",Walt Disney,,"['Robert Benchley', 'Frances Gifford', 'Buddy ...","['Frank Churchill', 'Larry Morey']",RKO Radio Pictures,Bert Giennon,Paul Weatherwax,


In [47]:
data.tail()
# Fungsi ini mengembalikan n baris terakhir dari objek berdasarkan posisi. Ini berguna untuk 
# memverifikasi data dengan cepat, misalnya, setelah menyortir atau menambahkan baris.

Unnamed: 0.1,Unnamed: 0,title,Production company,Country,Language,Running time,Budget,Box office,Release date,imdb,metascore,rotten_tomatoes,Directed by,Produced by,Based on,Starring,Music by,Distributed by,Cinematography,Edited by,Screenplay by
439,439,The Little Mermaid,"['Walt Disney Pictures', 'Lucamar Productions'...",United States,English,,,,,7.6,88.0,93%,Rob Marshall,"['Rob Marshall', 'John DeLuca', 'Marc Platt', ...","['Disney', ""'s"", 'The Little Mermaid', 'by', '...","['Halle Bailey', 'Jonah Hauer-King', 'Daveed D...","['Alan Menken (score and songs)', 'Howard Ashm...","['Walt Disney Studios', 'Motion Pictures']",Dion Beebe,Wyatt Smith,"['Jane Goldman', 'David Magee']"
440,440,Peter Pan & Wendy,"['Walt Disney Pictures', 'Whitaker Entertainme...",United States,English,,,,,,,,David Lowery,"['Jim Whitaker', 'Joe Roth']","[""Disney 's Peter Pan"", 'Peter and Wendy by J....","['Alexander Molony', 'Ever Anderson', 'Jude La...",,Walt Disney Studios Motion Pictures,Bojan Bazelli,,"['David Lowery', 'Toby Halbrooks']"
441,441,Home Alone,"['20th Century Studios', 'Hutch Parker Enterta...",United States,English,,,,,7.6,63.0,66%,Dan Mazer,"['Hutch Parker', 'Dan Wilson']","['Home Alone', 'by', 'John Hughes']","['Archie Yates', 'Rob Delaney', 'Ellie Kemper'...",John Debney,Disney+,Mitchell Amundsen,,"['Mikey Day', 'Streeter Seidell']"
442,442,Shrunk,"['Walt Disney Pictures', 'Mandeville Films']",United States,English,,,,,,,,Joe Johnston,"['David Hoberman', 'Todd Lieberman']","['Characters', 'by', 'Stuart Gordon', ',', 'Br...","['Josh Gad', 'Rick Moranis']",,"['Walt Disney Studios', 'Motion Pictures']",,,Todd Rosenberg
443,443,Night at the Museum,"['21 Laps Entertainment', 'Ingenious Film Part...",United States,English,306.0,387000000.0,1310000000.0,,6.4,48.0,43%,Shawn Levy,"['Shawn Levy', 'Chris Columbus', 'Michael Barn...","['The Night at the Museum', 'by', 'Milan Trenc']","['Ben Stiller', 'Robin Williams', 'Owen Wilson...",Alan Silvestri,"['20th Century Studios', 'Disney+']",,,


In [48]:
data.columns

Index(['Unnamed: 0', 'title', 'Production company', 'Country', 'Language',
       'Running time', 'Budget', 'Box office', 'Release date', 'imdb',
       'metascore', 'rotten_tomatoes', 'Directed by', 'Produced by',
       'Based on', 'Starring', 'Music by', 'Distributed by', 'Cinematography',
       'Edited by', 'Screenplay by'],
      dtype='object')

In [49]:
data.describe

<bound method NDFrame.describe of      Unnamed: 0  ...                       Screenplay by
0             0  ...                                 NaN
1             1  ...                                 NaN
2             2  ...                                 NaN
3             3  ...                                 NaN
4             4  ...                                 NaN
..          ...  ...                                 ...
439         439  ...     ['Jane Goldman', 'David Magee']
440         440  ...  ['David Lowery', 'Toby Halbrooks']
441         441  ...   ['Mikey Day', 'Streeter Seidell']
442         442  ...                      Todd Rosenberg
443         443  ...                                 NaN

[444 rows x 21 columns]>

In [50]:
data.dtypes

Unnamed: 0              int64
title                  object
Production company     object
Country                object
Language               object
Running time          float64
Budget                float64
Box office            float64
Release date           object
imdb                  float64
metascore             float64
rotten_tomatoes        object
Directed by            object
Produced by            object
Based on               object
Starring               object
Music by               object
Distributed by         object
Cinematography         object
Edited by              object
Screenplay by          object
dtype: object

**boleh dicoba untuk analisis data di atas yaaa....**

In [51]:
# MENGANALISIS DATA MULAI DARI SINI

data.describe()  # menampilkan statistik data

Unnamed: 0.1,Unnamed: 0,Running time,Budget,Box office,imdb,metascore
count,444.0,430.0,278.0,358.0,424.0,293.0
mean,221.5,98.076744,56385950.0,170241700.0,6.566274,61.860068
std,128.316016,21.418924,71114270.0,280354100.0,0.965122,16.756236
min,0.0,40.0,4.4,7.7,1.5,18.0
25%,110.75,86.25,6000000.0,10425000.0,6.1,49.0
50%,221.5,96.0,25000000.0,44700000.0,6.6,61.0
75%,332.25,107.0,85000000.0,186775000.0,7.2,74.0
max,443.0,306.0,410600000.0,1657000000.0,8.6,99.0


In [52]:
data.sort_values(by='Budget') # mengurutkan kolom Budget dari nilai terkecil ke terbesar

Unnamed: 0.1,Unnamed: 0,title,Production company,Country,Language,Running time,Budget,Box office,Release date,imdb,metascore,rotten_tomatoes,Directed by,Produced by,Based on,Starring,Music by,Distributed by,Cinematography,Edited by,Screenplay by
72,72,Mary Poppins,Walt Disney Productions,United States,English,139.0,4.4,103100000.0,27/08/1964,7.8,88.0,100%,Robert Stevenson,Walt Disney,"['Mary Poppins', 'by', 'P. L. Travers']","['Julie Andrews', 'Dick Van Dyke', 'David Toml...","['Richard M. Sherman', 'Robert B. Sherman']",Buena Vista Distribution,Edward Colman,Cotton Warburton,"['Bill Walsh', 'Don DaGradi']"
379,379,Monkey Kingdom,"['Disneynature', 'Silverback Films']",United States,English,82.0,5.0,17100000.0,17/04/2015,7.3,72.0,93%,"['Mark Linfield', 'Alastair Fothergill']","['Mark Linfield', 'Alastair Fothergill']",,,Harry Gregson-Williams,Walt Disney Studios Motion Pictures,"['Martyn Colbeck', 'Gavin Thurston']",Andy Netley,
397,397,Born in China,"['Disneynature', 'Shanghai Media Group', 'Chua...","['United States', 'China', 'France']","['English', 'Mandarin', 'French']",76.0,5.0,25100000.0,12/08/2016,7.2,57.0,85%,Lu Chuan,"['Roy Conli', 'Brian Leith', 'Phil Chapman']",,,Barnaby Taylor,"['Walt Disney Studios Motion Pictures', 'Shang...",,Matthew Meech,"['David Fowler', 'Brian Leith', 'Phil Chapman'..."
254,254,Spirited Away,Studio Ghibli,Japan,Japanese,125.0,15.0,,20/07/2001,8.6,96.0,97%,Hayao Miyazaki,Toshio Suzuki,,"['Rumi Hiiragi', 'Miyu Irino', 'Mari Natsuki',...",Joe Hisaishi,Toho,Atsushi Okui,Takeshi Seyama,
300,300,Bridge to Terabithia,,United States,English,95.0,20.0,138000000.0,16/02/2007,7.1,74.0,85%,Gábor Csupó,"['David L. Paterson', 'Lauren Levine', 'Hal Li...","['Bridge to Terabithia', 'by', 'Katherine Pate...","['Josh Hutcherson', 'AnnaSophia Robb', 'Bailee...",Aaron Zigman,"['Buena Vista Pictures Distribution', '(United...",Michael Chapman,John Gilbert,"['David L. Paterson', 'Jeff Stockwell']"
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
438,438,Encanto,"['Walt Disney Pictures', 'Walt Disney Animatio...",United States,English,,,,24/11/2021,,,,"['Byron Howard', 'Jared Bush']","['Clark Spencer', 'Yvett Merino Flores']",,,Lin-Manuel Miranda,"['Walt Disney Studios', 'Motion Pictures']",,,
439,439,The Little Mermaid,"['Walt Disney Pictures', 'Lucamar Productions'...",United States,English,,,,,7.6,88.0,93%,Rob Marshall,"['Rob Marshall', 'John DeLuca', 'Marc Platt', ...","['Disney', ""'s"", 'The Little Mermaid', 'by', '...","['Halle Bailey', 'Jonah Hauer-King', 'Daveed D...","['Alan Menken (score and songs)', 'Howard Ashm...","['Walt Disney Studios', 'Motion Pictures']",Dion Beebe,Wyatt Smith,"['Jane Goldman', 'David Magee']"
440,440,Peter Pan & Wendy,"['Walt Disney Pictures', 'Whitaker Entertainme...",United States,English,,,,,,,,David Lowery,"['Jim Whitaker', 'Joe Roth']","[""Disney 's Peter Pan"", 'Peter and Wendy by J....","['Alexander Molony', 'Ever Anderson', 'Jude La...",,Walt Disney Studios Motion Pictures,Bojan Bazelli,,"['David Lowery', 'Toby Halbrooks']"
441,441,Home Alone,"['20th Century Studios', 'Hutch Parker Enterta...",United States,English,,,,,7.6,63.0,66%,Dan Mazer,"['Hutch Parker', 'Dan Wilson']","['Home Alone', 'by', 'John Hughes']","['Archie Yates', 'Rob Delaney', 'Ellie Kemper'...",John Debney,Disney+,Mitchell Amundsen,,"['Mikey Day', 'Streeter Seidell']"


In [54]:
data.info() # untuk mengetahui info 

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 444 entries, 0 to 443
Data columns (total 21 columns):
 #   Column              Non-Null Count  Dtype  
---  ------              --------------  -----  
 0   Unnamed: 0          444 non-null    int64  
 1   title               444 non-null    object 
 2   Production company  399 non-null    object 
 3   Country             441 non-null    object 
 4   Language            443 non-null    object 
 5   Running time        430 non-null    float64
 6   Budget              278 non-null    float64
 7   Box office          358 non-null    float64
 8   Release date        435 non-null    object 
 9   imdb                424 non-null    float64
 10  metascore           293 non-null    float64
 11  rotten_tomatoes     391 non-null    object 
 12  Directed by         443 non-null    object 
 13  Produced by         435 non-null    object 
 14  Based on            221 non-null    object 
 15  Starring            409 non-null    object 
 16  Music by

In [53]:
data.count() # hanya menghitung jumlah elemen selain NA / None

Unnamed: 0            444
title                 444
Production company    399
Country               441
Language              443
Running time          430
Budget                278
Box office            358
Release date          435
imdb                  424
metascore             293
rotten_tomatoes       391
Directed by           443
Produced by           435
Based on              221
Starring              409
Music by              433
Distributed by        441
Cinematography        352
Edited by             404
Screenplay by         204
dtype: int64

##ThankYou