# Package Pandas  

Digunakan untuk pengolahan data yang berkaitan dengan data frame. 

In [3]:
# Lakukan import pandas sebagai pd
import pandas as pd

In [4]:
# Lakukan import numpy sebagai np
import numpy as np

## 1. Membuat dataframe

Untuk membuat data frame, digunakan sintaks berikut: `pandas.DataFrame( data, index, columns, dtype, copy)`  
1. index merupakan label untuk baris   
2. columns merupakan label untuk kolom
3. dtype merupakan tipe data perkolom
4. copy digunakan untuk menyalin data, defaultnya False

In [5]:
# Membuat rentang waktu
tanggal = pd.date_range("20200901", freq="M", periods=9)
print(tanggal)

DatetimeIndex(['2020-09-30', '2020-10-31', '2020-11-30', '2020-12-31',
               '2021-01-31', '2021-02-28', '2021-03-31', '2021-04-30',
               '2021-05-31'],
              dtype='datetime64[ns]', freq='M')


In [6]:
# Membuat data frame dengan data randon ukuran 9x4, serta label baris adalah tanggal dan label kolom A, B, C, D
contoh1 = pd.DataFrame(np.random.randn(9,4), index=tanggal, columns=("A","B","C","D"))
contoh1

Unnamed: 0,A,B,C,D
2020-09-30,1.807234,-0.546344,-0.393466,-0.353618
2020-10-31,-0.899886,-0.892469,0.614704,0.280939
2020-11-30,1.750727,0.016294,1.136336,0.70357
2020-12-31,2.480358,0.908032,-0.76774,-1.299337
2021-01-31,-1.225295,0.117517,-0.489437,0.488737
2021-02-28,-0.930417,-0.995462,-0.74258,-0.211376
2021-03-31,-0.090109,0.330262,1.023413,0.787451
2021-04-30,2.088013,-0.772923,1.308658,0.619509
2021-05-31,0.294834,1.541281,0.73346,0.886389


In [7]:
# Membuat dataframe dengan daftar anggota
contoh2 = pd.DataFrame({"A": 1.,
                       "B": pd.Timestamp("20180925"),
                       "C": np.array([3]*4, dtype="int32"),
                       "D": pd.Categorical(["test","train"]*2),
                       "E": np.array([1,12,32,14])}, index=["satu","dua","tiga","empat"])
contoh2

Unnamed: 0,A,B,C,D,E
satu,1.0,2018-09-25,3,test,1
dua,1.0,2018-09-25,3,train,12
tiga,1.0,2018-09-25,3,test,32
empat,1.0,2018-09-25,3,train,14


## 2. Menambah, menghapus, dan menyeleksi kolom data frame

Menghapus kolom dengan fungsi:  
1. `del(data_frame["kolom"])` 
2. `.pop("kolom")`
3. `.drop("kolom", axis=1)`; axis=1 berarti menghapus sepanjang kolom yang dimaksud

Menambahkan kolom baru dengan operasi matematis "+"

In [8]:
# Menambahkan kolom baru dengan nama "F", dengan operasi penambahan kolom "C" dan "E"
contoh2["F"]=contoh2["C"]+contoh2["E"]
print(contoh2)

         A          B  C      D   E   F
satu   1.0 2018-09-25  3   test   1   4
dua    1.0 2018-09-25  3  train  12  15
tiga   1.0 2018-09-25  3   test  32  35
empat  1.0 2018-09-25  3  train  14  17


In [10]:
# Menambahkan kolom baru dengan nama "G", pada index satu, tiga, empat 
contoh2["G"]=pd.Series([10,20,30], index=["satu", "tiga", "empat"])
print(contoh2)

         A          B  C      D   E   F     G
satu   1.0 2018-09-25  3   test   1   4  10.0
dua    1.0 2018-09-25  3  train  12  15   NaN
tiga   1.0 2018-09-25  3   test  32  35  20.0
empat  1.0 2018-09-25  3  train  14  17  30.0


In [11]:
# Menghapus kolom "B" dengan fungsi del
del(contoh2["B"])
contoh2

Unnamed: 0,A,C,D,E,F,G
satu,1.0,3,test,1,4,10.0
dua,1.0,3,train,12,15,
tiga,1.0,3,test,32,35,20.0
empat,1.0,3,train,14,17,30.0


In [12]:
# Menghapus kolom "C" dengan pop
contoh2.pop("C")
contoh2

Unnamed: 0,A,D,E,F,G
satu,1.0,test,1,4,10.0
dua,1.0,train,12,15,
tiga,1.0,test,32,35,20.0
empat,1.0,train,14,17,30.0


In [13]:
# Menyeleksi kolom "A"
kolomA = contoh2["A"]
kolomA

satu     1.0
dua      1.0
tiga     1.0
empat    1.0
Name: A, dtype: float64

In [14]:
# Menghapus kolom "A" dengan fungsi drop
contoh2_hapus = contoh2.drop("A", axis = 1)
contoh2_hapus.head()

Unnamed: 0,D,E,F,G
satu,test,1,4,10.0
dua,train,12,15,
tiga,test,32,35,20.0
empat,train,14,17,30.0


## 3. Menambah, mengurang, dan menyeleksi baris pada data frame

Menyeleksi/mengiris data frame dengan fungsi:
1. `loc`: untuk seleksi dengan menggunakan indeks/bilangan bulat
2. `iloc`: untuk seleksi dengan menggunakan bilangan bulat

Menambah baris dengan fungsi: `.append()`

Menghapus baris dengan fungsi: `.del("index", axis=0)`, axis=0 berarti menghapus sepanjang baris.

In [15]:
# Menambah baris menggunakan fungsi append
contoh3 = pd.DataFrame([[1,"train",4,5,6.0], [2,"test",7,12,34]], columns=["A","D","E","F","G"])
contoh3

contoh4 = contoh2.append(contoh3)
contoh4

Unnamed: 0,A,D,E,F,G
satu,1.0,test,1,4,10.0
dua,1.0,train,12,15,
tiga,1.0,test,32,35,20.0
empat,1.0,train,14,17,30.0
0,1.0,train,4,5,6.0
1,2.0,test,7,12,34.0


In [16]:
# Menyeleksi indeks "tiga" pada baris
contoh4.loc["tiga"]

A       1
D    test
E      32
F      35
G      20
Name: tiga, dtype: object

In [17]:
# Menyeleksi baris ke 2 dan 3, dengan menyebut urutannya, kemudian mengcopy hasilnya
contoh5=contoh4.iloc[1:3].copy()
contoh5

Unnamed: 0,A,D,E,F,G
dua,1.0,train,12,15,
tiga,1.0,test,32,35,20.0


In [18]:
# Menghapus baris dengan indeks "tiga". Simpan variabel dengan nama "contoh5_hapus"
contoh5_hapus = contoh5.drop("tiga", axis=0)
contoh5_hapus

Unnamed: 0,A,D,E,F,G
dua,1.0,train,12,15,


## 4. Menyeleksi/megiris data frame berdasar baris dan kolom



In [19]:
contoh2

Unnamed: 0,A,D,E,F,G
satu,1.0,test,1,4,10.0
dua,1.0,train,12,15,
tiga,1.0,test,32,35,20.0
empat,1.0,train,14,17,30.0


In [20]:
# mengiris data baris dan kolom
contoh2.iloc[1:3, 2:5]

Unnamed: 0,E,F,G
dua,12,15,
tiga,32,35,20.0


In [21]:
# Menampilkan informasi pada data frame
contoh2.info()

<class 'pandas.core.frame.DataFrame'>
Index: 4 entries, satu to empat
Data columns (total 5 columns):
A    4 non-null float64
D    4 non-null category
E    4 non-null int32
F    4 non-null int32
G    3 non-null float64
dtypes: category(1), float64(2), int32(2)
memory usage: 388.0+ bytes


### Fungsi dasar untuk series  


Berikut fungsi dasar untuk series (deret)  

No   | Fungsi   | Deskripsi
:---:|:---      |:---   
1    | axes     | Daftar label baris dan kolom |
2    | dtypes   | Daftar tipe data setiap kolom |
3    | empty    | Akan bernilai True jika deret ada yang kosong |
4    | size     | Ukuran dari data |
5    | values   | Mengubah deret menjadi ndarray (n dimensional array) |
6    | head()   | Menampilkan n data pertama |
7    | tail()   | Menampilkan n data terakhir |

In [22]:
# cobalah fungsi axes, dtypes, empty, size, head, tail untuk contoh2

## 5. Mengimport atau membaca file (csv, xls)

In [24]:
# Membaca file xls. File terletak dalam satu folder dengan notebook jupyter
superstore = pd.read_excel("Superstore.xls")
superstore.head()

Unnamed: 0,Row ID,Order ID,Order Date,Ship Date,Ship Mode,Customer ID,Customer Name,Segment,Kota,State,Country,Region,Product ID,Category,Sub-Category,Product Name,Sales,Quantity,Discount,Profit
0,18,ID-2014-44908,2014-02-26,2014-03-04,Standard Class,AI-10855,Arianne Irving,Consumer,Bandung,Jawa Barat,Indonesia,Southeast Asia,OFF-SU-10004848,Office Supplies,Supplies,"Kleencut Shears, High Speed",123.9405,5,0.47,-84.2595
1,19,ID-2014-44908,2014-02-26,2014-03-04,Standard Class,AI-10855,Arianne Irving,Consumer,Bandung,Jawa Barat,Indonesia,Southeast Asia,OFF-PA-10003332,Office Supplies,Paper,"Xerox Cards & Envelopes, Recycled",47.5728,2,0.47,-15.3072
2,20,ID-2012-73146,2012-10-24,2012-10-30,Standard Class,HM-14980,Henry MacAllister,Consumer,Denpasar,Bali,Indonesia,Southeast Asia,OFF-AP-10000487,Office Supplies,Appliances,"Hoover Stove, Silver",1417.3578,3,0.17,-290.3022
3,21,ID-2012-73146,2012-10-24,2012-10-30,Standard Class,HM-14980,Henry MacAllister,Consumer,Denpasar,Bali,Indonesia,Southeast Asia,OFF-LA-10000095,Office Supplies,Labels,"Avery Round Labels, Laser Printer Compatible",22.7052,6,0.47,-4.2948
4,24,ID-2012-57809,2012-10-09,2012-10-13,Standard Class,AO-10810,Anthony O'Donnell,Corporate,Pekanbaru,Riau,Indonesia,Southeast Asia,FUR-TA-10000665,Furniture,Tables,"Bevis Computer Table, Fully Assembled",786.2868,3,0.47,-563.8032


In [25]:
# Gunakan fungsi dasar untuk series, untuk melihat informasi tabel
superstore.empty

False

In [26]:
superstore.dtypes

Row ID                    int64
Order ID                 object
Order Date       datetime64[ns]
Ship Date        datetime64[ns]
Ship Mode                object
Customer ID              object
Customer Name            object
Segment                  object
Kota                     object
State                    object
Country                  object
Region                   object
Product ID               object
Category                 object
Sub-Category             object
Product Name             object
Sales                   float64
Quantity                  int64
Discount                float64
Profit                  float64
dtype: object

In [27]:
# Ukuran data frame (baris, kolom)
superstore.shape

(1388, 20)

In [28]:
# Ukuran data frame 
superstore.size

27760

In [29]:
# apakah tipe data superstore? Gunakan fungsi type
type(superstore)

pandas.core.frame.DataFrame

In [30]:
# Gunakan fungsi .info() untuk mengetahui gambaran data superstore
superstore.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1388 entries, 0 to 1387
Data columns (total 20 columns):
Row ID           1388 non-null int64
Order ID         1388 non-null object
Order Date       1388 non-null datetime64[ns]
Ship Date        1388 non-null datetime64[ns]
Ship Mode        1388 non-null object
Customer ID      1388 non-null object
Customer Name    1388 non-null object
Segment          1388 non-null object
Kota             1388 non-null object
State            1388 non-null object
Country          1388 non-null object
Region           1388 non-null object
Product ID       1388 non-null object
Category         1388 non-null object
Sub-Category     1388 non-null object
Product Name     1388 non-null object
Sales            1388 non-null float64
Quantity         1388 non-null int64
Discount         1388 non-null float64
Profit           1388 non-null float64
dtypes: datetime64[ns](2), float64(3), int64(2), object(13)
memory usage: 217.0+ KB


In [31]:
# Pilih kolom "Product Name", dan simpan dalam variabel produk

produk = superstore['Product Name']
produk.head(10)

0                     Kleencut Shears, High Speed
1               Xerox Cards & Envelopes, Recycled
2                            Hoover Stove, Silver
3    Avery Round Labels, Laser Printer Compatible
4           Bevis Computer Table, Fully Assembled
5                     Sanford Canvas, Fluorescent
6     Binney & Smith Pencil Sharpener, Easy-Erase
7                Novimex Swivel Stool, Adjustable
8                   Panasonic Calculator, Durable
9                         Stockwell Clamps, Metal
Name: Product Name, dtype: object

In [32]:
# Menjadikan series ke array dengan .values
produk.values

array(['Kleencut Shears, High Speed', 'Xerox Cards & Envelopes, Recycled',
       'Hoover Stove, Silver', ..., 'Hon Chairmat, Set of Two',
       'Rubbermaid Light Bulb, Black', 'Enermax Keyboard, Programmable'],
      dtype=object)

In [35]:
superstore.iloc[::5, :].head(10)

Unnamed: 0,Row ID,Order ID,Order Date,Ship Date,Ship Mode,Customer ID,Customer Name,Segment,Kota,State,Country,Region,Product ID,Category,Sub-Category,Product Name,Sales,Quantity,Discount,Profit
0,18,ID-2014-44908,2014-02-26,2014-03-04,Standard Class,AI-10855,Arianne Irving,Consumer,Bandung,Jawa Barat,Indonesia,Southeast Asia,OFF-SU-10004848,Office Supplies,Supplies,"Kleencut Shears, High Speed",123.9405,5,0.47,-84.2595
5,25,ID-2012-57809,2012-10-09,2012-10-13,Standard Class,AO-10810,Anthony O'Donnell,Corporate,Pekanbaru,Riau,Indonesia,Southeast Asia,OFF-AR-10001232,Office Supplies,Art,"Sanford Canvas, Fluorescent",75.5988,2,0.27,4.1388
10,98,ID-2011-74721,2011-05-04,2011-05-05,First Class,HG-14845,Harry Greene,Consumer,Yogyakarta,Yogyakarta,Indonesia,Southeast Asia,OFF-AP-10002017,Office Supplies,Appliances,"Cuisinart Blender, Red",55.6017,1,0.17,0.6417
15,115,ID-2011-36011,2011-01-26,2011-01-27,First Class,HK-14890,Heather Kirkland,Corporate,Depok,Jawa Barat,Indonesia,Southeast Asia,FUR-CH-10003950,Furniture,Chairs,"Novimex Executive Leather Armchair, Black",334.3035,1,0.27,-109.9365
20,158,IN-2014-17489,2014-12-22,2014-12-26,Standard Class,DF-13135,David Flashing,Consumer,Jember,Jawa Timur,Indonesia,Southeast Asia,OFF-AR-10000539,Office Supplies,Art,"Boston Markers, Easy-Erase",58.3416,3,0.27,-15.9984
25,199,IN-2014-76450,2014-11-17,2014-11-21,Standard Class,PJ-19015,Pauline Johnson,Consumer,Pontianak,Kalimantan Barat,Indonesia,Southeast Asia,OFF-BI-10004666,Office Supplies,Binders,"Wilson Jones Binding Machine, Durable",125.6454,3,0.17,42.3054
30,229,ID-2014-61169,2014-12-12,2014-12-16,Standard Class,EB-13930,Eric Barreto,Consumer,Jakarta,Jakarta,Indonesia,Southeast Asia,OFF-EN-10002700,Office Supplies,Envelopes,"Kraft Interoffice Envelope, with clear poly wi...",80.2314,3,0.47,-18.2286
35,298,ID-2013-22025,2013-10-09,2013-10-13,Standard Class,TS-21655,Trudy Schmidt,Consumer,Bandung,Jawa Barat,Indonesia,Southeast Asia,TEC-CO-10000821,Technology,Copiers,"Canon Ink, High-Speed",675.8775,5,0.07,-43.6725
40,307,ID-2013-70122,2013-06-11,2013-06-15,Standard Class,AD-10180,Alan Dominguez,Home Office,Jakarta,Jakarta,Indonesia,Southeast Asia,FUR-CH-10002061,Furniture,Chairs,"Harbour Creations Executive Leather Armchair, Red",3126.4002,9,0.27,-128.7198
45,326,IN-2014-54211,2014-01-16,2014-01-20,Standard Class,KB-16315,Karl Braun,Consumer,Bekasi,Jawa Barat,Indonesia,Southeast Asia,OFF-BI-10004869,Office Supplies,Binders,"Avery 3-Hole Punch, Recycled",93.7236,4,0.17,34.9236


In [33]:
# Memilih baris kelipatan 3, dengan semua kolom. Kemudian tampilkan 10 data pertama
superstore.iloc[::3,:].head(10)

Unnamed: 0,Row ID,Order ID,Order Date,Ship Date,Ship Mode,Customer ID,Customer Name,Segment,Kota,State,Country,Region,Product ID,Category,Sub-Category,Product Name,Sales,Quantity,Discount,Profit
0,18,ID-2014-44908,2014-02-26,2014-03-04,Standard Class,AI-10855,Arianne Irving,Consumer,Bandung,Jawa Barat,Indonesia,Southeast Asia,OFF-SU-10004848,Office Supplies,Supplies,"Kleencut Shears, High Speed",123.9405,5,0.47,-84.2595
3,21,ID-2012-73146,2012-10-24,2012-10-30,Standard Class,HM-14980,Henry MacAllister,Consumer,Denpasar,Bali,Indonesia,Southeast Asia,OFF-LA-10000095,Office Supplies,Labels,"Avery Round Labels, Laser Printer Compatible",22.7052,6,0.47,-4.2948
6,26,IN-2013-76464,2013-06-12,2013-06-14,First Class,DK-13090,Dave Kipp,Consumer,Semarang,Jawa Tengah,Indonesia,Southeast Asia,OFF-AR-10000027,Office Supplies,Art,"Binney & Smith Pencil Sharpener, Easy-Erase",61.1667,3,0.27,10.0467
9,97,ID-2011-74721,2011-05-04,2011-05-05,First Class,HG-14845,Harry Greene,Consumer,Yogyakarta,Yogyakarta,Indonesia,Southeast Asia,OFF-FA-10001010,Office Supplies,Fasteners,"Stockwell Clamps, Metal",82.044,8,0.47,-32.676
12,110,ID-2012-10230,2012-07-06,2012-07-09,First Class,JC-16105,Julie Creighton,Corporate,Jakarta,Jakarta,Indonesia,Southeast Asia,OFF-LA-10004062,Office Supplies,Labels,"Hon Removable Labels, 5000 Label Set",16.3134,3,0.47,-0.3366
15,115,ID-2011-36011,2011-01-26,2011-01-27,First Class,HK-14890,Heather Kirkland,Corporate,Depok,Jawa Barat,Indonesia,Southeast Asia,FUR-CH-10003950,Furniture,Chairs,"Novimex Executive Leather Armchair, Black",334.3035,1,0.27,-109.9365
18,131,ID-2012-60427,2012-07-14,2012-07-20,Standard Class,RB-19795,Ross Baird,Home Office,Palembang,Sumatera Selatan,Indonesia,Southeast Asia,TEC-AC-10001022,Technology,Accessories,"SanDisk Flash Drive, USB",105.3375,5,0.47,-53.6625
21,178,ID-2013-52370,2013-05-29,2013-06-02,Standard Class,JR-15670,Jim Radford,Consumer,Jakarta,Jakarta,Indonesia,Southeast Asia,OFF-BI-10002881,Office Supplies,Binders,"Wilson Jones Binding Machine, Economy",40.6368,1,0.17,-7.3632
24,192,IN-2012-21297,2012-09-21,2012-09-28,Standard Class,ES-14080,Erin Smith,Corporate,Surakarta,Jawa Tengah,Indonesia,Southeast Asia,OFF-ST-10000485,Office Supplies,Storage,"Fellowes Folders, Single Width",87.7476,4,0.17,6.2676
27,211,IN-2013-29676,2013-01-17,2013-01-22,Standard Class,SS-20515,Shirley Schmidt,Home Office,Jayapura,Papua,Indonesia,Southeast Asia,FUR-CH-10003232,Furniture,Chairs,"Harbour Creations Executive Leather Armchair, ...",1375.8456,4,0.27,94.1256


In [34]:
# Menyeleksi data dengan Kota adalah "Semarang". Kemudian tampilkan 5 data pertama
semarang = superstore[superstore.Kota == "Semarang"]
semarang.head(5)

Unnamed: 0,Row ID,Order ID,Order Date,Ship Date,Ship Mode,Customer ID,Customer Name,Segment,Kota,State,Country,Region,Product ID,Category,Sub-Category,Product Name,Sales,Quantity,Discount,Profit
6,26,IN-2013-76464,2013-06-12,2013-06-14,First Class,DK-13090,Dave Kipp,Consumer,Semarang,Jawa Tengah,Indonesia,Southeast Asia,OFF-AR-10000027,Office Supplies,Art,"Binney & Smith Pencil Sharpener, Easy-Erase",61.1667,3,0.27,10.0467
7,27,IN-2013-76464,2013-06-12,2013-06-14,First Class,DK-13090,Dave Kipp,Consumer,Semarang,Jawa Tengah,Indonesia,Southeast Asia,FUR-CH-10003009,Furniture,Chairs,"Novimex Swivel Stool, Adjustable",243.747,2,0.27,-6.693
16,126,IN-2012-53175,2012-06-18,2012-06-23,Standard Class,BO-11350,Bill Overfelt,Corporate,Semarang,Jawa Tengah,Indonesia,Southeast Asia,TEC-PH-10004509,Technology,Phones,"Nokia Audio Dock, Cordless",140.7597,1,0.17,25.4097
17,127,IN-2012-53175,2012-06-18,2012-06-23,Standard Class,BO-11350,Bill Overfelt,Corporate,Semarang,Jawa Tengah,Indonesia,Southeast Asia,OFF-FA-10002597,Office Supplies,Fasteners,"OIC Clamps, 12 Pack",142.464,14,0.47,-121.296
86,865,IN-2011-74070,2011-06-23,2011-06-25,First Class,CA-12265,Christina Anderson,Consumer,Semarang,Jawa Tengah,Indonesia,Southeast Asia,TEC-PH-10002916,Technology,Phones,"Apple Speaker Phone, with Caller ID",102.339,1,0.17,30.819


## 6. Menambahkan kolom baru pada data frame

In [36]:
# Tambahkan kolom "Garansi", dan isikan semua baris dengan "Tidak Bergaransi"
superstore["Garansi"] = "Tidak bergaransi"
superstore.head(3)

Unnamed: 0,Row ID,Order ID,Order Date,Ship Date,Ship Mode,Customer ID,Customer Name,Segment,Kota,State,...,Region,Product ID,Category,Sub-Category,Product Name,Sales,Quantity,Discount,Profit,Garansi
0,18,ID-2014-44908,2014-02-26,2014-03-04,Standard Class,AI-10855,Arianne Irving,Consumer,Bandung,Jawa Barat,...,Southeast Asia,OFF-SU-10004848,Office Supplies,Supplies,"Kleencut Shears, High Speed",123.9405,5,0.47,-84.2595,Tidak bergaransi
1,19,ID-2014-44908,2014-02-26,2014-03-04,Standard Class,AI-10855,Arianne Irving,Consumer,Bandung,Jawa Barat,...,Southeast Asia,OFF-PA-10003332,Office Supplies,Paper,"Xerox Cards & Envelopes, Recycled",47.5728,2,0.47,-15.3072,Tidak bergaransi
2,20,ID-2012-73146,2012-10-24,2012-10-30,Standard Class,HM-14980,Henry MacAllister,Consumer,Denpasar,Bali,...,Southeast Asia,OFF-AP-10000487,Office Supplies,Appliances,"Hoover Stove, Silver",1417.3578,3,0.17,-290.3022,Tidak bergaransi


In [37]:
# Seleksi kolom Customer ID, Kota, Sub-Category, dan Profit. Simpan dalam variabel superstore2
superstore2 = superstore[["Customer ID", "Kota", "Sub-Category", "Profit"]]
superstore2.head(5)

Unnamed: 0,Customer ID,Kota,Sub-Category,Profit
0,AI-10855,Bandung,Supplies,-84.2595
1,AI-10855,Bandung,Paper,-15.3072
2,HM-14980,Denpasar,Appliances,-290.3022
3,HM-14980,Denpasar,Labels,-4.2948
4,AO-10810,Pekanbaru,Tables,-563.8032


In [38]:
# Seleksi superstore2, yang Kota adalah Semarang, memiliki Profit lebih dari 20. Simpan dalam superstore2_filter. 
superstore2_filter = superstore2[(superstore2.Kota == "Semarang") & (superstore2.Profit > 20)] 
superstore2_filter.head()

Unnamed: 0,Customer ID,Kota,Sub-Category,Profit
16,BO-11350,Semarang,Phones,25.4097
86,CA-12265,Semarang,Phones,30.819
99,CY-12745,Semarang,Chairs,28.4106
184,DP-13165,Semarang,Appliances,232.0011
230,MY-17380,Semarang,Appliances,70.7259


In [1]:
# Berapakah data yang sesuai dengan kondisi setelah dilakukan filtering? 
superstore2_filter.count()

NameError: name 'superstore2_filter' is not defined

In [49]:
superstore_ = superstore[(superstore.State == "Jawa Timur")| (superstore.Sales > 2000)]
superstore_
                         

Unnamed: 0,Row ID,Order ID,Order Date,Ship Date,Ship Mode,Customer ID,Customer Name,Segment,Kota,State,...,Region,Product ID,Category,Sub-Category,Product Name,Sales,Quantity,Discount,Profit,Garansi
19,157,IN-2014-17489,2014-12-22,2014-12-26,Standard Class,DF-13135,David Flashing,Consumer,Jember,Jawa Timur,...,Southeast Asia,OFF-BI-10004651,Office Supplies,Binders,"Cardinal Binding Machine, Clear",163.4436,4,0.17,57.0036,Tidak bergaransi
20,158,IN-2014-17489,2014-12-22,2014-12-26,Standard Class,DF-13135,David Flashing,Consumer,Jember,Jawa Timur,...,Southeast Asia,OFF-AR-10000539,Office Supplies,Art,"Boston Markers, Easy-Erase",58.3416,3,0.27,-15.9984,Tidak bergaransi
32,267,ID-2013-49143,2013-03-29,2013-04-02,Standard Class,RO-19780,Rose O'Brian,Consumer,Probolinggo,Jawa Timur,...,Southeast Asia,FUR-FU-10000735,Furniture,Furnishings,"Tenex Frame, Erganomic",158.5560,2,0.27,-26.0640,Tidak bergaransi
33,277,ID-2014-13135,2014-06-19,2014-06-25,Standard Class,JL-15235,Janet Lee,Consumer,Surabaya,Jawa Timur,...,Southeast Asia,OFF-LA-10001548,Office Supplies,Labels,"Avery Shipping Labels, Adjustable",20.6700,4,0.47,-8.9700,Tidak bergaransi
36,303,ID-2013-70122,2013-06-11,2013-06-15,Standard Class,AD-10180,Alan Dominguez,Home Office,Jakarta,Jakarta,...,Southeast Asia,FUR-TA-10001386,Furniture,Tables,"Lesro Conference Table, Fully Assembled",2276.4825,5,0.47,-472.5675,Tidak bergaransi
40,307,ID-2013-70122,2013-06-11,2013-06-15,Standard Class,AD-10180,Alan Dominguez,Home Office,Jakarta,Jakarta,...,Southeast Asia,FUR-CH-10002061,Furniture,Chairs,"Harbour Creations Executive Leather Armchair, Red",3126.4002,9,0.27,-128.7198,Tidak bergaransi
56,514,ID-2014-60854,2014-10-16,2014-10-22,Standard Class,AF-10885,Art Foster,Consumer,Surabaya,Jawa Timur,...,Southeast Asia,FUR-CH-10001203,Furniture,Chairs,"Novimex Steel Folding Chair, Set of Two",555.0336,9,0.27,-175.0464,Tidak bergaransi
57,563,IN-2014-66027,2014-12-15,2014-12-19,Standard Class,SV-20935,Susan Vittorini,Consumer,Surabaya,Jawa Timur,...,Southeast Asia,FUR-BO-10002387,Furniture,Bookcases,"Safco Library with Doors, Metal",2534.0175,7,0.07,136.2375,Tidak bergaransi
58,564,IN-2014-66027,2014-12-15,2014-12-19,Standard Class,SV-20935,Susan Vittorini,Consumer,Surabaya,Jawa Timur,...,Southeast Asia,OFF-AR-10002400,Office Supplies,Art,"Boston Highlighters, Water Color",32.1930,2,0.27,-8.4270,Tidak bergaransi
60,578,IN-2013-34170,2013-12-18,2013-12-25,Standard Class,FH-14275,Frank Hawley,Corporate,Palu,Sulawesi Tengah,...,Southeast Asia,FUR-BO-10002990,Furniture,Bookcases,"Dania Library with Doors, Traditional",3707.3520,11,0.07,1554.4320,Tidak bergaransi
