# Pandas 
Pandas is a popular open-source data analysis and manipulation library in Python. It provides data structures and functions needed to work efficiently with structured data, such as tables or time series.

Key Features of Pandas:
Data Structures

Series: A one-dimensional labeled array (like a column in Excel).

DataFrame: A two-dimensional table with labeled axes (like an Excel spreadsheet).

Data Manipulation:

Filtering, sorting, and transforming data.
Handling missing values.
Merging and joining datasets.

Reading & Writing Data:

Supports various formats like CSV, Excel, JSON, SQL, and more.

Statistical Analysis:

Supports descriptive statistics, group-by operations, and pivot tables.
Integration

Works well with NumPy, Matplotlib, and other data science libraries.

In [1]:
import numpy as np
import pandas as pd 

In [2]:
train=pd.read_csv('data/titanicdata.csv')
df=train.copy()

In [3]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked
0,1,0,3,"Braund, Mr. Owen Harris",male,22.0,1,0,A/5 21171,7.25,,S
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",female,38.0,1,0,PC 17599,71.2833,C85,C
2,3,1,3,"Heikkinen, Miss. Laina",female,26.0,0,0,STON/O2. 3101282,7.925,,S
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",female,35.0,1,0,113803,53.1,C123,S
4,5,0,3,"Allen, Mr. William Henry",male,35.0,0,0,373450,8.05,,S


In [4]:
df.tail()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked
886,887,0,2,"Montvila, Rev. Juozas",male,27.0,0,0,211536,13.0,,S
887,888,1,1,"Graham, Miss. Margaret Edith",female,19.0,0,0,112053,30.0,B42,S
888,889,0,3,"Johnston, Miss. Catherine Helen ""Carrie""",female,,1,2,W./C. 6607,23.45,,S
889,890,1,1,"Behr, Mr. Karl Howell",male,26.0,0,0,111369,30.0,C148,C
890,891,0,3,"Dooley, Mr. Patrick",male,32.0,0,0,370376,7.75,,Q


In [5]:
df.shape

(891, 12)

In [6]:
df.columns

Index(['PassengerId', 'Survived', 'Pclass', 'Name', 'Sex', 'Age', 'SibSp',
       'Parch', 'Ticket', 'Fare', 'Cabin', 'Embarked'],
      dtype='object')

In [7]:
df['Pclass'].value_counts()

Pclass
3    491
1    216
2    184
Name: count, dtype: int64

In [8]:
df.describe()

Unnamed: 0,PassengerId,Survived,Pclass,Age,SibSp,Parch,Fare
count,891.0,891.0,891.0,714.0,891.0,891.0,891.0
mean,446.0,0.383838,2.308642,29.699118,0.523008,0.381594,32.204208
std,257.353842,0.486592,0.836071,14.526497,1.102743,0.806057,49.693429
min,1.0,0.0,1.0,0.42,0.0,0.0,0.0
25%,223.5,0.0,2.0,20.125,0.0,0.0,7.9104
50%,446.0,0.0,3.0,28.0,0.0,0.0,14.4542
75%,668.5,1.0,3.0,38.0,1.0,0.0,31.0
max,891.0,1.0,3.0,80.0,8.0,6.0,512.3292


# 2. Make DataFrame¶


In [9]:
df_empty=pd.DataFrame()
df_empty.head()

In [10]:
df_empty.shape

(0, 0)

In [11]:
employee_dict={'Name':['A','B','C'],'Age':[24,34,28],'Roll':[1,2,3]}
employee_dict

{'Name': ['A', 'B', 'C'], 'Age': [24, 34, 28], 'Roll': [1, 2, 3]}

In [12]:
df_student=pd.DataFrame(employee_dict).reset_index(drop=True)
df_student.head()

Unnamed: 0,Name,Age,Roll
0,A,24,1
1,B,34,2
2,C,28,3


# 3. Handling null values¶


In [13]:
import numpy as np
import pandas as pd 

In [14]:

train=pd.read_csv('data/titanicdata.csv')
df=train.copy()

In [15]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked
0,1,0,3,"Braund, Mr. Owen Harris",male,22.0,1,0,A/5 21171,7.25,,S
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",female,38.0,1,0,PC 17599,71.2833,C85,C
2,3,1,3,"Heikkinen, Miss. Laina",female,26.0,0,0,STON/O2. 3101282,7.925,,S
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",female,35.0,1,0,113803,53.1,C123,S
4,5,0,3,"Allen, Mr. William Henry",male,35.0,0,0,373450,8.05,,S


In [16]:
df.isnull().sum()

PassengerId      0
Survived         0
Pclass           0
Name             0
Sex              0
Age            177
SibSp            0
Parch            0
Ticket           0
Fare             0
Cabin          687
Embarked         2
dtype: int64

In [17]:
df['Age'].isnull().sum()

177

In [18]:
df['Age'].fillna(df['Age'].mean(),inplace=True)

The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on which we are setting values always behaves as a copy.

For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' or df[col] = df[col].method(value) instead, to perform the operation inplace on the original object.


  df['Age'].fillna(df['Age'].mean(),inplace=True)


In [19]:
df['Age'].isnull().sum()

0

In [20]:
df['Sex'].fillna(df['Sex'].mode(),inplace=True)

The behavior will change in pandas 3.0. This inplace method will never work because the intermediate object on which we are setting values always behaves as a copy.

For example, when doing 'df[col].method(value, inplace=True)', try using 'df.method({col: value}, inplace=True)' or df[col] = df[col].method(value) instead, to perform the operation inplace on the original object.


  df['Sex'].fillna(df['Sex'].mode(),inplace=True)


In [21]:
df['Sex'].isnull().sum()

0

# 4. Update/Add new column(s).¶


In [22]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked
0,1,0,3,"Braund, Mr. Owen Harris",male,22.0,1,0,A/5 21171,7.25,,S
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",female,38.0,1,0,PC 17599,71.2833,C85,C
2,3,1,3,"Heikkinen, Miss. Laina",female,26.0,0,0,STON/O2. 3101282,7.925,,S
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",female,35.0,1,0,113803,53.1,C123,S
4,5,0,3,"Allen, Mr. William Henry",male,35.0,0,0,373450,8.05,,S


In [23]:
df['Sex']=df['Sex'].map({'male':'0','female':1})

In [24]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,A/5 21171,7.25,,S
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,PC 17599,71.2833,C85,C
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,STON/O2. 3101282,7.925,,S
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,113803,53.1,C123,S
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,373450,8.05,,S


In [25]:
df['last_name']=df['Name'].apply(lambda x:x.split(',')[0])

In [26]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked,last_name
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,A/5 21171,7.25,,S,Braund
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,PC 17599,71.2833,C85,C,Cumings
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,STON/O2. 3101282,7.925,,S,Heikkinen
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,113803,53.1,C123,S,Futrelle
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,373450,8.05,,S,Allen


In [27]:
df['first_name']=df['Name'].apply(lambda x:' '.join(x.split(',')[1:]))

In [28]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked,last_name,first_name
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,A/5 21171,7.25,,S,Braund,Mr. Owen Harris
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,PC 17599,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer)
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,STON/O2. 3101282,7.925,,S,Heikkinen,Miss. Laina
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,113803,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel)
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,373450,8.05,,S,Allen,Mr. William Henry


In [29]:
df['ThirdAndMen']=df.apply(lambda row:int(row['Pclass']==3 and row['Sex']=="0"),axis=1)
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,A/5 21171,7.25,,S,Braund,Mr. Owen Harris,1
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,PC 17599,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,STON/O2. 3101282,7.925,,S,Heikkinen,Miss. Laina,0
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,113803,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,373450,8.05,,S,Allen,Mr. William Henry,1


In [30]:
def findAgeGroupFun(ageValue):
    if ageValue<=18:
        return 1
    elif ageValue>=19 and ageValue<=45:
        return 2
    else:
        return 3

In [31]:
df['Age_group']=df['Age'].apply(lambda x:findAgeGroupFun(x))

In [32]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,A/5 21171,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,PC 17599,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,STON/O2. 3101282,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,113803,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,373450,8.05,,S,Allen,Mr. William Henry,1,2


# 5. Deleting columns¶


In [33]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Ticket,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,A/5 21171,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,PC 17599,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,STON/O2. 3101282,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,113803,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,373450,8.05,,S,Allen,Mr. William Henry,1,2


In [34]:
df=df.drop(['Ticket'],axis=1)

In [35]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


# 6. Renaming columns¶


In [36]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Name,Sex,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


In [37]:
df=df.rename(columns={'Sex':'Gender','Name':'Full Name'})

In [38]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


# 7 Slicing DataFrame¶


In [39]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


In [40]:
df_second_class=df[df['Pclass']==2].reset_index(drop=True)


In [41]:
df_second_class.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,10,1,2,"Nasser, Mrs. Nicholas (Adele Achem)",1,14.0,1,0,30.0708,,C,Nasser,Mrs. Nicholas (Adele Achem),0,1
1,16,1,2,"Hewlett, Mrs. (Mary D Kingcome)",1,55.0,0,0,16.0,,S,Hewlett,Mrs. (Mary D Kingcome),0,3
2,18,1,2,"Williams, Mr. Charles Eugene",0,29.699118,0,0,13.0,,S,Williams,Mr. Charles Eugene,0,2
3,21,0,2,"Fynney, Mr. Joseph J",0,35.0,0,0,26.0,,S,Fynney,Mr. Joseph J,0,2
4,22,1,2,"Beesley, Mr. Lawrence",0,34.0,0,0,13.0,D56,S,Beesley,Mr. Lawrence,0,2


# Female with age>65


In [42]:
df_aged=df[(df['Age']>60)]

In [43]:
df_aged.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
33,34,0,2,"Wheadon, Mr. Edward H",0,66.0,0,0,10.5,,S,Wheadon,Mr. Edward H,0,3
54,55,0,1,"Ostby, Mr. Engelhart Cornelius",0,65.0,0,1,61.9792,B30,C,Ostby,Mr. Engelhart Cornelius,0,3
96,97,0,1,"Goldschmidt, Mr. George B",0,71.0,0,0,34.6542,A5,C,Goldschmidt,Mr. George B,0,3
116,117,0,3,"Connors, Mr. Patrick",0,70.5,0,0,7.75,,Q,Connors,Mr. Patrick,1,3
170,171,0,1,"Van der hoef, Mr. Wyckoff",0,61.0,0,0,33.5,B19,S,Van der hoef,Mr. Wyckoff,0,3


In [44]:
df['Gender'].value_counts()

Gender
0    577
1    314
Name: count, dtype: int64

In [45]:
df_aged['Gender'].value_counts()

Gender
0    19
1     3
Name: count, dtype: int64

In [46]:
df_aged=df[(df['Age']>60) &(df['Gender']=="0")]
df_aged.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
33,34,0,2,"Wheadon, Mr. Edward H",0,66.0,0,0,10.5,,S,Wheadon,Mr. Edward H,0,3
54,55,0,1,"Ostby, Mr. Engelhart Cornelius",0,65.0,0,1,61.9792,B30,C,Ostby,Mr. Engelhart Cornelius,0,3
96,97,0,1,"Goldschmidt, Mr. George B",0,71.0,0,0,34.6542,A5,C,Goldschmidt,Mr. George B,0,3
116,117,0,3,"Connors, Mr. Patrick",0,70.5,0,0,7.75,,Q,Connors,Mr. Patrick,1,3
170,171,0,1,"Van der hoef, Mr. Wyckoff",0,61.0,0,0,33.5,B19,S,Van der hoef,Mr. Wyckoff,0,3


# 8  Slicing dataframe columns

In [47]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


In [48]:
df1=df[['Full Name','Age','Pclass','Gender']]

In [49]:
df1.head()

Unnamed: 0,Full Name,Age,Pclass,Gender
0,"Braund, Mr. Owen Harris",22.0,3,0
1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",38.0,1,1
2,"Heikkinen, Miss. Laina",26.0,3,1
3,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",35.0,1,1
4,"Allen, Mr. William Henry",35.0,3,0


In [50]:
data_types=['int16','int32','int64','float16','float32','float64']

In [51]:
df_num=df.select_dtypes(include=data_types)


In [52]:
df_num.head()

Unnamed: 0,PassengerId,Survived,Pclass,Age,SibSp,Parch,Fare,ThirdAndMen,Age_group
0,1,0,3,22.0,1,0,7.25,1,2
1,2,1,1,38.0,1,0,71.2833,0,2
2,3,1,3,26.0,0,0,7.925,0,2
3,4,1,1,35.0,1,0,53.1,0,2
4,5,0,3,35.0,0,0,8.05,1,2


In [53]:
df_categorical=df.select_dtypes(include=['object'])

In [54]:
df_categorical.head()

Unnamed: 0,Full Name,Gender,Cabin,Embarked,last_name,first_name
0,"Braund, Mr. Owen Harris",0,,S,Braund,Mr. Owen Harris
1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer)
2,"Heikkinen, Miss. Laina",1,,S,Heikkinen,Miss. Laina
3,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel)
4,"Allen, Mr. William Henry",0,,S,Allen,Mr. William Henry


# 9 . Slicing using iloc and loc¶


In [55]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


In [56]:
df_sub1=df.iloc[0:100,:]
df_sub1.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


In [57]:
df_sub1.shape

(100, 15)

In [64]:
df_sub1=df.iloc[0:300,[1,8]]

In [65]:
df_sub1.head()

Unnamed: 0,Survived,Fare
0,0,7.25
1,1,71.2833
2,1,7.925
3,1,53.1
4,0,8.05


In [66]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


In [67]:
df_sub2=df.loc[:500,:]

In [68]:
df_sub2.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


In [69]:
df_sub2.shape

(501, 15)

In [75]:
df_sub3=df.loc[(df['Age']>60),['Full Name','Gender','Age']].reset_index(drop=True)

In [76]:
df_sub3.head()

Unnamed: 0,Full Name,Gender,Age
0,"Wheadon, Mr. Edward H",0,66.0
1,"Ostby, Mr. Engelhart Cornelius",0,65.0
2,"Goldschmidt, Mr. George B",0,71.0
3,"Connors, Mr. Patrick",0,70.5
4,"Van der hoef, Mr. Wyckoff",0,61.0


# 10 . Adding a row¶


In [77]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1,0,3,"Braund, Mr. Owen Harris",0,22.0,1,0,7.25,,S,Braund,Mr. Owen Harris,1,2
1,2,1,1,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1,0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0,2
2,3,1,3,"Heikkinen, Miss. Laina",1,26.0,0,0,7.925,,S,Heikkinen,Miss. Laina,0,2
3,4,1,1,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1,0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0,2
4,5,0,3,"Allen, Mr. William Henry",0,35.0,0,0,8.05,,S,Allen,Mr. William Henry,1,2


In [78]:
row=dict({'Age':24,'Full Name':'Rahul Raj','Survived':'Y'})

In [80]:
df=pd.concat([df,pd.DataFrame([row])],ignore_index=True)

In [82]:
df.tail()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
887,888.0,1,1.0,"Graham, Miss. Margaret Edith",1.0,19.0,0.0,0.0,30.0,B42,S,Graham,Miss. Margaret Edith,0.0,2.0
888,889.0,0,3.0,"Johnston, Miss. Catherine Helen ""Carrie""",1.0,29.699118,1.0,2.0,23.45,,S,Johnston,"Miss. Catherine Helen ""Carrie""",0.0,2.0
889,890.0,1,1.0,"Behr, Mr. Karl Howell",0.0,26.0,0.0,0.0,30.0,C148,C,Behr,Mr. Karl Howell,0.0,2.0
890,891.0,0,3.0,"Dooley, Mr. Patrick",0.0,32.0,0.0,0.0,7.75,,Q,Dooley,Mr. Patrick,1.0,2.0
891,,Y,,Rahul Raj,,24.0,,,,,,,,,


In [83]:
df.shape

(892, 15)

# 11. Dropping row(s)¶


In [85]:
df=df.drop(df.index[-1],axis=0)
df.tail()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
885,886.0,0,3.0,"Rice, Mrs. William (Margaret Norton)",1,39.0,0.0,5.0,29.125,,Q,Rice,Mrs. William (Margaret Norton),0.0,2.0
886,887.0,0,2.0,"Montvila, Rev. Juozas",0,27.0,0.0,0.0,13.0,,S,Montvila,Rev. Juozas,0.0,2.0
887,888.0,1,1.0,"Graham, Miss. Margaret Edith",1,19.0,0.0,0.0,30.0,B42,S,Graham,Miss. Margaret Edith,0.0,2.0
888,889.0,0,3.0,"Johnston, Miss. Catherine Helen ""Carrie""",1,29.699118,1.0,2.0,23.45,,S,Johnston,"Miss. Catherine Helen ""Carrie""",0.0,2.0
889,890.0,1,1.0,"Behr, Mr. Karl Howell",0,26.0,0.0,0.0,30.0,C148,C,Behr,Mr. Karl Howell,0.0,2.0


In [86]:
df.shape

(890, 15)

# 12. Sorting¶


In [87]:
df.head()

Unnamed: 0,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,1.0,0,3.0,"Braund, Mr. Owen Harris",0,22.0,1.0,0.0,7.25,,S,Braund,Mr. Owen Harris,1.0,2.0
1,2.0,1,1.0,"Cumings, Mrs. John Bradley (Florence Briggs Th...",1,38.0,1.0,0.0,71.2833,C85,C,Cumings,Mrs. John Bradley (Florence Briggs Thayer),0.0,2.0
2,3.0,1,3.0,"Heikkinen, Miss. Laina",1,26.0,0.0,0.0,7.925,,S,Heikkinen,Miss. Laina,0.0,2.0
3,4.0,1,1.0,"Futrelle, Mrs. Jacques Heath (Lily May Peel)",1,35.0,1.0,0.0,53.1,C123,S,Futrelle,Mrs. Jacques Heath (Lily May Peel),0.0,2.0
4,5.0,0,3.0,"Allen, Mr. William Henry",0,35.0,0.0,0.0,8.05,,S,Allen,Mr. William Henry,1.0,2.0


In [96]:
df=df.sort_values(by=['Age'],ascending=False).reset_index(drop=True)

In [97]:
df.head()

Unnamed: 0,index,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,630,631.0,1,1.0,"Barkworth, Mr. Algernon Henry Wilson",0,80.0,0.0,0.0,30.0,A23,S,Barkworth,Mr. Algernon Henry Wilson,0.0,3.0
1,851,852.0,0,3.0,"Svensson, Mr. Johan",0,74.0,0.0,0.0,7.775,,S,Svensson,Mr. Johan,1.0,3.0
2,493,494.0,0,1.0,"Artagaveytia, Mr. Ramon",0,71.0,0.0,0.0,49.5042,,C,Artagaveytia,Mr. Ramon,0.0,3.0
3,96,97.0,0,1.0,"Goldschmidt, Mr. George B",0,71.0,0.0,0.0,34.6542,A5,C,Goldschmidt,Mr. George B,0.0,3.0
4,116,117.0,0,3.0,"Connors, Mr. Patrick",0,70.5,0.0,0.0,7.75,,Q,Connors,Mr. Patrick,1.0,3.0


# 13. Joins¶


In [101]:
serianlnum=[ i+1 for i in range(100)]
type(serianlnum)

list

In [100]:
marks=np.random.randint(100,size=100)
marks
type(marks)

numpy.ndarray

In [102]:
marks_dataframe=pd.DataFrame({'Serialnumb':serianlnum,'marks':marks})

In [103]:
marks_dataframe.head()

Unnamed: 0,Serialnumb,marks
0,1,86
1,2,72
2,3,56
3,4,85
4,5,45


In [116]:
marks_dataframe.shape

(100, 2)

In [112]:
serianlnum2=[ i+1 for i in range(100)]
age=np.random.randint(10,100,size=100)
age_dataframe=pd.DataFrame({'Serialnumb':serianlnum2,'Age':age})

In [113]:
age_dataframe.head()

Unnamed: 0,Serialnumb,Age
0,1,87
1,2,97
2,3,35
3,4,80
4,5,74


In [115]:
age_dataframe.shape

(100, 2)

In [114]:
cross_join_df=pd.merge(marks_dataframe,age_dataframe,how='cross')
cross_join_df.head()

Unnamed: 0,Serialnumb_x,marks,Serialnumb_y,Age
0,1,86,1,87
1,1,86,2,97
2,1,86,3,35
3,1,86,4,80
4,1,86,5,74


In [118]:
cross_join_df.tail()


Unnamed: 0,Serialnumb_x,marks,Serialnumb_y,Age
9995,100,39,96,48
9996,100,39,97,29
9997,100,39,98,94
9998,100,39,99,51
9999,100,39,100,31


In [117]:
cross_join_df.shape

(10000, 4)

In [125]:
serianlnum2=[ i+1 for i in range(200)]
age=np.random.randint(10,100,size=200)
age_dataframe=pd.DataFrame({'Serialnumb':serianlnum2,'Age':age})

In [126]:
age_dataframe.shape

(200, 2)

In [127]:
marks_dataframe.shape

(100, 2)

In [129]:
inner_join=pd.merge(marks_dataframe,age_dataframe,how='inner',on='Serialnumb')

In [130]:
inner_join.head()

Unnamed: 0,Serialnumb,marks,Age
0,1,86,89
1,2,72,67
2,3,56,83
3,4,85,99
4,5,45,94


In [131]:
inner_join.shape

(100, 3)

In [132]:
inner_join.tail()

Unnamed: 0,Serialnumb,marks,Age
95,96,56,86
96,97,76,57
97,98,77,90
98,99,80,12
99,100,39,47


In [136]:
left_join=pd.merge(age_dataframe,marks_dataframe,how='left',on='Serialnumb')

In [137]:
left_join.head()

Unnamed: 0,Serialnumb,Age,marks
0,1,89,86.0
1,2,67,72.0
2,3,83,56.0
3,4,99,85.0
4,5,94,45.0


In [138]:
left_join.shape

(200, 3)

In [139]:
right_join=pd.merge(age_dataframe,marks_dataframe,how='right',on='Serialnumb')

In [140]:
right_join.head()

Unnamed: 0,Serialnumb,Age,marks
0,1,89,86
1,2,67,72
2,3,83,56
3,4,99,85
4,5,94,45


In [141]:
right_join.shape

(100, 3)

# 14. Groupby¶


In [142]:
df.head()

Unnamed: 0,index,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,630,631.0,1,1.0,"Barkworth, Mr. Algernon Henry Wilson",0,80.0,0.0,0.0,30.0,A23,S,Barkworth,Mr. Algernon Henry Wilson,0.0,3.0
1,851,852.0,0,3.0,"Svensson, Mr. Johan",0,74.0,0.0,0.0,7.775,,S,Svensson,Mr. Johan,1.0,3.0
2,493,494.0,0,1.0,"Artagaveytia, Mr. Ramon",0,71.0,0.0,0.0,49.5042,,C,Artagaveytia,Mr. Ramon,0.0,3.0
3,96,97.0,0,1.0,"Goldschmidt, Mr. George B",0,71.0,0.0,0.0,34.6542,A5,C,Goldschmidt,Mr. George B,0.0,3.0
4,116,117.0,0,3.0,"Connors, Mr. Patrick",0,70.5,0.0,0.0,7.75,,Q,Connors,Mr. Patrick,1.0,3.0


In [None]:
group_pclass=df.groupby(['Pclass'])

In [151]:
group_pclass.get_group(1)

  group_pclass.get_group(1)


Unnamed: 0,index,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,630,631.0,1,1.0,"Barkworth, Mr. Algernon Henry Wilson",0,80.00,0.0,0.0,30.0000,A23,S,Barkworth,Mr. Algernon Henry Wilson,0.0,3.0
2,493,494.0,0,1.0,"Artagaveytia, Mr. Ramon",0,71.00,0.0,0.0,49.5042,,C,Artagaveytia,Mr. Ramon,0.0,3.0
3,96,97.0,0,1.0,"Goldschmidt, Mr. George B",0,71.00,0.0,0.0,34.6542,A5,C,Goldschmidt,Mr. George B,0.0,3.0
6,745,746.0,0,1.0,"Crosby, Capt. Edward Gifford",0,70.00,1.0,1.0,71.0000,B22,S,Crosby,Capt. Edward Gifford,0.0,3.0
9,54,55.0,0,1.0,"Ostby, Mr. Engelhart Cornelius",0,65.00,0.0,1.0,61.9792,B30,C,Ostby,Mr. Engelhart Cornelius,0.0,3.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
813,435,436.0,1,1.0,"Carter, Miss. Lucile Polk",1,14.00,1.0,2.0,120.0000,B96 B98,S,Carter,Miss. Lucile Polk,0.0,1.0
823,802,803.0,1,1.0,"Carter, Master. William Thornton II",0,11.00,1.0,2.0,120.0000,B96 B98,S,Carter,Master. William Thornton II,0.0,1.0
857,445,446.0,1,1.0,"Dodge, Master. Washington",0,4.00,0.0,2.0,81.8583,A34,S,Dodge,Master. Washington,0.0,1.0
873,297,298.0,0,1.0,"Allison, Miss. Helen Loraine",1,2.00,1.0,2.0,151.5500,C22 C26,S,Allison,Miss. Helen Loraine,0.0,1.0


In [152]:
group_pclass.get_group(2)

  group_pclass.get_group(2)


Unnamed: 0,index,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
5,672,673.0,0,2.0,"Mitchell, Mr. Henry Michael",0,70.00,0.0,0.0,10.5000,,S,Mitchell,Mr. Henry Michael,0.0,3.0
7,33,34.0,0,2.0,"Wheadon, Mr. Edward H",0,66.00,0.0,0.0,10.5000,,S,Wheadon,Mr. Edward H,0.0,3.0
15,570,571.0,1,2.0,"Harris, Mr. George",0,62.00,0.0,0.0,10.5000,,S,Harris,Mr. George,0.0,3.0
23,684,685.0,0,2.0,"Brown, Mr. Thomas William Solomon",0,60.00,1.0,1.0,39.0000,,S,Brown,Mr. Thomas William Solomon,0.0,3.0
26,232,233.0,0,2.0,"Sjostedt, Mr. Ernst Adolf",0,59.00,0.0,0.0,13.5000,,S,Sjostedt,Mr. Ernst Adolf,0.0,3.0
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
876,183,184.0,1,2.0,"Becker, Master. Richard F",0,1.00,2.0,1.0,39.0000,F4,S,Becker,Master. Richard F,0.0,1.0
877,827,828.0,1,2.0,"Mallet, Master. Andre",0,1.00,0.0,2.0,37.0042,,C,Mallet,Master. Andre,0.0,1.0
884,831,832.0,1,2.0,"Richards, Master. George Sibley",0,0.83,1.0,1.0,18.7500,,S,Richards,Master. George Sibley,0.0,1.0
885,78,79.0,1,2.0,"Caldwell, Master. Alden Gates",0,0.83,0.0,2.0,29.0000,,S,Caldwell,Master. Alden Gates,0.0,1.0


In [153]:
df1=df.groupby(['Pclass'])


In [154]:
df1.head()

Unnamed: 0,index,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,630,631.0,1,1.0,"Barkworth, Mr. Algernon Henry Wilson",0,80.0,0.0,0.0,30.0,A23,S,Barkworth,Mr. Algernon Henry Wilson,0.0,3.0
1,851,852.0,0,3.0,"Svensson, Mr. Johan",0,74.0,0.0,0.0,7.775,,S,Svensson,Mr. Johan,1.0,3.0
2,493,494.0,0,1.0,"Artagaveytia, Mr. Ramon",0,71.0,0.0,0.0,49.5042,,C,Artagaveytia,Mr. Ramon,0.0,3.0
3,96,97.0,0,1.0,"Goldschmidt, Mr. George B",0,71.0,0.0,0.0,34.6542,A5,C,Goldschmidt,Mr. George B,0.0,3.0
4,116,117.0,0,3.0,"Connors, Mr. Patrick",0,70.5,0.0,0.0,7.75,,Q,Connors,Mr. Patrick,1.0,3.0
5,672,673.0,0,2.0,"Mitchell, Mr. Henry Michael",0,70.0,0.0,0.0,10.5,,S,Mitchell,Mr. Henry Michael,0.0,3.0
6,745,746.0,0,1.0,"Crosby, Capt. Edward Gifford",0,70.0,1.0,1.0,71.0,B22,S,Crosby,Capt. Edward Gifford,0.0,3.0
7,33,34.0,0,2.0,"Wheadon, Mr. Edward H",0,66.0,0.0,0.0,10.5,,S,Wheadon,Mr. Edward H,0.0,3.0
8,280,281.0,0,3.0,"Duane, Mr. Frank",0,65.0,0.0,0.0,7.75,,Q,Duane,Mr. Frank,1.0,3.0
9,54,55.0,0,1.0,"Ostby, Mr. Engelhart Cornelius",0,65.0,0.0,1.0,61.9792,B30,C,Ostby,Mr. Engelhart Cornelius,0.0,3.0


In [156]:
df1['Age'].mean()

Pclass
1.0    37.048118
2.0    29.866958
3.0    26.391837
Name: Age, dtype: float64

In [157]:
df1['Age'].max()

Pclass
1.0    80.0
2.0    70.0
3.0    74.0
Name: Age, dtype: float64

In [158]:
df1['Age'].min()

Pclass
1.0    0.92
2.0    0.67
3.0    0.42
Name: Age, dtype: float64

In [160]:
df1['Pclass'].count()

Pclass
1.0    216
2.0    184
3.0    490
Name: Pclass, dtype: int64

In [161]:
df_grp2=df.groupby(['Pclass']).agg({'Age':lambda x: np.mean(x)})

In [162]:
df_grp2.head()

Unnamed: 0_level_0,Age
Pclass,Unnamed: 1_level_1
1.0,37.048118
2.0,29.866958
3.0,26.391837


In [163]:
df_grp2=df.groupby(['Pclass']).agg({'Age':lambda x: np.mean(x)}).rename(columns={'Age':'Mean Age'})

In [164]:
df_grp2.head()

Unnamed: 0_level_0,Mean Age
Pclass,Unnamed: 1_level_1
1.0,37.048118
2.0,29.866958
3.0,26.391837


In [166]:
df_group3=df.groupby(['Pclass']).agg({'Full Name':lambda x:", ".join(x)})

In [167]:
df_group3.head()

Unnamed: 0_level_0,Full Name
Pclass,Unnamed: 1_level_1
1.0,"Barkworth, Mr. Algernon Henry Wilson, Artagave..."
2.0,"Mitchell, Mr. Henry Michael, Wheadon, Mr. Edwa..."
3.0,"Svensson, Mr. Johan, Connors, Mr. Patrick, Dua..."


In [168]:
df_group4=df.groupby(['Pclass']).agg({'Age':['max','min']})

In [169]:
df_group4.head()

Unnamed: 0_level_0,Age,Age
Unnamed: 0_level_1,max,min
Pclass,Unnamed: 1_level_2,Unnamed: 2_level_2
1.0,80.0,0.92
2.0,70.0,0.67
3.0,74.0,0.42


# 15: Iterating over rows in dataframe¶


In [170]:
df.head()

Unnamed: 0,index,PassengerId,Survived,Pclass,Full Name,Gender,Age,SibSp,Parch,Fare,Cabin,Embarked,last_name,first_name,ThirdAndMen,Age_group
0,630,631.0,1,1.0,"Barkworth, Mr. Algernon Henry Wilson",0,80.0,0.0,0.0,30.0,A23,S,Barkworth,Mr. Algernon Henry Wilson,0.0,3.0
1,851,852.0,0,3.0,"Svensson, Mr. Johan",0,74.0,0.0,0.0,7.775,,S,Svensson,Mr. Johan,1.0,3.0
2,493,494.0,0,1.0,"Artagaveytia, Mr. Ramon",0,71.0,0.0,0.0,49.5042,,C,Artagaveytia,Mr. Ramon,0.0,3.0
3,96,97.0,0,1.0,"Goldschmidt, Mr. George B",0,71.0,0.0,0.0,34.6542,A5,C,Goldschmidt,Mr. George B,0.0,3.0
4,116,117.0,0,3.0,"Connors, Mr. Patrick",0,70.5,0.0,0.0,7.75,,Q,Connors,Mr. Patrick,1.0,3.0


In [172]:
for index,row in df.iterrows():
    print(row['Full Name'])

Barkworth, Mr. Algernon Henry Wilson
Svensson, Mr. Johan
Artagaveytia, Mr. Ramon
Goldschmidt, Mr. George B
Connors, Mr. Patrick
Mitchell, Mr. Henry Michael
Crosby, Capt. Edward Gifford
Wheadon, Mr. Edward H
Duane, Mr. Frank
Ostby, Mr. Engelhart Cornelius
Millet, Mr. Francis Davis
Fortune, Mr. Mark
Nicholson, Mr. Arthur Ernest
Turkula, Mrs. (Hedwig)
Andrews, Miss. Kornelia Theodosia
Harris, Mr. George
Wright, Mr. George
Stead, Mr. William Thomas
Stone, Mrs. George Nelson (Martha Evelyn)
Sutton, Mr. Frederick
Van der hoef, Mr. Wyckoff
Nysveen, Mr. Johan Hansen
Warren, Mrs. Frank Manley (Anna Sophia Atkinson)
Brown, Mr. Thomas William Solomon
Weir, Col. John
Frolicher-Stehli, Mr. Maxmillian
Sjostedt, Mr. Ernst Adolf
Coxon, Mr. Daniel
Lurette, Miss. Elise
Newell, Mr. Arthur Webster
Bonnell, Miss. Elizabeth
Kent, Mr. Edward Austin
Graham, Mrs. William Thompson (Edith Junkins)
Kirkland, Rev. Charles Leonard
Mack, Mrs. (Mary)
Simonius-Blumer, Col. Oberst Alfons
Smith, Mr. James Clinch
Smart, 