In [1]:
# import relevant libraries

import pandas as pd

In [2]:
# read in csv file containing data

gh_contract_data = pd.read_csv("./contract_data_ppa_gh.csv")

In [3]:
# explore data with first 5 columns

gh_contract_data.head()

Unnamed: 0.1,Unnamed: 0,Awarding Agency:,Tender Package No:,Tender Type:,Contract Type:,Lot #:,Tender Description:,Approval Auth:,Justification:,Contract Date:,Completion Date:,Contract Currency:,Contract Award Price:,Contract Awarded To:,Company Email:,Company Address:,Company Tel:,Supplier #:
0,0.0,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 9-SAN-DAG/12/18,-,Restricted Tender,LOT 9,Construction of small earth dams to store wate...,ETC/PPA,40 (1)b - Urgency,"10th May, 2019","20th May, 2020",Ghana Cedi,Gh¢4962525.82,Ashcarl Investment Ltd,,P. O. Box 2310\r\nTamale\r,,-
1,1.0,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 1-VUN-NAM/12/18,-,Restricted Tender,LOT 1,Construction of Small earth dams at Vunania an...,ETC/PPA,40 (1)b - Urgency,"10th May, 2019","12th May, 2020",Ghana Cedi,Gh¢5087867.52,ALZAK COMPANY LIMITED,info@alzak.com,-,-,-
2,2.0,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 3-KATAA/12/18,-,Restricted Tender,LOT 3,Construction of small earth dam at Kataa for a...,ETC/PPA,40 (1)b - Urgency,"10th May, 2019","14th January, 2020",Ghana Cedi,Gh¢2489286.20,QUALITY ASSURED ENGINEERING COMPANY,info@qualityassured.com,-,0,-
3,3.0,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 4-DUONG/12/18,-,Restricted Tender,LOT 4,Construction of small earth dam at Doung to st...,ETC/PPA,40 (1)b - Urgency,"10th May, 2019","14th January, 2020",Ghana Cedi,Gh¢2576940.88,HANDOSKY INTERNATIONAL LIMITED,support@HANDOSKY.com,-,-,-
4,4.0,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 5-DOUSE/12/18,-,Restricted Tender,LOT 5,Construction of small earth dams at Douse to s...,ETC/PPA,40 (1)b - Urgency,"10th May, 2019","14th January, 2020",Ghana Cedi,Gh¢2435596.41,WAALE CONSTRUCTION WORKS LIMITED,WAALE@yahoo.com,-,-,-


In [4]:
# deleting 'Unnamed: 0' column as it plays the same role as the index

gh_contract_data.drop(['Unnamed: 0'], axis=1, inplace=True)

In [5]:
# Striping column names of the suffix ':'

gh_contract_data.rename(columns = lambda x : str(x)[:-1], inplace=True)

In [6]:
# converting 'Contract Date' & 'Completion Date' to date formats

gh_contract_data['Contract Date'] = pd.to_datetime(gh_contract_data['Contract Date'], errors='coerce')
gh_contract_data['Completion Date'] = pd.to_datetime(gh_contract_data['Completion Date'], errors='coerce')

In [7]:
# Striping the currency characters off the amount

gh_contract_data['Contract Award Price'] = gh_contract_data['Contract Award Price'].str.extract('(\d+.\d+)', expand=True)

In [8]:
# Converting amount column from object to float

gh_contract_data['Contract Award Price'] = gh_contract_data['Contract Award Price'].astype(float)

In [9]:
# View data types of all columns

gh_contract_data.dtypes

Awarding Agency                 object
Tender Package No               object
Tender Type                     object
Contract Type                   object
Lot #                           object
Tender Description              object
Approval Auth                   object
Justification                   object
Contract Date           datetime64[ns]
Completion Date         datetime64[ns]
Contract Currency               object
Contract Award Price           float64
Contract Awarded To             object
Company Email                   object
Company Address                 object
Company Tel                     object
Supplier #                      object
dtype: object

In [10]:
# replacing all null objects with '-'

str_cols = gh_contract_data.columns[gh_contract_data.dtypes==object]

gh_contract_data[str_cols] = gh_contract_data[str_cols].fillna('-')

In [11]:
gh_contract_data.head()

Unnamed: 0,Awarding Agency,Tender Package No,Tender Type,Contract Type,Lot #,Tender Description,Approval Auth,Justification,Contract Date,Completion Date,Contract Currency,Contract Award Price,Contract Awarded To,Company Email,Company Address,Company Tel,Supplier #
0,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 9-SAN-DAG/12/18,-,Restricted Tender,LOT 9,Construction of small earth dams to store wate...,ETC/PPA,40 (1)b - Urgency,2019-05-10,2020-05-20,Ghana Cedi,4962525.82,Ashcarl Investment Ltd,-,P. O. Box 2310\r\nTamale\r,-,-
1,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 1-VUN-NAM/12/18,-,Restricted Tender,LOT 1,Construction of Small earth dams at Vunania an...,ETC/PPA,40 (1)b - Urgency,2019-05-10,2020-05-12,Ghana Cedi,5087867.52,ALZAK COMPANY LIMITED,info@alzak.com,-,-,-
2,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 3-KATAA/12/18,-,Restricted Tender,LOT 3,Construction of small earth dam at Kataa for a...,ETC/PPA,40 (1)b - Urgency,2019-05-10,2020-01-14,Ghana Cedi,2489286.2,QUALITY ASSURED ENGINEERING COMPANY,info@qualityassured.com,-,0,-
3,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 4-DUONG/12/18,-,Restricted Tender,LOT 4,Construction of small earth dam at Doung to st...,ETC/PPA,40 (1)b - Urgency,2019-05-10,2020-01-14,Ghana Cedi,2576940.88,HANDOSKY INTERNATIONAL LIMITED,support@HANDOSKY.com,-,-,-
4,Ghana Irrigation Development Authority - Accra,MOFA/GIDA-IFT/LOT 5-DOUSE/12/18,-,Restricted Tender,LOT 5,Construction of small earth dams at Douse to s...,ETC/PPA,40 (1)b - Urgency,2019-05-10,2020-01-14,Ghana Cedi,2435596.41,WAALE CONSTRUCTION WORKS LIMITED,WAALE@yahoo.com,-,-,-


In [12]:
#storing cleaned data from dataframe to csv

gh_contract_data.to_csv('cleaned_gh_contract_data.csv')