#  Construction in Ireland: Cement Data 

CA2 (26/05/2023) - MSc in Data Analytics 
<b>Student ID: 2023063

### Introduction 
write briefing

### Data Preparation and Visualisation

In [1]:
# Import libraries

import pandas as pd

import warnings
warnings.filterwarnings('ignore') # To suppress the warnings
%matplotlib inline 

In [2]:
# Read cement data (csv)

cement_data = pd.read_csv("cementdata.csv")

In [3]:
cement_data.head()

Unnamed: 0,FACTOR,UNITS,2007,2008,2009,2010,2011,2012,2013,2014,2015,Country,Product
0,Consumption Volume,Thousand tons,3563.0,3489.0,1748.0,1704.0,1263.0,48.4,856.0,580.9,667.0,Ireland,Cement
1,Consumption Value,Million USD,264.3,267.4,159.1,160.8,137.1,7.7,101.4,69.2,83.4,Ireland,Cement
2,Production Volume,Thousand tons,4003.0,3900.0,2600.0,2600.0,2103.0,1198.0,2000.0,2000.0,2500.0,Ireland,Cement
3,Production Value,Million USD,146.7,160.2,175.1,191.3,209.0,228.4,234.9,237.6,323.7,Ireland,Cement
4,Import Volume,Thousand tons,684.4,735.4,204.1,138.7,104.3,90.7,92.3,106.7,89.8,Ireland,Cement


In [4]:
cement_data.tail()

Unnamed: 0,FACTOR,UNITS,2007,2008,2009,2010,2011,2012,2013,2014,2015,Country,Product
125,Import Price,USD per Ton,81.5,97.6,225.8,343.0,773.8,189.3,330.6,225.8,275.3,Iran,Cement
126,Export Price,USD per Ton,91.9,97.2,76.4,76.5,62.5,62.5,59.6,74.5,59.7,Iran,Cement
127,Per Capita Consumption,Kg per Person,569.0,608.9,670.0,653.2,861.6,902.8,862.3,800.3,626.9,Iran,Cement
128,Net Export Volume,Thousand tons,11.1,43.8,631.5,1291.0,956.9,1227.0,1927.0,3951.0,8851.0,Iran,Cement
129,Net Export Value,Million USD,1.7,4.2,46.9,96.7,53.4,72.7,103.7,286.9,522.0,Iran,Cement


In [5]:
# Number of countries

cement_data["Country"].nunique()

10

In [6]:
# Country names 

cement_data["Country"].unique()

array(['Ireland', 'USA', 'Brazil', 'China', 'Germany', 'Russia',
       'Australia', 'Vietnam', 'Japan', 'Iran'], dtype=object)

In [7]:
# Define function to split data by country

def cement_df(country, new_df, original_df):
    new_df = original_df[original_df["Country"]==country]
    new_df = new_df.drop({"Country","Product","UNITS"}, axis='columns')
    new_df = new_df.transpose()
    new_df.columns = new_df.iloc[0]
    new_df.drop(index=new_df.index[0], axis=0, inplace=True)
    return new_df

In [8]:
# Ireland cement data

cement_df(country="Ireland", new_df="ireland_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,3563.0,264.3,4003.0,146.7,684.4,65.5,1124.0,105.5,95.7,93.9,810.1,439.6,40.0
2008,3489.0,267.4,3900.0,160.2,735.4,65.4,1146.0,112.0,88.9,97.7,777.2,410.8,46.6
2009,1748.0,159.1,2600.0,175.1,204.1,23.0,1056.0,101.9,112.6,96.5,382.6,852.0,78.9
2010,1704.0,160.8,2600.0,191.3,138.7,13.9,1035.0,104.7,99.9,101.2,368.2,896.5,90.9
2011,1263.0,137.1,2103.0,209.0,104.3,10.9,944.6,94.0,104.6,99.5,270.8,840.3,83.1
2012,48.4,7.7,1198.0,228.4,90.7,10.7,1240.0,111.2,118.5,89.6,10.4,1150.0,100.4
2013,856.0,101.4,2000.0,234.9,92.3,10.0,1236.0,110.6,107.8,89.5,182.8,1144.0,100.6
2014,580.9,69.2,2000.0,237.6,106.7,9.5,1526.0,148.0,88.9,97.0,124.0,1419.0,138.5
2015,667.0,83.4,2500.0,323.7,89.8,7.0,1923.0,145.4,78.1,75.6,141.9,1833.0,138.4


In [9]:
# United States cement data

cement_df(country="USA", new_df="usa_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,117546.0,12055.0,96850.0,10153.0,21739.0,1693.0,1042.0,131.4,77.9,126.0,391.0,-20696.30,-1561.20
2008,97539.0,9737.0,87610.0,8915.0,10898.0,949.1,969.6,117.5,87.1,121.2,321.5,﻿-9928.3,﻿-831.6
2009,70200.0,6020.0,64843.0,5568.0,6338.0,561.4,980.2,117.5,88.6,119.9,229.4,﻿-5357.6,﻿-443.9
2010,71960.0,5503.0,67176.0,5064.0,6141.0,535.8,1357.0,184.3,87.3,135.8,233.1,﻿-4783.6,﻿-351.5
2011,72929.0,5674.0,68639.0,5278.0,5937.0,519.0,1646.0,211.3,87.4,128.3,234.5,﻿-4290.3,﻿-307.8
2012,79217.0,6069.0,74934.0,5661.0,6276.0,552.7,1993.0,259.1,88.1,130.0,252.8,﻿-4283,﻿-293.6
2013,82025.0,6901.0,77415.0,6506.0,6514.0,571.9,1904.0,257.7,87.8,135.4,260.0,﻿-4610,﻿-314.2
2014,86346.0,7237.0,83124.0,6956.0,6069.0,663.1,2847.0,264.2,109.3,92.8,271.8,﻿-3222,﻿-398.9
2015,101975.0,8547.0,93208.0,7800.0,10337.0,896.1,1571.0,240.1,86.7,152.9,318.7,﻿-8766.6,﻿-656


In [10]:
# Brazil cement data

cement_df(country="Brazil", new_df="brazil_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,45592.0,3981.0,46551.0,3802.0,286.6,20.8,1246.0,62.3,72.5,50.0,238.7,959.20,41.50
2008,51654.0,5397.0,51970.0,5478.0,286.6,26.8,602.8,39.3,93.3,65.2,267.7,316.10,12.50
2009,52095.0,5174.0,51748.0,5086.0,397.0,39.4,49.6,5.1,99.3,102.9,267.3,﻿-347.4,﻿-34.3
2010,59937.0,6616.0,59118.0,6714.0,859.7,79.4,40.5,4.5,92.3,112.0,304.6,﻿-819.2,﻿-74 8
2011,65145.0,7906.0,64093.0,8250.0,1098.0,99.5,45.4,5.4,90.6,118.9,327.9,﻿-1052.3,-94.10
2012,70275.0,7580.0,69323.0,7631.0,985.6,92.1,33.5,4.4,93.4,131.2,350.4,﻿-952.1,﻿-87.7
2013,70976.0,7647.0,69975.0,7690.0,1034.0,92.9,32.7,4.2,89.8,129.3,350.7,﻿-1001.2,﻿-88.6
2014,72034.0,7739.0,71254.0,7801.0,823.9,77.0,43.7,5.5,93.4,126.5,352.7,﻿-780.2,﻿-71.4
2015,65649.0,5437.0,65283.0,4927.0,514.1,48.7,147.9,13.0,94.8,87.8,318.7,﻿-366.2,-35.70


In [11]:
# China cement data

cement_df(country="China", new_df="china_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,1346507.0,58994.0,1361170.0,54201.0,532.4,22.4,15195.0,605.1,42.1,39.8,985.0,14663.0,582.6
2008,1387333.0,69244.0,1400000.0,66718.0,565.3,27.1,13232.0,630.6,47.9,47.7,1009.0,12667.0,603.5
2009,1636216.0,84842.0,1644000.0,82445.0,702.7,33.4,8487.0,425.6,47.5,50.1,1183.0,7784.0,392.2
2010,1870996.0,97491.0,1880000.0,94894.0,823.1,38.8,9827.0,496.0,47.2,50.5,1346.0,9004.0,457.2
2011,2091058.0,124781.0,2099000.0,126356.0,855.6,45.3,8798.0,529.6,52.9,60.2,1495.0,7943.0,484.4
2012,2201410.0,132310.0,2210000.0,134256.0,649.9,37.7,9240.0,561.3,57.9,60.7,1566.0,8590.0,523.7
2013,2400469.0,139494.0,2411000.0,140297.0,411.2,26.9,10942.0,636.7,65.3,58.2,1698.0,10531.0,609.9
2014,2482064.0,147064.0,2492000.0,148660.0,238.1,21.4,10174.0,606.9,89.8,59.7,1746.0,9936.0,585.5
2015,2349902.0,136241.0,2359000.0,136866.0,103.6,16.8,9202.0,533.9,162.3,58.0,1645.0,9098.0,517.1


In [12]:
# Germany cement data

cement_df(country="Germany", new_df="germany_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,27566.0,2198.0,33382.0,2644.0,1144.0,160.9,6961.0,599.7,140.6,86.2,338.9,5816.0,438.8
2008,27452.0,2193.0,33581.0,2665.0,1064.0,173.2,7193.0,750.1,162.8,104.3,338.4,6129.0,576.9
2009,24918.0,2188.0,30441.0,2687.0,1025.0,159.6,6548.0,643.7,155.7,98.3,307.8,5523.0,484.0
2010,24756.0,2059.0,29894.0,2483.0,1046.0,166.2,6184.0,570.0,158.8,92.2,306.0,5138.0,403.8
2011,26766.0,2410.0,32779.0,2975.0,1117.0,184.3,7131.0,709.9,164.9,99.6,330.7,6014.0,525.6
2012,27169.0,2234.0,32432.0,2660.0,1277.0,181.1,6541.0,615.5,141.8,94.1,335.1,5263.0,434.3
2013,26602.0,2295.0,31308.0,2709.0,1344.0,203.5,6050.0,588.8,151.4,97.3,327.4,4706.0,385.3
2014,27677.0,2420.0,32099.0,2820.0,1325.0,208.8,5747.0,558.1,157.6,97.1,339.6,4422.0,349.3
2015,26207.0,1980.0,31160.0,2322.0,1308.0,177.2,6262.0,498.0,135.4,79.5,320.7,4953.0,320.8


In [13]:
# Russia cement data

cement_df(country="Russia", new_df="russia_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,60349.0,5694.0,59939.0,61.46,2066.0,206.6,1656.0,169.8,100.0,102.5,421.6,﻿-409.6,﻿-36.8
2008,58928.0,7027.0,53548.0,7563.0,5862.0,593.1,482.0,68.1,101.2,141.2,411.8,﻿-5380,﻿-525
2009,44046.0,3703.0,44266.0,3832.0,1124.0,88.6,1344.0,116.3,78.9,86.6,307.8,220.00,27.70
2010,50862.0,4133.0,50392.0,4142.0,1170.0,91.0,700.2,57.6,77.8,82.2,355.3,﻿-469.4,﻿-33.4
2011,58164.0,5168.0,56153.0,5279.0,2398.0,212.5,386.9,36.4,88.6,94.0,406.0,-2011.50,-176.10
2012,64461.0,6155.0,61691.0,6434.0,4234.0,348.4,1464.0,152.7,82.3,104.3,449.5,-2770.20,-195.70
2013,69128.0,6639.0,66549.0,6999.0,4338.0,347.3,1759.0,185.0,80.1,105.2,481.4,-2578.80,-162.30
2014,71772.0,5875.0,69139.0,5748.0,4501.0,337.9,1868.0,155.3,75.1,83.1,499.2,-2633.00,-182.60
2015,63262.0,3948.0,62103.0,3286.0,2883.0,169.2,1723.0,91.2,58.7,52.9,439.7,-1159.70,-78.00


In [14]:
# Australia cement data

cement_df(country="Australia", new_df="australia_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,9485.0,2604.0,9200.0,2333.0,306.6,38.2,21.9,5.6,124.7,253.6,452.8,-284.70,-32.70
2008,10086.0,3181.0,9400.0,3041.0,705.8,77.3,20.1,6.5,109.6,323.5,472.6,﻿-685.6,﻿-70.8
2009,9615.0,2947.0,9200.0,2836.0,431.5,46.2,16.6,5.1,107.1,308.3,442.3,﻿-414 9,﻿-41.1
2010,9415.0,2986.0,9000.0,2940.0,442.4,51.6,27.3,8.9,116.7,326.6,425.6,﻿-415,﻿-42.7
2011,9106.0,3268.0,8600.0,3423.0,530.5,45.6,24.6,9.8,85.9,398.0,405.1,﻿-505.9,﻿-35.8
2012,9109.0,2954.0,8500.0,2879.0,629.0,51.2,20.6,7.0,81.4,338.8,399.1,﻿-608.5,﻿-44.2
2013,8810.0,2726.0,8400.0,2631.0,423.8,40.3,13.7,4.3,95.0,313.3,380.6,﻿-410.1,﻿-36
2014,9376.0,3648.0,9000.0,4047.0,383.2,40.7,71.0,3.2,106.3,449.6,399.4,﻿-376.1,﻿-37.6
2015,9395.0,2713.0,9100.0,2530.0,303.1,31.6,8.5,2.4,104.2,278.0,394.7,﻿-294.6,﻿-29.2


In [15]:
# Vietnam cement data

cement_df(country="Vietnam", new_df="vietnam_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,37076.0,3976.0,37102.0,4297.0,63.5,7.3,89.4,10.4,115.2,115.8,431.7,25.90,3.00
2008,40032.0,3958.0,40009.0,4209.0,115.4,12.2,92.7,9.7,105.8,105.2,461.7,﻿-22.7,﻿-2.5
2009,47930.0,4389.0,47900.0,4596.0,123.5,15.6,94.0,9.0,126.6,95.9,547.4,﻿-29.5,﻿-6.6
2010,55599.0,4804.0,55801.0,4987.0,92.6,11.5,294.5,26.3,124.3,89.4,628.4,201.90,14.80
2011,57914.0,4816.0,58271.0,4967.0,73.6,9.9,430.4,36.7,135.1,85.2,647.5,356.80,26.70
2012,55187.0,3663.0,56353.0,3603.0,52.0,5.6,1218.0,77.9,107.9,63.9,610.1,1166.00,72.30
2013,54111.0,4205.0,57516.0,4505.0,31.4,4.0,3437.0,269.2,125.9,78.3,591.4,3405.00,265.20
2014,57183.0,4356.0,60982.0,4658.0,34.4,6.5,3834.0,292.8,188.5,76.4,617.9,3799.00,286.30
2015,64521.0,5004.0,67427.0,5269.0,36.5,5.2,2942.0,229.9,141.9,78.1,689.5,2906.00,224.70


In [16]:
# Japan cement data

cement_df(country="Japan", new_df="japan_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,58919,160.5,63705,138.6,1154.0,61.8,5940,174.4,53.6,29.4,458.5,4786,112.6
2008,57460,180.1,62810,170.0,935.4,61.5,6285,204.7,65.8,32.6,447.0,5350,143.2
2009,49529,184.9,54800,190.9,827.2,62.2,6099,215.9,75.2,35.4,385.2,5271,153.7
2010,46756,191.6,51526,203.8,628.9,56.5,5399,175.8,89.8,32.6,363.7,4770,119.3
2011,47096,244.9,51291,276.3,729.4,70.1,4924,165.7,96.1,33.7,366.5,4195,95.6
2012,50175,250.7,54737,280.4,846.4,79.1,5409,203.1,93.4,37.5,390.7,4562,124.0
2013,53572,229.6,57962,243.5,828.0,68.8,5218,203.7,83.0,39.0,417.5,4390,134.9
2014,53284,229.2,57913,244.4,609.0,56.1,5238,214.8,92.2,41.0,415.8,4629,158.6
2015,49441,214.1,54827,233.5,393.7,39.8,5779,235.8,101.1,40.8,386.3,5386,196.0


In [17]:
# Iran cement data

cement_df(country="Iran", new_df="iran_cement", original_df=cement_data)

FACTOR,Consumption Volume,Consumption Value,Production Volume,Production Value,Import Volume,Import Value,Export Volume,Export Value,Import Price,Export Price,Per Capita Consumption,Net Export Volume,Net Export Value
2007,40989,2185,41000,1588,64.2,5.2,75.3,6.9,81.5,91.9,569.0,11.1,1.7
2008,44356,2775,44400,2233,37.6,3.7,81.4,7.9,97.6,97.2,608.9,43.8,4.2
2009,49369,3124,50000,2559,9.0,2.0,640.5,49.0,225.8,76.4,670.0,631.5,46.9
2010,48709,3337,50000,2885,7.8,2.7,1298.0,99.4,343.0,76.5,653.2,1291.0,96.7
2011,65043,4129,66000,3394,9.0,7.0,965.9,60.4,773.8,62.5,861.6,956.9,53.4
2012,69023,4610,70250,3903,31.7,6.0,1258.0,78.7,189.3,62.5,902.8,1227.0,72.7
2013,66773,4984,68700,4489,41.1,13.6,1968.0,117.2,330.6,59.6,862.3,1927.0,103.7
2014,62749,5290,66700,5162,47.9,10.8,3999.0,297.8,225.8,74.5,800.3,3951.0,286.9
2015,49749,5148,58600,5936,31.2,8.6,8883.0,530.6,275.3,59.7,626.9,8851.0,522.0
