In [2]:
#import modules
import pandas as pd
import numpy as np
import seaborn as sns
import matplotlib.pyplot as plt
import os
import warnings

pd.set_option('Display.max_rows',None)
pd.set_option('display.max_columns', None)
warnings.filterwarnings('ignore')

**Dataset Description.**

This dataset contain details about oil and gas exploration and production activities, including geographical, operational, and geological information.

| Column Name                   | Description                                                                                           |
|-------------------------------|-------------------------------------------------------------------------------------------------------|
| `On offshore`                 | Indicates whether the operation is onshore or offshore.                                               |
| `Kaartbladindeling`           | Map sheet division, used for categorizing the area based on a mapping grid.                           |
| `Kaartblad`                   | Specific map sheet number or reference.                                                               |
| `Bloknummer`                  | Block number, typically refers to a specific area within a designated map grid.                       |
| `Provincie Code`              | Code for the province in which the drilling activity is located.                                      |
| `Provincie Naam`              | Name of the province.                                                                                 |
| `Gemeente Id`                 | Municipality ID where the activity is located.                                                        |
| `Gemeente Naam`               | Name of the municipality.                                                                             |
| `Postcode`                    | Postal code of the area.                                                                              |
| `Mijnbouwwerk Code`           | Mining work code, referring to specific codes assigned to mining structures or operations.            |
| `Mijnbouwwerk Naam`           | Name of the mining structure or operation.                                                            |
| `Aangeleverde X`              | Provided X coordinate.                                                                                |
| `Aangeleverde Y`              | Provided Y coordinate.                                                                                |
| `Aangeleverd Stelsel`         | Coordinate system in which X and Y are provided.                                                      |
| `X Rijksdriehoek`             | X coordinate in the Dutch national grid system (Rijksdriehoekstelsel).                                |
| `Y Rijksdriehoek`             | Y coordinate in the Dutch national grid system.                                                       |
| `X TM5_ED50`                  | X coordinate in TM5/ED50 system.                                                                      |
| `Y TM5_ED50`                  | Y coordinate in TM5/ED50 system.                                                                      |
| `X UTM31_ED50`                | X coordinate in UTM Zone 31 on the ED50 datum.                                                        |
| `Y UTM31_ED50`                | Y coordinate in UTM Zone 31 on the ED50 datum.                                                        |
| `Longitude ED50`              | Longitude in the ED50 datum.                                                                          |
| `Latitude ED50`               | Latitude in the ED50 datum.                                                                           |
| `X UTM31_WGS84`               | X coordinate in UTM Zone 31 on the WGS84 datum.                                                       |
| `Y UTM31_WGS84`               | Y coordinate in UTM Zone 31 on the WGS84 datum.                                                       |
| `Longitude WGS84`             | Longitude in the WGS84 datum.                                                                         |
| `Latitude WGS84`              | Latitude in the WGS84 datum.                                                                          |
| `Startdatum`                  | Start date of the drilling or operation.                                                              |
| `Einddatum`                   | End date of the drilling or operation.                                                                |
| `Boorgat / Sidetrack`         | Designates the main wellbore or a sidetrack.                                                          |
| `NITG nummer`                 | National Geological Institute number, possibly a unique identifier for the geological study or well.  |
| `UWI`                         | Universal Well Identifier, a unique identifier for each well.                                         |
| `Boorgatcode`                 | Well code, likely another identifier for the drilling operation.                                      |
| `Boorgatnaam`                 | Name of the well.                                                                                     |
| `Boorgatdoel Code`            | Code indicating the objective of the well.                                                            |
| `Boorgatdoel`                 | Objective or purpose of the well.                                                                     |
| `Boorgatresultaat Code`       | Code describing the outcome of the drilling.                                                          |
| `Boorgatresultaat`            | Result of the drilling operation.                                                                     |
| `Boorgatstatus`               | Current status of the well.                                                                           |
| `Boorgatvorm`                 | Shape or type of the well.                                                                            |
| `Kickoff diepte AH`           | Depth at which the well begins to deviate horizontally.                                               |
| `Boorgatdiepte AH`            | Total depth of the well from the surface (Along Hole).                                                |
| `Boorgatdiepte TVD`           | True Vertical Depth of the well.                                                                      |
| `X deviatie UTM31 ED50`       | X deviation in UTM Zone 31 ED50, used in directional drilling.                                        |
| `X_end UTM31_ED50`            | End X coordinate in UTM Zone 31 ED50.                                                                 |
| `Y deviatie UTM31 ED50`       | Y deviation in UTM Zone 31 ED50.                                                                      |
| `Y_end UTM31_ED50`            | End Y coordinate in UTM Zone 31 ED50.                                                                 |
| `Referentievlak`              | Reference level or datum used.                                                                        |
| `Hoogte referentievlak`       | Elevation of the reference level.                                                                     |
| `t.o.v.`                      | Relative to; used for specifying relative measurements.                                               |
| `Boorgatdiepte AH t.o.v. NAP / MSL` | Well depth relative to Normal Amsterdam Peil (NAP) or Mean Sea Level (MSL).                     |
| `Boorgatdiepte TVD t.o.v. NAP / MSL` | True vertical depth relative to NAP or MSL.                                                    |
| `Huidige eigenaar`            | Current owner of the well or operation.                                                               |
| `Opdrachtgever`               | Client or entity commissioning the drilling.                                                          |    
| `Boortoren/-platform`         | Drilling tower or platform used.                                                                      |
| `Boorfirma`                   | Drilling company or contractor.                                                                       |
| `Lithostratigrafie Code`      | Code related to the lithostratigraphy of the well.                                                    |
| `Chronotratigrafie Code`      | Code related to the chronostratigraphy of the well.                                                   |
| `Put Naam`                    | Name of the well or site.                                                                             |
| `Veld Code`                   | Field code, possibly indicating a specific field or area.                                             |
| `Veld Naam`                   | Name of the field or area.                                                                            |
| `Openbaar vanaf`              | Date from which the data becomes public.                                                              |


In [3]:
#load dataset
dutch_oil = pd.read_excel(r'C:\Users\admin\Documents\Conda files\Data Science Projects\Oil and Gas\Dutch oil and gas\data\boreholes.xlsx', sheet_name=0)

#save to parquet file format
dutch_oil.to_parquet('C:/Users/admin/Documents/Conda files/Data Science Projects/Oil and Gas/Dutch oil and gas/data/dutch_oil_borehole.pq')

dutch_oil.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6638 entries, 0 to 6637
Data columns (total 61 columns):
 #   Column                              Non-Null Count  Dtype         
---  ------                              --------------  -----         
 0   On offshore                         6638 non-null   object        
 1   Kaartbladindeling                   6638 non-null   object        
 2   Kaartblad                           4465 non-null   object        
 3   Bloknummer                          2425 non-null   object        
 4   Provincie Code                      4408 non-null   object        
 5   Provincie Naam                      4408 non-null   object        
 6   Gemeente Id                         4408 non-null   float64       
 7   Gemeente Naam                       4408 non-null   object        
 8   Postcode                            4373 non-null   float64       
 9   Mijnbouwwerk Code                   2990 non-null   object        
 10  Mijnbouwwerk Naam       

In [4]:
#clone the dataset

data = dutch_oil

In [5]:
data.tail(10)

Unnamed: 0,On offshore,Kaartbladindeling,Kaartblad,Bloknummer,Provincie Code,Provincie Naam,Gemeente Id,Gemeente Naam,Postcode,Mijnbouwwerk Code,Mijnbouwwerk Naam,Aangeleverde X,Aangeleverde Y,Aangeleverd Stelsel,X Rijksdriehoek,Y Rijksdriehoek,X TM5_ED50,Y TM5_ED50,X UTM31_ED50,Y UTM31_ED50,Longitude ED50,Latitude ED50,X UTM31_WGS84,Y UTM31_WGS84,Longitude WGS84,Latitude WGS84,Startdatum,Einddatum,Boorgat / Sidetrack,NITG nummer,UWI,Boorgatcode,Boorgatnaam,Boorgatdoel Code,Boorgatdoel,Boorgatresultaat Code,Boorgatresultaat,Boorgatstatus,Boorgatvorm,Kickoff diepte AH,Boorgatdiepte AH,Boorgatdiepte TVD,X deviatie UTM31 ED50,X_end UTM31_ED50,Y deviatie UTM31 ED50,Y_end UTM31_ED50,Referentievlak,Hoogte referentievlak,t.o.v.,Boorgatdiepte AH t.o.v. NAP / MSL,Boorgatdiepte TVD t.o.v. NAP / MSL,Huidige eigenaar,Opdrachtgever,Boortoren/-platform,Boorfirma,Lithostratigrafie Code,Chronotratigrafie Code,Put Naam,Veld Code,Veld Naam,Openbaar vanaf
6628,ON,Topografische kaart 1:25.000,12F,,GR,Groningen,45.0,Veendam,9644.0,ZWD KNZ,Zuidwending Zoutwinning,258215.0,567221.0,RD,258215,567221,629199,5883327,763119,5888805,6.928866,53.082636,763027,5888594,6.927617,53.081898,02-07-1968,26-07-1968,BRH,B12F0086,2363,ZWD-KNZ-05,ZUIDWENDING ZOUT-05,DEV-PS,Ontwikkeling zoutwinning,SALT,Zout,Producing/Injecting,Vertikaal,,1576.5,1576.43,-2.38,763117.0,9.85,5888815.0,Rotary Table,3.2,NAP,1573.3,1573.23,Nouryon Salt B.V.,KNZ,,,ZESA,,ZUIDWENDING ZOUT-05,ZWD,Zuidwending Zout,2003-01-01
6629,ON,Topografische kaart 1:25.000,12F,,GR,Groningen,45.0,Veendam,9644.0,ZWD KNZ,Zuidwending Zoutwinning,258333.0,567443.0,RD,258333,567443,629316,5883549,763230,5889031,6.930697,53.084608,763138,5888819,6.929449,53.083869,20-01-1969,15-02-1969,BRH,B12F0087,2364,ZWD-KNZ-06,ZUIDWENDING ZOUT-06,DEV-PS,Ontwikkeling zoutwinning,SALT,Zout,Producing/Injecting,Vertikaal,,1577.0,1576.93,6.66,763237.0,9.54,5889041.0,Rotary Table,2.4,NAP,1574.6,1574.53,Nouryon Salt B.V.,KNZ,,,ZESA,,ZUIDWENDING ZOUT-06,ZWD,Zuidwending Zout,2003-01-01
6630,ON,Topografische kaart 1:25.000,12F,,GR,Groningen,45.0,Veendam,9644.0,ZWD KNZ,Zuidwending Zoutwinning,258464.0,567666.0,RD,258464,567666,629446,5883773,763353,5889258,6.932723,53.086586,763262,5889047,6.931474,53.085847,15-02-1969,15-03-1969,BRH,B12F0088,2365,ZWD-KNZ-07,ZUIDWENDING ZOUT-07,DEV-PS,Ontwikkeling zoutwinning,SALT,Zout,Producing/Injecting,Vertikaal,,1580.0,1579.93,9.03,763362.0,6.73,5889265.0,Rotary Table,2.8,NAP,1577.2,1577.13,Nouryon Salt B.V.,KNZ,,,ZESA,,ZUIDWENDING ZOUT-07,ZWD,Zuidwending Zout,2003-01-01
6631,ON,Topografische kaart 1:25.000,12F,,GR,Groningen,45.0,Veendam,9644.0,ZWD KNZ,Zuidwending Zoutwinning,258870.0,567877.0,RD,258870,567877,629850,5883986,763752,5889483,6.938848,53.088403,763660,5889271,6.9376,53.087664,26-05-1988,29-07-1988,BRH,B12F0176,3681,ZWD-KNZ-08,ZUIDWENDING ZOUT-08,DEV-PS,Ontwikkeling zoutwinning,SALT,Zout,Producing/Injecting,Vertikaal,,1800.0,1799.92,2.96,763755.0,3.66,5889487.0,Rotary Table,2.02,NAP,1797.98,1797.9,Nouryon Salt B.V.,KNZ,ITAG-120,Deutsche Schachtbau-und Tiefbohrgesellschaft GmbH,ZESA,,ZUIDWENDING ZOUT-08,ZWD,Zuidwending Zout,2003-01-01
6632,ON,Topografische kaart 1:25.000,12F,,GR,Groningen,45.0,Veendam,9644.0,ZWD KNZ,Zuidwending Zoutwinning,258577.0,567886.0,RD,258577,567886,629557,5883993,763459,5889482,6.934479,53.08854,763367,5889271,6.933231,53.087802,20-10-1988,25-11-1988,BRH,B12F0177,3684,ZWD-KNZ-09,ZUIDWENDING ZOUT-09,DEV-PS,Ontwikkeling zoutwinning,SALT,Zout,Producing/Injecting,Vertikaal,,1200.0,1199.85,-0.59,763458.0,17.56,5889500.0,Rotary Table,2.68,NAP,1197.32,1197.17,Nouryon Salt B.V.,KNZ,,Deutsche Schachtbau-und Tiefbohrgesellschaft GmbH,ZESA,,ZUIDWENDING ZOUT-09,ZWD,Zuidwending Zout,2003-01-01
6633,ON,Topografische kaart 1:25.000,17G,,DR,Drenthe,71.0,Coevorden,7855.0,,,243781.14,532582.51,RD,243781,532583,614959,5848617,749844,5853690,6.704086,52.77402,749752,5853479,6.702839,52.773269,04-06-1952,23-08-1952,BRH,B17G0036,2366,ZWE-01,ZWEELO-01,EXP-HC,Exploratie koolwaterstof,DRY,Droog,Abandoned,Vertikaal,,1473.0,1472.88,-0.48,749844.0,14.39,5853704.0,Rotary Table,20.06,NAP,1452.94,1452.82,Nederlandse Aardolie Maatschappij B.V.,Nederlandse Aardolie Maatschappij B.V.,Ideal 50,Nederlandse Aardolie Maatschappij B.V.,RN,,,,,2003-01-01
6634,ON,Topografische kaart 1:25.000,17G,,DR,Drenthe,71.0,Coevorden,7854.0,,,245204.45,533388.72,RD,245204,533389,616378,5849431,751240,5854543,6.725393,52.781028,751148,5854332,6.724146,52.780278,10-08-1953,17-09-1953,BRH,B17G0037,2367,ZWE-02,ZWEELO-02,EXP-HC,Exploratie koolwaterstof,OIL,Olie,Abandoned,Vertikaal,,989.0,988.77,-0.63,751239.0,19.0,5854562.0,Rotary Table,21.46,NAP,967.54,967.31,Nederlandse Aardolie Maatschappij B.V.,Nederlandse Aardolie Maatschappij B.V.,Ideal 50,Nederlandse Aardolie Maatschappij B.V.,ATAL,,,,,2003-01-01
6635,ON,Topografische kaart 1:25.000,17G,,DR,Drenthe,71.0,Coevorden,7854.0,,,245199.37,533388.63,RD,245199,533389,616373,5849431,751235,5854543,6.725318,52.781028,751143,5854332,6.724071,52.780278,04-01-1974,17-01-1974,BRH,B17G0058,2368,ZWE-03,ZWEELO-03,EVA-HC,Evaluatie koolwaterstof,OIL,Olie,Abandoned,Gedevieerd,,990.0,911.85,-124.88,751110.0,259.89,5854803.0,Rotary Table,20.94,NAP,969.06,890.91,Nederlandse Aardolie Maatschappij B.V.,Nederlandse Aardolie Maatschappij B.V.,H525E FV,Nederlandse Aardolie Maatschappij B.V.,SKCF,,,,,2003-01-01
6636,ON,Topografische kaart 1:25.000,19G,,NH,Noord-Holland,102.0,Beemster,1464.0,,,120063.65,505233.84,RD,120064,505234,491426,5820609,627087,5822251,4.873605,52.534411,626996,5822041,4.872319,52.533637,29-02-2012,06-04-2012,BRH,B19G1127,5685,ZWK-01,ZUIDWIJK-01,EXP-HC,Exploratie koolwaterstof,GAS,Gas,Closed-in,Gedevieerd,,3300.0,3138.2,92.49,627179.0,-840.77,5821410.0,Rotary Table,5.57,NAP,3294.43,3132.63,Taqa Energy B.V.,Taqa Energy B.V.,T-45,KCA Deutag Drilling Ltd,ROSL,,,,,2017-04-06
6637,ON,Topografische kaart 1:25.000,21G,,OV,Overijssel,107.0,Zwolle,8026.0,,,209036.0,500421.0,RD,209036,500421,580397,5816275,716174,5820383,6.184029,52.489593,716083,5820172,6.182776,52.488829,22-07-1965,29-07-1965,BRH,B21G0290,2369,ZWO-01,ZWOLLE-01,EXP-HC,Exploratie koolwaterstof,DRY,Droog,Abandoned,Vertikaal,,1058.0,1057.74,-0.63,716173.0,18.98,5820402.0,Rotary Table,5.73,NAP,1052.27,1052.01,Nederlandse Aardolie Maatschappij B.V.,NAM,,,ATRT,,,,,2003-01-01


**Data Wrangling**

In [6]:
# check for null values
data.isna().sum().sort_index()

Aangeleverd Stelsel                      0
Aangeleverde X                           0
Aangeleverde Y                           0
Bloknummer                            4213
Boorfirma                             1322
Boorgat / Sidetrack                      0
Boorgatcode                              0
Boorgatdiepte AH                       128
Boorgatdiepte AH t.o.v. NAP / MSL      147
Boorgatdiepte TVD                      210
Boorgatdiepte TVD t.o.v. NAP / MSL     211
Boorgatdoel                              0
Boorgatdoel Code                         0
Boorgatnaam                              0
Boorgatresultaat                       166
Boorgatresultaat Code                  166
Boorgatstatus                          385
Boorgatvorm                              6
Boortoren/-platform                   2805
Chronotratigrafie Code                6489
Einddatum                                2
Gemeente Id                           2230
Gemeente Naam                         2230
Hoogte refe

In [7]:
# check columns in the dataset
data.columns

Index(['On offshore', 'Kaartbladindeling', 'Kaartblad', 'Bloknummer',
       'Provincie Code', 'Provincie Naam', 'Gemeente Id', 'Gemeente Naam',
       'Postcode', 'Mijnbouwwerk Code', 'Mijnbouwwerk Naam', 'Aangeleverde X',
       'Aangeleverde Y', 'Aangeleverd Stelsel', 'X Rijksdriehoek',
       'Y Rijksdriehoek', 'X TM5_ED50', 'Y TM5_ED50', 'X UTM31_ED50',
       'Y UTM31_ED50', 'Longitude ED50', 'Latitude ED50', 'X UTM31_WGS84',
       'Y UTM31_WGS84', 'Longitude WGS84', 'Latitude WGS84', 'Startdatum',
       'Einddatum', 'Boorgat / Sidetrack', 'NITG nummer', 'UWI', 'Boorgatcode',
       'Boorgatnaam', 'Boorgatdoel Code', 'Boorgatdoel',
       'Boorgatresultaat Code', 'Boorgatresultaat', 'Boorgatstatus',
       'Boorgatvorm', 'Kickoff diepte AH', 'Boorgatdiepte AH',
       'Boorgatdiepte TVD', 'X deviatie UTM31 ED50', 'X_end UTM31_ED50',
       'Y deviatie UTM31 ED50', 'Y_end UTM31_ED50', 'Referentievlak',
       'Hoogte referentievlak', 't.o.v.', 'Boorgatdiepte AH t.o.v. NAP / MSL'

In [8]:
# check for categorical variables in the dataset
for col in data.select_dtypes(include=['object']).columns:
    print(f"{col}: {data[col].unique()}")

On offshore: ['OFF' 'ON']
Kaartbladindeling: ['RWS Blokindeling' 'Topografische kaart 1:25.000']
Kaartblad: [nan '52D' '15C' '40B' '37H' '11B' '11A' '11E' '11G' '38C' '26A' '19B'
 '44E' '11F' '31C' '39G' '02D' '02C' '01H' '02B' '28G' '28D' '07F' '25G'
 '12E' '44F' '06E' '12G' '12F' '33B' '12C' '52F' '31B' '12D' '52C' '19C'
 '05G' '05F' '07B' '58E' '17D' '30H' '19A' '42E' '22G' '13A' '33H' '34E'
 '31E' '38F' '51A' '26C' '16B' '37F' '06A' '38D' '10G' '22E' '32E' '07H'
 '10F' '06H' '09D' '07E' '37D' '16D' '58B' '08A' '34F' '08C' '37G' '12H'
 '39C' '17H' '10E' '52G' '22D' '22B' '58G' '09E' '41E' '22F' '17G' '62B'
 '62E' '62A' '60D' '60C' '60G' '59H' '62D' '61H' '62C' '61F' '37E' '29A'
 '28H' '16E' '16F' '11H' '44G' '21C' '05H' '27A' '28E' '17A' '03C' '34G'
 '07G' '18C' '18A' '16C' '35A' '29C' '27D' '26G' '15F' '16G' '17F' '07C'
 '08D' '28F' '37B' '34D' '41B' '38B' '11D' '06F' '14C' '45B' '30D' '07D'
 '10A' '21H' '31F' '28A' '28C' '31A' '03H' '01G' '19F' '20A' '06C' '45A'
 '10B' '45D' '06B'

In [9]:
#rename columns into proper syntax and also from Dutch to English.
columns_rename_map = {
    'On offshore': 'Onshore_Offshore',
    'Kaartbladindeling': 'Map_Sheet_Division',
    'Kaartblad': 'Map_Sheet',
    'Bloknummer': 'Block_Number',
    'Provincie Code': 'Province_Code',
    'Provincie Naam': 'Province_Name',
    'Gemeente Id': 'Municipality_ID',
    'Gemeente Naam': 'Municipality_Name',
    'Postcode': 'Postal_Code',
    'Mijnbouwwerk Code': 'Mining_Work_Code',
    'Mijnbouwwerk Naam': 'Mining_Work_Name',
    'Aangeleverde X': 'Provided_X',
    'Aangeleverde Y': 'Provided_Y',
    'Aangeleverd Stelsel': 'Coordinate_System',
    'X Rijksdriehoek': 'X_Rijksdriehoek',
    'Y Rijksdriehoek': 'Y_Rijksdriehoek',
    'X TM5_ED50': 'X_TM5_ED50',
    'Y TM5_ED50': 'Y_TM5_ED50',
    'X UTM31_ED50': 'X_UTM31_ED50',
    'Y UTM31_ED50': 'Y_UTM31_ED50',
    'Longitude ED50': 'Longitude_ED50',
    'Latitude ED50': 'Latitude_ED50',
    'X UTM31_WGS84': 'X_UTM31_WGS84',
    'Y UTM31_WGS84': 'Y_UTM31_WGS84',
    'Longitude WGS84': 'Longitude_WGS84',
    'Latitude WGS84': 'Latitude_WGS84',
    'Startdatum': 'Start_Date',
    'Einddatum': 'End_Date',
    'Boorgat / Sidetrack': 'Wellbore_Sidetrack',
    'NITG nummer': 'NITG_Number',
    'UWI': 'UWI',
    'Boorgatcode': 'Wellbore_Code',
    'Boorgatnaam': 'Wellbore_Name',
    'Boorgatdoel Code': 'Wellbore_Objective_Code',
    'Boorgatdoel': 'Wellbore_Objective',
    'Boorgatresultaat Code': 'Wellbore_Result_Code',
    'Boorgatresultaat': 'Wellbore_Result',
    'Boorgatstatus': 'Wellbore_Status',
    'Boorgatvorm': 'Wellbore_Shape',
    'Kickoff diepte AH': 'Kickoff_Depth_AH',
    'Boorgatdiepte AH': 'Wellbore_Depth_AH',
    'Boorgatdiepte TVD': 'Wellbore_Depth_TVD',
    'X deviatie UTM31 ED50': 'X_Deviation_UTM31_ED50',
    'X_end UTM31_ED50': 'X_End_UTM31_ED50',
    'Y deviatie UTM31 ED50': 'Y_Deviation_UTM31_ED50',
    'Y_end UTM31_ED50': 'Y_End_UTM31_ED50',
    'Referentievlak': 'Reference_Level',
    'Hoogte referentievlak': 'Reference_Level_Height',
    't.o.v.': 'Relative_To',
    'Boorgatdiepte AH t.o.v. NAP / MSL': 'Wellbore_Depth_AH_Relative_To_NAP_MSL',
    'Boorgatdiepte TVD t.o.v. NAP / MSL': 'Wellbore_Depth_TVD_Relative_To_NAP_MSL',
    'Huidige eigenaar': 'Current_Owner',
    'Opdrachtgever': 'Client',
    'Boortoren/-platform': 'Drilling_Tower_Platform',
    'Boorfirma': 'Drilling_Company',
    'Lithostratigrafie Code': 'Lithostratigraphy_Code',
    'Chronotratigrafie Code': 'Chronostratigraphy_Code',
    'Put Naam': 'Well_Name',
    'Veld Code': 'Field_Code',
    'Veld Naam': 'Field_Name',
    'Openbaar vanaf': 'Public_Access_From'
}

# Rename the columns
data.rename(columns=columns_rename_map, inplace=True)

# Display the updated columns
print(data.columns)


Index(['Onshore_Offshore', 'Map_Sheet_Division', 'Map_Sheet', 'Block_Number',
       'Province_Code', 'Province_Name', 'Municipality_ID',
       'Municipality_Name', 'Postal_Code', 'Mining_Work_Code',
       'Mining_Work_Name', 'Provided_X', 'Provided_Y', 'Coordinate_System',
       'X_Rijksdriehoek', 'Y_Rijksdriehoek', 'X_TM5_ED50', 'Y_TM5_ED50',
       'X_UTM31_ED50', 'Y_UTM31_ED50', 'Longitude_ED50', 'Latitude_ED50',
       'X_UTM31_WGS84', 'Y_UTM31_WGS84', 'Longitude_WGS84', 'Latitude_WGS84',
       'Start_Date', 'End_Date', 'Wellbore_Sidetrack', 'NITG_Number', 'UWI',
       'Wellbore_Code', 'Wellbore_Name', 'Wellbore_Objective_Code',
       'Wellbore_Objective', 'Wellbore_Result_Code', 'Wellbore_Result',
       'Wellbore_Status', 'Wellbore_Shape', 'Kickoff_Depth_AH',
       'Wellbore_Depth_AH', 'Wellbore_Depth_TVD', 'X_Deviation_UTM31_ED50',
       'X_End_UTM31_ED50', 'Y_Deviation_UTM31_ED50', 'Y_End_UTM31_ED50',
       'Reference_Level', 'Reference_Level_Height', 'Relative_To',
 

In [10]:
data.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 6638 entries, 0 to 6637
Data columns (total 61 columns):
 #   Column                                  Non-Null Count  Dtype         
---  ------                                  --------------  -----         
 0   Onshore_Offshore                        6638 non-null   object        
 1   Map_Sheet_Division                      6638 non-null   object        
 2   Map_Sheet                               4465 non-null   object        
 3   Block_Number                            2425 non-null   object        
 4   Province_Code                           4408 non-null   object        
 5   Province_Name                           4408 non-null   object        
 6   Municipality_ID                         4408 non-null   float64       
 7   Municipality_Name                       4408 non-null   object        
 8   Postal_Code                             4373 non-null   float64       
 9   Mining_Work_Code                        2990 non-nul

In [11]:
data.to_csv("C:/Users/admin/Documents/Conda files/Data Science Projects/Oil and Gas/Dutch oil and gas/data/dutch_oil.csv")

In [12]:
# dutch_oil.drop(columns=['X Rijksdriehoek','Y Rijksdriehoek','Aangeleverde X','Aangeleverde Y','X TM5_ED50',
#                         'Y TM5_ED50', 'X UTM31_ED50','Y UTM31_ED50', 'Longitude ED50', 
#                         'Latitude ED50', 'X UTM31_WGS84','Y UTM31_WGS84','Gemeente Id'], inplace=True)

- After data wrangling
- create a database for the cleaned data.