PROJECT - MAPPING OF "US" HEALTHCARE DATA

In [0]:
dbutils.fs.rm("dbfs:/FileStore/tables/Demographics_mock_data.txt", recurse = True)
dbutils.fs.rm("dbfs:/FileStore/tables/Enrollment_mock_data.txt", recurse = True)
dbutils.fs.rm("dbfs:/FileStore/tables/Coverage_crosswalk.txt", recurse = True)
dbutils.fs.rm("dbfs:/FileStore/tables/Gender_crosswalk.txt", recurse = True)
dbutils.fs.rm("dbfs:/FileStore/tables/Group_crosswalk.txt", recurse = True)
dbutils.fs.rm("dbfs:/FileStore/tables/Plan_crosswalk.txt", recurse = True)
dbutils.fs.rm("dbfs:/FileStore/tables/Relationship_crosswalk.txt", recurse = True)

Out[1]: False

In [0]:
from pyspark.sql import SparkSession
spark = SparkSession.builder.getOrCreate()
spark

IMPORTING ALL FILES INTO DBFS

In [0]:
%fs ls dbfs:///FileStore/Healthcare/

path,name,size,modificationTime
dbfs:/FileStore/Healthcare/Coverage_crosswalk.txt,Coverage_crosswalk.txt,174,1709544367000
dbfs:/FileStore/Healthcare/Demographics_mock_data.txt,Demographics_mock_data.txt,13215,1709544367000
dbfs:/FileStore/Healthcare/Enrollment_mock_data.txt,Enrollment_mock_data.txt,5010,1709544368000
dbfs:/FileStore/Healthcare/Gender_crosswalk.txt,Gender_crosswalk.txt,72,1709544368000
dbfs:/FileStore/Healthcare/Group_crosswalk.txt,Group_crosswalk.txt,115,1709544368000
dbfs:/FileStore/Healthcare/Plan_crosswalk-1.txt,Plan_crosswalk-1.txt,874,1709552257000
dbfs:/FileStore/Healthcare/Plan_crosswalk.txt,Plan_crosswalk.txt,874,1709544368000
dbfs:/FileStore/Healthcare/Relationship_crosswalk.txt,Relationship_crosswalk.txt,264,1709544369000


LOADING THE FILES AND RENAMING IT

In [0]:
enrollment = spark.read.format("csv") \
                              .option("inferSchema", True) \
                              .option("delimiter", "\t") \
                              .option("header", True) \
                              .load("dbfs:/FileStore/Healthcare/Enrollment_mock_data.txt")

demographics = spark.read.format("csv") \
                              .option("inferSchema", True) \
                              .option("delimiter", "\t") \
                              .option("header", True) \
                              .load("dbfs:/FileStore/Healthcare/Demographics_mock_data.txt")

gender = spark.read.format("csv") \
                              .option("inferSchema", True) \
                              .option("delimiter", "\t") \
                              .option("header", True) \
                              .load("dbfs:/FileStore/Healthcare/Gender_crosswalk.txt")

group = spark.read.format("csv") \
                              .option("inferSchema", True) \
                              .option("delimiter", "\t") \
                              .option("header", True) \
                              .load("dbfs:/FileStore/Healthcare/Group_crosswalk.txt")

plan = spark.read.format("csv") \
                              .option("inferSchema", True) \
                              .option("delimiter", "\t") \
                              .option("header", True) \
                              .load("dbfs:/FileStore/Healthcare/Plan_crosswalk-1.txt")

relationship = spark.read.format("csv") \
                              .option("inferSchema", True) \
                              .option("delimiter", "\t") \
                              .option("header", True) \
                              .load("dbfs:/FileStore/Healthcare/Relationship_crosswalk.txt")


coverage = spark.read.format("csv") \
                              .option("inferSchema", True) \
                              .option("delimiter", "\t") \
                              .option("header", True) \
                              .load("dbfs:/FileStore/Healthcare/Coverage_crosswalk.txt")



CREATING TABLES OF ALL IMPORTED FILES

In [0]:
enrollment.createOrReplaceTempView("enrollment")
demographics.createOrReplaceTempView("demographics")
gender.createOrReplaceTempView("gender")
group.createOrReplaceTempView("group")
plan.createOrReplaceTempView("plan")
relationship.createOrReplaceTempView("relationship")
coverage.createOrReplaceTempView("coverage")

In [0]:
%sql
select * from enrollment

MEMBER_ID,MEMBER_STATUS,GROUP_ID,COVERAGE_TYPE,PLAN_ID,VENDOR,EFFECTIVE_DATE,TERMINATION_DATE
173400,ACTIVE,1,E1C,11,Cigna,2021-01-01,2021-02-28
83300,ACTIVE,1,ES,0,Cigna,2019-12-01,2020-01-31
106800,ACTIVE,1,U,4,Aetna,2020-09-01,2020-10-31
52900,ACTIVE,1,ES,15,Aetna,2021-02-01,2021-03-31
97600,ACTIVE,1,E,10,Aetna,2021-01-01,2021-01-31
22000,ACTIVE,1,EC,15,Cigna,2020-03-01,2020-04-30
22900,ACTIVE,1,E,1,Aetna,2020-07-01,2020-07-31
122500,ACTIVE,1,F,10,Cigna,2020-11-01,2020-12-31
21800,ACTIVE,8,E1C,4,Aetna,2020-12-01,2021-01-31
145000,ACTIVE,1,F,1,Cigna,2020-03-01,2020-04-30


In [0]:
%sql
select * from demographics

MEMBER_ID,EMPLOYEE_ID,FIRST_NAME,LAST_NAME,MIDDLE_NAME,GENDER,DOB,RELATIONSHIP,PERSON_CODE,RACE,ETHNICITY,ADDRESS_1,ADDRESS_2,CITY,STATE,COUNTY,ZIP
173400,160951,Freya,Lynn,Marlys,0,1988-02-23,S,2,white,nonhispanic,771 Kirlin Haven,,Attleboro,Massachusetts,Bristol County,2703.0
83300,160951,Candice,Padilla,,0,1964-12-10,F,3,white,nonhispanic,182 Trantow Mission Unit 20,,Bellingham,Massachusetts,Norfolk County,
106800,111325,Leanne,Swanson,,0,2015-05-28,D2,16,white,nonhispanic,686 Shields Dam,,Easthampton,Massachusetts,Hampshire County,
52900,114177,Millicent,Byrne,,0,1948-04-22,N,13,white,nonhispanic,1009 DuBuque Ville Unit 54,,Springfield,Massachusetts,Hampden County,1106.0
97600,117067,Charley,Lynn,,0,1976-01-12,A1,11,white,nonhispanic,114 Cummerata Parade,,West Tisbury,Massachusetts,Dukes County,
22000,12745,Flynn,Morrison,,0,1989-03-30,M,4,white,nonhispanic,164 Stokes Lodge Apt 34,,Winchendon,Massachusetts,Worcester County,1475.0
22900,13466,Pauline,Knight,,0,2019-05-09,N,13,white,nonhispanic,376 Skiles Forge Suite 48,,Westminster,Massachusetts,Worcester County,
122500,135688,Elspeth,Gonzalez,Marliss,0,2014-09-09,C2,6,asian,hispanic,570 Nikolaus Wynd,,Cambridge,Massachusetts,Middlesex County,2139.0
21800,13587,Amelie,Harmon,,0,1984-04-08,D2,16,other,nonhispanic,958 Robel Run Unit 83,,Carver,Massachusetts,Plymouth County,
145000,138507,Laura,Montoya,,0,2010-03-29,F,3,white,nonhispanic,1094 Keebler Grove,,Gardner,Massachusetts,Worcester County,1440.0


In [0]:
%sql
select * from plan

PLAN_ID,Plan_Name,BENEFIT_TYPE,EFFECTIVE_DATE,TERMINATION_DATE
0,Plan A,Medical,2018-01-01,2018-12-31
1,Plan B,Medical and Dental,2018-01-01,2018-12-31
2,Plan C,Medical and Vision,2018-01-01,2018-12-31
3,Plan D,"Medical, Dental and Vision",2018-01-01,2018-12-31
4,Plan E,Medical,2019-01-01,2019-12-31
5,Plan F,Medical and Dental,2019-01-01,2019-12-31
6,Plan G,Medical and Vision,2019-01-01,2019-12-31
7,Plan H,"Medical, Dental and Vision",2019-01-01,2019-12-31
8,Plan I,Medical,2020-01-01,2020-12-31
9,Plan J,Medical and Dental,2020-01-01,2020-12-31


In [0]:
%sql
select * from group

GROUP_ID,GROUP_NAME
8,TechKraft Inc
1,Abacus Insights
4,Digital Convergence Technologies
3,Facebook
2,Google


In [0]:
%sql
select * from relationship

Rollup_Code,Rollup_Description
E,Self
S,Spouse
F,Father
M,Mother
C1,Son
C2,Daughter
G1,Grand Father
G2,Grand Mother
G3,Grand Son
G4,Grand Daughter


In [0]:
%sql
select * from coverage

Coverage_ID,Coverage_Description
E,Employee Only
ES,Employee and Spouse
F,Family
E1C,Employee and 1 Child
EC,Employee and Childrens
EP,Employee and Parents
U,Unknown


In [0]:
%sql
select * from gender

Code,Rollup_Code,Rollup_Description
0,F,Female
1,M,Male
2,U,Unknown


JOINING ALL TABLES FOR MAPPING

In [0]:
%sql
SELECT *
FROM enrollment a
LEFT JOIN demographics b ON a.MEMBER_ID = b.MEMBER_ID
LEFT JOIN gender c ON c.code = b.gender
LEFT JOIN coverage d ON d.Coverage_ID = a.COVERAGE_TYPE
LEFT JOIN relationship e ON e.Rollup_Code = b.RELATIONSHIP
LEFT JOIN group f ON f.GROUP_ID = a.GROUP_ID
LEFT JOIN plan g ON g.PLAN_ID = a.PLAN_ID;


MEMBER_ID,MEMBER_STATUS,GROUP_ID,COVERAGE_TYPE,PLAN_ID,VENDOR,EFFECTIVE_DATE,TERMINATION_DATE,MEMBER_ID.1,EMPLOYEE_ID,FIRST_NAME,LAST_NAME,MIDDLE_NAME,GENDER,DOB,RELATIONSHIP,PERSON_CODE,RACE,ETHNICITY,ADDRESS_1,ADDRESS_2,CITY,STATE,COUNTY,ZIP,Code,Rollup_Code,Rollup_Description,Coverage_ID,Coverage_Description,Rollup_Code.1,Rollup_Description.1,GROUP_ID.1,GROUP_NAME,PLAN_ID.1,Plan_Name,BENEFIT_TYPE,EFFECTIVE_DATE.1,TERMINATION_DATE.1
173400,ACTIVE,1,E1C,11,Cigna,2021-01-01,2021-02-28,173400,160951,Freya,Lynn,Marlys,0,1988-02-23,S,2,white,nonhispanic,771 Kirlin Haven,,Attleboro,Massachusetts,Bristol County,2703.0,0,F,Female,E1C,Employee and 1 Child,S,Spouse,1,Abacus Insights,11,Plan L,"Medical, Dental and Vision",2020-01-01,2020-12-31
83300,ACTIVE,1,ES,0,Cigna,2019-12-01,2020-01-31,83300,160951,Candice,Padilla,,0,1964-12-10,F,3,white,nonhispanic,182 Trantow Mission Unit 20,,Bellingham,Massachusetts,Norfolk County,,0,F,Female,ES,Employee and Spouse,F,Fiance,1,Abacus Insights,0,Plan A,Medical,2018-01-01,2018-12-31
83300,ACTIVE,1,ES,0,Cigna,2019-12-01,2020-01-31,83300,160951,Candice,Padilla,,0,1964-12-10,F,3,white,nonhispanic,182 Trantow Mission Unit 20,,Bellingham,Massachusetts,Norfolk County,,0,F,Female,ES,Employee and Spouse,F,Father,1,Abacus Insights,0,Plan A,Medical,2018-01-01,2018-12-31
106800,ACTIVE,1,U,4,Aetna,2020-09-01,2020-10-31,106800,111325,Leanne,Swanson,,0,2015-05-28,D2,16,white,nonhispanic,686 Shields Dam,,Easthampton,Massachusetts,Hampshire County,,0,F,Female,U,Unknown,D2,Divorced Wife,1,Abacus Insights,4,Plan E,Medical,2019-01-01,2019-12-31
52900,ACTIVE,1,ES,15,Aetna,2021-02-01,2021-03-31,52900,114177,Millicent,Byrne,,0,1948-04-22,N,13,white,nonhispanic,1009 DuBuque Ville Unit 54,,Springfield,Massachusetts,Hampden County,1106.0,0,F,Female,ES,Employee and Spouse,N,Niece,1,Abacus Insights,15,Plan P,"Medical, Dental and Vision",2021-01-01,2021-12-31
97600,ACTIVE,1,E,10,Aetna,2021-01-01,2021-01-31,97600,117067,Charley,Lynn,,0,1976-01-12,A1,11,white,nonhispanic,114 Cummerata Parade,,West Tisbury,Massachusetts,Dukes County,,0,F,Female,E,Employee Only,A1,Adopted Son,1,Abacus Insights,10,Plan K,Medical and Vision,2020-01-01,2020-12-31
22000,ACTIVE,1,EC,15,Cigna,2020-03-01,2020-04-30,22000,12745,Flynn,Morrison,,0,1989-03-30,M,4,white,nonhispanic,164 Stokes Lodge Apt 34,,Winchendon,Massachusetts,Worcester County,1475.0,0,F,Female,EC,Employee and Childrens,M,Mother,1,Abacus Insights,15,Plan P,"Medical, Dental and Vision",2021-01-01,2021-12-31
22900,ACTIVE,1,E,1,Aetna,2020-07-01,2020-07-31,22900,13466,Pauline,Knight,,0,2019-05-09,N,13,white,nonhispanic,376 Skiles Forge Suite 48,,Westminster,Massachusetts,Worcester County,,0,F,Female,E,Employee Only,N,Niece,1,Abacus Insights,1,Plan B,Medical and Dental,2018-01-01,2018-12-31
122500,ACTIVE,1,F,10,Cigna,2020-11-01,2020-12-31,122500,135688,Elspeth,Gonzalez,Marliss,0,2014-09-09,C2,6,asian,hispanic,570 Nikolaus Wynd,,Cambridge,Massachusetts,Middlesex County,2139.0,0,F,Female,F,Family,C2,Daughter,1,Abacus Insights,10,Plan K,Medical and Vision,2020-01-01,2020-12-31
21800,ACTIVE,8,E1C,4,Aetna,2020-12-01,2021-01-31,21800,13587,Amelie,Harmon,,0,1984-04-08,D2,16,other,nonhispanic,958 Robel Run Unit 83,,Carver,Massachusetts,Plymouth County,,0,F,Female,E1C,Employee and 1 Child,D2,Divorced Wife,8,TechKraft Inc,4,Plan E,Medical,2019-01-01,2019-12-31


PROJECTING OUR REQUARED FIELDS

In [0]:
%sql
SELECT 
    CONCAT(a.MEMBER_ID, " ", b.EMPLOYEE_ID, " ", e.Rollup_Code, " ", e.Rollup_Description) AS Abacus_Member_ID,
    a.MEMBER_ID,
    b.EMPLOYEE_ID AS SUBSCRIBER_ID,
    b.FIRST_NAME AS MEMBER_FIRST_NAME,
    b.LAST_NAME AS MEMBER_LAST_NAME,
    b.MIDDLE_NAME AS MEMBER_MIDDLE_NAME,
    "NULL" AS Member_Prefix_Name,
    "NULL" AS Member_Suffix_Name,
    c.Rollup_Description AS MEMBER_GENDER,
    DATE_FORMAT(DOB, 'MM-dd-yyyy') AS Member_Date_of_Birth,
    e.Rollup_Code AS Member_Relationship_Code,
    e.Rollup_Description AS Member_Relationship_Description,
    b.PERSON_CODE AS Member_Person_Code,
    b.ADDRESS_1 AS Member_Address_Line_1,
    b.ADDRESS_2 AS Member_Address_Line_2,
    b.CITY AS Member_City,
    b.STATE AS Member_State,
    b.COUNTY AS Member_County,
    b.ZIP AS Member_Postal_Code,
    "US" AS Member_Country,
    "NULL" AS Member_Home_Phone,
    "NULL" AS Member_Work_Phone,
    "NULL" AS Member_Mobile_Phone,
    "NULL" AS Member_Email,
    "NULL" AS Member_Is_Deceased,
    "NULL" AS Member_Date_of_Death,
    "NULL" AS Member_Deceased_Reason,
    a.GROUP_ID AS Enrollment_Group_ID,
    f.GROUP_NAME AS Enrollment_Group_Name,
    "NULL" AS Enrollment_SubGroup_ID,
    "NULL" AS Enrollment_SubGroup_Name,
    d.Coverage_ID AS Enrollment_Coverage_Code,
    d.Coverage_Description AS Enrollment_Coverage_Description,
    g.PLAN_ID AS Enrollment_Plan_ID,
    g.Plan_Name AS Enrollment_Plan_Name,
    g.BENEFIT_TYPE AS Enrollment_Plan_Coverage,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Medical%" THEN g.EFFECTIVE_DATE
    END AS Enrollment_Medical_Effective_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Medical%" OR g.BENEFIT_TYPE LIKE "Medical and Vision" OR g.BENEFIT_TYPE LIKE "Medical, Dental and Vision" THEN g.TERMINATION_DATE
    END AS Enrollment_Medical_Termination_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Dental%" THEN g.EFFECTIVE_DATE
    END AS Enrollment_Dental_Effective_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Dental%" THEN g.TERMINATION_DATE
    END AS Enrollment_Dental_Termination_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Vision%" THEN g.EFFECTIVE_DATE
    END AS Enrollment_Vision_Effective_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Vision%" THEN g.TERMINATION_DATE
    END AS Enrollment_Vision_Termination_Date,
    a.VENDOR AS Enrollment_Vendor_Name,
    "Member Enrollment Data Dictionary" AS Souce_File_Name,
    CURRENT_DATE() AS File_Ingestion_Date
FROM
    enrollment a
    LEFT JOIN demographics b ON a.MEMBER_ID = b.MEMBER_ID
    LEFT JOIN gender c ON c.code = b.gender
    LEFT JOIN coverage d ON d.Coverage_ID = a.COVERAGE_TYPE
    LEFT JOIN relationship e ON e.Rollup_Code = b.RELATIONSHIP
    LEFT JOIN group f ON f.GROUP_ID = a.GROUP_ID
    LEFT JOIN plan g ON g.PLAN_ID = a.PLAN_ID;


Abacus_Member_ID,MEMBER_ID,SUBSCRIBER_ID,MEMBER_FIRST_NAME,MEMBER_LAST_NAME,MEMBER_MIDDLE_NAME,Member_Prefix_Name,Member_Suffix_Name,MEMBER_GENDER,Member_Date_of_Birth,Member_Relationship_Code,Member_Relationship_Description,Member_Person_Code,Member_Address_Line_1,Member_Address_Line_2,Member_City,Member_State,Member_County,Member_Postal_Code,Member_Country,Member_Home_Phone,Member_Work_Phone,Member_Mobile_Phone,Member_Email,Member_Is_Deceased,Member_Date_of_Death,Member_Deceased_Reason,Enrollment_Group_ID,Enrollment_Group_Name,Enrollment_SubGroup_ID,Enrollment_SubGroup_Name,Enrollment_Coverage_Code,Enrollment_Coverage_Description,Enrollment_Plan_ID,Enrollment_Plan_Name,Enrollment_Plan_Coverage,Enrollment_Medical_Effective_Date,Enrollment_Medical_Termination_Date,Enrollment_Dental_Effective_Date,Enrollment_Dental_Termination_Date,Enrollment_Vision_Effective_Date,Enrollment_Vision_Termination_Date,Enrollment_Vendor_Name,Souce_File_Name,File_Ingestion_Date
173400 160951 S Spouse,173400,160951,Freya,Lynn,Marlys,,,Female,02-23-1988,S,Spouse,2,771 Kirlin Haven,,Attleboro,Massachusetts,Bristol County,2703.0,US,,,,,,,,1,Abacus Insights,,,E1C,Employee and 1 Child,11,Plan L,"Medical, Dental and Vision",2020-01-01,2020-12-31,2020-01-01,2020-12-31,2020-01-01,2020-12-31,Cigna,Member Enrollment Data Dictionary,2024-03-08
83300 160951 F Fiance,83300,160951,Candice,Padilla,,,,Female,12-10-1964,F,Fiance,3,182 Trantow Mission Unit 20,,Bellingham,Massachusetts,Norfolk County,,US,,,,,,,,1,Abacus Insights,,,ES,Employee and Spouse,0,Plan A,Medical,2018-01-01,2018-12-31,,,,,Cigna,Member Enrollment Data Dictionary,2024-03-08
83300 160951 F Father,83300,160951,Candice,Padilla,,,,Female,12-10-1964,F,Father,3,182 Trantow Mission Unit 20,,Bellingham,Massachusetts,Norfolk County,,US,,,,,,,,1,Abacus Insights,,,ES,Employee and Spouse,0,Plan A,Medical,2018-01-01,2018-12-31,,,,,Cigna,Member Enrollment Data Dictionary,2024-03-08
106800 111325 D2 Divorced Wife,106800,111325,Leanne,Swanson,,,,Female,05-28-2015,D2,Divorced Wife,16,686 Shields Dam,,Easthampton,Massachusetts,Hampshire County,,US,,,,,,,,1,Abacus Insights,,,U,Unknown,4,Plan E,Medical,2019-01-01,2019-12-31,,,,,Aetna,Member Enrollment Data Dictionary,2024-03-08
52900 114177 N Niece,52900,114177,Millicent,Byrne,,,,Female,04-22-1948,N,Niece,13,1009 DuBuque Ville Unit 54,,Springfield,Massachusetts,Hampden County,1106.0,US,,,,,,,,1,Abacus Insights,,,ES,Employee and Spouse,15,Plan P,"Medical, Dental and Vision",2021-01-01,2021-12-31,2021-01-01,2021-12-31,2021-01-01,2021-12-31,Aetna,Member Enrollment Data Dictionary,2024-03-08
97600 117067 A1 Adopted Son,97600,117067,Charley,Lynn,,,,Female,01-12-1976,A1,Adopted Son,11,114 Cummerata Parade,,West Tisbury,Massachusetts,Dukes County,,US,,,,,,,,1,Abacus Insights,,,E,Employee Only,10,Plan K,Medical and Vision,2020-01-01,2020-12-31,,,2020-01-01,2020-12-31,Aetna,Member Enrollment Data Dictionary,2024-03-08
22000 12745 M Mother,22000,12745,Flynn,Morrison,,,,Female,03-30-1989,M,Mother,4,164 Stokes Lodge Apt 34,,Winchendon,Massachusetts,Worcester County,1475.0,US,,,,,,,,1,Abacus Insights,,,EC,Employee and Childrens,15,Plan P,"Medical, Dental and Vision",2021-01-01,2021-12-31,2021-01-01,2021-12-31,2021-01-01,2021-12-31,Cigna,Member Enrollment Data Dictionary,2024-03-08
22900 13466 N Niece,22900,13466,Pauline,Knight,,,,Female,05-09-2019,N,Niece,13,376 Skiles Forge Suite 48,,Westminster,Massachusetts,Worcester County,,US,,,,,,,,1,Abacus Insights,,,E,Employee Only,1,Plan B,Medical and Dental,2018-01-01,2018-12-31,2018-01-01,2018-12-31,,,Aetna,Member Enrollment Data Dictionary,2024-03-08
122500 135688 C2 Daughter,122500,135688,Elspeth,Gonzalez,Marliss,,,Female,09-09-2014,C2,Daughter,6,570 Nikolaus Wynd,,Cambridge,Massachusetts,Middlesex County,2139.0,US,,,,,,,,1,Abacus Insights,,,F,Family,10,Plan K,Medical and Vision,2020-01-01,2020-12-31,,,2020-01-01,2020-12-31,Cigna,Member Enrollment Data Dictionary,2024-03-08
21800 13587 D2 Divorced Wife,21800,13587,Amelie,Harmon,,,,Female,04-08-1984,D2,Divorced Wife,16,958 Robel Run Unit 83,,Carver,Massachusetts,Plymouth County,,US,,,,,,,,8,TechKraft Inc,,,E1C,Employee and 1 Child,4,Plan E,Medical,2019-01-01,2019-12-31,,,,,Aetna,Member Enrollment Data Dictionary,2024-03-08


CREATING 1 TABLE FROM JOING 7 TABLES WITH THE HELP OF OUR ABOVE QUERY

In [0]:
%sql
CREATE OR REPLACE TABLE healthcare AS 
( 
SELECT 
    monotonically_increasing_id() AS Abacus_Record_ID,
    CONCAT(a.MEMBER_ID, " ", b.EMPLOYEE_ID, " ", e.Rollup_Code, " ", e.Rollup_Description) AS Abacus_Member_ID,
    a.MEMBER_ID,
    b.EMPLOYEE_ID AS SUBSCRIBER_ID,
    b.FIRST_NAME AS MEMBER_FIRST_NAME,
    b.LAST_NAME AS MEMBER_LAST_NAME,
    b.MIDDLE_NAME AS MEMBER_MIDDLE_NAME,
    "NULL" AS Member_Prefix_Name,
    "NULL" AS Member_Suffix_Name,
    c.Rollup_Description AS MEMBER_GENDER,
    DATE_FORMAT(DOB, 'MM-dd-yyyy') AS Member_Date_of_Birth,
    e.Rollup_Code AS Member_Relationship_Code,
    e.Rollup_Description AS Member_Relationship_Description,
    b.PERSON_CODE AS Member_Person_Code,
    b.ADDRESS_1 AS Member_Address_Line_1,
    b.ADDRESS_2 AS Member_Address_Line_2,
    b.CITY AS Member_City,
    b.STATE AS Member_State,
    b.COUNTY AS Member_County,
    b.ZIP AS Member_Postal_Code,
    "US" AS Member_Country,
    "NULL" AS Member_Home_Phone,
    "NULL" AS Member_Work_Phone,
    "NULL" AS Member_Mobile_Phone,
    "NULL" AS Member_Email,
    "NULL" AS Member_Is_Deceased,
    "NULL" AS Member_Date_of_Death,
    "NULL" AS Member_Deceased_Reason,
    a.GROUP_ID AS Enrollment_Group_ID,
    f.GROUP_NAME AS Enrollment_Group_Name,
    "NULL" AS Enrollment_SubGroup_ID,
    "NULL" AS Enrollment_SubGroup_Name,
    d.Coverage_ID AS Enrollment_Coverage_Code,
    d.Coverage_Description AS Enrollment_Coverage_Description,
    g.PLAN_ID AS Enrollment_Plan_ID,
    g.Plan_Name AS Enrollment_Plan_Name,
    g.BENEFIT_TYPE AS Enrollment_Plan_Coverage,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Medical%" THEN g.EFFECTIVE_DATE
    END AS Enrollment_Medical_Effective_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Medical%" OR g.BENEFIT_TYPE LIKE "Medical and Vision" OR g.BENEFIT_TYPE LIKE "Medical, Dental and Vision" THEN g.TERMINATION_DATE
    END AS Enrollment_Medical_Termination_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Dental%" THEN g.EFFECTIVE_DATE
    END AS Enrollment_Dental_Effective_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Dental%" THEN g.TERMINATION_DATE
    END AS Enrollment_Dental_Termination_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Vision%" THEN g.EFFECTIVE_DATE
    END AS Enrollment_Vision_Effective_Date,
    CASE
        WHEN g.BENEFIT_TYPE LIKE "%Vision%" THEN g.TERMINATION_DATE
    END AS Enrollment_Vision_Termination_Date,
    a.VENDOR AS Enrollment_Vendor_Name,
    "Member Enrollment Data Dictionary" AS Souce_File_Name,
    CURRENT_DATE() AS File_Ingestion_Date
FROM
    enrollment a
    LEFT JOIN demographics b ON a.MEMBER_ID = b.MEMBER_ID
    LEFT JOIN gender c ON c.code = b.gender
    LEFT JOIN coverage d ON d.Coverage_ID = a.COVERAGE_TYPE
    LEFT JOIN relationship e ON e.Rollup_Code = b.RELATIONSHIP
    LEFT JOIN group f ON f.GROUP_ID = a.GROUP_ID
    LEFT JOIN plan g ON g.PLAN_ID = a.PLAN_ID
)


num_affected_rows,num_inserted_rows


SHOWING OUR FINAL OUTPUT

In [0]:
%sql
select * from healthcare

Abacus_Record_ID,Abacus_Member_ID,MEMBER_ID,SUBSCRIBER_ID,MEMBER_FIRST_NAME,MEMBER_LAST_NAME,MEMBER_MIDDLE_NAME,Member_Prefix_Name,Member_Suffix_Name,MEMBER_GENDER,Member_Date_of_Birth,Member_Relationship_Code,Member_Relationship_Description,Member_Person_Code,Member_Address_Line_1,Member_Address_Line_2,Member_City,Member_State,Member_County,Member_Postal_Code,Member_Country,Member_Home_Phone,Member_Work_Phone,Member_Mobile_Phone,Member_Email,Member_Is_Deceased,Member_Date_of_Death,Member_Deceased_Reason,Enrollment_Group_ID,Enrollment_Group_Name,Enrollment_SubGroup_ID,Enrollment_SubGroup_Name,Enrollment_Coverage_Code,Enrollment_Coverage_Description,Enrollment_Plan_ID,Enrollment_Plan_Name,Enrollment_Plan_Coverage,Enrollment_Medical_Effective_Date,Enrollment_Medical_Termination_Date,Enrollment_Dental_Effective_Date,Enrollment_Dental_Termination_Date,Enrollment_Vision_Effective_Date,Enrollment_Vision_Termination_Date,Enrollment_Vendor_Name,Souce_File_Name,File_Ingestion_Date
0,173400 160951 S Spouse,173400,160951,Freya,Lynn,Marlys,,,Female,02-23-1988,S,Spouse,2,771 Kirlin Haven,,Attleboro,Massachusetts,Bristol County,2703.0,US,,,,,,,,1,Abacus Insights,,,E1C,Employee and 1 Child,11,Plan L,"Medical, Dental and Vision",2020-01-01,2020-12-31,2020-01-01,2020-12-31,2020-01-01,2020-12-31,Cigna,Member Enrollment Data Dictionary,2024-03-08
1,83300 160951 F Fiance,83300,160951,Candice,Padilla,,,,Female,12-10-1964,F,Fiance,3,182 Trantow Mission Unit 20,,Bellingham,Massachusetts,Norfolk County,,US,,,,,,,,1,Abacus Insights,,,ES,Employee and Spouse,0,Plan A,Medical,2018-01-01,2018-12-31,,,,,Cigna,Member Enrollment Data Dictionary,2024-03-08
2,83300 160951 F Father,83300,160951,Candice,Padilla,,,,Female,12-10-1964,F,Father,3,182 Trantow Mission Unit 20,,Bellingham,Massachusetts,Norfolk County,,US,,,,,,,,1,Abacus Insights,,,ES,Employee and Spouse,0,Plan A,Medical,2018-01-01,2018-12-31,,,,,Cigna,Member Enrollment Data Dictionary,2024-03-08
3,106800 111325 D2 Divorced Wife,106800,111325,Leanne,Swanson,,,,Female,05-28-2015,D2,Divorced Wife,16,686 Shields Dam,,Easthampton,Massachusetts,Hampshire County,,US,,,,,,,,1,Abacus Insights,,,U,Unknown,4,Plan E,Medical,2019-01-01,2019-12-31,,,,,Aetna,Member Enrollment Data Dictionary,2024-03-08
4,52900 114177 N Niece,52900,114177,Millicent,Byrne,,,,Female,04-22-1948,N,Niece,13,1009 DuBuque Ville Unit 54,,Springfield,Massachusetts,Hampden County,1106.0,US,,,,,,,,1,Abacus Insights,,,ES,Employee and Spouse,15,Plan P,"Medical, Dental and Vision",2021-01-01,2021-12-31,2021-01-01,2021-12-31,2021-01-01,2021-12-31,Aetna,Member Enrollment Data Dictionary,2024-03-08
5,97600 117067 A1 Adopted Son,97600,117067,Charley,Lynn,,,,Female,01-12-1976,A1,Adopted Son,11,114 Cummerata Parade,,West Tisbury,Massachusetts,Dukes County,,US,,,,,,,,1,Abacus Insights,,,E,Employee Only,10,Plan K,Medical and Vision,2020-01-01,2020-12-31,,,2020-01-01,2020-12-31,Aetna,Member Enrollment Data Dictionary,2024-03-08
6,22000 12745 M Mother,22000,12745,Flynn,Morrison,,,,Female,03-30-1989,M,Mother,4,164 Stokes Lodge Apt 34,,Winchendon,Massachusetts,Worcester County,1475.0,US,,,,,,,,1,Abacus Insights,,,EC,Employee and Childrens,15,Plan P,"Medical, Dental and Vision",2021-01-01,2021-12-31,2021-01-01,2021-12-31,2021-01-01,2021-12-31,Cigna,Member Enrollment Data Dictionary,2024-03-08
7,22900 13466 N Niece,22900,13466,Pauline,Knight,,,,Female,05-09-2019,N,Niece,13,376 Skiles Forge Suite 48,,Westminster,Massachusetts,Worcester County,,US,,,,,,,,1,Abacus Insights,,,E,Employee Only,1,Plan B,Medical and Dental,2018-01-01,2018-12-31,2018-01-01,2018-12-31,,,Aetna,Member Enrollment Data Dictionary,2024-03-08
8,122500 135688 C2 Daughter,122500,135688,Elspeth,Gonzalez,Marliss,,,Female,09-09-2014,C2,Daughter,6,570 Nikolaus Wynd,,Cambridge,Massachusetts,Middlesex County,2139.0,US,,,,,,,,1,Abacus Insights,,,F,Family,10,Plan K,Medical and Vision,2020-01-01,2020-12-31,,,2020-01-01,2020-12-31,Cigna,Member Enrollment Data Dictionary,2024-03-08
9,21800 13587 D2 Divorced Wife,21800,13587,Amelie,Harmon,,,,Female,04-08-1984,D2,Divorced Wife,16,958 Robel Run Unit 83,,Carver,Massachusetts,Plymouth County,,US,,,,,,,,8,TechKraft Inc,,,E1C,Employee and 1 Child,4,Plan E,Medical,2019-01-01,2019-12-31,,,,,Aetna,Member Enrollment Data Dictionary,2024-03-08
