In [1]:
# Dependencies and Setup
import matplotlib.pyplot as plt
import requests
import pandas as pd
import json
import numpy as np
import time

In [2]:
# URL for GET requests to retrieve vehicle data

url = "https://data.cms.gov/resource/97k6-zzx3.json"

# Create a variable for and print the response object to the console to make sure we have a connection to the API
Response = requests.get(url)
print(Response)

<Response [200]>


In [3]:
# Create a variable to hold the response data in json format
Response_Data = Response.json()

print(json.dumps(Response_Data, indent=4, sort_keys=True))

[
    {
        "average_covered_charges": "32963.07",
        "average_medicare_payments": "5777.24",
        "average_medicare_payments_2": "4763.73",
        "drg_definition": "039 - EXTRACRANIAL PROCEDURES W/O CC/MCC",
        "hospital_referral_region_description": "AL - Dothan",
        "provider_city": "DOTHAN",
        "provider_id": "10001",
        "provider_name": "SOUTHEAST ALABAMA MEDICAL CENTER",
        "provider_state": "AL",
        "provider_street_address": "1108 ROSS CLARK CIRCLE",
        "provider_zip_code": "36301",
        "total_discharges": "91"
    },
    {
        "average_covered_charges": "15131.85",
        "average_medicare_payments": "5787.57",
        "average_medicare_payments_2": "4976.71",
        "drg_definition": "039 - EXTRACRANIAL PROCEDURES W/O CC/MCC",
        "hospital_referral_region_description": "AL - Birmingham",
        "provider_city": "BOAZ",
        "provider_id": "10005",
        "provider_name": "MARSHALL MEDICAL CENTER SOUTH",
    

In [4]:
# Print the first row of data
print(Response_Data[0])

{'drg_definition': '039 - EXTRACRANIAL PROCEDURES W/O CC/MCC', 'provider_id': '10001', 'provider_name': 'SOUTHEAST ALABAMA MEDICAL CENTER', 'provider_street_address': '1108 ROSS CLARK CIRCLE', 'provider_city': 'DOTHAN', 'provider_state': 'AL', 'provider_zip_code': '36301', 'hospital_referral_region_description': 'AL - Dothan', 'total_discharges': '91', 'average_covered_charges': '32963.07', 'average_medicare_payments': '5777.24', 'average_medicare_payments_2': '4763.73'}


In [5]:
# Generate a DataFrame from the response data
DataFrame = pd.DataFrame(Response_Data)

# Display top 5 rows of dataframe for reference

DataFrame.head()

Unnamed: 0,drg_definition,provider_id,provider_name,provider_street_address,provider_city,provider_state,provider_zip_code,hospital_referral_region_description,total_discharges,average_covered_charges,average_medicare_payments,average_medicare_payments_2
0,039 - EXTRACRANIAL PROCEDURES W/O CC/MCC,10001,SOUTHEAST ALABAMA MEDICAL CENTER,1108 ROSS CLARK CIRCLE,DOTHAN,AL,36301,AL - Dothan,91,32963.07,5777.24,4763.73
1,039 - EXTRACRANIAL PROCEDURES W/O CC/MCC,10005,MARSHALL MEDICAL CENTER SOUTH,2505 U S HIGHWAY 431 NORTH,BOAZ,AL,35957,AL - Birmingham,14,15131.85,5787.57,4976.71
2,039 - EXTRACRANIAL PROCEDURES W/O CC/MCC,10006,ELIZA COFFEE MEMORIAL HOSPITAL,205 MARENGO STREET,FLORENCE,AL,35631,AL - Birmingham,24,37560.37,5434.95,4453.79
3,039 - EXTRACRANIAL PROCEDURES W/O CC/MCC,10011,ST VINCENT'S EAST,50 MEDICAL PARK EAST DRIVE,BIRMINGHAM,AL,35235,AL - Birmingham,25,13998.28,5417.56,4129.16
4,039 - EXTRACRANIAL PROCEDURES W/O CC/MCC,10016,SHELBY BAPTIST MEDICAL CENTER,1000 FIRST STREET NORTH,ALABASTER,AL,35007,AL - Birmingham,18,31633.27,5658.33,4851.44


In [6]:
# Display a statistical overview of the DataFrame for reference

DataFrame.describe()

Unnamed: 0,drg_definition,provider_id,provider_name,provider_street_address,provider_city,provider_state,provider_zip_code,hospital_referral_region_description,total_discharges,average_covered_charges,average_medicare_payments,average_medicare_payments_2
count,1000,1000,1000,1000,1000,1000,1000,1000,1000,1000.0,1000.0,1000.0
unique,1,1000,974,999,683,47,957,282,92,1000.0,994.0,998.0
top,039 - EXTRACRANIAL PROCEDURES W/O CC/MCC,70028,GOOD SAMARITAN HOSPITAL,800 WASHINGTON STREET,SPRINGFIELD,FL,76104,MA - Boston,11,30355.22,6710.81,4847.08
freq,1000,1,6,2,8,81,3,19,57,1.0,2.0,2.0


In [7]:
# Check to see if there are any incomplete rows
DataFrame.count()

drg_definition                          1000
provider_id                             1000
provider_name                           1000
provider_street_address                 1000
provider_city                           1000
provider_state                          1000
provider_zip_code                       1000
hospital_referral_region_description    1000
total_discharges                        1000
average_covered_charges                 1000
average_medicare_payments               1000
average_medicare_payments_2             1000
dtype: int64

In [8]:
# Calculate the Number of Unique Diagnosis Related Groups (DRGs): 
Unique_DRGs = len(DataFrame["drg_definition"].unique())
Unique_DRGs

1

In [9]:
# Calculate the Number of Unique Providers: 
Unique_Provider_count = len(DataFrame["provider_id"].unique())
Unique_Provider_count

1000

In [10]:
# Calculate the Total Number of Unique States in the DataFrame
Unique_State_Count = len(DataFrame["provider_state"].unique())
Unique_State_Count

47

In [11]:
# Calculate the Total Number of Unique Provider Zip Codes in the DataFrame
Unique_Provider_ZipCode_Count = len(DataFrame["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count

957

In [12]:
# Calculate the Unique Number of hospital_referral_region_description in the DataFrame
Unique_Hospital_Referral_Region_count = len(DataFrame["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count

282

In [13]:
# Calculate the Total Number of Discharges in the DataFrame
Discharge_Count = (DataFrame["total_discharges"].sum())
Discharge_Count

'911424251867513213534144543211527273118332966192311401812422820151842136217253627151112131426256439551248194176173526121813922276648161727262156155211401328663434671226271616152320191334121831111213752217111213171732171719212811192735162039111341531314401466154813161120335638171920255038141122191529232457203416129013411114222340937055513633533320112414885420301330287141564917161927166692103514324115921141713231317273116382320271549361110811883512762415141675222223255025292022233836133411632621114082151286502634175322954327611222523325291112242418381718111171163131371221152315611222142612313019163415141966192017171127181414181228192822162114142436462133391415242830165722232615213323301428408254135268132011252613254218112273251114302637292112194640211275764757261624302647345639271517190181217575031651948284626171422683584366616453512192445171615111119131480271633321926134348110913975281216242236278162427941111230423611561523141837143129182391495033145414125024181617512317155340143411221

In [14]:
# Observe the DataTypes of each column
DataFrame.dtypes

drg_definition                          object
provider_id                             object
provider_name                           object
provider_street_address                 object
provider_city                           object
provider_state                          object
provider_zip_code                       object
hospital_referral_region_description    object
total_discharges                        object
average_covered_charges                 object
average_medicare_payments               object
average_medicare_payments_2             object
dtype: object

In [15]:
# Use pd.to_numeric() method to convert the datatype of the Discharge Count column
DataFrame['total_discharges'] = pd.to_numeric(DataFrame['total_discharges'])

# Use pd.to_numeric() method to convert the datatype of the Average Covered Charges column
DataFrame['average_covered_charges'] = pd.to_numeric(DataFrame['average_covered_charges'])

# Use pd.to_numeric() method to convert the datatype of the Average Medicare Payments column
DataFrame['average_medicare_payments'] = pd.to_numeric(DataFrame['average_medicare_payments'])

# Use pd.to_numeric() method to convert the datatype of the Average Medicare Payments 2 column
DataFrame['average_medicare_payments_2'] = pd.to_numeric(DataFrame['average_medicare_payments_2'])

In [16]:
# Verify that the Discharge column datatype has been made numeric
# DataFrame['total_discharges'].dtype

# Observe the updated DataTypes of each column
DataFrame.dtypes

drg_definition                           object
provider_id                              object
provider_name                            object
provider_street_address                  object
provider_city                            object
provider_state                           object
provider_zip_code                        object
hospital_referral_region_description     object
total_discharges                          int64
average_covered_charges                 float64
average_medicare_payments               float64
average_medicare_payments_2             float64
dtype: object

In [17]:
# Calculate the Total Number of Discharges in the DataFrame
Discharge_Count = (DataFrame["total_discharges"].sum())
Discharge_Count

31334

In [18]:
# Cacluate the average covered charges amount
Average_Covered_Charges = DataFrame["average_covered_charges"].mean()
Average_Covered_Charges

30764.52741

In [19]:
# Cacluate the max covered charge amount
Max_Covered_Charges = DataFrame["average_covered_charges"].max()
Max_Covered_Charges

146892.0

In [20]:
# Cacluate the min covered charge amount
Min_Covered_Charges = DataFrame["average_covered_charges"].min()
Min_Covered_Charges

5981.05

In [21]:
# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df = pd.DataFrame([
    {"Unique DRGs": Unique_DRGs, 
     "Unique Providers": Unique_Provider_count, 
     "Unique Provider States": Unique_State_Count, 
     "Unique Provider Zip Codes": Unique_Provider_ZipCode_Count, 
     "Unique Regions": Unique_Hospital_Referral_Region_count,
     "Total Discharge Count": Discharge_Count,
     "Average Charge": Average_Covered_Charges,
     "Max Charge": Max_Covered_Charges,
     "Min Charge": Min_Covered_Charges
    }
])
DRG_Analysis_df

Unnamed: 0,Unique DRGs,Unique Providers,Unique Provider States,Unique Provider Zip Codes,Unique Regions,Total Discharge Count,Average Charge,Max Charge,Min Charge
0,1,1000,47,957,282,31334,30764.52741,146892.0,5981.05


In [22]:
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df = DRG_Analysis_df

DRG_Analysis_Formatted_df["Average Charge"] = DRG_Analysis_df["Average Charge"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df["Max Charge"] = DRG_Analysis_df["Max Charge"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df["Min Charge"] = DRG_Analysis_df["Min Charge"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df

Unnamed: 0,Unique DRGs,Unique Providers,Unique Provider States,Unique Provider Zip Codes,Unique Regions,Total Discharge Count,Average Charge,Max Charge,Min Charge
0,1,1000,47,957,282,31334,"$30,764.53","$146,892.00","$5,981.05"


In [23]:
#MT
DataFrame_MT = DataFrame.loc[DataFrame["provider_state"] == "MT", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in MT: 
Unique_DRGs_MT = len(DataFrame_MT["drg_definition"].unique())
Unique_DRGs_MT

# Calculate the Number of Unique Providers in MT: 
Unique_Provider_count_MT = len(DataFrame_MT["provider_id"].unique())
Unique_Provider_count_MT

# Calculate the Total Number of Unique Provider Zip Codes in MT 
Unique_Provider_ZipCode_Count_MT = len(DataFrame_MT["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_MT
# Calculate the Unique Number of hospital_referral_region_description in MT 
Unique_Hospital_Referral_Region_count_MT = len(DataFrame_MT["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_MT
# Calculate the Total Number of Discharges in MT 
Discharge_Count_MT = (DataFrame_MT["total_discharges"].sum())
Discharge_Count_MT
# Cacluate the average covered charges amount in MT
Average_Covered_Charges_MT = DataFrame_MT["average_covered_charges"].mean()
Average_Covered_Charges_MT
# Cacluate the max covered charge amount in MT
Max_Covered_Charges_MT = DataFrame_MT["average_covered_charges"].max()
Max_Covered_Charges_MT
# Cacluate the min covered charge amount in MT
Min_Covered_Charges_MT = DataFrame_MT["average_covered_charges"].min()
Min_Covered_Charges_MT

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_MT = pd.DataFrame([
    {"Unique DRGs in MT": Unique_DRGs_MT, 
     "Unique Providers in MT": Unique_Provider_count_MT, 
     "Unique Provider Zip Codes in MT": Unique_Provider_ZipCode_Count_MT, 
     "Unique Regions in MT": Unique_Hospital_Referral_Region_count_MT,
     "Total Discharge Count in MT": Discharge_Count_MT,
     "Average Charge in MT": Average_Covered_Charges_MT,
     "Max Charge in MT": Max_Covered_Charges_MT,
     "Min Charge in MT": Min_Covered_Charges_MT
    }
])
DRG_Analysis_df_MT
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_MT = DRG_Analysis_df_MT

DRG_Analysis_Formatted_df_MT["Average Charge in MT"] = DRG_Analysis_df_MT["Average Charge in MT"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_MT["Max Charge in MT"] = DRG_Analysis_df_MT["Max Charge in MT"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_MT["Min Charge in MT"] = DRG_Analysis_df_MT["Min Charge in MT"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_MT




Unnamed: 0,Unique DRGs in MT,Unique Providers in MT,Unique Provider Zip Codes in MT,Unique Regions in MT,Total Discharge Count in MT,Average Charge in MT,Max Charge in MT,Min Charge in MT
0,1,5,5,3,174,"$18,199.58","$22,178.94","$14,227.39"


In [24]:
#NC
DataFrame_NC = DataFrame.loc[DataFrame["provider_state"] == "NC", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in NC: 
Unique_DRGs_NC = len(DataFrame_NC["drg_definition"].unique())
Unique_DRGs_NC

# Calculate the Number of Unique Providers in NC: 
Unique_Provider_count_NC = len(DataFrame_NC["provider_id"].unique())
Unique_Provider_count_NC

# Calculate the Total Number of Unique Provider Zip Codes in NC 
Unique_Provider_ZipCode_Count_NC = len(DataFrame_NC["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_NC
# Calculate the Unique Number of hospital_referral_region_description in NC 
Unique_Hospital_Referral_Region_count_NC = len(DataFrame_NC["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_NC
# Calculate the Total Number of Discharges in NC 
Discharge_Count_NC = (DataFrame_NC["total_discharges"].sum())
Discharge_Count_NC
# Cacluate the average covered charges amount in NC
Average_Covered_Charges_NC = DataFrame_NC["average_covered_charges"].mean()
Average_Covered_Charges_NC
# Cacluate the max covered charge amount in NC
Max_Covered_Charges_NC = DataFrame_NC["average_covered_charges"].max()
Max_Covered_Charges_NC
# Cacluate the min covered charge amount in NC
Min_Covered_Charges_NC = DataFrame_NC["average_covered_charges"].min()
Min_Covered_Charges_NC

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_NC = pd.DataFrame([
    {"Unique DRGs in NC": Unique_DRGs_NC, 
     "Unique Providers in NC": Unique_Provider_count_NC, 
     "Unique Provider Zip Codes in NC": Unique_Provider_ZipCode_Count_NC, 
     "Unique Regions in NC": Unique_Hospital_Referral_Region_count_NC,
     "Total Discharge Count in NC": Discharge_Count_NC,
     "Average Charge in NC": Average_Covered_Charges_NC,
     "Max Charge in NC": Max_Covered_Charges_NC,
     "Min Charge in NC": Min_Covered_Charges_NC
    }
])
DRG_Analysis_df_NC
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_NC = DRG_Analysis_df_NC

DRG_Analysis_Formatted_df_NC["Average Charge in NC"] = DRG_Analysis_df_NC["Average Charge in NC"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NC["Max Charge in NC"] = DRG_Analysis_df_NC["Max Charge in NC"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NC["Min Charge in NC"] = DRG_Analysis_df_NC["Min Charge in NC"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_NC


Unnamed: 0,Unique DRGs in NC,Unique Providers in NC,Unique Provider Zip Codes in NC,Unique Regions in NC,Total Discharge Count in NC,Average Charge in NC,Max Charge in NC,Min Charge in NC
0,1,26,26,10,1141,"$21,999.21","$40,611.73","$11,461.06"


In [25]:
#ND
DataFrame_ND = DataFrame.loc[DataFrame["provider_state"] == "ND", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in ND: 
Unique_DRGs_ND = len(DataFrame_ND["drg_definition"].unique())
Unique_DRGs_ND

# Calculate the Number of Unique Providers in ND: 
Unique_Provider_count_ND = len(DataFrame_ND["provider_id"].unique())
Unique_Provider_count_ND

# Calculate the Total Number of Unique Provider Zip Codes in ND 
Unique_Provider_ZipCode_Count_ND = len(DataFrame_ND["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_ND
# Calculate the Unique Number of hospital_referral_region_description in ND 
Unique_Hospital_Referral_Region_count_ND = len(DataFrame_ND["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_ND
# Calculate the Total Number of Discharges in ND 
Discharge_Count_ND = (DataFrame_ND["total_discharges"].sum())
Discharge_Count_ND
# Cacluate the average covered charges amount in ND
Average_Covered_Charges_ND = DataFrame_ND["average_covered_charges"].mean()
Average_Covered_Charges_ND
# Cacluate the max covered charge amount in ND
Max_Covered_Charges_ND = DataFrame_ND["average_covered_charges"].max()
Max_Covered_Charges_ND
# Cacluate the min covered charge amount in ND
Min_Covered_Charges_ND = DataFrame_ND["average_covered_charges"].min()
Min_Covered_Charges_ND

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_ND = pd.DataFrame([
    {"Unique DRGs in ND": Unique_DRGs_ND, 
     "Unique Providers in ND": Unique_Provider_count_ND, 
     "Unique Provider Zip Codes in ND": Unique_Provider_ZipCode_Count_ND, 
     "Unique Regions in ND": Unique_Hospital_Referral_Region_count_ND,
     "Total Discharge Count in ND": Discharge_Count_ND,
     "Average Charge in ND": Average_Covered_Charges_ND,
     "Max Charge in ND": Max_Covered_Charges_ND,
     "Min Charge in ND": Min_Covered_Charges_ND
    }
])
DRG_Analysis_df_ND
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_ND = DRG_Analysis_df_ND

DRG_Analysis_Formatted_df_ND["Average Charge in ND"] = DRG_Analysis_df_ND["Average Charge in ND"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_ND["Max Charge in ND"] = DRG_Analysis_df_ND["Max Charge in ND"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_ND["Min Charge in ND"] = DRG_Analysis_df_ND["Min Charge in ND"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_ND


Unnamed: 0,Unique DRGs in ND,Unique Providers in ND,Unique Provider Zip Codes in ND,Unique Regions in ND,Total Discharge Count in ND,Average Charge in ND,Max Charge in ND,Min Charge in ND
0,1,6,6,4,178,"$14,450.35","$16,553.17","$11,360.66"


In [26]:
#NE
DataFrame_NE = DataFrame.loc[DataFrame["provider_state"] == "NE", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in NE: 
Unique_DRGs_NE = len(DataFrame_NE["drg_definition"].unique())
Unique_DRGs_NE

# Calculate the Number of Unique Providers in NE: 
Unique_Provider_count_NE = len(DataFrame_NE["provider_id"].unique())
Unique_Provider_count_NE

# Calculate the Total Number of Unique Provider Zip Codes in NE 
Unique_Provider_ZipCode_Count_NE = len(DataFrame_NE["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_NE
# Calculate the Unique Number of hospital_referral_region_description in NE 
Unique_Hospital_Referral_Region_count_NE = len(DataFrame_NE["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_NE
# Calculate the Total Number of Discharges in NE 
Discharge_Count_NE = (DataFrame_NE["total_discharges"].sum())
Discharge_Count_NE
# Cacluate the average covered charges amount in NE
Average_Covered_Charges_NE = DataFrame_NE["average_covered_charges"].mean()
Average_Covered_Charges_NE
# Cacluate the max covered charge amount in NE
Max_Covered_Charges_NE = DataFrame_NE["average_covered_charges"].max()
Max_Covered_Charges_NE
# Cacluate the min covered charge amount in NE
Min_Covered_Charges_NE = DataFrame_NE["average_covered_charges"].min()
Min_Covered_Charges_NE

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_NE = pd.DataFrame([
    {"Unique DRGs in NE": Unique_DRGs_NE, 
     "Unique Providers in NE": Unique_Provider_count_NE, 
     "Unique Provider Zip Codes in NE": Unique_Provider_ZipCode_Count_NE, 
     "Unique Regions in NE": Unique_Hospital_Referral_Region_count_NE,
     "Total Discharge Count in NE": Discharge_Count_NE,
     "Average Charge in NE": Average_Covered_Charges_NE,
     "Max Charge in NE": Max_Covered_Charges_NE,
     "Min Charge in NE": Min_Covered_Charges_NE
    }
])
DRG_Analysis_df_NE
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_NE = DRG_Analysis_df_NE

DRG_Analysis_Formatted_df_NE["Average Charge in NE"] = DRG_Analysis_df_NE["Average Charge in NE"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NE["Max Charge in NE"] = DRG_Analysis_df_NE["Max Charge in NE"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NE["Min Charge in NE"] = DRG_Analysis_df_NE["Min Charge in NE"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_NE


Unnamed: 0,Unique DRGs in NE,Unique Providers in NE,Unique Provider Zip Codes in NE,Unique Regions in NE,Total Discharge Count in NE,Average Charge in NE,Max Charge in NE,Min Charge in NE
0,1,9,9,3,318,"$23,804.48","$35,408.75","$6,994.06"


In [27]:
#NH
DataFrame_NH = DataFrame.loc[DataFrame["provider_state"] == "NH", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in NH: 
Unique_DRGs_NH = len(DataFrame_NH["drg_definition"].unique())
Unique_DRGs_NH

# Calculate the Number of Unique Providers in NH: 
Unique_Provider_count_NH = len(DataFrame_NH["provider_id"].unique())
Unique_Provider_count_NH

# Calculate the Total Number of Unique Provider Zip Codes in NH 
Unique_Provider_ZipCode_Count_NH = len(DataFrame_NH["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_NH
# Calculate the Unique Number of hospital_referral_region_description in NH 
Unique_Hospital_Referral_Region_count_NH = len(DataFrame_NH["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_NH
# Calculate the Total Number of Discharges in NH 
Discharge_Count_NH = (DataFrame_NH["total_discharges"].sum())
Discharge_Count_NH
# Cacluate the average covered charges amount in NH
Average_Covered_Charges_NH = DataFrame_NH["average_covered_charges"].mean()
Average_Covered_Charges_NH
# Cacluate the max covered charge amount in NH
Max_Covered_Charges_NH = DataFrame_NH["average_covered_charges"].max()
Max_Covered_Charges_NH
# Cacluate the min covered charge amount in NH
Min_Covered_Charges_NH = DataFrame_NH["average_covered_charges"].min()
Min_Covered_Charges_NH

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_NH = pd.DataFrame([
    {"Unique DRGs in NH": Unique_DRGs_NH, 
     "Unique Providers in NH": Unique_Provider_count_NH, 
     "Unique Provider Zip Codes in NH": Unique_Provider_ZipCode_Count_NH, 
     "Unique Regions in NH": Unique_Hospital_Referral_Region_count_NH,
     "Total Discharge Count in NH": Discharge_Count_NH,
     "Average Charge in NH": Average_Covered_Charges_NH,
     "Max Charge in NH": Max_Covered_Charges_NH,
     "Min Charge in NH": Min_Covered_Charges_NH
    }
])
DRG_Analysis_df_NH
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_NH = DRG_Analysis_df_NH

DRG_Analysis_Formatted_df_NH["Average Charge in NH"] = DRG_Analysis_df_NH["Average Charge in NH"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NH["Max Charge in NH"] = DRG_Analysis_df_NH["Max Charge in NH"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NH["Min Charge in NH"] = DRG_Analysis_df_NH["Min Charge in NH"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_NH


Unnamed: 0,Unique DRGs in NH,Unique Providers in NH,Unique Provider Zip Codes in NH,Unique Regions in NH,Total Discharge Count in NH,Average Charge in NH,Max Charge in NH,Min Charge in NH
0,1,8,8,2,216,"$24,200.00","$32,770.57","$14,912.42"


In [28]:
#NJ
DataFrame_NJ = DataFrame.loc[DataFrame["provider_state"] == "NJ", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in NJ: 
Unique_DRGs_NJ = len(DataFrame_NJ["drg_definition"].unique())
Unique_DRGs_NJ

# Calculate the Number of Unique Providers in NJ: 
Unique_Provider_count_NJ = len(DataFrame_NJ["provider_id"].unique())
Unique_Provider_count_NJ

# Calculate the Total Number of Unique Provider Zip Codes in NJ 
Unique_Provider_ZipCode_Count_NJ = len(DataFrame_NJ["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_NJ
# Calculate the Unique Number of hospital_referral_region_description in NJ 
Unique_Hospital_Referral_Region_count_NJ = len(DataFrame_NJ["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_NJ
# Calculate the Total Number of Discharges in NJ 
Discharge_Count_NJ = (DataFrame_NJ["total_discharges"].sum())
Discharge_Count_NJ
# Cacluate the average covered charges amount in NJ
Average_Covered_Charges_NJ = DataFrame_NJ["average_covered_charges"].mean()
Average_Covered_Charges_NJ
# Cacluate the max covered charge amount in NJ
Max_Covered_Charges_NJ = DataFrame_NJ["average_covered_charges"].max()
Max_Covered_Charges_NJ
# Cacluate the min covered charge amount in NJ
Min_Covered_Charges_NJ = DataFrame_NJ["average_covered_charges"].min()
Min_Covered_Charges_NJ

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_NJ = pd.DataFrame([
    {"Unique DRGs in NJ": Unique_DRGs_NJ, 
     "Unique Providers in NJ": Unique_Provider_count_NJ, 
     "Unique Provider Zip Codes in NJ": Unique_Provider_ZipCode_Count_NJ, 
     "Unique Regions in NJ": Unique_Hospital_Referral_Region_count_NJ,
     "Total Discharge Count in NJ": Discharge_Count_NJ,
     "Average Charge in NJ": Average_Covered_Charges_NJ,
     "Max Charge in NJ": Max_Covered_Charges_NJ,
     "Min Charge in NJ": Min_Covered_Charges_NJ
    }
])
DRG_Analysis_df_NJ
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_NJ = DRG_Analysis_df_NJ

DRG_Analysis_Formatted_df_NJ["Average Charge in NJ"] = DRG_Analysis_df_NJ["Average Charge in NJ"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NJ["Max Charge in NJ"] = DRG_Analysis_df_NJ["Max Charge in NJ"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NJ["Min Charge in NJ"] = DRG_Analysis_df_NJ["Min Charge in NJ"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_NJ


Unnamed: 0,Unique DRGs in NJ,Unique Providers in NJ,Unique Provider Zip Codes in NJ,Unique Regions in NJ,Total Discharge Count in NJ,Average Charge in NJ,Max Charge in NJ,Min Charge in NJ
0,1,31,29,8,819,"$35,103.81","$53,243.83","$15,980.13"


In [29]:
#NM
DataFrame_NM = DataFrame.loc[DataFrame["provider_state"] == "NM", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in NM: 
Unique_DRGs_NM = len(DataFrame_NM["drg_definition"].unique())
Unique_DRGs_NM

# Calculate the Number of Unique Providers in NM: 
Unique_Provider_count_NM = len(DataFrame_NM["provider_id"].unique())
Unique_Provider_count_NM

# Calculate the Total Number of Unique Provider Zip Codes in NM 
Unique_Provider_ZipCode_Count_NM = len(DataFrame_NM["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_NM
# Calculate the Unique Number of hospital_referral_region_description in NM 
Unique_Hospital_Referral_Region_count_NM = len(DataFrame_NM["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_NM
# Calculate the Total Number of Discharges in NM 
Discharge_Count_NM = (DataFrame_NM["total_discharges"].sum())
Discharge_Count_NM
# Cacluate the average covered charges amount in NM
Average_Covered_Charges_NM = DataFrame_NM["average_covered_charges"].mean()
Average_Covered_Charges_NM
# Cacluate the max covered charge amount in NM
Max_Covered_Charges_NM = DataFrame_NM["average_covered_charges"].max()
Max_Covered_Charges_NM
# Cacluate the min covered charge amount in NM
Min_Covered_Charges_NM = DataFrame_NM["average_covered_charges"].min()
Min_Covered_Charges_NM

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_NM = pd.DataFrame([
    {"Unique DRGs in NM": Unique_DRGs_NM, 
     "Unique Providers in NM": Unique_Provider_count_NM, 
     "Unique Provider Zip Codes in NM": Unique_Provider_ZipCode_Count_NM, 
     "Unique Regions in NM": Unique_Hospital_Referral_Region_count_NM,
     "Total Discharge Count in NM": Discharge_Count_NM,
     "Average Charge in NM": Average_Covered_Charges_NM,
     "Max Charge in NM": Max_Covered_Charges_NM,
     "Min Charge in NM": Min_Covered_Charges_NM
    }
])
DRG_Analysis_df_NM
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_NM = DRG_Analysis_df_NM

DRG_Analysis_Formatted_df_NM["Average Charge in NM"] = DRG_Analysis_df_NM["Average Charge in NM"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NM["Max Charge in NM"] = DRG_Analysis_df_NM["Max Charge in NM"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NM["Min Charge in NM"] = DRG_Analysis_df_NM["Min Charge in NM"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_NM


Unnamed: 0,Unique DRGs in NM,Unique Providers in NM,Unique Provider Zip Codes in NM,Unique Regions in NM,Total Discharge Count in NM,Average Charge in NM,Max Charge in NM,Min Charge in NM
0,1,7,5,3,128,"$32,472.88","$42,012.72","$26,606.38"


In [30]:
#NV
DataFrame_NV = DataFrame.loc[DataFrame["provider_state"] == "NV", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in NV: 
Unique_DRGs_NV = len(DataFrame_NV["drg_definition"].unique())
Unique_DRGs_NV

# Calculate the Number of Unique Providers in NV: 
Unique_Provider_count_NV = len(DataFrame_NV["provider_id"].unique())
Unique_Provider_count_NV

# Calculate the Total Number of Unique Provider Zip Codes in NV 
Unique_Provider_ZipCode_Count_NV = len(DataFrame_NV["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_NV
# Calculate the Unique Number of hospital_referral_region_description in NV 
Unique_Hospital_Referral_Region_count_NV = len(DataFrame_NV["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_NV
# Calculate the Total Number of Discharges in NV 
Discharge_Count_NV = (DataFrame_NV["total_discharges"].sum())
Discharge_Count_NV
# Cacluate the average covered charges amount in NV
Average_Covered_Charges_NV = DataFrame_NV["average_covered_charges"].mean()
Average_Covered_Charges_NV
# Cacluate the max covered charge amount in NV
Max_Covered_Charges_NV = DataFrame_NV["average_covered_charges"].max()
Max_Covered_Charges_NV
# Cacluate the min covered charge amount in NV
Min_Covered_Charges_NV = DataFrame_NV["average_covered_charges"].min()
Min_Covered_Charges_NV

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_NV = pd.DataFrame([
    {"Unique DRGs in NV": Unique_DRGs_NV, 
     "Unique Providers in NV": Unique_Provider_count_NV, 
     "Unique Provider Zip Codes in NV": Unique_Provider_ZipCode_Count_NV, 
     "Unique Regions in NV": Unique_Hospital_Referral_Region_count_NV,
     "Total Discharge Count in NV": Discharge_Count_NV,
     "Average Charge in NV": Average_Covered_Charges_NV,
     "Max Charge in NV": Max_Covered_Charges_NV,
     "Min Charge in NV": Min_Covered_Charges_NV
    }
])
DRG_Analysis_df_NV
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_NV = DRG_Analysis_df_NV

DRG_Analysis_Formatted_df_NV["Average Charge in NV"] = DRG_Analysis_df_NV["Average Charge in NV"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NV["Max Charge in NV"] = DRG_Analysis_df_NV["Max Charge in NV"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NV["Min Charge in NV"] = DRG_Analysis_df_NV["Min Charge in NV"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_NV


Unnamed: 0,Unique DRGs in NV,Unique Providers in NV,Unique Provider Zip Codes in NV,Unique Regions in NV,Total Discharge Count in NV,Average Charge in NV,Max Charge in NV,Min Charge in NV
0,1,11,11,2,311,"$47,518.48","$82,666.26","$23,482.86"


In [31]:
#NY
DataFrame_NY = DataFrame.loc[DataFrame["provider_state"] == "NY", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in NY: 
Unique_DRGs_NY = len(DataFrame_NY["drg_definition"].unique())
Unique_DRGs_NY

# Calculate the Number of Unique Providers in NY: 
Unique_Provider_count_NY = len(DataFrame_NY["provider_id"].unique())
Unique_Provider_count_NY

# Calculate the Total Number of Unique Provider Zip Codes in NY 
Unique_Provider_ZipCode_Count_NY = len(DataFrame_NY["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_NY
# Calculate the Unique Number of hospital_referral_region_description in NY 
Unique_Hospital_Referral_Region_count_NY = len(DataFrame_NY["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_NY
# Calculate the Total Number of Discharges in NY 
Discharge_Count_NY = (DataFrame_NY["total_discharges"].sum())
Discharge_Count_NY
# Cacluate the average covered charges amount in NY
Average_Covered_Charges_NY = DataFrame_NY["average_covered_charges"].mean()
Average_Covered_Charges_NY
# Cacluate the max covered charge amount in NY
Max_Covered_Charges_NY = DataFrame_NY["average_covered_charges"].max()
Max_Covered_Charges_NY
# Cacluate the min covered charge amount in NY
Min_Covered_Charges_NY = DataFrame_NY["average_covered_charges"].min()
Min_Covered_Charges_NY

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_NY = pd.DataFrame([
    {"Unique DRGs in NY": Unique_DRGs_NY, 
     "Unique Providers in NY": Unique_Provider_count_NY, 
     "Unique Provider Zip Codes in NY": Unique_Provider_ZipCode_Count_NY, 
     "Unique Regions in NY": Unique_Hospital_Referral_Region_count_NY,
     "Total Discharge Count in NY": Discharge_Count_NY,
     "Average Charge in NY": Average_Covered_Charges_NY,
     "Max Charge in NY": Max_Covered_Charges_NY,
     "Min Charge in NY": Min_Covered_Charges_NY
    }
])
DRG_Analysis_df_NY
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_NY = DRG_Analysis_df_NY

DRG_Analysis_Formatted_df_NY["Average Charge in NY"] = DRG_Analysis_df_NY["Average Charge in NY"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NY["Max Charge in NY"] = DRG_Analysis_df_NY["Max Charge in NY"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_NY["Min Charge in NY"] = DRG_Analysis_df_NY["Min Charge in NY"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_NY


Unnamed: 0,Unique DRGs in NY,Unique Providers in NY,Unique Provider Zip Codes in NY,Unique Regions in NY,Total Discharge Count in NY,Average Charge in NY,Max Charge in NY,Min Charge in NY
0,1,46,42,12,1336,"$23,260.68","$58,074.18","$7,468.00"


In [32]:
#OH
DataFrame_OH = DataFrame.loc[DataFrame["provider_state"] == "OH", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in OH: 
Unique_DRGs_OH = len(DataFrame_OH["drg_definition"].unique())
Unique_DRGs_OH

# Calculate the Number of Unique Providers in OH: 
Unique_Provider_count_OH = len(DataFrame_OH["provider_id"].unique())
Unique_Provider_count_OH

# Calculate the Total Number of Unique Provider Zip Codes in OH 
Unique_Provider_ZipCode_Count_OH = len(DataFrame_OH["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_OH
# Calculate the Unique Number of hospital_referral_region_description in OH 
Unique_Hospital_Referral_Region_count_OH = len(DataFrame_OH["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_OH
# Calculate the Total Number of Discharges in OH 
Discharge_Count_OH = (DataFrame_OH["total_discharges"].sum())
Discharge_Count_OH
# Cacluate the average covered charges amount in OH
Average_Covered_Charges_OH = DataFrame_OH["average_covered_charges"].mean()
Average_Covered_Charges_OH
# Cacluate the max covered charge amount in OH
Max_Covered_Charges_OH = DataFrame_OH["average_covered_charges"].max()
Max_Covered_Charges_OH
# Cacluate the min covered charge amount in OH
Min_Covered_Charges_OH = DataFrame_OH["average_covered_charges"].min()
Min_Covered_Charges_OH

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_OH = pd.DataFrame([
    {"Unique DRGs in OH": Unique_DRGs_OH, 
     "Unique Providers in OH": Unique_Provider_count_OH, 
     "Unique Provider Zip Codes in OH": Unique_Provider_ZipCode_Count_OH, 
     "Unique Regions in OH": Unique_Hospital_Referral_Region_count_OH,
     "Total Discharge Count in OH": Discharge_Count_OH,
     "Average Charge in OH": Average_Covered_Charges_OH,
     "Max Charge in OH": Max_Covered_Charges_OH,
     "Min Charge in OH": Min_Covered_Charges_OH
    }
])
DRG_Analysis_df_OH
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_OH = DRG_Analysis_df_OH

DRG_Analysis_Formatted_df_OH["Average Charge in OH"] = DRG_Analysis_df_OH["Average Charge in OH"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_OH["Max Charge in OH"] = DRG_Analysis_df_OH["Max Charge in OH"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_OH["Min Charge in OH"] = DRG_Analysis_df_OH["Min Charge in OH"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_OH


Unnamed: 0,Unique DRGs in OH,Unique Providers in OH,Unique Provider Zip Codes in OH,Unique Regions in OH,Total Discharge Count in OH,Average Charge in OH,Max Charge in OH,Min Charge in OH
0,1,48,48,11,1186,"$28,181.94","$59,512.24","$9,973.26"


In [33]:
#OK
DataFrame_OK = DataFrame.loc[DataFrame["provider_state"] == "OK", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in OK: 
Unique_DRGs_OK = len(DataFrame_OK["drg_definition"].unique())
Unique_DRGs_OK

# Calculate the Number of Unique Providers in OK: 
Unique_Provider_count_OK = len(DataFrame_OK["provider_id"].unique())
Unique_Provider_count_OK

# Calculate the Total Number of Unique Provider Zip Codes in OK 
Unique_Provider_ZipCode_Count_OK = len(DataFrame_OK["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_OK
# Calculate the Unique Number of hospital_referral_region_description in OK 
Unique_Hospital_Referral_Region_count_OK = len(DataFrame_OK["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_OK
# Calculate the Total Number of Discharges in OK 
Discharge_Count_OK = (DataFrame_OK["total_discharges"].sum())
Discharge_Count_OK
# Cacluate the average covered charges amount in OK
Average_Covered_Charges_OK = DataFrame_OK["average_covered_charges"].mean()
Average_Covered_Charges_OK
# Cacluate the max covered charge amount in OK
Max_Covered_Charges_OK = DataFrame_OK["average_covered_charges"].max()
Max_Covered_Charges_OK
# Cacluate the min covered charge amount in OK
Min_Covered_Charges_OK = DataFrame_OK["average_covered_charges"].min()
Min_Covered_Charges_OK

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_OK = pd.DataFrame([
    {"Unique DRGs in OK": Unique_DRGs_OK, 
     "Unique Providers in OK": Unique_Provider_count_OK, 
     "Unique Provider Zip Codes in OK": Unique_Provider_ZipCode_Count_OK, 
     "Unique Regions in OK": Unique_Hospital_Referral_Region_count_OK,
     "Total Discharge Count in OK": Discharge_Count_OK,
     "Average Charge in OK": Average_Covered_Charges_OK,
     "Max Charge in OK": Max_Covered_Charges_OK,
     "Min Charge in OK": Min_Covered_Charges_OK
    }
])
DRG_Analysis_df_OK
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_OK = DRG_Analysis_df_OK

DRG_Analysis_Formatted_df_OK["Average Charge in OK"] = DRG_Analysis_df_OK["Average Charge in OK"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_OK["Max Charge in OK"] = DRG_Analysis_df_OK["Max Charge in OK"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_OK["Min Charge in OK"] = DRG_Analysis_df_OK["Min Charge in OK"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_OK


Unnamed: 0,Unique DRGs in OK,Unique Providers in OK,Unique Provider Zip Codes in OK,Unique Regions in OK,Total Discharge Count in OK,Average Charge in OK,Max Charge in OK,Min Charge in OK
0,1,10,9,3,463,"$23,915.59","$38,192.26","$16,458.95"


In [34]:
#OR
DataFrame_OR = DataFrame.loc[DataFrame["provider_state"] == "OR", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in OR: 
Unique_DRGs_OR = len(DataFrame_OR["drg_definition"].unique())
Unique_DRGs_OR

# Calculate the Number of Unique Providers in OR: 
Unique_Provider_count_OR = len(DataFrame_OR["provider_id"].unique())
Unique_Provider_count_OR

# Calculate the Total Number of Unique Provider Zip Codes in OR 
Unique_Provider_ZipCode_Count_OR = len(DataFrame_OR["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_OR
# Calculate the Unique Number of hospital_referral_region_description in OR 
Unique_Hospital_Referral_Region_count_OR = len(DataFrame_OR["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_OR
# Calculate the Total Number of Discharges in OR 
Discharge_Count_OR = (DataFrame_OR["total_discharges"].sum())
Discharge_Count_OR
# Cacluate the average covered charges amount in OR
Average_Covered_Charges_OR = DataFrame_OR["average_covered_charges"].mean()
Average_Covered_Charges_OR
# Cacluate the max covered charge amount in OR
Max_Covered_Charges_OR = DataFrame_OR["average_covered_charges"].max()
Max_Covered_Charges_OR
# Cacluate the min covered charge amount in OR
Min_Covered_Charges_OR = DataFrame_OR["average_covered_charges"].min()
Min_Covered_Charges_OR

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_OR = pd.DataFrame([
    {"Unique DRGs in OR": Unique_DRGs_OR, 
     "Unique Providers in OR": Unique_Provider_count_OR, 
     "Unique Provider Zip Codes in OR": Unique_Provider_ZipCode_Count_OR, 
     "Unique Regions in OR": Unique_Hospital_Referral_Region_count_OR,
     "Total Discharge Count in OR": Discharge_Count_OR,
     "Average Charge in OR": Average_Covered_Charges_OR,
     "Max Charge in OR": Max_Covered_Charges_OR,
     "Min Charge in OR": Min_Covered_Charges_OR
    }
])
DRG_Analysis_df_OR
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_OR = DRG_Analysis_df_OR

DRG_Analysis_Formatted_df_OR["Average Charge in OR"] = DRG_Analysis_df_OR["Average Charge in OR"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_OR["Max Charge in OR"] = DRG_Analysis_df_OR["Max Charge in OR"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_OR["Min Charge in OR"] = DRG_Analysis_df_OR["Min Charge in OR"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_OR


Unnamed: 0,Unique DRGs in OR,Unique Providers in OR,Unique Provider Zip Codes in OR,Unique Regions in OR,Total Discharge Count in OR,Average Charge in OR,Max Charge in OR,Min Charge in OR
0,1,12,10,5,354,"$24,634.94","$33,958.90","$16,988.91"


In [35]:
#PA
DataFrame_PA = DataFrame.loc[DataFrame["provider_state"] == "PA", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in PA: 
Unique_DRGs_PA = len(DataFrame_PA["drg_definition"].unique())
Unique_DRGs_PA

# Calculate the Number of Unique Providers in PA: 
Unique_Provider_count_PA = len(DataFrame_PA["provider_id"].unique())
Unique_Provider_count_PA

# Calculate the Total Number of Unique Provider Zip Codes in PA 
Unique_Provider_ZipCode_Count_PA = len(DataFrame_PA["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_PA
# Calculate the Unique Number of hospital_referral_region_description in PA 
Unique_Hospital_Referral_Region_count_PA = len(DataFrame_PA["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_PA
# Calculate the Total Number of Discharges in PA 
Discharge_Count_PA = (DataFrame_PA["total_discharges"].sum())
Discharge_Count_PA
# Cacluate the average covered charges amount in PA
Average_Covered_Charges_PA = DataFrame_PA["average_covered_charges"].mean()
Average_Covered_Charges_PA
# Cacluate the max covered charge amount in PA
Max_Covered_Charges_PA = DataFrame_PA["average_covered_charges"].max()
Max_Covered_Charges_PA
# Cacluate the min covered charge amount in PA
Min_Covered_Charges_PA = DataFrame_PA["average_covered_charges"].min()
Min_Covered_Charges_PA

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_PA = pd.DataFrame([
    {"Unique DRGs in PA": Unique_DRGs_PA, 
     "Unique Providers in PA": Unique_Provider_count_PA, 
     "Unique Provider Zip Codes in PA": Unique_Provider_ZipCode_Count_PA, 
     "Unique Regions in PA": Unique_Hospital_Referral_Region_count_PA,
     "Total Discharge Count in PA": Discharge_Count_PA,
     "Average Charge in PA": Average_Covered_Charges_PA,
     "Max Charge in PA": Max_Covered_Charges_PA,
     "Min Charge in PA": Min_Covered_Charges_PA
    }
])
DRG_Analysis_df_PA
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_PA = DRG_Analysis_df_PA

DRG_Analysis_Formatted_df_PA["Average Charge in PA"] = DRG_Analysis_df_PA["Average Charge in PA"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_PA["Max Charge in PA"] = DRG_Analysis_df_PA["Max Charge in PA"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_PA["Min Charge in PA"] = DRG_Analysis_df_PA["Min Charge in PA"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_PA


Unnamed: 0,Unique DRGs in PA,Unique Providers in PA,Unique Provider Zip Codes in PA,Unique Regions in PA,Total Discharge Count in PA,Average Charge in PA,Max Charge in PA,Min Charge in PA
0,1,44,42,13,1003,"$33,175.99","$116,349.84","$10,425.36"


In [36]:
#RI
DataFrame_RI = DataFrame.loc[DataFrame["provider_state"] == "RI", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in RI: 
Unique_DRGs_RI = len(DataFrame_RI["drg_definition"].unique())
Unique_DRGs_RI

# Calculate the Number of Unique Providers in RI: 
Unique_Provider_count_RI = len(DataFrame_RI["provider_id"].unique())
Unique_Provider_count_RI

# Calculate the Total Number of Unique Provider Zip Codes in RI 
Unique_Provider_ZipCode_Count_RI = len(DataFrame_RI["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_RI
# Calculate the Unique Number of hospital_referral_region_description in RI 
Unique_Hospital_Referral_Region_count_RI = len(DataFrame_RI["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_RI
# Calculate the Total Number of Discharges in RI 
Discharge_Count_RI = (DataFrame_RI["total_discharges"].sum())
Discharge_Count_RI
# Cacluate the average covered charges amount in RI
Average_Covered_Charges_RI = DataFrame_RI["average_covered_charges"].mean()
Average_Covered_Charges_RI
# Cacluate the max covered charge amount in RI
Max_Covered_Charges_RI = DataFrame_RI["average_covered_charges"].max()
Max_Covered_Charges_RI
# Cacluate the min covered charge amount in RI
Min_Covered_Charges_RI = DataFrame_RI["average_covered_charges"].min()
Min_Covered_Charges_RI

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_RI = pd.DataFrame([
    {"Unique DRGs in RI": Unique_DRGs_RI, 
     "Unique Providers in RI": Unique_Provider_count_RI, 
     "Unique Provider Zip Codes in RI": Unique_Provider_ZipCode_Count_RI, 
     "Unique Regions in RI": Unique_Hospital_Referral_Region_count_RI,
     "Total Discharge Count in RI": Discharge_Count_RI,
     "Average Charge in RI": Average_Covered_Charges_RI,
     "Max Charge in RI": Max_Covered_Charges_RI,
     "Min Charge in RI": Min_Covered_Charges_RI
    }
])
DRG_Analysis_df_RI
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_RI = DRG_Analysis_df_RI

DRG_Analysis_Formatted_df_RI["Average Charge in RI"] = DRG_Analysis_df_RI["Average Charge in RI"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_RI["Max Charge in RI"] = DRG_Analysis_df_RI["Max Charge in RI"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_RI["Min Charge in RI"] = DRG_Analysis_df_RI["Min Charge in RI"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_RI


Unnamed: 0,Unique DRGs in RI,Unique Providers in RI,Unique Provider Zip Codes in RI,Unique Regions in RI,Total Discharge Count in RI,Average Charge in RI,Max Charge in RI,Min Charge in RI
0,1,3,3,1,76,"$24,913.80","$27,174.00","$23,619.86"


In [37]:
#SC
DataFrame_SC = DataFrame.loc[DataFrame["provider_state"] == "SC", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in SC: 
Unique_DRGs_SC = len(DataFrame_SC["drg_definition"].unique())
Unique_DRGs_SC

# Calculate the Number of Unique Providers in SC: 
Unique_Provider_count_SC = len(DataFrame_SC["provider_id"].unique())
Unique_Provider_count_SC

# Calculate the Total Number of Unique Provider Zip Codes in SC 
Unique_Provider_ZipCode_Count_SC = len(DataFrame_SC["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_SC
# Calculate the Unique Number of hospital_referral_region_description in SC 
Unique_Hospital_Referral_Region_count_SC = len(DataFrame_SC["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_SC
# Calculate the Total Number of Discharges in SC 
Discharge_Count_SC = (DataFrame_SC["total_discharges"].sum())
Discharge_Count_SC
# Cacluate the average covered charges amount in SC
Average_Covered_Charges_SC = DataFrame_SC["average_covered_charges"].mean()
Average_Covered_Charges_SC
# Cacluate the max covered charge amount in SC
Max_Covered_Charges_SC = DataFrame_SC["average_covered_charges"].max()
Max_Covered_Charges_SC
# Cacluate the min covered charge amount in SC
Min_Covered_Charges_SC = DataFrame_SC["average_covered_charges"].min()
Min_Covered_Charges_SC

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_SC = pd.DataFrame([
    {"Unique DRGs in SC": Unique_DRGs_SC, 
     "Unique Providers in SC": Unique_Provider_count_SC, 
     "Unique Provider Zip Codes in SC": Unique_Provider_ZipCode_Count_SC, 
     "Unique Regions in SC": Unique_Hospital_Referral_Region_count_SC,
     "Total Discharge Count in SC": Discharge_Count_SC,
     "Average Charge in SC": Average_Covered_Charges_SC,
     "Max Charge in SC": Max_Covered_Charges_SC,
     "Min Charge in SC": Min_Covered_Charges_SC
    }
])
DRG_Analysis_df_SC
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_SC = DRG_Analysis_df_SC

DRG_Analysis_Formatted_df_SC["Average Charge in SC"] = DRG_Analysis_df_SC["Average Charge in SC"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_SC["Max Charge in SC"] = DRG_Analysis_df_SC["Max Charge in SC"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_SC["Min Charge in SC"] = DRG_Analysis_df_SC["Min Charge in SC"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_SC


Unnamed: 0,Unique DRGs in SC,Unique Providers in SC,Unique Provider Zip Codes in SC,Unique Regions in SC,Total Discharge Count in SC,Average Charge in SC,Max Charge in SC,Min Charge in SC
0,1,19,19,8,721,"$33,864.17","$72,954.62","$16,748.91"


In [38]:
#SD
DataFrame_SD = DataFrame.loc[DataFrame["provider_state"] == "SD", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in SD: 
Unique_DRGs_SD = len(DataFrame_SD["drg_definition"].unique())
Unique_DRGs_SD

# Calculate the Number of Unique Providers in SD: 
Unique_Provider_count_SD = len(DataFrame_SD["provider_id"].unique())
Unique_Provider_count_SD

# Calculate the Total Number of Unique Provider Zip Codes in SD 
Unique_Provider_ZipCode_Count_SD = len(DataFrame_SD["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_SD
# Calculate the Unique Number of hospital_referral_region_description in SD 
Unique_Hospital_Referral_Region_count_SD = len(DataFrame_SD["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_SD
# Calculate the Total Number of Discharges in SD 
Discharge_Count_SD = (DataFrame_SD["total_discharges"].sum())
Discharge_Count_SD
# Cacluate the average covered charges amount in SD
Average_Covered_Charges_SD = DataFrame_SD["average_covered_charges"].mean()
Average_Covered_Charges_SD
# Cacluate the max covered charge amount in SD
Max_Covered_Charges_SD = DataFrame_SD["average_covered_charges"].max()
Max_Covered_Charges_SD
# Cacluate the min covered charge amount in SD
Min_Covered_Charges_SD = DataFrame_SD["average_covered_charges"].min()
Min_Covered_Charges_SD

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_SD = pd.DataFrame([
    {"Unique DRGs in SD": Unique_DRGs_SD, 
     "Unique Providers in SD": Unique_Provider_count_SD, 
     "Unique Provider Zip Codes in SD": Unique_Provider_ZipCode_Count_SD, 
     "Unique Regions in SD": Unique_Hospital_Referral_Region_count_SD,
     "Total Discharge Count in SD": Discharge_Count_SD,
     "Average Charge in SD": Average_Covered_Charges_SD,
     "Max Charge in SD": Max_Covered_Charges_SD,
     "Min Charge in SD": Min_Covered_Charges_SD
    }
])
DRG_Analysis_df_SD
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_SD = DRG_Analysis_df_SD

DRG_Analysis_Formatted_df_SD["Average Charge in SD"] = DRG_Analysis_df_SD["Average Charge in SD"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_SD["Max Charge in SD"] = DRG_Analysis_df_SD["Max Charge in SD"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_SD["Min Charge in SD"] = DRG_Analysis_df_SD["Min Charge in SD"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_SD


Unnamed: 0,Unique DRGs in SD,Unique Providers in SD,Unique Provider Zip Codes in SD,Unique Regions in SD,Total Discharge Count in SD,Average Charge in SD,Max Charge in SD,Min Charge in SD
0,1,4,4,2,156,"$21,836.92","$30,355.22","$12,715.56"


In [39]:
#TN
DataFrame_TN = DataFrame.loc[DataFrame["provider_state"] == "TN", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in TN: 
Unique_DRGs_TN = len(DataFrame_TN["drg_definition"].unique())
Unique_DRGs_TN

# Calculate the Number of Unique Providers in TN: 
Unique_Provider_count_TN = len(DataFrame_TN["provider_id"].unique())
Unique_Provider_count_TN

# Calculate the Total Number of Unique Provider Zip Codes in TN 
Unique_Provider_ZipCode_Count_TN = len(DataFrame_TN["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_TN
# Calculate the Unique Number of hospital_referral_region_description in TN 
Unique_Hospital_Referral_Region_count_TN = len(DataFrame_TN["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_TN
# Calculate the Total Number of Discharges in TN 
Discharge_Count_TN = (DataFrame_TN["total_discharges"].sum())
Discharge_Count_TN
# Cacluate the average covered charges amount in TN
Average_Covered_Charges_TN = DataFrame_TN["average_covered_charges"].mean()
Average_Covered_Charges_TN
# Cacluate the max covered charge amount in TN
Max_Covered_Charges_TN = DataFrame_TN["average_covered_charges"].max()
Max_Covered_Charges_TN
# Cacluate the min covered charge amount in TN
Min_Covered_Charges_TN = DataFrame_TN["average_covered_charges"].min()
Min_Covered_Charges_TN

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_TN = pd.DataFrame([
    {"Unique DRGs in TN": Unique_DRGs_TN, 
     "Unique Providers in TN": Unique_Provider_count_TN, 
     "Unique Provider Zip Codes in TN": Unique_Provider_ZipCode_Count_TN, 
     "Unique Regions in TN": Unique_Hospital_Referral_Region_count_TN,
     "Total Discharge Count in TN": Discharge_Count_TN,
     "Average Charge in TN": Average_Covered_Charges_TN,
     "Max Charge in TN": Max_Covered_Charges_TN,
     "Min Charge in TN": Min_Covered_Charges_TN
    }
])
DRG_Analysis_df_TN
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_TN = DRG_Analysis_df_TN

DRG_Analysis_Formatted_df_TN["Average Charge in TN"] = DRG_Analysis_df_TN["Average Charge in TN"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_TN["Max Charge in TN"] = DRG_Analysis_df_TN["Max Charge in TN"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_TN["Min Charge in TN"] = DRG_Analysis_df_TN["Min Charge in TN"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_TN


Unnamed: 0,Unique DRGs in TN,Unique Providers in TN,Unique Provider Zip Codes in TN,Unique Regions in TN,Total Discharge Count in TN,Average Charge in TN,Max Charge in TN,Min Charge in TN
0,1,32,31,7,986,"$26,417.38","$56,329.57","$10,904.81"


In [40]:
#TX
DataFrame_TX = DataFrame.loc[DataFrame["provider_state"] == "TX", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in TX: 
Unique_DRGs_TX = len(DataFrame_TX["drg_definition"].unique())
Unique_DRGs_TX

# Calculate the Number of Unique Providers in TX: 
Unique_Provider_count_TX = len(DataFrame_TX["provider_id"].unique())
Unique_Provider_count_TX

# Calculate the Total Number of Unique Provider Zip Codes in TX 
Unique_Provider_ZipCode_Count_TX = len(DataFrame_TX["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_TX
# Calculate the Unique Number of hospital_referral_region_description in TX 
Unique_Hospital_Referral_Region_count_TX = len(DataFrame_TX["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_TX
# Calculate the Total Number of Discharges in TX 
Discharge_Count_TX = (DataFrame_TX["total_discharges"].sum())
Discharge_Count_TX
# Cacluate the average covered charges amount in TX
Average_Covered_Charges_TX = DataFrame_TX["average_covered_charges"].mean()
Average_Covered_Charges_TX
# Cacluate the max covered charge amount in TX
Max_Covered_Charges_TX = DataFrame_TX["average_covered_charges"].max()
Max_Covered_Charges_TX
# Cacluate the min covered charge amount in TX
Min_Covered_Charges_TX = DataFrame_TX["average_covered_charges"].min()
Min_Covered_Charges_TX

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_TX = pd.DataFrame([
    {"Unique DRGs in TX": Unique_DRGs_TX, 
     "Unique Providers in TX": Unique_Provider_count_TX, 
     "Unique Provider Zip Codes in TX": Unique_Provider_ZipCode_Count_TX, 
     "Unique Regions in TX": Unique_Hospital_Referral_Region_count_TX,
     "Total Discharge Count in TX": Discharge_Count_TX,
     "Average Charge in TX": Average_Covered_Charges_TX,
     "Max Charge in TX": Max_Covered_Charges_TX,
     "Min Charge in TX": Min_Covered_Charges_TX
    }
])
DRG_Analysis_df_TX
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_TX = DRG_Analysis_df_TX

DRG_Analysis_Formatted_df_TX["Average Charge in TX"] = DRG_Analysis_df_TX["Average Charge in TX"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_TX["Max Charge in TX"] = DRG_Analysis_df_TX["Max Charge in TX"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_TX["Min Charge in TX"] = DRG_Analysis_df_TX["Min Charge in TX"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_TX


Unnamed: 0,Unique DRGs in TX,Unique Providers in TX,Unique Provider Zip Codes in TX,Unique Regions in TX,Total Discharge Count in TX,Average Charge in TX,Max Charge in TX,Min Charge in TX
0,1,76,67,23,2759,"$31,299.57","$81,126.90","$11,835.57"


In [41]:
#UT
DataFrame_UT = DataFrame.loc[DataFrame["provider_state"] == "UT", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in UT: 
Unique_DRGs_UT = len(DataFrame_UT["drg_definition"].unique())
Unique_DRGs_UT

# Calculate the Number of Unique Providers in UT: 
Unique_Provider_count_UT = len(DataFrame_UT["provider_id"].unique())
Unique_Provider_count_UT

# Calculate the Total Number of Unique Provider Zip Codes in UT 
Unique_Provider_ZipCode_Count_UT = len(DataFrame_UT["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_UT
# Calculate the Unique Number of hospital_referral_region_description in UT 
Unique_Hospital_Referral_Region_count_UT = len(DataFrame_UT["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_UT
# Calculate the Total Number of Discharges in UT 
Discharge_Count_UT = (DataFrame_UT["total_discharges"].sum())
Discharge_Count_UT
# Cacluate the average covered charges amount in UT
Average_Covered_Charges_UT = DataFrame_UT["average_covered_charges"].mean()
Average_Covered_Charges_UT
# Cacluate the max covered charge amount in UT
Max_Covered_Charges_UT = DataFrame_UT["average_covered_charges"].max()
Max_Covered_Charges_UT
# Cacluate the min covered charge amount in UT
Min_Covered_Charges_UT = DataFrame_UT["average_covered_charges"].min()
Min_Covered_Charges_UT

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_UT = pd.DataFrame([
    {"Unique DRGs in UT": Unique_DRGs_UT, 
     "Unique Providers in UT": Unique_Provider_count_UT, 
     "Unique Provider Zip Codes in UT": Unique_Provider_ZipCode_Count_UT, 
     "Unique Regions in UT": Unique_Hospital_Referral_Region_count_UT,
     "Total Discharge Count in UT": Discharge_Count_UT,
     "Average Charge in UT": Average_Covered_Charges_UT,
     "Max Charge in UT": Max_Covered_Charges_UT,
     "Min Charge in UT": Min_Covered_Charges_UT
    }
])
DRG_Analysis_df_UT
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_UT = DRG_Analysis_df_UT

DRG_Analysis_Formatted_df_UT["Average Charge in UT"] = DRG_Analysis_df_UT["Average Charge in UT"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_UT["Max Charge in UT"] = DRG_Analysis_df_UT["Max Charge in UT"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_UT["Min Charge in UT"] = DRG_Analysis_df_UT["Min Charge in UT"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_UT


Unnamed: 0,Unique DRGs in UT,Unique Providers in UT,Unique Provider Zip Codes in UT,Unique Regions in UT,Total Discharge Count in UT,Average Charge in UT,Max Charge in UT,Min Charge in UT
0,1,6,6,3,109,"$20,597.69","$25,490.15","$14,939.52"


In [42]:
#VA
DataFrame_VA = DataFrame.loc[DataFrame["provider_state"] == "VA", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in VA: 
Unique_DRGs_VA = len(DataFrame_VA["drg_definition"].unique())
Unique_DRGs_VA

# Calculate the Number of Unique Providers in VA: 
Unique_Provider_count_VA = len(DataFrame_VA["provider_id"].unique())
Unique_Provider_count_VA

# Calculate the Total Number of Unique Provider Zip Codes in VA 
Unique_Provider_ZipCode_Count_VA = len(DataFrame_VA["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_VA
# Calculate the Unique Number of hospital_referral_region_description in VA 
Unique_Hospital_Referral_Region_count_VA = len(DataFrame_VA["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_VA
# Calculate the Total Number of Discharges in VA 
Discharge_Count_VA = (DataFrame_VA["total_discharges"].sum())
Discharge_Count_VA
# Cacluate the average covered charges amount in VA
Average_Covered_Charges_VA = DataFrame_VA["average_covered_charges"].mean()
Average_Covered_Charges_VA
# Cacluate the max covered charge amount in VA
Max_Covered_Charges_VA = DataFrame_VA["average_covered_charges"].max()
Max_Covered_Charges_VA
# Cacluate the min covered charge amount in VA
Min_Covered_Charges_VA = DataFrame_VA["average_covered_charges"].min()
Min_Covered_Charges_VA

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_VA = pd.DataFrame([
    {"Unique DRGs in VA": Unique_DRGs_VA, 
     "Unique Providers in VA": Unique_Provider_count_VA, 
     "Unique Provider Zip Codes in VA": Unique_Provider_ZipCode_Count_VA, 
     "Unique Regions in VA": Unique_Hospital_Referral_Region_count_VA,
     "Total Discharge Count in VA": Discharge_Count_VA,
     "Average Charge in VA": Average_Covered_Charges_VA,
     "Max Charge in VA": Max_Covered_Charges_VA,
     "Min Charge in VA": Min_Covered_Charges_VA
    }
])
DRG_Analysis_df_VA
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_VA = DRG_Analysis_df_VA

DRG_Analysis_Formatted_df_VA["Average Charge in VA"] = DRG_Analysis_df_VA["Average Charge in VA"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_VA["Max Charge in VA"] = DRG_Analysis_df_VA["Max Charge in VA"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_VA["Min Charge in VA"] = DRG_Analysis_df_VA["Min Charge in VA"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_VA


Unnamed: 0,Unique DRGs in VA,Unique Providers in VA,Unique Provider Zip Codes in VA,Unique Regions in VA,Total Discharge Count in VA,Average Charge in VA,Max Charge in VA,Min Charge in VA
0,1,7,7,4,207,"$22,684.29","$35,318.41","$12,007.86"


In [43]:
#VT
DataFrame_VT = DataFrame.loc[DataFrame["provider_state"] == "VT", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in VT: 
Unique_DRGs_VT = len(DataFrame_VT["drg_definition"].unique())
Unique_DRGs_VT

# Calculate the Number of Unique Providers in VT: 
Unique_Provider_count_VT = len(DataFrame_VT["provider_id"].unique())
Unique_Provider_count_VT

# Calculate the Total Number of Unique Provider Zip Codes in VT 
Unique_Provider_ZipCode_Count_VT = len(DataFrame_VT["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_VT
# Calculate the Unique Number of hospital_referral_region_description in VT 
Unique_Hospital_Referral_Region_count_VT = len(DataFrame_VT["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_VT
# Calculate the Total Number of Discharges in VT 
Discharge_Count_VT = (DataFrame_VT["total_discharges"].sum())
Discharge_Count_VT
# Cacluate the average covered charges amount in VT
Average_Covered_Charges_VT = DataFrame_VT["average_covered_charges"].mean()
Average_Covered_Charges_VT
# Cacluate the max covered charge amount in VT
Max_Covered_Charges_VT = DataFrame_VT["average_covered_charges"].max()
Max_Covered_Charges_VT
# Cacluate the min covered charge amount in VT
Min_Covered_Charges_VT = DataFrame_VT["average_covered_charges"].min()
Min_Covered_Charges_VT

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_VT = pd.DataFrame([
    {"Unique DRGs in VT": Unique_DRGs_VT, 
     "Unique Providers in VT": Unique_Provider_count_VT, 
     "Unique Provider Zip Codes in VT": Unique_Provider_ZipCode_Count_VT, 
     "Unique Regions in VT": Unique_Hospital_Referral_Region_count_VT,
     "Total Discharge Count in VT": Discharge_Count_VT,
     "Average Charge in VT": Average_Covered_Charges_VT,
     "Max Charge in VT": Max_Covered_Charges_VT,
     "Min Charge in VT": Min_Covered_Charges_VT
    }
])
DRG_Analysis_df_VT
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_VT = DRG_Analysis_df_VT

DRG_Analysis_Formatted_df_VT["Average Charge in VT"] = DRG_Analysis_df_VT["Average Charge in VT"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_VT["Max Charge in VT"] = DRG_Analysis_df_VT["Max Charge in VT"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_VT["Min Charge in VT"] = DRG_Analysis_df_VT["Min Charge in VT"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_VT


Unnamed: 0,Unique DRGs in VT,Unique Providers in VT,Unique Provider Zip Codes in VT,Unique Regions in VT,Total Discharge Count in VT,Average Charge in VT,Max Charge in VT,Min Charge in VT
0,1,1,1,1,57,"$17,934.35","$17,934.35","$17,934.35"


In [44]:
#WA
DataFrame_WA = DataFrame.loc[DataFrame["provider_state"] == "WA", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in WA: 
Unique_DRGs_WA = len(DataFrame_WA["drg_definition"].unique())
Unique_DRGs_WA

# Calculate the Number of Unique Providers in WA: 
Unique_Provider_count_WA = len(DataFrame_WA["provider_id"].unique())
Unique_Provider_count_WA

# Calculate the Total Number of Unique Provider Zip Codes in WA 
Unique_Provider_ZipCode_Count_WA = len(DataFrame_WA["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_WA
# Calculate the Unique Number of hospital_referral_region_description in WA 
Unique_Hospital_Referral_Region_count_WA = len(DataFrame_WA["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_WA
# Calculate the Total Number of Discharges in WA 
Discharge_Count_WA = (DataFrame_WA["total_discharges"].sum())
Discharge_Count_WA
# Cacluate the average covered charges amount in WA
Average_Covered_Charges_WA = DataFrame_WA["average_covered_charges"].mean()
Average_Covered_Charges_WA
# Cacluate the max covered charge amount in WA
Max_Covered_Charges_WA = DataFrame_WA["average_covered_charges"].max()
Max_Covered_Charges_WA
# Cacluate the min covered charge amount in WA
Min_Covered_Charges_WA = DataFrame_WA["average_covered_charges"].min()
Min_Covered_Charges_WA

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_WA = pd.DataFrame([
    {"Unique DRGs in WA": Unique_DRGs_WA, 
     "Unique Providers in WA": Unique_Provider_count_WA, 
     "Unique Provider Zip Codes in WA": Unique_Provider_ZipCode_Count_WA, 
     "Unique Regions in WA": Unique_Hospital_Referral_Region_count_WA,
     "Total Discharge Count in WA": Discharge_Count_WA,
     "Average Charge in WA": Average_Covered_Charges_WA,
     "Max Charge in WA": Max_Covered_Charges_WA,
     "Min Charge in WA": Min_Covered_Charges_WA
    }
])
DRG_Analysis_df_WA
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_WA = DRG_Analysis_df_WA

DRG_Analysis_Formatted_df_WA["Average Charge in WA"] = DRG_Analysis_df_WA["Average Charge in WA"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_WA["Max Charge in WA"] = DRG_Analysis_df_WA["Max Charge in WA"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_WA["Min Charge in WA"] = DRG_Analysis_df_WA["Min Charge in WA"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_WA


Unnamed: 0,Unique DRGs in WA,Unique Providers in WA,Unique Provider Zip Codes in WA,Unique Regions in WA,Total Discharge Count in WA,Average Charge in WA,Max Charge in WA,Min Charge in WA
0,0,0,0,0,0,$nan,$nan,$nan


In [45]:
#WI
DataFrame_WI = DataFrame.loc[DataFrame["provider_state"] == "WI", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in WI: 
Unique_DRGs_WI = len(DataFrame_WI["drg_definition"].unique())
Unique_DRGs_WI

# Calculate the Number of Unique Providers in WI: 
Unique_Provider_count_WI = len(DataFrame_WI["provider_id"].unique())
Unique_Provider_count_WI

# Calculate the Total Number of Unique Provider Zip Codes in WI 
Unique_Provider_ZipCode_Count_WI = len(DataFrame_WI["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_WI
# Calculate the Unique Number of hospital_referral_region_description in WI 
Unique_Hospital_Referral_Region_count_WI = len(DataFrame_WI["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_WI
# Calculate the Total Number of Discharges in WI 
Discharge_Count_WI = (DataFrame_WI["total_discharges"].sum())
Discharge_Count_WI
# Cacluate the average covered charges amount in WI
Average_Covered_Charges_WI = DataFrame_WI["average_covered_charges"].mean()
Average_Covered_Charges_WI
# Cacluate the max covered charge amount in WI
Max_Covered_Charges_WI = DataFrame_WI["average_covered_charges"].max()
Max_Covered_Charges_WI
# Cacluate the min covered charge amount in WI
Min_Covered_Charges_WI = DataFrame_WI["average_covered_charges"].min()
Min_Covered_Charges_WI

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_WI = pd.DataFrame([
    {"Unique DRGs in WI": Unique_DRGs_WI, 
     "Unique Providers in WI": Unique_Provider_count_WI, 
     "Unique Provider Zip Codes in WI": Unique_Provider_ZipCode_Count_WI, 
     "Unique Regions in WI": Unique_Hospital_Referral_Region_count_WI,
     "Total Discharge Count in WI": Discharge_Count_WI,
     "Average Charge in WI": Average_Covered_Charges_WI,
     "Max Charge in WI": Max_Covered_Charges_WI,
     "Min Charge in WI": Min_Covered_Charges_WI
    }
])
DRG_Analysis_df_WI
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_WI = DRG_Analysis_df_WI

DRG_Analysis_Formatted_df_WI["Average Charge in WI"] = DRG_Analysis_df_WI["Average Charge in WI"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_WI["Max Charge in WI"] = DRG_Analysis_df_WI["Max Charge in WI"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_WI["Min Charge in WI"] = DRG_Analysis_df_WI["Min Charge in WI"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_WI


Unnamed: 0,Unique DRGs in WI,Unique Providers in WI,Unique Provider Zip Codes in WI,Unique Regions in WI,Total Discharge Count in WI,Average Charge in WI,Max Charge in WI,Min Charge in WI
0,0,0,0,0,0,$nan,$nan,$nan


In [46]:
#WV
DataFrame_WV = DataFrame.loc[DataFrame["provider_state"] == "WV", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in WV: 
Unique_DRGs_WV = len(DataFrame_WV["drg_definition"].unique())
Unique_DRGs_WV

# Calculate the Number of Unique Providers in WV: 
Unique_Provider_count_WV = len(DataFrame_WV["provider_id"].unique())
Unique_Provider_count_WV

# Calculate the Total Number of Unique Provider Zip Codes in WV 
Unique_Provider_ZipCode_Count_WV = len(DataFrame_WV["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_WV
# Calculate the Unique Number of hospital_referral_region_description in WV 
Unique_Hospital_Referral_Region_count_WV = len(DataFrame_WV["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_WV
# Calculate the Total Number of Discharges in WV 
Discharge_Count_WV = (DataFrame_WV["total_discharges"].sum())
Discharge_Count_WV
# Cacluate the average covered charges amount in WV
Average_Covered_Charges_WV = DataFrame_WV["average_covered_charges"].mean()
Average_Covered_Charges_WV
# Cacluate the max covered charge amount in WV
Max_Covered_Charges_WV = DataFrame_WV["average_covered_charges"].max()
Max_Covered_Charges_WV
# Cacluate the min covered charge amount in WV
Min_Covered_Charges_WV = DataFrame_WV["average_covered_charges"].min()
Min_Covered_Charges_WV

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_WV = pd.DataFrame([
    {"Unique DRGs in WV": Unique_DRGs_WV, 
     "Unique Providers in WV": Unique_Provider_count_WV, 
     "Unique Provider Zip Codes in WV": Unique_Provider_ZipCode_Count_WV, 
     "Unique Regions in WV": Unique_Hospital_Referral_Region_count_WV,
     "Total Discharge Count in WV": Discharge_Count_WV,
     "Average Charge in WV": Average_Covered_Charges_WV,
     "Max Charge in WV": Max_Covered_Charges_WV,
     "Min Charge in WV": Min_Covered_Charges_WV
    }
])
DRG_Analysis_df_WV
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_WV = DRG_Analysis_df_WV

DRG_Analysis_Formatted_df_WV["Average Charge in WV"] = DRG_Analysis_df_WV["Average Charge in WV"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_WV["Max Charge in WV"] = DRG_Analysis_df_WV["Max Charge in WV"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_WV["Min Charge in WV"] = DRG_Analysis_df_WV["Min Charge in WV"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_WV


Unnamed: 0,Unique DRGs in WV,Unique Providers in WV,Unique Provider Zip Codes in WV,Unique Regions in WV,Total Discharge Count in WV,Average Charge in WV,Max Charge in WV,Min Charge in WV
0,0,0,0,0,0,$nan,$nan,$nan


In [47]:
#WY
DataFrame_WY = DataFrame.loc[DataFrame["provider_state"] == "WY", :]
# Calculate the Number of Unique Diagnosis Related Groups (DRGs) in WY: 
Unique_DRGs_WY = len(DataFrame_WY["drg_definition"].unique())
Unique_DRGs_WY

# Calculate the Number of Unique Providers in WY: 
Unique_Provider_count_WY = len(DataFrame_WY["provider_id"].unique())
Unique_Provider_count_WY

# Calculate the Total Number of Unique Provider Zip Codes in WY 
Unique_Provider_ZipCode_Count_WY = len(DataFrame_WY["provider_zip_code"].unique())
Unique_Provider_ZipCode_Count_WY
# Calculate the Unique Number of hospital_referral_region_description in WY 
Unique_Hospital_Referral_Region_count_WY = len(DataFrame_WY["hospital_referral_region_description"].unique())
Unique_Hospital_Referral_Region_count_WY
# Calculate the Total Number of Discharges in WY 
Discharge_Count_WY = (DataFrame_WY["total_discharges"].sum())
Discharge_Count_WY
# Cacluate the average covered charges amount in WY
Average_Covered_Charges_WY = DataFrame_WY["average_covered_charges"].mean()
Average_Covered_Charges_WY
# Cacluate the max covered charge amount in WY
Max_Covered_Charges_WY = DataFrame_WY["average_covered_charges"].max()
Max_Covered_Charges_WY
# Cacluate the min covered charge amount in WY
Min_Covered_Charges_WY = DataFrame_WY["average_covered_charges"].min()
Min_Covered_Charges_WY

# Create a summary data frame to hold the Analysis Results

DRG_Analysis_df_WY = pd.DataFrame([
    {"Unique DRGs in WY": Unique_DRGs_WY, 
     "Unique Providers in WY": Unique_Provider_count_WY, 
     "Unique Provider Zip Codes in WY": Unique_Provider_ZipCode_Count_WY, 
     "Unique Regions in WY": Unique_Hospital_Referral_Region_count_WY,
     "Total Discharge Count in WY": Discharge_Count_WY,
     "Average Charge in WY": Average_Covered_Charges_WY,
     "Max Charge in WY": Max_Covered_Charges_WY,
     "Min Charge in WY": Min_Covered_Charges_WY
    }
])
DRG_Analysis_df_WY
# Give the displayed data cleaner formatting

DRG_Analysis_Formatted_df_WY = DRG_Analysis_df_WY

DRG_Analysis_Formatted_df_WY["Average Charge in WY"] = DRG_Analysis_df_WY["Average Charge in WY"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_WY["Max Charge in WY"] = DRG_Analysis_df_WY["Max Charge in WY"].map("${:,.2f}".format)
DRG_Analysis_Formatted_df_WY["Min Charge in WY"] = DRG_Analysis_df_WY["Min Charge in WY"].map("${:,.2f}".format)

DRG_Analysis_Formatted_df_WY


Unnamed: 0,Unique DRGs in WY,Unique Providers in WY,Unique Provider Zip Codes in WY,Unique Regions in WY,Total Discharge Count in WY,Average Charge in WY,Max Charge in WY,Min Charge in WY
0,0,0,0,0,0,$nan,$nan,$nan
