In [1]:
import pandas as pd
import sqlite3
import numpy as np
from tqdm.notebook import tqdm
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', 300)

In [2]:
#db = sqlite3.connect('data/hop_team.sqlite')
#db.execute('CREATE INDEX from_npi ON calls(from_npi)')
#db.close()

In [3]:
query = '''WITH tax_nucc AS(
            SELECT * 
            FROM taxonomy as t
            JOIN nucc as n
            ON t.taxonomy_code=n.code
            WHERE taxonomy_switch = 'Y' 
            ),
            trim_npi AS(
            SELECT npi, entity_type_code, `provider_organization_name_(legal_business_name)`,`provider_last_name_(legal_name)`,provider_first_name,provider_middle_name,provider_name_prefix_text,provider_name_suffix_text,provider_credential_text,provider_other_organization_name,provider_first_line_business_mailing_address,provider_second_line_business_mailing_address,provider_business_mailing_address_city_name,provider_business_mailing_address_state_name,provider_business_mailing_address_postal_code,
                CASE WHEN `provider_organization_name_(legal_business_name)` LIKE '%Vanderbilt%' THEN 'Vanderbilt'
                ELSE '-' END AS facility_consolidation
            FROM npi
            WHERE provider_business_mailing_address_state_name = 'TN'
            ),
            best_npi AS(
                        SELECT*
                        FROM trim_npi
                        JOIN tax_nucc
                        on trim_npi.npi= tax_nucc.NPI
                        )
            SELECT *
            FROM calls
            JOIN best_npi
            on calls.from_npi=best_npi.npi
            JOIN best_npi AS b1
            on calls.to_npi=b1.npi
            WHERE transaction_count>49
            AND average_day_wait<100
            AND average_day_wait>0
            '''
with sqlite3.connect('data/hop_team.sqlite') as db:
    full = pd.read_sql(query, db)
    
    

In [4]:
full.shape

(852201, 60)

In [5]:
full.info

<bound method DataFrame.info of           from_npi      to_npi  patient_count  transaction_count  \
0       1841293891  1245290857            176                231   
1       1841293891  1245437060             44                 50   
2       1841293891  1306061601             67                 76   
3       1841293891  1356633564             56                 66   
4       1841293891  1457302010            233                366   
...            ...         ...            ...                ...   
852196  1275001851  1184610859             62                 62   
852197  1275001851  1275531956            130                130   
852198  1275001851  1366440570             74                 74   
852199  1275001851  1710919980            108                108   
852200  1275001851  1972648319             84                 84   

        average_day_wait  std_day_wait         npi  entity_type_code  \
0                 28.857        60.036  1841293891               1.0   
1      

In [6]:
list(full)

['from_npi',
 'to_npi',
 'patient_count',
 'transaction_count',
 'average_day_wait',
 'std_day_wait',
 'npi',
 'entity_type_code',
 'provider_organization_name_(legal_business_name)',
 'provider_last_name_(legal_name)',
 'provider_first_name',
 'provider_middle_name',
 'provider_name_prefix_text',
 'provider_name_suffix_text',
 'provider_credential_text',
 'provider_other_organization_name',
 'provider_first_line_business_mailing_address',
 'provider_second_line_business_mailing_address',
 'provider_business_mailing_address_city_name',
 'provider_business_mailing_address_state_name',
 'provider_business_mailing_address_postal_code',
 'facility_consolidation',
 'NPI:1',
 'taxonomy_switch',
 'taxonomy_code',
 'code',
 'grouping',
 'classification',
 'specialization',
 'definition',
 'notes',
 'display_name',
 'section',
 'npi',
 'entity_type_code',
 'provider_organization_name_(legal_business_name)',
 'provider_last_name_(legal_name)',
 'provider_first_name',
 'provider_middle_name',
 'p

In [7]:
last_col= full.pop('to_npi')

In [8]:
full.insert(loc=31, column= 'to_npi', value= last_col)

In [9]:
full.pop('npi')

Unnamed: 0,npi,npi.1
0,1841293891,1245290857
1,1841293891,1245437060
2,1841293891,1306061601
3,1841293891,1356633564
4,1841293891,1457302010
...,...,...
852196,1275001851,1184610859
852197,1275001851,1275531956
852198,1275001851,1366440570
852199,1275001851,1710919980


In [10]:
full.pop('NPI:1')

Unnamed: 0,NPI:1,NPI:1.1
0,1841293891,1245290857
1,1841293891,1245437060
2,1841293891,1306061601
3,1841293891,1356633564
4,1841293891,1457302010
...,...,...
852196,1275001851,1184610859
852197,1275001851,1275531956
852198,1275001851,1366440570
852199,1275001851,1710919980


In [11]:
full.nunique()

from_npi                                            25307
patient_count                                        4433
transaction_count                                    5858
average_day_wait                                    96768
std_day_wait                                        91994
entity_type_code                                        2
provider_organization_name_(legal_business_name)     4613
provider_last_name_(legal_name)                      9294
provider_first_name                                  3859
provider_middle_name                                 2711
provider_name_prefix_text                               6
provider_name_suffix_text                               6
provider_credential_text                              719
provider_other_organization_name                     2625
provider_first_line_business_mailing_address         7915
provider_second_line_business_mailing_address        1593
provider_business_mailing_address_city_name           348
provider_busin

In [17]:
full.columns=['from_npi',
 'patient_count',
 'transaction_count',
 'average_day_wait',
 'std_day_wait',
 'entity_type_code_1',
 'provider_organization_name_(legal_business_name)_1',
 'provider_last_name_(legal_name)_1',
 'provider_first_name_1',
 'provider_middle_name_1',
 'provider_name_prefix_text_1',
 'provider_name_suffix_text_1',
 'provider_credential_text_1',
 'provider_other_organization_name_1',
 'provider_first_line_business_mailing_address_1',
 'provider_second_line_business_mailing_address_1',
 'provider_business_mailing_address_city_name_1',
 'provider_business_mailing_address_state_name_1',
 'provider_business_mailing_address_postal_code_1',
'facility_consolidation_1',
 'taxonomy_switch_1',
 'taxonomy_code_1',
 'code_1',
 'grouping_1',
 'classification_1',
 'specialization_1',
 'definition_1',
 'notes_1',
 'display_name_1',
 'section_1',
 'to_npi',
 'entity_type_code_2',
 'provider_organization_name_(legal_business_name)_2',
 'provider_last_name_(legal_name)_2',
 'provider_first_name_2',
 'provider_middle_name_2',
 'provider_name_prefix_text_2',
 'provider_name_suffix_text_2',
 'provider_credential_text_2',
 'provider_other_organization_name_2',
 'provider_first_line_business_mailing_address_2',
 'provider_second_line_business_mailing_address_2',
 'provider_business_mailing_address_city_name_2',
 'provider_business_mailing_address_state_name_2',
 'provider_business_mailing_address_postal_code_2',
 'facility_consolidation_2',
 'taxonomy_switch_2',
 'taxonomy_code_2',
 'code_2',
 'grouping_2',
 'classification_2',
 'specialization_2',
 'definition_2',
 'notes_2',
 'display_name_2',
 'section_2']

In [18]:
full

Unnamed: 0,from_npi,patient_count,transaction_count,average_day_wait,std_day_wait,entity_type_code_1,provider_organization_name_(legal_business_name)_1,provider_last_name_(legal_name)_1,provider_first_name_1,provider_middle_name_1,provider_name_prefix_text_1,provider_name_suffix_text_1,provider_credential_text_1,provider_other_organization_name_1,provider_first_line_business_mailing_address_1,provider_second_line_business_mailing_address_1,provider_business_mailing_address_city_name_1,provider_business_mailing_address_state_name_1,provider_business_mailing_address_postal_code_1,facility_consolidation_1,taxonomy_switch_1,taxonomy_code_1,code_1,grouping_1,classification_1,specialization_1,definition_1,notes_1,display_name_1,section_1,to_npi,entity_type_code_2,provider_organization_name_(legal_business_name)_2,provider_last_name_(legal_name)_2,provider_first_name_2,provider_middle_name_2,provider_name_prefix_text_2,provider_name_suffix_text_2,provider_credential_text_2,provider_other_organization_name_2,provider_first_line_business_mailing_address_2,provider_second_line_business_mailing_address_2,provider_business_mailing_address_city_name_2,provider_business_mailing_address_state_name_2,provider_business_mailing_address_postal_code_2,facility_consolidation_2,taxonomy_switch_2,taxonomy_code_2,code_2,grouping_2,classification_2,specialization_2,definition_2,notes_2,display_name_2,section_2
0,1841293891,176,231,28.857,60.036,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1245290857,Individual,2.0,RADIOLOGY IMAGING ASSOCIATES OF OAK RIDGE PC,,,,,,,RADIOLOGY IMAGING ASSOCIATES OF OAK RIDGE,601 DODDS AVE,,CHATTANOOGA,TN,374043911.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,Individual
1,1841293891,44,50,35.260,60.604,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1245437060,Individual,1.0,,MONAZAM TAVALLAEE,MEHRAN,,,,M.D.,,49 CLEVELAND ST,SUITE 350,CROSSVILLE,TN,385559716.0,-,Y,207R00000X,207R00000X,Allopathic & Osteopathic Physicians,Internal Medicine,,"A physician who provides long-term, comprehens...","Source: American Board of Medical Specialties,...",Internal Medicine Physician,Individual
2,1841293891,67,76,53.184,83.149,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1306061601,Individual,1.0,,LEMOND,THOMAS,CHARLES,DR.,,M.D.,,990 OAK RIDGE TPKE,,OAK RIDGE,TN,378306976.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,Individual
3,1841293891,56,66,61.894,81.764,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1356633564,Individual,1.0,,LUTTRELL,LINDSAY,GEORGE,DR.,,M.D.,,2508 WILD FERN LN,,KNOXVILLE,TN,379313359.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,Individual
4,1841293891,233,366,3.101,19.513,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1457302010,Individual,2.0,"COVENANT MEDICAL GROUP, INC.",,,,,,,,1400 CENTERPOINT BLVD,"BLDG A, SUITE 202",KNOXVILLE,TN,379322146.0,-,Y,207Q00000X,207Q00000X,Allopathic & Osteopathic Physicians,Family Medicine,,Family Medicine is the medical specialty which...,Source: American Board of Family Medicine [1/...,Family Medicine Physician,Individual
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
852196,1275001851,62,62,7.435,4.151,2.0,CQUENTIA ARKANSAS LAB LLC,,,,,,,,3742 TYNDALE DR,,MEMPHIS,TN,381258500.0,-,Y,291U00000X,291U00000X,Laboratories,Clinical Medical Laboratory,,(1) A clinical laboratory is a facility for th...,"Source: (1) Code of Federal Regulations #42, P...",Clinical Medical Laboratory,1184610859,Non-Individual,2.0,"UPPER CUMBERLAND ORTHOPEDIC SURGERY, PC",,,,,,,,105 S. WILLOW AVE,,COOKEVILLE,TN,38501.0,-,Y,261QM1300X,261QM1300X,Ambulatory Health Care Facilities,Clinic/Center,Multi-Specialty,Definition to come...,,Multi-Specialty Clinic/Center,Non-Individual
852197,1275001851,130,130,0.208,1.186,2.0,CQUENTIA ARKANSAS LAB LLC,,,,,,,,3742 TYNDALE DR,,MEMPHIS,TN,381258500.0,-,Y,291U00000X,291U00000X,Laboratories,Clinical Medical Laboratory,,(1) A clinical laboratory is a facility for th...,"Source: (1) Code of Federal Regulations #42, P...",Clinical Medical Laboratory,1275531956,Non-Individual,2.0,COOKEVILLE REGIONAL MEDICAL CENTER,,,,,,,,1 MEDICAL CENTER BLVD,,COOKEVILLE,TN,385011760.0,-,Y,282N00000X,282N00000X,Hospitals,General Acute Care Hospital,,An acute general hospital is an institution wh...,,General Acute Care Hospital,Non-Individual
852198,1275001851,74,74,8.568,4.991,2.0,CQUENTIA ARKANSAS LAB LLC,,,,,,,,3742 TYNDALE DR,,MEMPHIS,TN,381258500.0,-,Y,291U00000X,291U00000X,Laboratories,Clinical Medical Laboratory,,(1) A clinical laboratory is a facility for th...,"Source: (1) Code of Federal Regulations #42, P...",Clinical Medical Laboratory,1366440570,Non-Individual,2.0,COMMUNITY PATHOLOGY LABORATORY LLC,,,,,,,COOKEVILLE PATHOLOGY LAB,115 N PEACHTREE AVE,,COOKEVILLE,TN,385012546.0,-,Y,174400000X,174400000X,Other Service Providers,Specialist,,An individual educated and trained in an appli...,Source: Expanded from Webster's II New Riversi...,Specialist,Individual
852199,1275001851,108,108,8.019,3.045,2.0,CQUENTIA ARKANSAS LAB LLC,,,,,,,,3742 TYNDALE DR,,MEMPHIS,TN,381258500.0,-,Y,291U00000X,291U00000X,Laboratories,Clinical Medical Laboratory,,(1) A clinical laboratory is a facility for th...,"Source: (1) Code of Federal Regulations #42, P...",Clinical Medical Laboratory,1710919980,Non-Individual,2.0,"UPPER CUMBERLAND ANESTHESIA ASSOCIATES, PC",,,,,,,,PO BOX 280,,COOKEVILLE,TN,385030280.0,-,Y,207LP2900X,207LP2900X,Allopathic & Osteopathic Physicians,Anesthesiology,Pain Medicine,An anesthesiologist who provides a high level ...,"Source: American Board of Medical Specialties,...",Pain Medicine (Anesthesiology) Physician,Individual


In [19]:
full_2=full[full['entity_type_code_1']==1.0]

In [20]:
full_2=full_2[full_2['entity_type_code_2']==2.0]

In [64]:
full_2

Unnamed: 0,from_npi,patient_count,transaction_count,average_day_wait,std_day_wait,entity_type_code_1,provider_organization_name_(legal_business_name)_1,provider_last_name_(legal_name)_1,provider_first_name_1,provider_middle_name_1,provider_name_prefix_text_1,provider_name_suffix_text_1,provider_credential_text_1,provider_other_organization_name_1,provider_first_line_business_mailing_address_1,provider_second_line_business_mailing_address_1,provider_business_mailing_address_city_name_1,provider_business_mailing_address_state_name_1,provider_business_mailing_address_postal_code_1,facility_consolidation_1,taxonomy_switch_1,taxonomy_code_1,code_1,grouping_1,classification_1,specialization_1,definition_1,notes_1,display_name_1,section_1,to_npi,entity_type_code_2,provider_organization_name_(legal_business_name)_2,provider_last_name_(legal_name)_2,provider_first_name_2,provider_middle_name_2,provider_name_prefix_text_2,provider_name_suffix_text_2,provider_credential_text_2,provider_other_organization_name_2,provider_first_line_business_mailing_address_2,provider_second_line_business_mailing_address_2,provider_business_mailing_address_city_name_2,provider_business_mailing_address_state_name_2,provider_business_mailing_address_postal_code_2,facility_consolidation_2,taxonomy_switch_2,taxonomy_code_2,code_2,grouping_2,classification_2,specialization_2,definition_2,notes_2,display_name_2,section_2,full_addy_1,full_addy_2,from_npi_pt_count,from_npi_transaction_count,to_npi_pt_count,to_npi_transaction_count,from_facility_pt_count,from_facility_transaction_count,to_facility_pt_count,to_facility_transaction_count
0,1841293891,176,231,28.857,60.036,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1245290857,Individual,2.0,RADIOLOGY IMAGING ASSOCIATES OF OAK RIDGE PC,,,,,,,RADIOLOGY IMAGING ASSOCIATES OF OAK RIDGE,601 DODDS AVE,,CHATTANOOGA,TN,374043911.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,Individual,"49 CLEVELAND ST 310, CROSSVILLE","601 DODDS AVE, CHATTANOOGA",766,1130,36666932,52211903,766,1130,385028,489261
4,1841293891,233,366,3.101,19.513,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1457302010,Individual,2.0,"COVENANT MEDICAL GROUP, INC.",,,,,,,,1400 CENTERPOINT BLVD,"BLDG A, SUITE 202",KNOXVILLE,TN,379322146.0,-,Y,207Q00000X,207Q00000X,Allopathic & Osteopathic Physicians,Family Medicine,,Family Medicine is the medical specialty which...,Source: American Board of Family Medicine [1/...,Family Medicine Physician,Individual,"49 CLEVELAND ST 310, CROSSVILLE","1400 CENTERPOINT BLVD, KNOXVILLE",766,1130,36666932,52211903,766,1130,322519,477249
6,1841293891,63,80,32.675,59.438,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1518980499,Individual,2.0,"BUCKEYE HOME HEALTH CENTER, INC.",,,,,,,,PO BOX 1197,,JAMESTOWN,TN,38556.0,-,Y,332B00000X,332B00000X,Suppliers,Durable Medical Equipment & Medical Supplies,,A supplier of medical equipment such as respir...,,Durable Medical Equipment & Medical Supplies,Non-Individual,"49 CLEVELAND ST 310, CROSSVILLE","PO BOX 1197, JAMESTOWN",766,1130,36666932,52211903,766,1130,45187,74204
7,1841293891,72,89,37.022,56.687,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1538252010,Individual,2.0,"CUMBERLAND HEART CLINIC, PLLC",,,,,,,,49 CLEVELAND ST.,STE. 250,CROSSVILLE,TN,38555.0,-,Y,207RC0000X,207RC0000X,Allopathic & Osteopathic Physicians,Internal Medicine,Cardiovascular Disease,An internist who specializes in diseases of th...,Source: American Osteopathic Board of Internal...,Cardiovascular Disease Physician,Individual,"49 CLEVELAND ST 310, CROSSVILLE","49 CLEVELAND ST., CROSSVILLE",766,1130,36666932,52211903,766,1130,14271,16772
14,1841293891,222,364,6.745,28.678,1.0,,GIBBS,ELMER,RICKEY,DR.,,M.D.,,49 CLEVELAND ST 310,,CROSSVILLE,TN,385552854.0,-,Y,208600000X,208600000X,Allopathic & Osteopathic Physicians,Surgery,,A general surgeon has expertise related to the...,"Source: American Board of Medical Specialties,...",Surgery Physician,1871596403,Individual,2.0,"CUMBERLAND MEDICAL CENTER, INC.",,,,,,,CUMBERLAND MEDICAL CENTER,421 S MAIN ST,,CROSSVILLE,TN,385555048.0,-,Y,282N00000X,282N00000X,Hospitals,General Acute Care Hospital,,An acute general hospital is an institution wh...,,General Acute Care Hospital,Non-Individual,"49 CLEVELAND ST 310, CROSSVILLE","421 S MAIN ST, CROSSVILLE",766,1130,36666932,52211903,766,1130,74651,112620
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
852183,1407336548,57,66,1.273,8.861,1.0,,OGLE,CANDICE,M,,,,,30 BURTON HILLS BLVD,STE 175,NASHVILLE,TN,372156403.0,-,Y,363L00000X,363L00000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,,(1) A registered nurse provider with a graduat...,"Source: (1) American Nurses' Association, Amer...",Nurse Practitioner,1578886610,Individual,2.0,"UNIVERSITY HEALTH SYSTEM, INC",,,,,,,UT FAMILY PHYSICIANS CLINTON,PO BOX 415000-MSC8162,,NASHVILLE,TN,372418162.0,-,Y,207Q00000X,207Q00000X,Allopathic & Osteopathic Physicians,Family Medicine,,Family Medicine is the medical specialty which...,Source: American Board of Family Medicine [1/...,Family Medicine Physician,Individual,"30 BURTON HILLS BLVD, NASHVILLE","PO BOX 415000-MSC8162, NASHVILLE",57,66,36666932,52211903,18782,25613,427,1147
852184,1063992097,38,60,0.017,0.129,1.0,,WOOD,SAMUEL,LAWRENCE,,,FNP-BC,,215 S MOLLY BRIGHT RD,,KNOXVILLE,TN,379244112.0,-,Y,363LF0000X,363LF0000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,Family,Definition to come...,,Family Nurse Practitioner,1184610248,Individual,2.0,"HEALTHSTAR PHYSICIANS, P.C.",,,,,,,,420 W MORRIS BLVD STE 400A,,MORRISTOWN,TN,378132262.0,-,Y,207Q00000X,207Q00000X,Allopathic & Osteopathic Physicians,Family Medicine,,Family Medicine is the medical specialty which...,Source: American Board of Family Medicine [1/...,Family Medicine Physician,Individual,"215 S MOLLY BRIGHT RD, KNOXVILLE","420 W MORRIS BLVD STE 400A, MORRISTOWN",38,60,36666932,52211903,38,60,99787,181126
852186,1962983502,49,66,18.879,22.422,1.0,,SMITH,ERIC,,,,PT,,675 S JEFFERSON AVE STE C,,COOKEVILLE,TN,385010949.0,-,Y,225100000X,225100000X,"Respiratory, Developmental, Rehabilitative and...",Physical Therapist,,Physical therapists (PTs) are licensed health ...,Source: American Physical Therapy Association ...,Physical Therapist,1275531956,Individual,2.0,COOKEVILLE REGIONAL MEDICAL CENTER,,,,,,,,1 MEDICAL CENTER BLVD,,COOKEVILLE,TN,385011760.0,-,Y,282N00000X,282N00000X,Hospitals,General Acute Care Hospital,,An acute general hospital is an institution wh...,,General Acute Care Hospital,Non-Individual,"675 S JEFFERSON AVE STE C, COOKEVILLE","1 MEDICAL CENTER BLVD, COOKEVILLE",49,66,36666932,52211903,690,1110,144836,225944
852191,1114409273,33,53,0.113,0.824,1.0,,SHANNON,DOMINIK,ALAN,,,"PT, DPT",,6397 LEE HWY STE 300,,CHATTANOOGA,TN,374212564.0,-,Y,225100000X,225100000X,"Respiratory, Developmental, Rehabilitative and...",Physical Therapist,,Physical therapists (PTs) are licensed health ...,Source: American Physical Therapy Association ...,Physical Therapist,1780636068,Individual,2.0,"INDEPENDENT PHYSICAL THERAPY OF GEORGIA, LLC",,,,,,,BENCHMARK PHYSICAL THERAPY,6397 LEE HWY STE 300,,CHATTANOOGA,TN,374212564.0,-,Y,225100000X,225100000X,"Respiratory, Developmental, Rehabilitative and...",Physical Therapist,,Physical therapists (PTs) are licensed health ...,Source: American Physical Therapy Association ...,Physical Therapist,Individual,"6397 LEE HWY STE 300, CHATTANOOGA","6397 LEE HWY STE 300, CHATTANOOGA",33,53,36666932,52211903,2729,13233,21493,47630


In [22]:
# 1.  using full_2 determine who is sending the most pts and initiating the most transactions
### solve: sum of patient_count grouped by from_npi and sum of transaction_count  grouped by from_npi
###### visualization: could have a bar graph with all NPIs, but that will be too much information, maybe a stripped down with
#####                 most, least and median NPI and most, least and median facility overall, maybe  a histogram to show trends
#####                 super_extra_credit: r_shiny app that allows you to use drop down to visualize by NPI or facility,and
#####                 filter by specialty, and uses specialty to look at wait-time.  Further points if there can be a slide 
#####                 with the Neo4J stuff, and one more that        

# 2.  using full_2 determine who is receiving the most pts and the most transactions
### solve: sum of patient_count grouped by to_npi and sum of transaction_count  grouped by to_npi
###### visualization: see above


# 3.  use this information to determine which facility gets and receives the most pts and transactions
### solve: group previous info by facility??? make sure that you have consolidated the facilites for accuracy.  May try a string
###        like "%rough_hospital address%" query in sql and add a "renamed_facility_address" column.
###        ~~~on second thought, this would require doing that for every facility, might need fuzzy naming ~~~

# 4.  ***The purpose of the next questions to to see where Vandy is doing well and where they could improve***
#     Use this information to determine which doctors refer to Vanderbilt most (top 5, and top 5 not assocaited with Vanderbilt), 
#     which refer to Vanderbilt least (again, top 5, and top 5 not assocaited with Vanderbilt) as well as (4b) the facilities and 
#     specialites that refer to Vandy the most and least. 

# 5.  Determine doctor's patient caseload as a metric for growth (ei: look at doctors, grouped by speciality to determine which
#     ones have the most and least pts~~~(may not actually work because these are referrals, not total pts)~~~. Use that number 
#     to find out how what a facilities pt.per.physician ratio is in total and per speciality.  This could theorectically also 
#     be a shiny app.)


In [23]:
# (1)group by from_npi summing the patient_count and then sorting the values
pt_count_by_from_npi= full_2.groupby(['from_npi'])['patient_count'].sum().reset_index()
pt_count_by_from_npi. sort_values('patient_count', ascending=False)
#these are the npi's with the 5 most and least pt count

Unnamed: 0,from_npi,patient_count
1725,1093753303,646023
13238,1710915061,117275
12660,1689673048,87477
11257,1609848563,75274
162,1003921404,70078
...,...,...
521,1023503612,12
4617,1255309381,12
6474,1356319198,12
17818,1962411934,11


In [24]:
# (1) group by from_npi summing the transaction_count and then sorting the values
transaction_count_by_from_npi= full_2.groupby(['from_npi'])['transaction_count'].sum().reset_index()
transaction_count_by_from_npi. sort_values('transaction_count', ascending=False)
#these are the npi's with the 5 most and least transaction count

Unnamed: 0,from_npi,transaction_count
1725,1093753303,978213
13238,1710915061,156297
12660,1689673048,118935
2841,1154356764,82001
6912,1376658781,79237
...,...,...
15971,1861431884,50
5966,1326054446,50
10648,1578566519,50
8920,1487189197,50


In [25]:
# (2) group by to_npi summing the patient_count and then sorting the values
pt_count_by_to_npi= full_2.groupby(['to_npi'])['patient_count'].sum().reset_index()
pt_count_by_to_npi. sort_values('patient_count', ascending=False)
#these are the npi's with the 5 most and least pt count

Unnamed: 0,to_npi,patient_count
0,Individual,36666932
1,Non-Individual,1459


In [26]:
# (2) group by to_npi summing the transaction_count and then sorting the values
transaction_count_by_to_npi= full_2.groupby(['to_npi'])['transaction_count'].sum().reset_index()
transaction_count_by_to_npi. sort_values('transaction_count', ascending=False)
#these are the npi's with the 5 most and least transaction count

Unnamed: 0,to_npi,transaction_count
0,Individual,52211903
1,Non-Individual,1654


In [27]:
full_2['full_addy_1']= full_2.provider_first_line_business_mailing_address_1.map(str) +', ' + full_2.provider_business_mailing_address_city_name_1

In [28]:
full_2['full_addy_2']= full_2.provider_first_line_business_mailing_address_2.map(str) +', ' + full_2.provider_business_mailing_address_city_name_2

In [29]:
full_2['from_npi_pt_count']= full_2.groupby(['from_npi'])['patient_count'].transform(np.sum)

In [30]:
full_2['from_npi_transaction_count']= full_2.groupby(['from_npi'])['transaction_count'].transform(np.sum)

In [31]:
full_2['to_npi_pt_count']= full_2.groupby(['to_npi'])['patient_count'].transform(np.sum)

In [34]:
full_2['to_npi_transaction_count']= full_2.groupby(['to_npi'])['transaction_count'].transform(np.sum)

In [35]:
full_2['provider_first_line_business_mailing_address_1'].nunique()

6083

In [36]:
unique_addy=pd.DataFrame((full_2['provider_first_line_business_mailing_address_1'].unique()))

In [37]:
unique_addy

Unnamed: 0,0
0,49 CLEVELAND ST 310
1,PO BOX 9
2,PO BOX 440100
3,PO BOX 778
4,127 CRESTVIEW PARK DR
...,...
6078,4405 WASHINGTON CT
6079,PO BOX 750
6080,147 NORTH STAR DRIVE
6081,700 W FOREST AVE STE 200


In [38]:
full_2[full_2['provider_first_line_business_mailing_address_1']=='PO BOX 9']

Unnamed: 0,from_npi,patient_count,transaction_count,average_day_wait,std_day_wait,entity_type_code_1,provider_organization_name_(legal_business_name)_1,provider_last_name_(legal_name)_1,provider_first_name_1,provider_middle_name_1,provider_name_prefix_text_1,provider_name_suffix_text_1,provider_credential_text_1,provider_other_organization_name_1,provider_first_line_business_mailing_address_1,provider_second_line_business_mailing_address_1,provider_business_mailing_address_city_name_1,provider_business_mailing_address_state_name_1,provider_business_mailing_address_postal_code_1,facility_consolidation_1,taxonomy_switch_1,taxonomy_code_1,code_1,grouping_1,classification_1,specialization_1,definition_1,notes_1,display_name_1,section_1,to_npi,entity_type_code_2,provider_organization_name_(legal_business_name)_2,provider_last_name_(legal_name)_2,provider_first_name_2,provider_middle_name_2,provider_name_prefix_text_2,provider_name_suffix_text_2,provider_credential_text_2,provider_other_organization_name_2,provider_first_line_business_mailing_address_2,provider_second_line_business_mailing_address_2,provider_business_mailing_address_city_name_2,provider_business_mailing_address_state_name_2,provider_business_mailing_address_postal_code_2,facility_consolidation_2,taxonomy_switch_2,taxonomy_code_2,code_2,grouping_2,classification_2,specialization_2,definition_2,notes_2,display_name_2,section_2,full_addy_1,full_addy_2,from_npi_pt_count,from_npi_transaction_count,to_npi_pt_count,to_npi_transaction_count
15,1659374601,60,65,21.646,29.540,1.0,,OBERDICK,WENDY,TIPTON,,,MD,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,207Q00000X,207Q00000X,Allopathic & Osteopathic Physicians,Family Medicine,,Family Medicine is the medical specialty which...,Source: American Board of Family Medicine [1/...,Family Medicine Physician,1841638277,Individual,2.0,BTDI JV LLP,,,,,,,TOUCHSTONE MEDICAL IMAGING AT RED OAK,1431 PERRONE WAY,,FRANKLIN,TN,370694243.0,-,Y,293D00000X,293D00000X,Laboratories,Physiological Laboratory,,A laboratory that operates independently of a ...,Source: Paraphrased from the Medicare Carrier ...,Physiological Laboratory,Non-Individual,"PO BOX 9, KINGSPORT","1431 PERRONE WAY, FRANKLIN",60,65,36666932,52211903
694,1255334298,48,52,89.788,88.380,1.0,,HUNT,JEFFREY,,DR.,,MD,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,207Y00000X,207Y00000X,Allopathic & Osteopathic Physicians,Otolaryngology,,An otolaryngologist-head and neck surgeon prov...,"Source: American Board of Medical Specialties,...",Otolaryngology Physician,1003904095,Individual,2.0,WPS PROVIDERS INC,,,,,,,,105 W STONE DR,SUITE 6A,KINGSPORT,TN,376603365.0,-,Y,208D00000X,208D00000X,Allopathic & Osteopathic Physicians,General Practice,,Definition to come...,,General Practice Physician,Individual,"PO BOX 9, KINGSPORT","105 W STONE DR, KINGSPORT",1338,2169,36666932,52211903
695,1255334298,48,51,79.725,78.437,1.0,,HUNT,JEFFREY,,DR.,,MD,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,207Y00000X,207Y00000X,Allopathic & Osteopathic Physicians,Otolaryngology,,An otolaryngologist-head and neck surgeon prov...,"Source: American Board of Medical Specialties,...",Otolaryngology Physician,1093762759,Individual,2.0,MOUNTAIN EMPIRE RADIOLOGY INC PC,,,,,,,,1301 SUNSET DR,STE 3,JOHNSON CITY,TN,376047906.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,Individual,"PO BOX 9, KINGSPORT","1301 SUNSET DR, JOHNSON CITY",1338,2169,36666932,52211903
696,1255334298,43,52,64.231,81.937,1.0,,HUNT,JEFFREY,,DR.,,MD,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,207Y00000X,207Y00000X,Allopathic & Osteopathic Physicians,Otolaryngology,,An otolaryngologist-head and neck surgeon prov...,"Source: American Board of Medical Specialties,...",Otolaryngology Physician,1124058615,Individual,2.0,WELLMONT HEALTH SYSTEM,,,,,,,BRISTOL REGIONAL MEDICAL CENTER,311 PRINCETON RD STE 1,,JOHNSON CITY,TN,376012026.0,-,Y,282N00000X,282N00000X,Hospitals,General Acute Care Hospital,,An acute general hospital is an institution wh...,,General Acute Care Hospital,Non-Individual,"PO BOX 9, KINGSPORT","311 PRINCETON RD STE 1, JOHNSON CITY",1338,2169,36666932,52211903
697,1255334298,30,52,39.346,55.256,1.0,,HUNT,JEFFREY,,DR.,,MD,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,207Y00000X,207Y00000X,Allopathic & Osteopathic Physicians,Otolaryngology,,An otolaryngologist-head and neck surgeon prov...,"Source: American Board of Medical Specialties,...",Otolaryngology Physician,1174808216,Individual,2.0,WELLMONT MEDICAL ASSOCIATES INC,,,,,,,BALLAD HEALTH MEDICAL ASSOCIATES,2020 BROOKSIDE DR,,KINGSPORT,TN,376604633.0,-,Y,207Q00000X,207Q00000X,Allopathic & Osteopathic Physicians,Family Medicine,,Family Medicine is the medical specialty which...,Source: American Board of Family Medicine [1/...,Family Medicine Physician,Individual,"PO BOX 9, KINGSPORT","2020 BROOKSIDE DR, KINGSPORT",1338,2169,36666932,52211903
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
831500,1164884938,45,60,40.800,56.470,1.0,,VARNEY,HEATHER,,,,NP,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,363LF0000X,363LF0000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,Family,Definition to come...,,Family Nurse Practitioner,1992813240,Individual,2.0,MOUNTAIN STATES HEALTH ALLIANCE,,,,,,,INDIAN PATH COMMUNITY HOSPITAL,311 PRINCETON RD STE 1,,JOHNSON CITY,TN,376012026.0,-,Y,282N00000X,282N00000X,Hospitals,General Acute Care Hospital,,An acute general hospital is an institution wh...,,General Acute Care Hospital,Non-Individual,"PO BOX 9, KINGSPORT","311 PRINCETON RD STE 1, JOHNSON CITY",570,1194,36666932,52211903
839374,1831633528,54,55,74.582,75.945,1.0,,TONEY,STEPHANIE,E,MRS.,,NP,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,363LF0000X,363LF0000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,Family,Definition to come...,,Family Nurse Practitioner,1376575035,Individual,2.0,WELLMONT CARDIOLOGY SERVICES,,,,,,,,2050 MEADOWVIEW PKWY,,KINGSPORT,TN,376607475.0,-,Y,207RC0000X,207RC0000X,Allopathic & Osteopathic Physicians,Internal Medicine,Cardiovascular Disease,An internist who specializes in diseases of th...,Source: American Osteopathic Board of Internal...,Cardiovascular Disease Physician,Individual,"PO BOX 9, KINGSPORT","2050 MEADOWVIEW PKWY, KINGSPORT",353,367,36666932,52211903
839375,1831633528,50,52,46.635,66.298,1.0,,TONEY,STEPHANIE,E,MRS.,,NP,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,363LF0000X,363LF0000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,Family,Definition to come...,,Family Nurse Practitioner,1619088697,Individual,2.0,"ASSOCIATION OF UNIVERSITY RADIOLOGISTS, PC",,,,,,,,2240 SUTHERLAND AVE STE 107,,KNOXVILLE,TN,379192333.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,Individual,"PO BOX 9, KINGSPORT","2240 SUTHERLAND AVE STE 107, KNOXVILLE",353,367,36666932,52211903
839376,1831633528,195,206,0.073,0.777,1.0,,TONEY,STEPHANIE,E,MRS.,,NP,,PO BOX 9,,KINGSPORT,TN,376620009.0,-,Y,363LF0000X,363LF0000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,Family,Definition to come...,,Family Nurse Practitioner,1780986257,Individual,2.0,WELLMONT MEDICAL ASSOCIATES INC,,,,,,,BALLAD HEALTH MEDICAL ASSOCIATES,2020 BROOKSIDE DR,,KINGSPORT,TN,376604633.0,-,Y,207RP1001X,207RP1001X,Allopathic & Osteopathic Physicians,Internal Medicine,Pulmonary Disease,An internist who treats diseases of the lungs ...,"Source: American Board of Medical Specialties,...",Pulmonary Disease Physician,Individual,"PO BOX 9, KINGSPORT","2020 BROOKSIDE DR, KINGSPORT",353,367,36666932,52211903


In [39]:
# (3a)group by full_addy_1 summing the patient_count and then sorting the values
pt_count_by_full_addy_1= full_2.groupby(['full_addy_1'])['patient_count'].sum().reset_index()
pt_count_by_full_addy_1. sort_values('patient_count', ascending=False)
#these are the facilities's with the 5 most and least pt count

Unnamed: 0,full_addy_1,patient_count
1952,"210 25TH AVE N STE 1204, NASHVILLE",991514
3820,"5301 VIRGINIA WAY, BRENTWOOD",923002
2736,"3024 BUSINESS PARK CIR, GOODLETTSVILLE",876060
2365,"2501 CITICO AVE, CHATTANOOGA",549853
5592,"PO BOX 2121, MEMPHIS",505969
...,...,...
2552,"28 MIDWAY STREET, BRISTOL",13
5016,"9051 EXECUTIVE PARK DR STE 500, KNOXVILLE",13
5222,"979 E 3RD ST STE C725, CHATTANOOGA",13
2455,"2611 SALEM CREEK DR, MURFREESBORO",12


In [40]:
full_2['from_facility_pt_count']= full_2.groupby(['full_addy_1'])['patient_count'].transform(np.sum)

In [41]:
full_2['from_facility_transaction_count']= full_2.groupby(['full_addy_1'])['transaction_count'].transform(np.sum)

In [42]:
full_2['to_facility_pt_count']= full_2.groupby(['full_addy_2'])['patient_count'].transform(np.sum)

In [43]:
full_2['to_facility_transaction_count']= full_2.groupby(['full_addy_2'])['transaction_count'].transform(np.sum)

In [44]:
full_2[full_2['full_addy_1']=='210 25TH AVE N STE 1204, NASHVILLE']

Unnamed: 0,from_npi,patient_count,transaction_count,average_day_wait,std_day_wait,entity_type_code_1,provider_organization_name_(legal_business_name)_1,provider_last_name_(legal_name)_1,provider_first_name_1,provider_middle_name_1,provider_name_prefix_text_1,provider_name_suffix_text_1,provider_credential_text_1,provider_other_organization_name_1,provider_first_line_business_mailing_address_1,provider_second_line_business_mailing_address_1,provider_business_mailing_address_city_name_1,provider_business_mailing_address_state_name_1,provider_business_mailing_address_postal_code_1,facility_consolidation_1,taxonomy_switch_1,taxonomy_code_1,code_1,grouping_1,classification_1,specialization_1,definition_1,notes_1,display_name_1,section_1,to_npi,entity_type_code_2,provider_organization_name_(legal_business_name)_2,provider_last_name_(legal_name)_2,provider_first_name_2,provider_middle_name_2,provider_name_prefix_text_2,provider_name_suffix_text_2,provider_credential_text_2,provider_other_organization_name_2,provider_first_line_business_mailing_address_2,provider_second_line_business_mailing_address_2,provider_business_mailing_address_city_name_2,provider_business_mailing_address_state_name_2,provider_business_mailing_address_postal_code_2,facility_consolidation_2,taxonomy_switch_2,taxonomy_code_2,code_2,grouping_2,classification_2,specialization_2,definition_2,notes_2,display_name_2,section_2,full_addy_1,full_addy_2,from_npi_pt_count,from_npi_transaction_count,to_npi_pt_count,to_npi_transaction_count,from_facility_pt_count,from_facility_transaction_count,to_facility_pt_count,to_facility_transaction_count
136442,1013991850,58,59,46.305,82.347,1.0,,NG,CHRISTOPHER,C,DR.,,MD,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,1003230236,Individual,2.0,"APP OF TENNESSEE ED, PLLC",,,,,,,,PO BOX 31957,,CLARKSVILLE,TN,370400033.0,-,Y,207P00000X,207P00000X,Allopathic & Osteopathic Physicians,Emergency Medicine,,An emergency physician focuses on the immediat...,"Source: American Board of Medical Specialties,...",Emergency Medicine Physician,Individual,"210 25TH AVE N STE 1204, NASHVILLE","PO BOX 31957, CLARKSVILLE",15101,15710,36666932,52211903,991514,1062764,209804,243135
136443,1013991850,496,499,57.595,65.541,1.0,,NG,CHRISTOPHER,C,DR.,,MD,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,1003863580,Individual,2.0,"ASSOCIATED PATHOLOGISTS, LLC",,,,,,,ASSOCIATED PATHOLOGISTS LLC DBA PATHGROUP,5301 VIRGINIA WAY,SUITE 300,BRENTWOOD,TN,370277542.0,-,Y,207ZP0102X,207ZP0102X,Allopathic & Osteopathic Physicians,Pathology,Anatomic Pathology & Clinical Pathology,A pathologist deals with the causes and nature...,"Source: American Board of Medical Specialties,...",Anatomic Pathology & Clinical Pathology Physician,Individual,"210 25TH AVE N STE 1204, NASHVILLE","5301 VIRGINIA WAY, BRENTWOOD",15101,15710,36666932,52211903,991514,1062764,1894619,2431116
136444,1013991850,642,665,22.771,49.368,1.0,,NG,CHRISTOPHER,C,DR.,,MD,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,1023055126,Individual,2.0,"HCA HEALTH SERVICES OF TENNESSEE, INC.",,,,,,,TRISTAR CENTENNIAL MEDICAL CENTER,2300 PATTERSON ST,,NASHVILLE,TN,372031538.0,-,Y,282N00000X,282N00000X,Hospitals,General Acute Care Hospital,,An acute general hospital is an institution wh...,,General Acute Care Hospital,Non-Individual,"210 25TH AVE N STE 1204, NASHVILLE","2300 PATTERSON ST, NASHVILLE",15101,15710,36666932,52211903,991514,1062764,209435,308261
136445,1013991850,67,76,12.947,35.635,1.0,,NG,CHRISTOPHER,C,DR.,,MD,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,1023066149,Individual,2.0,TENNESSEE ONCOLOGY PLLC,,,,,,,,PO BOX 440100,,NASHVILLE,TN,372440100.0,-,Y,207RH0003X,207RH0003X,Allopathic & Osteopathic Physicians,Internal Medicine,Hematology & Oncology,An internist doctor of osteopathy that special...,Source: American Osteopathic Board of Internal...,Hematology & Oncology Physician,Individual,"210 25TH AVE N STE 1204, NASHVILLE","PO BOX 440100, NASHVILLE",15101,15710,36666932,52211903,991514,1062764,481870,947137
136447,1013991850,81,81,32.914,52.004,1.0,,NG,CHRISTOPHER,C,DR.,,MD,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,2085R0202X,2085R0202X,Allopathic & Osteopathic Physicians,Radiology,Diagnostic Radiology,"A radiologist who utilizes x-ray, radionuclide...","Source: American Board of Medical Specialties,...",Diagnostic Radiology Physician,1033154786,Individual,2.0,"SKYLINE NEUROSCIENCE ASSOCIATES, LLC",,,,,,,WAUKEGAN CLINIC CORPORATION,2000 HEALTH PARK DR,,BRENTWOOD,TN,370274525.0,-,Y,2084N0400X,2084N0400X,Allopathic & Osteopathic Physicians,Psychiatry & Neurology,Neurology,A Neurologist specializes in the diagnosis and...,Source: The American Board of Psychiatry and ...,Neurology Physician,Individual,"210 25TH AVE N STE 1204, NASHVILLE","2000 HEALTH PARK DR, BRENTWOOD",15101,15710,36666932,52211903,991514,1062764,343346,459631
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
830717,1265892723,56,58,25.810,48.029,1.0,,EVANS,THOMAS,KERRY,,,AGACNP-BC,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,363L00000X,363L00000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,,(1) A registered nurse provider with a graduat...,"Source: (1) American Nurses' Association, Amer...",Nurse Practitioner,1003863580,Individual,2.0,"ASSOCIATED PATHOLOGISTS, LLC",,,,,,,ASSOCIATED PATHOLOGISTS LLC DBA PATHGROUP,5301 VIRGINIA WAY,SUITE 300,BRENTWOOD,TN,370277542.0,-,Y,207ZP0102X,207ZP0102X,Allopathic & Osteopathic Physicians,Pathology,Anatomic Pathology & Clinical Pathology,A pathologist deals with the causes and nature...,"Source: American Board of Medical Specialties,...",Anatomic Pathology & Clinical Pathology Physician,Individual,"210 25TH AVE N STE 1204, NASHVILLE","5301 VIRGINIA WAY, BRENTWOOD",300,329,36666932,52211903,991514,1062764,1894619,2431116
830718,1265892723,52,53,7.113,23.511,1.0,,EVANS,THOMAS,KERRY,,,AGACNP-BC,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,363L00000X,363L00000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,,(1) A registered nurse provider with a graduat...,"Source: (1) American Nurses' Association, Amer...",Nurse Practitioner,1023055126,Individual,2.0,"HCA HEALTH SERVICES OF TENNESSEE, INC.",,,,,,,TRISTAR CENTENNIAL MEDICAL CENTER,2300 PATTERSON ST,,NASHVILLE,TN,372031538.0,-,Y,282N00000X,282N00000X,Hospitals,General Acute Care Hospital,,An acute general hospital is an institution wh...,,General Acute Care Hospital,Non-Individual,"210 25TH AVE N STE 1204, NASHVILLE","2300 PATTERSON ST, NASHVILLE",300,329,36666932,52211903,991514,1062764,209435,308261
830719,1265892723,65,66,29.394,51.387,1.0,,EVANS,THOMAS,KERRY,,,AGACNP-BC,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,363L00000X,363L00000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,,(1) A registered nurse provider with a graduat...,"Source: (1) American Nurses' Association, Amer...",Nurse Practitioner,1245393057,Individual,2.0,CENTENNIAL HEART LLC,,,,,,,,2000 HEALTH PARK DR,,BRENTWOOD,TN,370274525.0,-,Y,174400000X,174400000X,Other Service Providers,Specialist,,An individual educated and trained in an appli...,Source: Expanded from Webster's II New Riversi...,Specialist,Individual,"210 25TH AVE N STE 1204, NASHVILLE","2000 HEALTH PARK DR, BRENTWOOD",300,329,36666932,52211903,991514,1062764,343346,459631
830720,1265892723,77,94,4.404,25.037,1.0,,EVANS,THOMAS,KERRY,,,AGACNP-BC,,210 25TH AVE N STE 1204,,NASHVILLE,TN,372031620.0,-,Y,363L00000X,363L00000X,Physician Assistants & Advanced Practice Nursi...,Nurse Practitioner,,(1) A registered nurse provider with a graduat...,"Source: (1) American Nurses' Association, Amer...",Nurse Practitioner,1295780476,Individual,2.0,HTI MEMORIAL HOSPITAL CORPORATION,,,,,,,TRISTAR SKYLINE MEDICAL CENTER,3441 DICKERSON PIKE,,NASHVILLE,TN,372072539.0,-,Y,282N00000X,282N00000X,Hospitals,General Acute Care Hospital,,An acute general hospital is an institution wh...,,General Acute Care Hospital,Non-Individual,"210 25TH AVE N STE 1204, NASHVILLE","3441 DICKERSON PIKE, NASHVILLE",300,329,36666932,52211903,991514,1062764,73652,104016


In [51]:
# all of the times Vanderbilt was referred TO
full_2_Vandy= full_2[full_2['facility_consolidation_2']=='Vanderbilt']

In [58]:
# (4)group by from_npi summing the patient_count and then sorting the values for Vanderbilt referals
vandy_pt_count_by_from_npi= full_2_Vandy.groupby(['from_npi'])['patient_count'].sum().reset_index()
vandy_pt_count_by_from_npi. sort_values('patient_count', ascending=False)
#these are the npi's with the 5 most and least pt count referred to Vanderbilt

Unnamed: 0,from_npi,patient_count
391,1093753303,13363
1441,1316983695,8847
3356,1740377845,8838
166,1043302466,8219
955,1215966726,7222
...,...,...
1931,1427045830,17
616,1144228107,17
2533,1558515437,14
1543,1346312477,13


In [59]:
# (4)group by from_npi summing the transaction_count and then sorting the values for Vanderbilt referals
vandy_transaction_count_by_from_npi= full_2_Vandy.groupby(['from_npi'])['transaction_count'].sum().reset_index()
vandy_transaction_count_by_from_npi. sort_values('transaction_count', ascending=False)
#these are the npi's with the 5 most and least transaction count referred to Vanderbilt

Unnamed: 0,from_npi,transaction_count
391,1093753303,17194
741,1174517593,13187
1441,1316983695,11324
3356,1740377845,10680
171,1043394166,9887
...,...,...
2452,1548249188,50
3666,1811045966,50
2134,1467704643,50
1427,1316927999,50


In [60]:
# (4b)group by full address summing the patient_count and then sorting the values for Vanderbilt referals. can use this to find 
# out the facilities by address
vandy_pt_count_by_full_addy_1= full_2_Vandy.groupby(['full_addy_1'])['patient_count'].sum().reset_index()
vandy_pt_count_by_full_addy_1. sort_values('patient_count', ascending=False)
#these are the facilities's with the 5 most and least pt count referred to Vanderbilt

Unnamed: 0,full_addy_1,patient_count
812,"3601 TVC, NASHVILLE",298918
1120,"719 THOMPSON LN STE 30330, NASHVILLE",185903
810,"3601 THE VANDERBILT CLINIC, NASHVILLE",72718
694,"3024 BUSINESS PARK CIR, GOODLETTSVILLE",56760
1122,"719 THOMPSON LN, NASHVILLE",45120
...,...,...
776,"342 FREY ST, ASHLAND CITY",21
189,"1233 17TH AVE S, NASHVILLE",20
576,"2300 21ST AVE S, NASHVILLE",17
771,"3401 W END AVE, NASHVILLE",14


In [61]:
# (4b)group by full_addy_1 summing the transaction_count and then sorting the values for Vanderbilt referals. can use this to find 
# out the facilities by address
vandy_transaction_count_by_full_addy_1= full_2_Vandy.groupby(['full_addy_1'])['transaction_count'].sum().reset_index()
vandy_transaction_count_by_full_addy_1. sort_values('transaction_count', ascending=False)
#these are the facilities's with the 5 most and least transaction count referred to Vanderbilt

Unnamed: 0,full_addy_1,transaction_count
812,"3601 TVC, NASHVILLE",455501
1120,"719 THOMPSON LN STE 30330, NASHVILLE",294053
810,"3601 THE VANDERBILT CLINIC, NASHVILLE",120540
694,"3024 BUSINESS PARK CIR, GOODLETTSVILLE",61875
1122,"719 THOMPSON LN, NASHVILLE",60829
...,...,...
690,"301 W MAIN ST, WAVERLY",50
584,"233 JACKSON MEADOWS DR, HERMITAGE",50
189,"1233 17TH AVE S, NASHVILLE",50
633,"270 E COURT AVE, SELMER",50


In [59]:
# (4)group by from_npi summing the transaction_count and then sorting the values for Vanderbilt referals
vandy_transaction_count_by_from_npi= full_2_Vandy.groupby(['from_npi'])['transaction_count'].sum().reset_index()
vandy_transaction_count_by_from_npi. sort_values('transaction_count', ascending=False)
#these are the npi's with the 5 most and least transaction count referred to Vanderbilt

Unnamed: 0,from_npi,transaction_count
391,1093753303,17194
741,1174517593,13187
1441,1316983695,11324
3356,1740377845,10680
171,1043394166,9887
...,...,...
2452,1548249188,50
3666,1811045966,50
2134,1467704643,50
1427,1316927999,50


In [65]:
# (4b)group by display_name_1 summing the patient_count and then sorting the values for Vanderbilt referals.
vandy_pt_count_by_full_specialization_1= full_2_Vandy.groupby(['display_name_1'])['patient_count'].sum().reset_index()
vandy_pt_count_by_full_specialization_1. sort_values('patient_count', ascending=False)
#these are all the specializations referred to Vanderbilt

Unnamed: 0,display_name_1,patient_count
41,Diagnostic Radiology Physician,273518
21,Cardiovascular Disease Physician,155715
72,Internal Medicine Physician,94439
46,Family Medicine Physician,49751
43,Emergency Medicine Physician,48971
47,Family Nurse Practitioner,48033
94,Ophthalmology Physician,44886
14,Anatomic Pathology & Clinical Pathology Physician,44488
16,Anesthesiology Physician,26213
52,Gastroenterology Physician,24820


In [66]:
# (4b)group by display_name_1 summing the transaction_count and then sorting the values for Vanderbilt referals.
vandy_transaction_count_by_specialization_1= full_2_Vandy.groupby(['display_name_1'])['transaction_count'].sum().reset_index()
vandy_transaction_count_by_specialization_1. sort_values('transaction_count', ascending=False)
#these are all the specializations referred to Vanderbilt

Unnamed: 0,display_name_1,transaction_count
41,Diagnostic Radiology Physician,297039
21,Cardiovascular Disease Physician,216455
72,Internal Medicine Physician,161372
46,Family Medicine Physician,76037
94,Ophthalmology Physician,67601
47,Family Nurse Practitioner,65554
63,Hematology & Oncology Physician,60565
43,Emergency Medicine Physician,54441
14,Anatomic Pathology & Clinical Pathology Physician,50340
79,Nephrology Physician,49274
