In [2]:
import pandas as pd
import boto3
import io
from pathlib import Path

# S3 configuration
s3_bucket = "commercial-rates"  # or use os.getenv('S3_BUCKET')
s3_prefix = "commercial_rates"
specific_fact_table = "/service_code=0240U/data.parquet"      # or use os.getenv('S3_PREFIX')
s3_key = f"{s3_prefix}{specific_fact_table}"  
# Initialize S3 client
s3_client = boto3.client('s3')

try:
    # Get object from S3
    response = s3_client.get_object(Bucket=s3_bucket, Key=s3_key)
    
    # Read parquet directly from memory buffer
    df = pd.read_parquet(io.BytesIO(response['Body'].read()))
    
    # Basic info
    print(f"Shape: {df.shape}")
    print(f"Columns: {list(df.columns)}")
    print(f"Memory usage: {df.memory_usage(deep=True).sum() / 1024 / 1024:.1f} MB")
    print(f"Successfully loaded from s3://{s3_bucket}/{s3_key}")

    # Show first few rows
    df.head()
    
except Exception as e:
    print(f"Error loading from S3: {str(e)}")

Shape: (2105, 16)
Columns: ['service_code', 'CBSA Title', 'nppes_primary_specialty', 'Metropolitan Division Title', 'negotiated_rate', 'payer_name', 'tin', 'npi', 'nppes_provider_name', 'nppes_address_street', 'nppes_address_city', 'nppes_address_state', 'nppes_address_zip', 'billing_class', 'service_description', 'Metropolitan/Micropolitan Statistical Area']
Memory usage: 1.1 MB
Successfully loaded from s3://commercial-rates/commercial_rates/service_code=0240U/data.parquet


In [3]:
display(df)

Unnamed: 0,service_code,CBSA Title,nppes_primary_specialty,Metropolitan Division Title,negotiated_rate,payer_name,tin,npi,nppes_provider_name,nppes_address_street,nppes_address_city,nppes_address_state,nppes_address_zip,billing_class,service_description,Metropolitan/Micropolitan Statistical Area
0,0240U,"New York-Newark-Jersey City, NY-NJ","Nurse Practitioner, Pediatrics","Lakewood-New Brunswick, NJ",121.23,Centene_Fidelis,133544120.0,1598363459,"{'first': 'KRISTIN', 'last': 'GULLO', 'middle'...",225 COMMUNITY DR,GREAT NECK,NY,110215503,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
1,0240U,"New York-Newark-Jersey City, NY-NJ","Nurse Practitioner, Pediatrics","Lakewood-New Brunswick, NJ",121.23,Centene_Fidelis,133544120.0,1598363459,"{'first': 'KRISTIN', 'last': 'GULLO', 'middle'...",225 COMMUNITY DR,GREAT NECK,NY,110215503,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
2,0240U,"New York-Newark-Jersey City, NY-NJ","Nurse Practitioner, Pediatrics","Lakewood-New Brunswick, NJ",121.23,Centene_Fidelis,133544120.0,1598363459,"{'first': 'KRISTIN', 'last': 'GULLO', 'middle'...",225 COMMUNITY DR,GREAT NECK,NY,110215503,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
3,0240U,"New York-Newark-Jersey City, NY-NJ","Nurse Practitioner, Pediatrics","Lakewood-New Brunswick, NJ",121.23,Centene_Fidelis,133544120.0,1598363459,"{'first': 'KRISTIN', 'last': 'GULLO', 'middle'...",225 COMMUNITY DR,GREAT NECK,NY,110215503,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
4,0240U,"New York-Newark-Jersey City, NY-NJ","Nurse Practitioner, Pediatrics","Nassau County-Suffolk County, NY",121.23,Centene_Fidelis,133544120.0,1598363459,"{'first': 'KRISTIN', 'last': 'GULLO', 'middle'...",225 COMMUNITY DR,GREAT NECK,NY,110215503,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
2100,0240U,"New York-Newark-Jersey City, NY-NJ",Allergy & Immunology,"New York-Jersey City-White Plains, NY-NJ",121.23,Centene_Fidelis,133544120.0,1588669519,"{'first': 'ROBERT', 'last': 'CORRIEL', 'middle...",1129 NORTHERN BLVD,MANHASSET,NY,110303022,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
2101,0240U,"New York-Newark-Jersey City, NY-NJ",Allergy & Immunology,"New York-Jersey City-White Plains, NY-NJ",121.23,Centene_Fidelis,133544120.0,1588669519,"{'first': 'ROBERT', 'last': 'CORRIEL', 'middle...",1129 NORTHERN BLVD,MANHASSET,NY,110303022,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
2102,0240U,"New York-Newark-Jersey City, NY-NJ",Allergy & Immunology,"New York-Jersey City-White Plains, NY-NJ",121.23,Centene_Fidelis,133544120.0,1588669519,"{'first': 'ROBERT', 'last': 'CORRIEL', 'middle...",1129 NORTHERN BLVD,MANHASSET,NY,110303022,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
2103,0240U,"New York-Newark-Jersey City, NY-NJ",Allergy & Immunology,"New York-Jersey City-White Plains, NY-NJ",121.23,Centene_Fidelis,133544120.0,1588669519,"{'first': 'ROBERT', 'last': 'CORRIEL', 'middle...",1129 NORTHERN BLVD,MANHASSET,NY,110303022,professional,NFCT DS RNA 3 TARGETS UPPER RESPIRATORY SPECIMEN,Metropolitan Statistical Area
