## Setting up 3 dataframes: LA County Hazard Data, FEMA data, and FEMA Shapefile data

In [68]:
import pandas as pd


In [67]:
from google.colab import drive

drive.mount('/content/drive') # allow access to Drive

Drive already mounted at /content/drive; to attempt to forcibly remount, call drive.mount("/content/drive", force_remount=True).


In [69]:
import os
import geopandas as gpd


# list files and directories in your Google Drive root
# os.listdir('/content/drive/My Drive/BTTAI Group 46 - PREPARED/')
os.listdir('/content/drive/My Drive/Break Through Tech AI @ MIT/AI Studio Project/BTTAI Group 46 - PREPARED/') # my root

shapefile_path = ('/content/drive/My Drive/BTTAI Group 46 - PREPARED/NRI_Shapefile_CensusTracts.zip') # general path
shapefile_path = ('/content/drive/My Drive/Break Through Tech AI @ MIT/AI Studio Project/BTTAI Group 46 - PREPARED/NRI_Shapefile_CensusTracts.zip') # my path
gdf = gpd.read_file(shapefile_path)


In [None]:
import gspread
from gspread_dataframe import get_as_dataframe, set_with_dataframe

from google.colab import auth
from google.auth import default

#authenticate and create a client to interact with Google Sheets
auth.authenticate_user()
creds, _ = default()
gc = gspread.authorize(creds)

In [70]:
la_data_sheet = gc.open('Los Angeles Hazard Data')
fema_data_sheet = gc.open('cleaned_NRI_Table_CensusTracts_California')
worksheet = fema_data_sheet.sheet1  # Access the first sheet

# Convert the worksheet to a pandas DataFrame
fema_data_df = get_as_dataframe(worksheet)
print(fema_data_df.head())

     OID_        NRI_ID       STATE STATEABBRV  STATEFIPS   COUNTY COUNTYTYPE  \
0  4201.0  T06001400100  California         CA        6.0  Alameda     County   
1  4202.0  T06001400200  California         CA        6.0  Alameda     County   
2  4203.0  T06001400300  California         CA        6.0  Alameda     County   
3  4204.0  T06001400400  California         CA        6.0  Alameda     County   
4  4205.0  T06001400500  California         CA        6.0  Alameda     County   

   COUNTYFIPS  STCOFIPS     TRACT  ...  WNTW_ALRB  WNTW_ALRP  WNTW_ALRA  \
0         1.0    6001.0  400100.0  ...        0.0        0.0        0.0   
1         1.0    6001.0  400200.0  ...        0.0        0.0        0.0   
2         1.0    6001.0  400300.0  ...        0.0        0.0        0.0   
3         1.0    6001.0  400400.0  ...        0.0        0.0        0.0   
4         1.0    6001.0  400500.0  ...        0.0        0.0        0.0   

   WNTW_ALR_NPCTL  WNTW_RISKV  WNTW_RISKS  WNTW_RISKR     NRI_

In [None]:
tabs = la_data_sheet.worksheets() #list of all sheet names aka tabs in the la hazard data
la_data_df = {}
for tab in tabs:
  la_data_df[tab.title] = get_as_dataframe(tab)
  print(tab.title)

Sheet1
Wildfire_RCP45
Historic_Earthquakes
Tsunami_Tide_Gauges
Extreme_Heat
Los_Angeles_County_CVA_Social_Sensitivity_Index
Extreme_Precipitation_Low_Emissions_RCP45
LACoFD_Historic_Fire_Perimeters_(Feature_Layer)
LACoFD_Fire_Hazard_Severity_Zones_%E2%80%93_SRA_(Feature_Layer)
Social_Vulnerability_Index_2020_3398216233094230935
EJSM_Scores
Wildfire_RCP_8.5
LACoFD_Fire_Hazard_Severity_Zones_%E2%80%93_LRA_(Feature_Layer)
Extreme_Precipitation_Low_Emissions_RCP_8.5
Extreme_Heat_Low_Emissions_RCP_45


In [None]:
fema_data_df.columns

Index(['OID_', 'NRI_ID', 'STATE', 'STATEABBRV', 'STATEFIPS', 'COUNTY',
       'COUNTYTYPE', 'COUNTYFIPS', 'STCOFIPS', 'TRACT',
       ...
       'WNTW_ALRB', 'WNTW_ALRP', 'WNTW_ALRA', 'WNTW_ALR_NPCTL', 'WNTW_RISKV',
       'WNTW_RISKS', 'WNTW_RISKR', 'NRI_VER', 'Unnamed: 445', 'Unnamed: 446'],
      dtype='object', length=447)

## Renaming columns across FEMA data and LA Hazard data


In [71]:
# Renaming the census tract column in FEMA data and columns in LA Hazard data for consistency
fema_data_df.rename(columns={'TRACT': 'Census Tract'}, inplace = True)
la_data_df['Los_Angeles_County_CVA_Social_Sensitivity_Index'].rename(columns={'Census_Tract': 'Census Tract'}, inplace = True)
la_data_df['Social_Vulnerability_Index_2020_3398216233094230935'].rename(columns={'Tract 2020': 'Census Tract'}, inplace = True)
la_data_df['EJSM_Scores'].rename(columns={'Tract_1': 'Census Tract'}, inplace = True)

In [72]:
fema_data_df= fema_data_df[fema_data_df['COUNTY'] == 'Los Angeles'] #only keeping LA data

In [73]:
# Renaming other columns in FEMA data for clarity
fema_data_df.rename(columns={'POPULATION': 'Population'}, inplace = True)
fema_data_df.rename(columns={'SOVI_SCORE': 'Social Vulnerability Index'}, inplace = True)


## Creating sentences from FEMA data

In [76]:
# Process FEMA dataset to create sentences
def create_sentence(row):
  # including certain rows from the FEMA dataset
    census_tract = row['Census Tract']
    population = row['Population']
    svi = row['Social Vulnerability Index']
    fips = row['TRACTFIPS']
    county = row['COUNTY']
    risk_value = row['RISK_VALUE']


    return (
        f"In Census Tract {census_tract} (FIPS {fips}), located in {county}, the total population is {population}, "
        f"with a risk value of {risk_value} and a Social Vulnerability Index score of {svi}."
    )
# Create the sentences
fema_data_df['sentence'] = fema_data_df.apply(create_sentence, axis=1)
fema_data_df['sentence']

Unnamed: 0,sentence
1377,"In Census Tract 101110.0 (FIPS 6037101110.0), ..."
1378,"In Census Tract 101122.0 (FIPS 6037101122.0), ..."
1379,"In Census Tract 101220.0 (FIPS 6037101220.0), ..."
1380,"In Census Tract 101221.0 (FIPS 6037101221.0), ..."
1381,"In Census Tract 101222.0 (FIPS 6037101222.0), ..."
...,...
3867,"In Census Tract 980035.0 (FIPS 6037980035.0), ..."
3868,"In Census Tract 980036.0 (FIPS 6037980036.0), ..."
3869,"In Census Tract 980037.0 (FIPS 6037980037.0), ..."
3870,"In Census Tract 980038.0 (FIPS 6037980038.0), ..."


## Standardizing census tract format across FEMA and La Hazard data


In [77]:
fema_data_df['Census Tract'] = fema_data_df['Census Tract'].astype(str)

# Convert 'Census Tract' to string in LA hazard data
la_data_df['Los_Angeles_County_CVA_Social_Sensitivity_Index']['Census Tract'] = la_data_df['Los_Angeles_County_CVA_Social_Sensitivity_Index']['Census Tract'].astype(str)
social_vulnerability = la_data_df['Social_Vulnerability_Index_2020_3398216233094230935']
social_vulnerability['Census Tract'] = social_vulnerability['Census Tract'].astype(str)
ejsm_scores = la_data_df['EJSM_Scores']
ejsm_scores['Census Tract'] = ejsm_scores['Census Tract'].astype(str)

In [78]:
la_data_df['Los_Angeles_County_CVA_Social_Sensitivity_Index']['Census Tract'] = la_data_df['Los_Angeles_County_CVA_Social_Sensitivity_Index']['Census Tract'].str.replace('Census Tract ', '')

#extracting last 6 digits of EJSM scores
la_data_df['EJSM_Scores']['Census Tract'] = la_data_df['EJSM_Scores']['Census Tract'].str[-6:]

In [79]:
# removing decimals from any columns that have it
for tab_name, df in la_data_df.items():
  if 'Census Tract' in df.columns:
    df['Census Tract'] = df['Census Tract'].astype(str).str.replace('.', '').str[:6].str.zfill(6)

In [82]:
#confirming tabs and printing column info for LA County Hazard data
for tab_name, df in la_data_df.items():
  print(f"Tab Name: {tab_name}")
  print(df.columns)
  # print(df.head())

Tab Name: Sheet1
Index(['Unnamed: 0', 'Unnamed: 1', 'Unnamed: 2', 'Unnamed: 3', 'Unnamed: 4',
       'Unnamed: 5', 'Unnamed: 6', 'Unnamed: 7', 'Unnamed: 8', 'Unnamed: 9',
       'Unnamed: 10', 'Unnamed: 11', 'Unnamed: 12', 'Unnamed: 13',
       'Unnamed: 14', 'Unnamed: 15', 'Unnamed: 16', 'Unnamed: 17',
       'Unnamed: 18', 'Unnamed: 19', 'Unnamed: 20', 'Unnamed: 21',
       'Unnamed: 22', 'Unnamed: 23', 'Unnamed: 24', 'Unnamed: 25'],
      dtype='object')
Tab Name: Wildfire_RCP45
Index(['OBJECTID', 'Geo_UID', 'Grid_Num', 'longitude', 'latitude', 'Baseline',
       'F_2050', 'F_2080', 'Shape_Length', 'Shape_Area', 'Mid_Cent',
       'Late_Cent', 'Shape__Area', 'Shape__Length', 'sentence'],
      dtype='object')
Tab Name: Historic_Earthquakes
Index(['X', 'Y', 'OBJECTID', 'source', 'ext_id', 'cat1', 'cat2', 'org_name',
       'Name', 'info2', 'post_id', 'link', 'use_type', 'latitude', 'longitude',
       'date_updated', 'POINT_X', 'POINT_Y', 'sentence'],
      dtype='object')
Tab Name: 

## Merging FEMA data and LA Hazard data on census tract

In [117]:
# # Merging the FEMA Data with LA Hazard Data (matching 'Census Tract')

# merged_data = pd.merge(la_data_df['Sheet1'], fema_data_df[['Census Tract', 'sentence']],
#                        on='Census Tract', how='left')

# Merging la and fema data on census tract

for tab in tabs:

    # Check if the 'Census Tract' column exists in the current tab
    if 'Census Tract' in la_data_df[tab.title].columns:

        # Merge based on Census Tract column
        merged_data = pd.merge(fema_data_df, la_data_df[tab.title], on='Census Tract', how='left')
        print(f"Merged data for tab: {tab.title}")
        print(merged_data.head())
    else:
        print(f"No Census Tract column found in tab: {tab.title}")


No Census Tract column found in tab: Sheet1
No Census Tract column found in tab: Wildfire_RCP45
No Census Tract column found in tab: Historic_Earthquakes
No Census Tract column found in tab: Tsunami_Tide_Gauges
No Census Tract column found in tab: Extreme_Heat
Merged data for tab: Los_Angeles_County_CVA_Social_Sensitivity_Index
     OID_        NRI_ID       STATE STATEABBRV  STATEFIPS       COUNTY  \
0  5578.0  T06037101110  California         CA        6.0  Los Angeles   
1  5579.0  T06037101122  California         CA        6.0  Los Angeles   
2  5580.0  T06037101220  California         CA        6.0  Los Angeles   
3  5581.0  T06037101221  California         CA        6.0  Los Angeles   
4  5582.0  T06037101222  California         CA        6.0  Los Angeles   

  COUNTYTYPE  COUNTYFIPS  STCOFIPS Census Tract     TRACTFIPS  Population_x  \
0     County        37.0    6037.0     101110.0  6.037101e+09        4926.0   
1     County        37.0    6037.0     101122.0  6.037101e+09      

## Generating more sentences from FEMA Shapefile data

---



In [118]:
gdf.rename(columns={'TRACT': 'Census Tract'}, inplace = True) #renaming gdf column to "Census Tract"
la_gdf = gdf[gdf['COUNTY'] == 'Los Angeles'] #only keeping LA data
# print(la_gdf.head())
print(la_gdf.columns)

KeyError: 'COUNTY'

In [119]:
# # Converting whole geodataframe to string
# la_gdf_string = la_gdf.to_string()
# print(la_gdf)

In [120]:
# Adjust display width to show all columns
pd.set_option('display.max_columns', None)

# Print all column names
print(la_gdf.columns.tolist())

['NRI_ID', 'STATE', 'STATEABBRV', 'STATEFIPS', 'COUNTY', 'COUNTYTYPE', 'COUNTYFIPS', 'STCOFIPS', 'Census Tract', 'TRACTFIPS', 'Population', 'BUILDVALUE', 'AGRIVALUE', 'AREA', 'RISK_VALUE', 'RISK_SCORE', 'RISK_RATNG', 'RISK_SPCTL', 'EAL_SCORE', 'EAL_RATNG', 'EAL_SPCTL', 'EAL_VALT', 'EAL_VALB', 'EAL_VALP', 'EAL_VALPE', 'EAL_VALA', 'ALR_VALB', 'ALR_VALP', 'ALR_VALA', 'ALR_NPCTL', 'ALR_VRA_NP', 'Social Vulnerability Index', 'SOVI_RATNG', 'SOVI_SPCTL', 'RESL_SCORE', 'RESL_RATNG', 'RESL_SPCTL', 'RESL_VALUE', 'CRF_VALUE', 'AVLN_EVNTS', 'AVLN_AFREQ', 'AVLN_EXP_A', 'AVLN_EXPB', 'AVLN_EXPP', 'AVLN_EXPPE', 'AVLN_EXPT', 'AVLN_HLRB', 'AVLN_HLRP', 'AVLN_HLRR', 'AVLN_EALB', 'AVLN_EALP', 'AVLN_EALPE', 'AVLN_EALT', 'AVLN_EALS', 'AVLN_EALR', 'AVLN_ALRB', 'AVLN_ALRP', 'AVLN_ALR_N', 'AVLN_RISKV', 'AVLN_RISKS', 'AVLN_RISKR', 'CFLD_EVNTS', 'CFLD_AFREQ', 'CFLD_EXP_A', 'CFLD_EXPB', 'CFLD_EXPP', 'CFLD_EXPPE', 'CFLD_EXPT', 'CFLD_HLRB', 'CFLD_HLRP', 'CFLD_HLRR', 'CFLD_EALB', 'CFLD_EALP', 'CFLD_EALPE', 'CFLD_EALT

In [121]:
#filtering out tabs with lat and long in LA Hazard data
tabs_with_latlong = []
for tab in tabs:
  if 'latitude' in la_data_df[tab.title].columns and 'longitude' in la_data_df[tab.title].columns:
    tabs_with_latlong.append(tab.title)
print(tabs_with_latlong)

['Wildfire_RCP45', 'Historic_Earthquakes', 'Tsunami_Tide_Gauges', 'Extreme_Heat', 'Extreme_Precipitation_Low_Emissions_RCP45', 'Wildfire_RCP_8.5', 'Extreme_Precipitation_Low_Emissions_RCP_8.5', 'Extreme_Heat_Low_Emissions_RCP_45']


In [122]:
#List to store merged data
all_merged_data = []

In [123]:
for tab_title in tabs_with_latlong:
  df = la_data_df[tab_title]
  #convert lat/long to geometry
  gdf = gpd.GeoDataFrame(df, geometry=gpd.points_from_xy(df['longitude'], df['latitude']))
  #spatial join with LA county shapefile
  gdf = gpd.sjoin(gdf, la_gdf[['Census Tract', 'geometry']], how='left', predicate='within')
  all_merged_data.append(merged_data)

  print(f"Merged data for tab with lat/long: {tab_title}")
  print(gdf.head())

Merged data for tab with lat/long: Wildfire_RCP45
   OBJECTID           Geo_UID  Grid_Num  longitude  latitude  Baseline  \
0         1    32.75-118.4375     17562  -118.4375   32.7500    2.9133   
1         2   32.8125-118.375     17742  -118.3750   32.8125    4.2058   
2         3  32.8125-118.4375     17563  -118.4375   32.8125   19.1550   
3         4     32.8125-118.5     17384  -118.5000   32.8125   12.5058   
4         5  32.8125-118.5625     17205  -118.5625   32.8125    2.8242   

   F_2050  F_2080  Shape_Length    Shape_Area  Mid_Cent  Late_Cent  \
0   -1.34   -1.97      0.110417  3.124653e-04     1.573      0.943   
1   -1.87   -2.67      0.121772  5.804570e-04     2.336      1.536   
2   -6.92  -10.60      0.225823  3.189656e-03    12.235      8.555   
3   -4.22   -6.74      0.218413  2.354185e-03     8.286      5.766   
4   -1.05   -1.66      0.005118  9.255045e-07     1.774      1.164   

    Shape__Area  Shape__Length  \
0  4.606830e+06   12910.061310   
1  8.559597e+06 

Use `to_crs()` to reproject one of the input geometries to match the CRS of the other.

Left CRS: None
Right CRS: EPSG:3857

  gdf = gpd.sjoin(gdf, la_gdf[['Census Tract', 'geometry']], how='left', predicate='within')
Use `to_crs()` to reproject one of the input geometries to match the CRS of the other.

Left CRS: None
Right CRS: EPSG:3857

  gdf = gpd.sjoin(gdf, la_gdf[['Census Tract', 'geometry']], how='left', predicate='within')
Use `to_crs()` to reproject one of the input geometries to match the CRS of the other.

Left CRS: None
Right CRS: EPSG:3857

  gdf = gpd.sjoin(gdf, la_gdf[['Census Tract', 'geometry']], how='left', predicate='within')
Use `to_crs()` to reproject one of the input geometries to match the CRS of the other.

Left CRS: None
Right CRS: EPSG:3857

  gdf = gpd.sjoin(gdf, la_gdf[['Census Tract', 'geometry']], how='left', predicate='within')
Use `to_crs()` to reproject one of the input geometries to match the CRS of the other.

Left CRS: None
Right CRS: EPSG:3857

  g

## Generating sentences from FEMA shapefile data, also includes latitude and longitude

In [91]:
# Save GeoDataFrame to CSV
la_gdf.to_csv('la_gdf.csv', index=False)

# Download the CSV
from google.colab import files
files.download('la_gdf.csv')

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

In [124]:
# Renaming columns in FEMA shapefile data for clarity
la_gdf.rename(columns={'POPULATION': 'Population'}, inplace = True)
la_gdf.rename(columns={'SOVI_SCORE': 'Social Vulnerability Index'}, inplace = True)

In [125]:
# Making sentences from FEMA shapefile data
# Process FEMA dataset to create sentences
# def create_sentence(row):
#   # including certain rows from the FEMA dataset
#     census_tract = row['Census Tract']
#     population = row['Population']
#     svi = row['Social Vulnerability Index']
#     fips = row['TRACTFIPS']
#     county = row['COUNTY']
#     risk_value = row['RISK_VALUE']


#     return (
#         f"In Census Tract {census_tract} (FIPS {fips}), located in {county}, the total population is {population}, "
#         f"with a risk value of {risk_value} and a Social Vulnerability Index score of {svi}."
#     )
# Create the sentences
la_gdf['sentence'] = la_gdf.apply(create_sentence, axis=1)
la_gdf['sentence']

Unnamed: 0,sentence
5577,"In Census Tract 101110 (FIPS 06037101110), loc..."
5578,"In Census Tract 101122 (FIPS 06037101122), loc..."
5579,"In Census Tract 101220 (FIPS 06037101220), loc..."
5580,"In Census Tract 101221 (FIPS 06037101221), loc..."
5581,"In Census Tract 101222 (FIPS 06037101222), loc..."
...,...
8067,"In Census Tract 980035 (FIPS 06037980035), loc..."
8068,"In Census Tract 980036 (FIPS 06037980036), loc..."
8069,"In Census Tract 980037 (FIPS 06037980037), loc..."
8070,"In Census Tract 980038 (FIPS 06037980038), loc..."


In [126]:
#merging la data with la county shapefile on census tract
for tab in tabs:

    # Check if the 'Census Tract' column exists in the current tab
    if 'Census Tract' in la_data_df[tab.title].columns:

        # Merge based on Census Tract column
        merged_data2 = pd.merge(la_data_df[tab.title], la_gdf[['Census Tract', 'geometry']], on='Census Tract', how='left')

        print(f"Merged data for tab: {tab.title}")
        # print(merged_data2.head())

        all_merged_data.append(merged_data2)
    else:
        print(f"No Census Tract column found in tab: {tab.title}")

No Census Tract column found in tab: Sheet1
No Census Tract column found in tab: Wildfire_RCP45
No Census Tract column found in tab: Historic_Earthquakes
No Census Tract column found in tab: Tsunami_Tide_Gauges
No Census Tract column found in tab: Extreme_Heat
Merged data for tab: Los_Angeles_County_CVA_Social_Sensitivity_Index
No Census Tract column found in tab: Extreme_Precipitation_Low_Emissions_RCP45
No Census Tract column found in tab: LACoFD_Historic_Fire_Perimeters_(Feature_Layer)
No Census Tract column found in tab: LACoFD_Fire_Hazard_Severity_Zones_%E2%80%93_SRA_(Feature_Layer)
Merged data for tab: Social_Vulnerability_Index_2020_3398216233094230935
Merged data for tab: EJSM_Scores
No Census Tract column found in tab: Wildfire_RCP_8.5
No Census Tract column found in tab: LACoFD_Fire_Hazard_Severity_Zones_%E2%80%93_LRA_(Feature_Layer)
No Census Tract column found in tab: Extreme_Precipitation_Low_Emissions_RCP_8.5
No Census Tract column found in tab: Extreme_Heat_Low_Emissions

In [127]:
all_merged_data

[        OID_        NRI_ID       STATE STATEABBRV  STATEFIPS       COUNTY  \
 0     5578.0  T06037101110  California         CA        6.0  Los Angeles   
 1     5579.0  T06037101122  California         CA        6.0  Los Angeles   
 2     5580.0  T06037101220  California         CA        6.0  Los Angeles   
 3     5581.0  T06037101221  California         CA        6.0  Los Angeles   
 4     5582.0  T06037101222  California         CA        6.0  Los Angeles   
 ...      ...           ...         ...        ...        ...          ...   
 2490  8068.0  T06037980035  California         CA        6.0  Los Angeles   
 2491  8069.0  T06037980036  California         CA        6.0  Los Angeles   
 2492  8070.0  T06037980037  California         CA        6.0  Los Angeles   
 2493  8071.0  T06037980038  California         CA        6.0  Los Angeles   
 2494  8072.0  T06037980039  California         CA        6.0  Los Angeles   
 
      COUNTYTYPE  COUNTYFIPS  STCOFIPS Census Tract     TRACTF

In [128]:
print(type(all_merged_data))  # Check if it's a list
# print(len(all_merged_data))  # See how many items are in the list
# print(all_merged_data[0])  # Check the structure of the first item

<class 'list'>


In [129]:
# df_cleaned = all_merged_data.drop(columns='geometry', errors='ignore')  # Drop geometry column if you don't need it

AttributeError: 'list' object has no attribute 'drop'

In [130]:
#combining merged data from both methods
final_merged_data = pd.concat(all_merged_data, ignore_index=True)
print(final_merged_data.columns)
final_merged_data.head()


Index(['OID_', 'NRI_ID', 'STATE', 'STATEABBRV', 'STATEFIPS', 'COUNTY',
       'COUNTYTYPE', 'COUNTYFIPS', 'STCOFIPS', 'Census Tract',
       ...
       'Sum of series for Household Characteristics theme',
       'Percentile ranking for Household Characteristics theme summary',
       'Sum of series for Racial and Ethnic Minority Status theme',
       'Percentile ranking for Racial and Ethnic Minority Status theme',
       'Sum of series for Housing Type/ Transportation theme',
       'Percentile ranking for Housing Type/ Transportation theme',
       'Sum of Series Themes', 'Overall Percentile Ranking', 'ObjectID',
       'Level of Vulnerability'],
      dtype='object', length=524)


Unnamed: 0,OID_,NRI_ID,STATE,STATEABBRV,STATEFIPS,COUNTY,COUNTYTYPE,COUNTYFIPS,STCOFIPS,Census Tract,TRACTFIPS,Population,BUILDVALUE,AGRIVALUE,AREA,RISK_VALUE,RISK_SCORE,RISK_RATNG,RISK_SPCTL,EAL_SCORE,EAL_RATNG,EAL_SPCTL,EAL_VALT,EAL_VALB,EAL_VALP,EAL_VALPE,EAL_VALA,ALR_VALB,ALR_VALP,ALR_VALA,ALR_NPCTL,ALR_VRA_NPCTL,Social Vulnerability Index,SOVI_RATNG,SOVI_SPCTL,RESL_SCORE,RESL_RATNG,RESL_SPCTL,RESL_VALUE,CRF_VALUE,AVLN_EVNTS,AVLN_AFREQ,AVLN_EXP_AREA,AVLN_EXPB,AVLN_EXPP,AVLN_EXPPE,AVLN_EXPT,AVLN_HLRB,AVLN_HLRP,AVLN_HLRR,AVLN_EALB,AVLN_EALP,AVLN_EALPE,AVLN_EALT,AVLN_EALS,AVLN_EALR,AVLN_ALRB,AVLN_ALRP,AVLN_ALR_NPCTL,AVLN_RISKV,AVLN_RISKS,AVLN_RISKR,CFLD_AFREQ,CFLD_EXP_AREA,CFLD_EXPB,CFLD_EXPP,CFLD_EXPPE,CFLD_EXPT,CFLD_HLRB,CFLD_HLRP,CFLD_HLRR,CFLD_EALB,CFLD_EALP,CFLD_EALPE,CFLD_EALT,CFLD_EALS,CFLD_EALR,CFLD_ALRB,CFLD_ALRP,CFLD_ALR_NPCTL,CFLD_RISKV,CFLD_RISKS,CFLD_RISKR,CWAV_EVNTS,CWAV_AFREQ,CWAV_EXP_AREA,CWAV_EXPB,CWAV_EXPP,CWAV_EXPPE,CWAV_EXPA,CWAV_EXPT,CWAV_HLRB,CWAV_HLRP,CWAV_HLRA,CWAV_HLRR,CWAV_EALB,CWAV_EALP,CWAV_EALPE,CWAV_EALA,CWAV_EALT,CWAV_EALS,CWAV_EALR,CWAV_ALRB,CWAV_ALRP,CWAV_ALRA,CWAV_ALR_NPCTL,CWAV_RISKV,CWAV_RISKS,CWAV_RISKR,DRGT_EVNTS,DRGT_AFREQ,DRGT_EXP_AREA,DRGT_EXPA,DRGT_EXPT,DRGT_HLRA,DRGT_HLRR,DRGT_EALA,DRGT_EALT,DRGT_EALS,DRGT_EALR,DRGT_ALRA,DRGT_ALR_NPCTL,DRGT_RISKV,DRGT_RISKS,DRGT_RISKR,ERQK_AFREQ,ERQK_EXP_AREA,ERQK_EXPB,ERQK_EXPP,ERQK_EXPPE,ERQK_EXPT,ERQK_HLRB,ERQK_HLRP,ERQK_HLRR,ERQK_EALB,ERQK_EALP,ERQK_EALPE,ERQK_EALT,ERQK_EALS,ERQK_EALR,ERQK_ALRB,ERQK_ALRP,ERQK_ALR_NPCTL,ERQK_RISKV,ERQK_RISKS,ERQK_RISKR,HAIL_EVNTS,HAIL_AFREQ,HAIL_EXP_AREA,HAIL_EXPB,HAIL_EXPP,HAIL_EXPPE,HAIL_EXPA,HAIL_EXPT,HAIL_HLRB,HAIL_HLRP,HAIL_HLRA,HAIL_HLRR,HAIL_EALB,HAIL_EALP,HAIL_EALPE,HAIL_EALA,HAIL_EALT,HAIL_EALS,HAIL_EALR,HAIL_ALRB,HAIL_ALRP,HAIL_ALRA,HAIL_ALR_NPCTL,HAIL_RISKV,HAIL_RISKS,HAIL_RISKR,HWAV_EVNTS,HWAV_AFREQ,HWAV_EXP_AREA,HWAV_EXPB,HWAV_EXPP,HWAV_EXPPE,HWAV_EXPA,HWAV_EXPT,HWAV_HLRB,HWAV_HLRP,HWAV_HLRA,HWAV_HLRR,HWAV_EALB,HWAV_EALP,HWAV_EALPE,HWAV_EALA,HWAV_EALT,HWAV_EALS,HWAV_EALR,HWAV_ALRB,HWAV_ALRP,HWAV_ALRA,HWAV_ALR_NPCTL,HWAV_RISKV,HWAV_RISKS,HWAV_RISKR,HRCN_EVNTS,HRCN_AFREQ,HRCN_EXP_AREA,HRCN_EXPB,HRCN_EXPP,HRCN_EXPPE,HRCN_EXPA,HRCN_EXPT,HRCN_HLRB,HRCN_HLRP,HRCN_HLRA,HRCN_HLRR,HRCN_EALB,HRCN_EALP,HRCN_EALPE,HRCN_EALA,HRCN_EALT,HRCN_EALS,HRCN_EALR,HRCN_ALRB,HRCN_ALRP,HRCN_ALRA,HRCN_ALR_NPCTL,HRCN_RISKV,HRCN_RISKS,HRCN_RISKR,ISTM_HLRR,ISTM_EALR,ISTM_RISKR,LNDS_EVNTS,LNDS_AFREQ,LNDS_EXP_AREA,LNDS_EXPB,LNDS_EXPP,LNDS_EXPPE,LNDS_EXPT,LNDS_HLRB,LNDS_HLRP,LNDS_HLRR,LNDS_EALB,LNDS_EALP,LNDS_EALPE,LNDS_EALT,LNDS_EALS,LNDS_EALR,LNDS_ALRB,LNDS_ALRP,LNDS_ALR_NPCTL,LNDS_RISKV,LNDS_RISKS,LNDS_RISKR,LTNG_EVNTS,LTNG_AFREQ,LTNG_EXP_AREA,LTNG_EXPB,LTNG_EXPP,LTNG_EXPPE,LTNG_EXPT,LTNG_HLRB,LTNG_HLRP,LTNG_HLRR,LTNG_EALB,LTNG_EALP,LTNG_EALPE,LTNG_EALT,LTNG_EALS,LTNG_EALR,LTNG_ALRB,LTNG_ALRP,LTNG_ALR_NPCTL,LTNG_RISKV,LTNG_RISKS,LTNG_RISKR,RFLD_EVNTS,RFLD_AFREQ,RFLD_EXP_AREA,RFLD_EXPB,RFLD_EXPP,RFLD_EXPPE,RFLD_EXPA,RFLD_EXPT,RFLD_HLRB,RFLD_HLRP,RFLD_HLRA,RFLD_HLRR,RFLD_EALB,RFLD_EALP,RFLD_EALPE,RFLD_EALA,RFLD_EALT,RFLD_EALS,RFLD_EALR,RFLD_ALRB,RFLD_ALRP,RFLD_ALRA,RFLD_ALR_NPCTL,RFLD_RISKV,RFLD_RISKS,RFLD_RISKR,SWND_EVNTS,SWND_AFREQ,SWND_EXP_AREA,SWND_EXPB,SWND_EXPP,SWND_EXPPE,SWND_EXPA,SWND_EXPT,SWND_HLRB,SWND_HLRP,SWND_HLRA,SWND_HLRR,SWND_EALB,SWND_EALP,SWND_EALPE,SWND_EALA,SWND_EALT,SWND_EALS,SWND_EALR,SWND_ALRB,SWND_ALRP,SWND_ALRA,SWND_ALR_NPCTL,SWND_RISKV,SWND_RISKS,SWND_RISKR,TRND_EVNTS,TRND_AFREQ,TRND_EXP_AREA,TRND_EXPB,TRND_EXPP,TRND_EXPPE,TRND_EXPA,TRND_EXPT,TRND_HLRB,TRND_HLRP,TRND_HLRA,TRND_HLRR,TRND_EALB,TRND_EALP,TRND_EALPE,TRND_EALA,TRND_EALT,TRND_EALS,TRND_EALR,TRND_ALRB,TRND_ALRP,TRND_ALRA,TRND_ALR_NPCTL,TRND_RISKV,TRND_RISKS,TRND_RISKR,TSUN_EVNTS,TSUN_AFREQ,TSUN_EXP_AREA,TSUN_EXPB,TSUN_EXPP,TSUN_EXPPE,TSUN_EXPT,TSUN_HLRB,TSUN_HLRP,TSUN_HLRR,TSUN_EALB,TSUN_EALP,TSUN_EALPE,TSUN_EALT,TSUN_EALS,TSUN_EALR,TSUN_ALRB,TSUN_ALRP,TSUN_ALR_NPCTL,TSUN_RISKV,TSUN_RISKS,TSUN_RISKR,VLCN_EVNTS,VLCN_AFREQ,VLCN_EXP_AREA,VLCN_EXPB,VLCN_EXPP,VLCN_EXPPE,VLCN_EXPT,VLCN_HLRB,VLCN_HLRP,VLCN_HLRR,VLCN_EALB,VLCN_EALP,VLCN_EALPE,VLCN_EALT,VLCN_EALS,VLCN_EALR,VLCN_ALRB,VLCN_ALRP,VLCN_ALR_NPCTL,VLCN_RISKV,VLCN_RISKS,VLCN_RISKR,WFIR_AFREQ,WFIR_EXP_AREA,WFIR_EXPB,WFIR_EXPP,WFIR_EXPPE,WFIR_EXPA,WFIR_EXPT,WFIR_HLRB,WFIR_HLRP,WFIR_HLRA,WFIR_HLRR,WFIR_EALB,WFIR_EALP,WFIR_EALPE,WFIR_EALA,WFIR_EALT,WFIR_EALS,WFIR_EALR,WFIR_ALRB,WFIR_ALRP,WFIR_ALRA,WFIR_ALR_NPCTL,WFIR_RISKV,WFIR_RISKS,WFIR_RISKR,WNTW_EVNTS,WNTW_AFREQ,WNTW_EXP_AREA,WNTW_EXPB,WNTW_EXPP,WNTW_EXPPE,WNTW_EXPA,WNTW_EXPT,WNTW_HLRB,WNTW_HLRP,WNTW_HLRA,WNTW_HLRR,WNTW_EALB,WNTW_EALP,WNTW_EALPE,WNTW_EALA,WNTW_EALT,WNTW_EALS,WNTW_EALR,WNTW_ALRB,WNTW_ALRP,WNTW_ALRA,WNTW_ALR_NPCTL,WNTW_RISKV,WNTW_RISKS,WNTW_RISKR,NRI_VER,Unnamed: 445,Unnamed: 446,sentence_x,OBJECTID,CIscore,HazScore,HealthScore,SVscore,CCVscore,Shape__Area,Shape__Length,sentence_y,County,CSA_Type,CSA_Label,DRP_Planning_Area,DPH_Service_Planning_Area,City_of_Los_Angeles_CPA,Children,Older_Adults,Older_Adults_Living_Alone,Limited_English,No_High_School_Diploma,Female,Female_Householder,Asthma,Cardiovascular_Disease,Disability,No_Health_Insurance,Living_in_Group_Quarters,Mobile_Homes,Rent_Burden,Renters,Median_Income,Poverty,Households_Without_Vehicle_Acce,Transit_Access,Outdoor_Workers,Unemployed,Foreign_Born,Library_Access,No_Internet_Subscription,Voter_Turnout_Rate,Hispanic_Latinx,White,Black,Native_Tribal,Asian,NHOPI,Other_Race,Two_or_More_Races,SoVI_Score,SoVI_Thirds,ObjectId,sentence,geometry,OBJECTID_1,Tract Label,FIPS,Location,Area in Square Miles,"Population estimate, 2016-2020 ACS","Population estimate MOE, 2016-2020 ACS","Housing units estimate, 2016-2020 ACS","Housing units estimate MOE, 2016-2020 ACS","Households estimate, 2016-2020 ACS","Households estimate MOE, 2016-2020 ACS",Sum of series for Socioeconomic Status theme,Percentile ranking for Socioeconomic Status theme summary,Sum of series for Household Characteristics theme,Percentile ranking for Household Characteristics theme summary,Sum of series for Racial and Ethnic Minority Status theme,Percentile ranking for Racial and Ethnic Minority Status theme,Sum of series for Housing Type/ Transportation theme,Percentile ranking for Housing Type/ Transportation theme,Sum of Series Themes,Overall Percentile Ranking,ObjectID,Level of Vulnerability
0,5578.0,T06037101110,California,CA,6.0,Los Angeles,County,37.0,6037.0,101110.0,6037101000.0,4926.0,477686853.0,0.0,0.445536,842402.7,65.487799,Relatively Moderate,27.498353,54.422576,Relatively Low,20.645728,551018.3,403242.8,0.012739,147775.504916,0.0,0.000844,3e-06,0.0,55.882284,64.750511,81.389999,Very High,0.713046,15.44,Very Low,0.477817,2.471082,1.528811,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,2.7e-05,3.618018e-07,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.445536,0.0,0.0,0.0,0.0,0.0,1.186214e-07,8.7618e-08,0.01238,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,1659.0,75.409091,0.445536,0.0,0.0,1.2e-05,No Rating,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,No Rating,0.009149,0.445536,477679000.0,4926.0,57141600000.0,57619280000.0,0.091516,0.000269,Relatively Low,399951.6,0.012112,140495.309891,540446.909891,87.479155,Relatively Moderate,0.000837,2e-06,88.231909,826240.975554,89.82424,Relatively High,4.0,0.090975,0.445536,477686853.0,4926.0,57141600000.0,0.0,57619290000.0,1.581831e-07,4.956726e-09,7e-06,Very Low,6.87427,2e-06,25.767398,0.0,32.641668,7.541647,Very Low,1.439075e-08,4.50939e-10,0.0,4.97878,49.902929,9.486039,Very Low,79.987853,4.952813,0.445536,477686853.0,4926.0,57141600000.0,0.0,57619290000.0,6.53204e-10,1.4959e-08,4.6e-05,Very Low,1.532033,0.000364,4218.559621,0.0,4220.091653,39.399206,Relatively Low,3.20719e-09,7.382642e-08,0.0,32.637339,6451.720938,43.973267,Relatively Low,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,Not Applicable,Not Applicable,Not Applicable,0.0,0.01,0.130187,220103800.0,1763.055221,20451440000.0,20671540000.0,4.8e-05,9.928904e-08,Very Low,104.573712,1.750521e-06,20.306039,124.879751,45.893583,Relatively Low,2.189169e-07,3.55363e-10,45.878263,190.91749,47.748317,Relatively Low,34.0,1.545453,0.445536,477686853.0,4926.0,57141600000.0,57619290000.0,8.817994e-09,6.342172e-09,Relatively Moderate,6.509815,4.8e-05,560.074446,566.584261,11.972784,Very Low,1.362779e-08,9.801518e-09,8.575604,866.200035,14.160278,Very Low,106.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2e-06,8.6913e-07,0.003637,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,6.0,0.154109,0.445536,477686853.0,4926.0,57141600000.0,0.0,57619290000.0,7.585231e-09,2.891832e-08,1e-06,Very Low,0.558394,2.2e-05,254.656242,0.0,255.214637,11.555237,Very Low,1.168955e-09,4.456582e-09,0.0,8.810148,390.174847,12.263949,Very Low,0.0,6.1e-05,0.445536,477686853.0,4926.0,57141600000.0,0.0,57619290000.0,0.108624,0.000567,0.0,Relatively Moderate,3169.694052,0.00017,1977.597367,0.0,5147.291419,15.652297,Very Low,7e-06,3.460872e-08,0.0,13.496197,7869.233787,18.861485,Very Low,0.0,0.004501,0.0,0.0,0.0,0.0,0.0,1.3e-05,3e-06,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4,2e-05,6.595474e-07,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,11.927087,0.73852,0.445536,38085550.0,513.860162,5960778000.0,0.0,5998863000.0,6.416375e-09,6.173231e-09,2e-12,Relatively Low,1.474382,1.9e-05,223.233913,0.0,224.708295,27.768514,Relatively Low,3.086504e-09,3.906679e-09,0.0,22.327783,343.536428,29.21681,Relatively Low,March 2023,,,"In Census Tract 101110.0 (FIPS 6037101110.0), ...",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
1,5579.0,T06037101122,California,CA,6.0,Los Angeles,County,37.0,6037.0,101122.0,6037101000.0,3728.0,508893146.0,0.0,1.031178,1324088.0,78.244066,Relatively Moderate,46.299143,81.71548,Relatively Moderate,56.731825,1318930.0,1246571.0,0.006238,72359.272326,0.0,0.00245,2e-06,0.0,87.796228,82.897303,31.83,Relatively Low,0.224797,15.44,Very Low,0.477817,2.471082,1.003911,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,2.7e-05,3.618018e-07,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,1.031178,0.0,0.0,0.0,0.0,0.0,1.186214e-07,8.7618e-08,0.01238,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,1659.0,75.409091,1.031178,0.0,0.0,1.2e-05,No Rating,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,No Rating,0.009166,1.031178,508887000.0,3728.0,43244800000.0,43753690000.0,0.078247,0.000157,Relatively Low,364990.3,0.00537,62293.049445,427283.349445,85.954858,Relatively Moderate,0.000717,1e-06,87.226672,428954.462474,85.785806,Relatively Moderate,4.0,0.090975,1.031178,508893146.0,3728.0,43244800000.0,0.0,43753690000.0,1.581831e-07,4.956726e-09,7e-06,Very Low,7.323352,2e-06,19.500783,0.0,26.824136,5.929862,Very Low,1.439075e-08,4.50939e-10,0.0,5.585403,26.929045,4.687723,Very Low,85.035807,5.265375,1.031178,508893146.0,3728.0,43244800000.0,0.0,43753690000.0,6.53204e-10,1.4959e-08,4.6e-05,Very Low,1.711101,0.000291,3379.949341,0.0,3381.660442,36.012401,Relatively Low,3.362397e-09,7.815852e-08,0.0,33.403011,3394.886179,34.23988,Relatively Low,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,Not Applicable,Not Applicable,Not Applicable,0.0,0.01,0.203075,161329200.0,1109.476338,12869930000.0,13031250000.0,4.8e-05,9.928904e-08,Very Low,76.649231,1.101588e-06,12.778425,89.427656,44.533616,Relatively Low,1.506195e-07,2.9549e-10,44.442873,89.777409,44.353215,Relatively Low,34.0,1.525514,1.031178,508893146.0,3728.0,43244800000.0,43753690000.0,8.817994e-09,6.342172e-09,Relatively Moderate,7.000824,3.7e-05,428.228967,435.229791,10.035817,Very Low,1.375696e-08,9.902438e-09,8.621123,436.931983,8.632008,Very Low,106.0,4.416667,0.003524,3085253.0,24.063213,279133300.0,0.0,282218500.0,2e-06,8.6913e-07,0.003637,Very Low,23.435027,9.2e-05,1071.497046,0.0,1094.932073,34.05712,Very Low,4.605098e-08,2.477748e-08,0.0,34.382413,1099.214372,33.669077,Very Low,6.0,0.154109,1.031178,508893146.0,3728.0,43244800000.0,0.0,43753690000.0,7.585231e-09,2.891832e-08,1e-06,Very Low,0.594873,1.7e-05,192.72401,0.0,193.318883,9.292155,Very Low,1.168955e-09,4.456582e-09,0.0,9.310965,194.074956,7.255149,Very Low,0.0,0.000116,1.031178,508893146.0,3728.0,43244800000.0,0.0,43753690000.0,0.057217,0.000298,0.0,Relatively Low,3376.763601,0.000129,1496.646972,0.0,4873.410573,14.731781,Very Low,7e-06,3.460872e-08,0.0,14.380268,4892.470571,11.589687,Very Low,0.0,0.004501,0.0,0.0,0.0,0.0,0.0,1.3e-05,3e-06,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.020202,0.114187,105860400.0,602.144419,6984875000.0,0.0,7090736000.0,0.4,2e-05,6.595474e-07,Relatively Low,878080.786815,0.000244,2832.00094,0.0,880912.787756,99.040348,Relatively High,0.001725,6.548766e-08,0.0,99.418501,884358.053853,98.967797,Relatively High,42.214675,2.613912,1.031178,150539600.0,1346.0,15613600000.0,0.0,15764140000.0,6.416375e-09,6.173231e-09,2e-12,Relatively Low,6.226551,5.5e-05,632.896397,0.0,639.122947,37.9806,Relatively Low,1.223548e-08,1.46352e-08,0.0,33.75414,641.622569,35.936831,Relatively Low,March 2023,,,"In Census Tract 101122.0 (FIPS 6037101122.0), ...",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
2,5580.0,T06037101220,California,CA,6.0,Los Angeles,County,37.0,6037.0,101220.0,6037101000.0,3344.0,308118718.0,0.0,0.272566,581682.9,53.225039,Relatively Low,17.153525,38.907156,Relatively Low,11.519877,369812.4,275711.8,0.008112,94100.638654,0.0,0.000895,2e-06,0.0,56.918054,66.247681,84.129997,Very High,0.74709,15.44,Very Low,0.477817,2.471082,1.572913,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,2.7e-05,3.618018e-07,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.272565,0.0,0.0,0.0,0.0,0.0,1.186214e-07,8.7618e-08,0.01238,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,1659.0,75.409091,0.272565,0.0,0.0,1.2e-05,No Rating,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,No Rating,0.009149,0.272565,308109000.0,3344.0,38790400000.0,39098510000.0,0.097079,0.000251,Relatively Low,273654.3,0.007665,88918.334899,362572.634899,84.917913,Relatively Moderate,0.000888,2e-06,88.66759,570295.315686,87.476811,Relatively Moderate,4.0,0.090975,0.272565,308118718.0,3344.0,38790400000.0,0.0,39098520000.0,1.581831e-07,4.956726e-09,7e-06,Very Low,4.434058,2e-06,17.492119,0.0,21.926177,4.476787,Very Low,1.439075e-08,4.50939e-10,0.0,4.984658,34.487976,6.417971,Very Low,82.982682,5.138259,0.272565,308118718.0,3344.0,38790400000.0,0.0,39098520000.0,6.53204e-10,1.4959e-08,4.6e-05,Very Low,1.005705,0.000251,2908.978579,0.0,2909.984284,33.950255,Relatively Low,3.264017e-09,7.499223e-08,0.0,32.840501,4577.152952,38.55777,Relatively Low,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,Not Applicable,Not Applicable,Not Applicable,0.0,0.01,0.0,0.0,0.0,0.0,0.0,4.8e-05,9.928904e-08,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,45.0,2.007354,0.272565,308118718.0,3344.0,38790400000.0,39098520000.0,8.817994e-09,6.342172e-09,Relatively Moderate,5.180299,4.1e-05,477.021292,482.201592,10.777303,Very Low,1.681267e-08,1.229741e-08,9.945976,758.461291,12.924054,Very Low,106.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2e-06,8.6913e-07,0.003637,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,6.0,0.15411,0.272565,308118718.0,3344.0,38790400000.0,0.0,39098520000.0,7.585231e-09,2.891832e-08,1e-06,Very Low,0.360177,1.5e-05,172.87261,0.0,173.232786,8.537403,Very Low,1.168955e-09,4.456582e-09,0.0,8.813675,272.480152,9.453931,Very Low,0.0,4.5e-05,0.272566,308118718.0,3344.0,38790400000.0,0.0,39098520000.0,0.147727,0.00077,0.0,Relatively Moderate,2044.523649,0.000116,1342.48591,0.0,3387.009559,9.842348,Very Low,7e-06,3.460872e-08,0.0,13.370405,5327.472346,12.789564,Very Low,0.0,0.004501,0.0,0.0,0.0,0.0,0.0,1.3e-05,3e-06,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4,2e-05,6.595474e-07,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,29.896199,1.851162,0.272565,81469760.0,1013.781709,11759870000.0,0.0,11841340000.0,6.416375e-09,6.173231e-09,2e-12,Relatively Low,1.982649,2.3e-05,263.453244,0.0,265.435893,28.988656,Relatively Low,6.434692e-09,6.791712e-09,0.0,25.812058,417.507643,31.113542,Relatively Low,March 2023,,,"In Census Tract 101220.0 (FIPS 6037101220.0), ...",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
3,5581.0,T06037101221,California,CA,6.0,Los Angeles,County,37.0,6037.0,101221.0,6037101000.0,3444.0,293556702.0,0.0,0.138129,630193.7,56.060029,Relatively Low,19.075335,37.078704,Relatively Low,10.586427,352790.7,251830.6,0.008703,100960.095979,0.0,0.000858,3e-06,0.0,55.12131,68.36441,94.910004,Very High,0.908961,15.44,Very Low,0.477817,2.471082,1.786311,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,2.7e-05,3.618018e-07,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.138129,0.0,0.0,0.0,0.0,0.0,1.186214e-07,8.7618e-08,0.01238,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,1659.0,75.409091,0.138129,0.0,0.0,1.2e-05,No Rating,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,No Rating,0.009149,0.138129,293548000.0,3444.0,39950400000.0,40243950000.0,0.093025,0.000263,Relatively Low,249836.2,0.008284,96093.187933,345929.387933,84.614933,Relatively Moderate,0.000851,2e-06,88.224863,617937.316447,87.938211,Relatively Moderate,4.0,0.090976,0.138129,293556702.0,3444.0,39950400000.0,0.0,40243960000.0,1.581831e-07,4.956726e-09,7e-06,Very Low,4.2245,2e-06,18.015209,0.0,22.239709,4.572013,Very Low,1.439075e-08,4.50939e-10,0.0,4.320429,39.727027,7.533416,Very Low,78.0,4.829741,0.138129,293556702.0,3444.0,39950400000.0,0.0,40243960000.0,6.53204e-10,1.4959e-08,4.6e-05,Very Low,0.926111,0.000249,2886.328462,0.0,2887.254574,33.853959,Relatively Low,3.154795e-09,7.22478e-08,0.0,32.373112,5157.533315,40.336774,Relatively Low,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,Not Applicable,Not Applicable,Not Applicable,0.0,0.01,0.04654,77888840.0,895.579021,10388720000.0,10466610000.0,4.8e-05,9.928904e-08,Very Low,37.00583,8.892118e-07,10.314857,47.320687,42.625656,Very Low,1.260602e-07,2.58192e-10,43.577868,84.529442,44.148245,Relatively Low,34.0,1.54546,0.138129,293556702.0,3444.0,39950400000.0,40243960000.0,8.817994e-09,6.342172e-09,Relatively Moderate,4.000533,3.4e-05,391.575253,395.575787,9.391359,Very Low,1.362781e-08,9.801535e-09,8.582791,706.621203,12.292765,Very Low,106.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2e-06,8.6913e-07,0.003637,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,6.0,0.15411,0.138129,293556702.0,3444.0,39950400000.0,0.0,40243960000.0,7.585231e-09,2.891832e-08,1e-06,Very Low,0.343154,1.5e-05,178.042245,0.0,178.385399,8.730205,Very Low,1.168955e-09,4.456582e-09,0.0,9.35799,318.651722,10.587214,Very Low,0.0,4.5e-05,0.138129,293556702.0,3444.0,39950400000.0,0.0,40243960000.0,0.147727,0.00077,0.0,Relatively Moderate,1947.897302,0.000119,1382.63202,0.0,3330.529322,9.663653,Very Low,7e-06,3.460872e-08,0.0,13.592598,5949.359677,14.415164,Very Low,0.0,0.004501,0.0,0.0,0.0,0.0,0.0,1.3e-05,3e-06,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4,2e-05,6.595474e-07,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.138129,0.0,0.0,0.0,0.0,0.0,6.416375e-09,6.173231e-09,2e-12,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,March 2023,,,"In Census Tract 101221.0 (FIPS 6037101221.0), ...",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,
4,5582.0,T06037101222,California,CA,6.0,Los Angeles,County,37.0,6037.0,101222.0,6037101000.0,2808.0,330877313.0,0.0,0.11564,835539.3,65.220235,Relatively Moderate,27.300681,47.198018,Relatively Low,16.242038,455142.5,355166.1,0.008619,99976.409594,0.0,0.001073,3e-06,0.0,64.193109,76.861057,97.32,Very High,0.952888,15.44,Very Low,0.477817,2.471082,1.835775,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,2.7e-05,3.618018e-07,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.11564,0.0,0.0,0.0,0.0,0.0,1.186214e-07,8.7618e-08,0.01238,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,1659.0,75.409091,0.11564,0.0,0.0,1.2e-05,No Rating,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,No Rating,0.009149,0.11564,330868000.0,2808.0,32572800000.0,32903670000.0,0.116598,0.000322,Relatively Low,352954.9,0.008277,96015.959981,448970.859981,86.262536,Relatively Moderate,0.001067,3e-06,90.574723,824209.541966,89.813538,Relatively High,4.0,0.090975,0.11564,330877313.0,2808.0,32572800000.0,0.0,32903680000.0,1.581831e-07,4.956726e-09,7e-06,Very Low,4.761572,1e-06,14.688358,0.0,19.44993,3.713805,Very Low,1.439075e-08,4.50939e-10,0.0,5.469016,35.705698,6.680778,Very Low,78.0,4.829721,0.11564,330877313.0,2808.0,32572800000.0,0.0,32903680000.0,6.53204e-10,1.4959e-08,4.6e-05,Very Low,1.04385,0.000203,2353.313102,0.0,2354.356952,31.24222,Relatively Low,3.154795e-09,7.22478e-08,0.0,32.192263,4322.069956,37.661133,Relatively Low,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,Not Applicable,Not Applicable,Not Applicable,0.0,0.01,0.003118,10461660.0,62.390222,723726600.0,734188200.0,4.8e-05,9.928904e-08,Very Low,4.970449,6.194665e-08,0.718581,5.689031,39.734842,Very Low,1.502203e-08,2.2061e-11,39.928113,10.443781,40.356313,Very Low,34.0,1.545454,0.11564,330877313.0,2808.0,32572800000.0,32903680000.0,8.817994e-09,6.342172e-09,Relatively Moderate,4.509131,2.8e-05,319.263447,323.772578,8.020987,Very Low,1.362781e-08,9.801535e-09,8.576802,594.37365,10.832535,Very Low,106.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,2e-06,8.6913e-07,0.003637,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,6.0,0.154109,0.11564,330877313.0,2808.0,32572800000.0,0.0,32903680000.0,7.585231e-09,2.891832e-08,1e-06,Very Low,0.386781,1.3e-05,145.163363,0.0,145.550144,7.495797,Very Low,1.168955e-09,4.456582e-09,0.0,9.57313,267.197336,9.301717,Very Low,0.0,4.5e-05,0.11564,330877313.0,2808.0,32572800000.0,0.0,32903680000.0,0.147727,0.00077,0.0,Relatively Moderate,2195.538446,9.7e-05,1127.302762,0.0,3322.841208,9.635438,Very Low,7e-06,3.460872e-08,0.0,14.407308,6099.989274,14.775484,Very Low,0.0,0.004501,0.0,0.0,0.0,0.0,0.0,1.3e-05,3e-06,No Rating,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,Not Applicable,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.4,2e-05,6.595474e-07,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,0.0,0.0,0.11564,0.0,0.0,0.0,0.0,0.0,6.416375e-09,6.173231e-09,2e-12,No Rating,0.0,0.0,0.0,0.0,0.0,0.0,No Expected Annual Losses,0.0,0.0,0.0,0.0,0.0,0.0,No Rating,March 2023,,,"In Census Tract 101222.0 (FIPS 6037101222.0), ...",,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,


In [134]:
df_cleaned = final_merged_data.drop(columns='geometry', errors='ignore')  # Drop geometry column if you don't need it


In [135]:
# merging the sentences into a txt file


# taking the "sentence" column and joining all entries into a single text string, with each sentence on a newline
sentences = df_cleaned['sentence'].dropna()  # Remove any missing values
combined_text = "\n".join(sentences)

# saving the combined text into a .txt file
output_file_path = 'merged_sentences.txt'
with open(output_file_path, 'w') as file:
    file.write(combined_text)

# downloading the merged text file
from google.colab import files
files.download(output_file_path)

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>