# American Community Survey (ACS) 5-Year Data

See https://www.census.gov/data/developers/data-sets/acs-5year.html.

In [1]:
# So we can run from within the censusdis project and find the packages we need.
import os
import sys

sys.path.append(
    os.path.join(
        os.path.abspath(os.path.join(os.path.curdir, os.path.pardir, os.path.pardir))
    )
)

In [2]:
import censusdis.data as ced

## ACS 5-Year Detailed Tables

In [3]:
DATASET = "acs/acs5"
YEAR = 2019

### What groups are in the dataset?

In [4]:
groups = ced.variables.all_groups(DATASET, YEAR)
groups.head()

Unnamed: 0,DATASET,YEAR,GROUP,DESCRIPTION
0,acs/acs5,2019,B01001,SEX BY AGE
1,acs/acs5,2019,B01001A,SEX BY AGE (WHITE ALONE)
2,acs/acs5,2019,B01001B,SEX BY AGE (BLACK OR AFRICAN AMERICAN ALONE)
3,acs/acs5,2019,B01001C,SEX BY AGE (AMERICAN INDIAN AND ALASKA NATIVE ...
4,acs/acs5,2019,B01001D,SEX BY AGE (ASIAN ALONE)


### What variables are in the first group (as a tree)?

In [5]:
group = groups.iloc[0]["GROUP"]

ced.variables.all_variables(DATASET, YEAR, group)

Unnamed: 0,YEAR,DATASET,GROUP,VARIABLE,LABEL,SUGGESTED_WEIGHT,VALUES
0,2019,acs/acs5,B01001,B01001_001E,Estimate!!Total:,,
1,2019,acs/acs5,B01001,B01001_002E,Estimate!!Total:!!Male:,,
2,2019,acs/acs5,B01001,B01001_003E,Estimate!!Total:!!Male:!!Under 5 years,,
3,2019,acs/acs5,B01001,B01001_004E,Estimate!!Total:!!Male:!!5 to 9 years,,
4,2019,acs/acs5,B01001,B01001_005E,Estimate!!Total:!!Male:!!10 to 14 years,,
5,2019,acs/acs5,B01001,B01001_006E,Estimate!!Total:!!Male:!!15 to 17 years,,
6,2019,acs/acs5,B01001,B01001_007E,Estimate!!Total:!!Male:!!18 and 19 years,,
7,2019,acs/acs5,B01001,B01001_008E,Estimate!!Total:!!Male:!!20 years,,
8,2019,acs/acs5,B01001,B01001_009E,Estimate!!Total:!!Male:!!21 years,,
9,2019,acs/acs5,B01001,B01001_010E,Estimate!!Total:!!Male:!!22 to 24 years,,


In [6]:
group

'B01001'

### What variables in the first group are leaves of the tree?

In [7]:
leaves = ced.variables.group_leaves(DATASET, YEAR, group)

str(leaves)

"['B01001_003E', 'B01001_004E', 'B01001_005E', 'B01001_006E', 'B01001_007E', 'B01001_008E', 'B01001_009E', 'B01001_010E', 'B01001_011E', 'B01001_012E', 'B01001_013E', 'B01001_014E', 'B01001_015E', 'B01001_016E', 'B01001_017E', 'B01001_018E', 'B01001_019E', 'B01001_020E', 'B01001_021E', 'B01001_022E', 'B01001_023E', 'B01001_024E', 'B01001_025E', 'B01001_027E', 'B01001_028E', 'B01001_029E', 'B01001_030E', 'B01001_031E', 'B01001_032E', 'B01001_033E', 'B01001_034E', 'B01001_035E', 'B01001_036E', 'B01001_037E', 'B01001_038E', 'B01001_039E', 'B01001_040E', 'B01001_041E', 'B01001_042E', 'B01001_043E', 'B01001_044E', 'B01001_045E', 'B01001_046E', 'B01001_047E', 'B01001_048E', 'B01001_049E']"

### All variables in the first group as a list

In [8]:
variables = ced.variables.group_variables(DATASET, YEAR, group)

str(variables)

"['B01001_001E', 'B01001_002E', 'B01001_003E', 'B01001_004E', 'B01001_005E', 'B01001_006E', 'B01001_007E', 'B01001_008E', 'B01001_009E', 'B01001_010E', 'B01001_011E', 'B01001_012E', 'B01001_013E', 'B01001_014E', 'B01001_015E', 'B01001_016E', 'B01001_017E', 'B01001_018E', 'B01001_019E', 'B01001_020E', 'B01001_021E', 'B01001_022E', 'B01001_023E', 'B01001_024E', 'B01001_025E', 'B01001_026E', 'B01001_027E', 'B01001_028E', 'B01001_029E', 'B01001_030E', 'B01001_031E', 'B01001_032E', 'B01001_033E', 'B01001_034E', 'B01001_035E', 'B01001_036E', 'B01001_037E', 'B01001_038E', 'B01001_039E', 'B01001_040E', 'B01001_041E', 'B01001_042E', 'B01001_043E', 'B01001_044E', 'B01001_045E', 'B01001_046E', 'B01001_047E', 'B01001_048E', 'B01001_049E']"

### Dowload data for the leaf variables

In [9]:
df_data = ced.download(DATASET, YEAR, leaves, state="*")

In [10]:
df_data.head()

Unnamed: 0,STATE,B01001_003E,B01001_004E,B01001_005E,B01001_006E,B01001_007E,B01001_008E,B01001_009E,B01001_010E,B01001_011E,...,B01001_040E,B01001_041E,B01001_042E,B01001_043E,B01001_044E,B01001_045E,B01001_046E,B01001_047E,B01001_048E,B01001_049E
0,1,149090,153494,158617,98257,64980,35870,35040,95065,165052,...,166787,174087,69293,96727,59558,83413,113624,82251,59420,56419
1,2,27062,26776,25921,15200,9746,6154,6029,19262,33136,...,22294,24504,9531,11786,6658,9489,11121,5978,4381,3981
2,4,221817,228224,241782,142358,99160,53415,52100,149020,260409,...,214302,222592,89972,131135,85291,121138,166001,121595,77798,78983
3,5,96986,100270,101442,61421,41658,23070,21553,59319,100466,...,96411,100562,40560,56728,35669,49920,69390,49857,35058,37257
4,6,1254607,1257974,1318355,779960,529837,295438,285103,839739,1591508,...,1275929,1264187,490110,668292,409644,556798,729375,518080,382536,451736


## ACS 5-Year Subject Tables

In [11]:
DATASET = "acs/acs5/subject"
YEAR = 2019

### What groups are in the dataset?

In [12]:
groups = ced.variables.all_groups(DATASET, YEAR)
groups.head()

Unnamed: 0,DATASET,YEAR,GROUP,DESCRIPTION
0,acs/acs5/subject,2019,S0101,AGE AND SEX
1,acs/acs5/subject,2019,S0102,POPULATION 60 YEARS AND OVER IN THE UNITED STATES
2,acs/acs5/subject,2019,S0102PR,POPULATION 60 YEARS AND OVER IN PUERTO RICO
3,acs/acs5/subject,2019,S0103,POPULATION 65 YEARS AND OVER IN THE UNITED STATES
4,acs/acs5/subject,2019,S0103PR,POPULATION 65 YEARS AND OVER IN PUERTO RICO


### What variables are in the first group?

In [13]:
group = groups.iloc[0]["GROUP"]

ced.variables.all_variables(DATASET, YEAR, group)

Unnamed: 0,YEAR,DATASET,GROUP,VARIABLE,LABEL,SUGGESTED_WEIGHT,VALUES
0,2019,acs/acs5/subject,S0101,S0101_C01_001E,Estimate!!Total!!Total population,,
1,2019,acs/acs5/subject,S0101,S0101_C01_002E,Estimate!!Total!!Total population!!AGE!!Under ...,,
2,2019,acs/acs5/subject,S0101,S0101_C01_003E,Estimate!!Total!!Total population!!AGE!!5 to 9...,,
3,2019,acs/acs5/subject,S0101,S0101_C01_004E,Estimate!!Total!!Total population!!AGE!!10 to ...,,
4,2019,acs/acs5/subject,S0101,S0101_C01_005E,Estimate!!Total!!Total population!!AGE!!15 to ...,,
...,...,...,...,...,...,...,...
223,2019,acs/acs5/subject,S0101,S0101_C06_034E,Estimate!!Percent Female!!Total population!!SU...,,
224,2019,acs/acs5/subject,S0101,S0101_C06_035E,Estimate!!Percent Female!!Total population!!SU...,,
225,2019,acs/acs5/subject,S0101,S0101_C06_036E,Estimate!!Percent Female!!Total population!!SU...,,
226,2019,acs/acs5/subject,S0101,S0101_C06_037E,Estimate!!Percent Female!!Total population!!PE...,,


### What variables are in the first group (as a tree)?

In [14]:
ced.variables.group_tree(DATASET, YEAR, group)

+ Estimate
    + Total
        + Total population (S0101_C01_001E)
            + AGE
                + Under 5 years (S0101_C01_002E)
                + 5 to 9 years (S0101_C01_003E)
                + 10 to 14 years (S0101_C01_004E)
                + 15 to 19 years (S0101_C01_005E)
                + 20 to 24 years (S0101_C01_006E)
                + 25 to 29 years (S0101_C01_007E)
                + 30 to 34 years (S0101_C01_008E)
                + 35 to 39 years (S0101_C01_009E)
                + 40 to 44 years (S0101_C01_010E)
                + 45 to 49 years (S0101_C01_011E)
                + 50 to 54 years (S0101_C01_012E)
                + 55 to 59 years (S0101_C01_013E)
                + 60 to 64 years (S0101_C01_014E)
                + 65 to 69 years (S0101_C01_015E)
                + 70 to 74 years (S0101_C01_016E)
                + 75 to 79 years (S0101_C01_017E)
                + 80 to 84 years (S0101_C01_018E)
                + 85 years and over (S0101_C01_019E)
            + S

### What variables in the first group are leaves of the tree?

In [15]:
leaves = ced.variables.group_leaves(DATASET, YEAR, group)

str(leaves)

"['S0101_C01_002E', 'S0101_C01_003E', 'S0101_C01_004E', 'S0101_C01_005E', 'S0101_C01_006E', 'S0101_C01_007E', 'S0101_C01_008E', 'S0101_C01_009E', 'S0101_C01_010E', 'S0101_C01_011E', 'S0101_C01_012E', 'S0101_C01_013E', 'S0101_C01_014E', 'S0101_C01_015E', 'S0101_C01_016E', 'S0101_C01_017E', 'S0101_C01_018E', 'S0101_C01_019E', 'S0101_C01_020E', 'S0101_C01_021E', 'S0101_C01_022E', 'S0101_C01_023E', 'S0101_C01_024E', 'S0101_C01_025E', 'S0101_C01_026E', 'S0101_C01_027E', 'S0101_C01_028E', 'S0101_C01_029E', 'S0101_C01_030E', 'S0101_C01_031E', 'S0101_C01_032E', 'S0101_C01_033E', 'S0101_C01_034E', 'S0101_C01_035E', 'S0101_C01_036E', 'S0101_C01_037E', 'S0101_C01_038E', 'S0101_C02_002E', 'S0101_C02_003E', 'S0101_C02_004E', 'S0101_C02_005E', 'S0101_C02_006E', 'S0101_C02_007E', 'S0101_C02_008E', 'S0101_C02_009E', 'S0101_C02_010E', 'S0101_C02_011E', 'S0101_C02_012E', 'S0101_C02_013E', 'S0101_C02_014E', 'S0101_C02_015E', 'S0101_C02_016E', 'S0101_C02_017E', 'S0101_C02_018E', 'S0101_C02_019E', 'S0101_C

### All variables in the first group as a list

In [16]:
variables = ced.variables.group_variables(DATASET, YEAR, group)

str(variables)

"['S0101_C01_001E', 'S0101_C01_002E', 'S0101_C01_003E', 'S0101_C01_004E', 'S0101_C01_005E', 'S0101_C01_006E', 'S0101_C01_007E', 'S0101_C01_008E', 'S0101_C01_009E', 'S0101_C01_010E', 'S0101_C01_011E', 'S0101_C01_012E', 'S0101_C01_013E', 'S0101_C01_014E', 'S0101_C01_015E', 'S0101_C01_016E', 'S0101_C01_017E', 'S0101_C01_018E', 'S0101_C01_019E', 'S0101_C01_020E', 'S0101_C01_021E', 'S0101_C01_022E', 'S0101_C01_023E', 'S0101_C01_024E', 'S0101_C01_025E', 'S0101_C01_026E', 'S0101_C01_027E', 'S0101_C01_028E', 'S0101_C01_029E', 'S0101_C01_030E', 'S0101_C01_031E', 'S0101_C01_032E', 'S0101_C01_033E', 'S0101_C01_034E', 'S0101_C01_035E', 'S0101_C01_036E', 'S0101_C01_037E', 'S0101_C01_038E', 'S0101_C02_001E', 'S0101_C02_002E', 'S0101_C02_003E', 'S0101_C02_004E', 'S0101_C02_005E', 'S0101_C02_006E', 'S0101_C02_007E', 'S0101_C02_008E', 'S0101_C02_009E', 'S0101_C02_010E', 'S0101_C02_011E', 'S0101_C02_012E', 'S0101_C02_013E', 'S0101_C02_014E', 'S0101_C02_015E', 'S0101_C02_016E', 'S0101_C02_017E', 'S0101_C

### Dowload data for the leaf variables

In [17]:
df_data = ced.download(DATASET, YEAR, leaves, state="*")

In [18]:
df_data.head()

Unnamed: 0,STATE,S0101_C01_002E,S0101_C01_003E,S0101_C01_004E,S0101_C01_005E,S0101_C01_006E,S0101_C01_007E,S0101_C01_008E,S0101_C01_009E,S0101_C01_010E,...,S0101_C06_029E,S0101_C06_030E,S0101_C06_031E,S0101_C06_032E,S0101_C06_033E,S0101_C06_034E,S0101_C06_035E,S0101_C06_036E,S0101_C06_037E,S0101_C06_038E
0,1,293187,301064,310456,322486,328180,332622,305325,300441,295947,...,21.9,18.1,7.9,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888
1,2,53237,52810,49269,46704,54462,62205,57119,50772,42612,...,15.2,11.8,4.1,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888
2,4,433968,450570,471732,473352,488145,501361,463586,443641,423147,...,22.1,18.4,7.9,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888
3,5,189636,196874,197804,201105,202312,202000,189817,187837,180620,...,21.9,18.1,8.0,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888
4,6,2451528,2468226,2575463,2565170,2751567,3078492,2889372,2681376,2524511,...,18.8,15.4,6.8,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888,-888888888


## ACS 5-Year Data Profiles

In [19]:
DATASET = "acs/acs5/profile"
YEAR = 2019

### What groups are in the dataset?

In [20]:
groups = ced.variables.all_groups(DATASET, YEAR)
groups.head()

Unnamed: 0,DATASET,YEAR,GROUP,DESCRIPTION
0,acs/acs5/profile,2019,DP02,SELECTED SOCIAL CHARACTERISTICS IN THE UNITED ...
1,acs/acs5/profile,2019,DP02PR,SELECTED SOCIAL CHARACTERISTICS IN PUERTO RICO
2,acs/acs5/profile,2019,DP03,SELECTED ECONOMIC CHARACTERISTICS
3,acs/acs5/profile,2019,DP04,SELECTED HOUSING CHARACTERISTICS
4,acs/acs5/profile,2019,DP05,ACS DEMOGRAPHIC AND HOUSING ESTIMATES


### What variables are in the first group (as a tree)?

In [21]:
group = groups.iloc[0]["GROUP"]

ced.variables.group_tree(DATASET, YEAR, group)

+ Estimate
    + HOUSEHOLDS BY TYPE
        + Total households (DP02_0001E)
            + Married-couple family (DP02_0002E)
                + With own children of the householder under 18 years (DP02_0003E)
            + Cohabiting couple household (DP02_0004E)
                + With own children of the householder under 18 years (DP02_0005E)
            + Male householder, no spouse/partner present (DP02_0006E)
                + With own children of the householder under 18 years (DP02_0007E)
                + Householder living alone (DP02_0008E)
                    + 65 years and over (DP02_0009E)
            + Female householder, no spouse/partner present (DP02_0010E)
                + With own children of the householder under 18 years (DP02_0011E)
                + Householder living alone (DP02_0012E)
                    + 65 years and over (DP02_0013E)
            + Households with one or more people under 18 years (DP02_0014E)
            + Households with one or more people 

### What variables in the first group are leaves of the tree?

In [22]:
leaves = ced.variables.group_leaves(DATASET, YEAR, group)

str(leaves)

"['DP02_0003E', 'DP02_0003PE', 'DP02_0003PM', 'DP02_0005E', 'DP02_0005PE', 'DP02_0005PM', 'DP02_0007E', 'DP02_0007PE', 'DP02_0007PM', 'DP02_0009E', 'DP02_0009PE', 'DP02_0009PM', 'DP02_0011E', 'DP02_0011PE', 'DP02_0011PM', 'DP02_0013E', 'DP02_0013PE', 'DP02_0013PM', 'DP02_0014E', 'DP02_0014PE', 'DP02_0014PM', 'DP02_0015E', 'DP02_0015PE', 'DP02_0015PM', 'DP02_0016E', 'DP02_0016PE', 'DP02_0016PM', 'DP02_0017E', 'DP02_0017PE', 'DP02_0017PM', 'DP02_0019E', 'DP02_0019PE', 'DP02_0019PM', 'DP02_0020E', 'DP02_0020PE', 'DP02_0020PM', 'DP02_0021E', 'DP02_0021PE', 'DP02_0021PM', 'DP02_0022E', 'DP02_0022PE', 'DP02_0022PM', 'DP02_0023E', 'DP02_0023PE', 'DP02_0023PM', 'DP02_0024E', 'DP02_0024PE', 'DP02_0024PM', 'DP02_0026E', 'DP02_0026PE', 'DP02_0026PM', 'DP02_0027E', 'DP02_0027PE', 'DP02_0027PM', 'DP02_0028E', 'DP02_0028PE', 'DP02_0028PM', 'DP02_0029E', 'DP02_0029PE', 'DP02_0029PM', 'DP02_0030E', 'DP02_0030PE', 'DP02_0030PM', 'DP02_0032E', 'DP02_0032PE', 'DP02_0032PM', 'DP02_0033E', 'DP02_0033PE', '

### All variables in the first group as a list

In [23]:
variables = ced.variables.group_variables(DATASET, YEAR, group)

str(variables)

"['DP02_0001E', 'DP02_0001PE', 'DP02_0001PM', 'DP02_0002E', 'DP02_0002PE', 'DP02_0002PM', 'DP02_0003E', 'DP02_0003PE', 'DP02_0003PM', 'DP02_0004E', 'DP02_0004PE', 'DP02_0004PM', 'DP02_0005E', 'DP02_0005PE', 'DP02_0005PM', 'DP02_0006E', 'DP02_0006PE', 'DP02_0006PM', 'DP02_0007E', 'DP02_0007PE', 'DP02_0007PM', 'DP02_0008E', 'DP02_0008PE', 'DP02_0008PM', 'DP02_0009E', 'DP02_0009PE', 'DP02_0009PM', 'DP02_0010E', 'DP02_0010PE', 'DP02_0010PM', 'DP02_0011E', 'DP02_0011PE', 'DP02_0011PM', 'DP02_0012E', 'DP02_0012PE', 'DP02_0012PM', 'DP02_0013E', 'DP02_0013PE', 'DP02_0013PM', 'DP02_0014E', 'DP02_0014PE', 'DP02_0014PM', 'DP02_0015E', 'DP02_0015PE', 'DP02_0015PM', 'DP02_0016E', 'DP02_0016PE', 'DP02_0016PM', 'DP02_0017E', 'DP02_0017PE', 'DP02_0017PM', 'DP02_0018E', 'DP02_0018PE', 'DP02_0018PM', 'DP02_0019E', 'DP02_0019PE', 'DP02_0019PM', 'DP02_0020E', 'DP02_0020PE', 'DP02_0020PM', 'DP02_0021E', 'DP02_0021PE', 'DP02_0021PM', 'DP02_0022E', 'DP02_0022PE', 'DP02_0022PM', 'DP02_0023E', 'DP02_0023PE', '

### Dowload data for the leaf variables

In [24]:
df_data = ced.download(DATASET, YEAR, leaves, state="*")

In [25]:
df_data.head()

Unnamed: 0,STATE,DP02_0003E,DP02_0003PE,DP02_0003PM,DP02_0005E,DP02_0005PE,DP02_0005PM,DP02_0007E,DP02_0007PE,DP02_0007PM,...,DP02_0149PM,DP02_0150E,DP02_0150PE,DP02_0150PM,DP02_0152E,DP02_0152PE,DP02_0152PM,DP02_0153E,DP02_0153PE,DP02_0153PM
0,1,313139.0,16.8,0.2,27962.0,1.5,0.1,21350.0,1.1,0.1,...,0.1,10863.0,0.2,0.1,1597441.0,85.5,0.2,1427054.0,76.4,0.3
1,2,54017.0,21.3,0.5,7026.0,2.8,0.2,5114.0,2.0,0.2,...,0.1,1486.0,0.2,0.1,238412.0,94.1,0.3,216709.0,85.5,0.5
2,4,455721.0,17.7,0.2,67207.0,2.6,0.1,37798.0,1.5,0.1,...,0.1,11545.0,0.2,0.1,2357063.0,91.7,0.1,2161674.0,84.1,0.2
3,5,206986.0,17.9,0.2,23363.0,2.0,0.1,15912.0,1.4,0.1,...,0.1,3538.0,0.1,0.1,998207.0,86.2,0.2,845966.0,73.0,0.4
4,6,2801975.0,21.5,0.1,331408.0,2.5,0.1,171733.0,1.3,0.1,...,0.1,89482.0,0.2,0.1,12131484.0,93.0,0.1,11303564.0,86.7,0.1


## ACS 5-Year Comparison Profiles

In [26]:
DATASET = "acs/acs5/cprofile"
YEAR = 2019

### What groups are in the dataset?

In [27]:
groups = ced.variables.all_groups(DATASET, YEAR)
groups.head()

Unnamed: 0,DATASET,YEAR,GROUP,DESCRIPTION
0,acs/acs5/cprofile,2019,CP02,COMPARATIVE SOCIAL CHARACTERISTICS IN THE UNIT...
1,acs/acs5/cprofile,2019,CP02PR,COMPARATIVE SOCIAL CHARACTERISTICS IN PUERTO RICO
2,acs/acs5/cprofile,2019,CP03,COMPARATIVE ECONOMIC CHARACTERISTICS
3,acs/acs5/cprofile,2019,CP04,COMPARATIVE HOUSING CHARACTERISTICS
4,acs/acs5/cprofile,2019,CP05,COMPARATIVE DEMOGRAPHIC ESTIMATES


### What variables are in the first group (as a tree)?

In [28]:
group = groups.iloc[0]["GROUP"]

ced.variables.group_tree(DATASET, YEAR, group)

+ 2010-2014 Estimates
    + HOUSEHOLDS BY TYPE
        + Total households (CP02_2014_001E)
            + Married-couple family (CP02_2014_002E)
                + With own children of the householder under 18 years (CP02_2014_003E)
            + Cohabiting couple household (CP02_2014_004E)
                + With own children of the householder under 18 years (CP02_2014_005E)
            + Male householder, no spouse/partner present (CP02_2014_006E)
                + With own children of the householder under 18 years (CP02_2014_007E)
                + Householder living alone (CP02_2014_008E)
                    + 65 years and over (CP02_2014_009E)
            + Female householder, no spouse/partner present (CP02_2014_010E)
                + With own children of the householder under 18 years (CP02_2014_011E)
                + Householder living alone (CP02_2014_012E)
                    + 65 years and over (CP02_2014_013E)
            + Households with one or more people under 18 years

### What variables in the first group are leaves of the tree?

In [29]:
leaves = ced.variables.group_leaves(DATASET, YEAR, group)

str(leaves)

"['CP02_2014_003E', 'CP02_2014_005E', 'CP02_2014_007E', 'CP02_2014_009E', 'CP02_2014_011E', 'CP02_2014_013E', 'CP02_2014_014E', 'CP02_2014_015E', 'CP02_2014_016E', 'CP02_2014_017E', 'CP02_2014_019E', 'CP02_2014_020E', 'CP02_2014_021E', 'CP02_2014_022E', 'CP02_2014_023E', 'CP02_2014_024E', 'CP02_2014_026E', 'CP02_2014_027E', 'CP02_2014_028E', 'CP02_2014_029E', 'CP02_2014_030E', 'CP02_2014_032E', 'CP02_2014_033E', 'CP02_2014_034E', 'CP02_2014_035E', 'CP02_2014_036E', 'CP02_2014_039E', 'CP02_2014_040E', 'CP02_2014_041E', 'CP02_2014_042E', 'CP02_2014_043E', 'CP02_2014_045E', 'CP02_2014_046E', 'CP02_2014_047E', 'CP02_2014_048E', 'CP02_2014_049E', 'CP02_2014_051E', 'CP02_2014_052E', 'CP02_2014_054E', 'CP02_2014_055E', 'CP02_2014_056E', 'CP02_2014_057E', 'CP02_2014_058E', 'CP02_2014_060E', 'CP02_2014_061E', 'CP02_2014_062E', 'CP02_2014_063E', 'CP02_2014_064E', 'CP02_2014_065E', 'CP02_2014_066E', 'CP02_2014_067E', 'CP02_2014_068E', 'CP02_2014_070E', 'CP02_2014_072E', 'CP02_2014_074E', 'CP02_20

### All variables in the first group as a list

In [30]:
variables = ced.variables.group_variables(DATASET, YEAR, group)

str(variables)

"['CP02_2014_001E', 'CP02_2014_002E', 'CP02_2014_003E', 'CP02_2014_004E', 'CP02_2014_005E', 'CP02_2014_006E', 'CP02_2014_007E', 'CP02_2014_008E', 'CP02_2014_009E', 'CP02_2014_010E', 'CP02_2014_011E', 'CP02_2014_012E', 'CP02_2014_013E', 'CP02_2014_014E', 'CP02_2014_015E', 'CP02_2014_016E', 'CP02_2014_017E', 'CP02_2014_018E', 'CP02_2014_019E', 'CP02_2014_020E', 'CP02_2014_021E', 'CP02_2014_022E', 'CP02_2014_023E', 'CP02_2014_024E', 'CP02_2014_025E', 'CP02_2014_026E', 'CP02_2014_027E', 'CP02_2014_028E', 'CP02_2014_029E', 'CP02_2014_030E', 'CP02_2014_031E', 'CP02_2014_032E', 'CP02_2014_033E', 'CP02_2014_034E', 'CP02_2014_035E', 'CP02_2014_036E', 'CP02_2014_037E', 'CP02_2014_038E', 'CP02_2014_039E', 'CP02_2014_040E', 'CP02_2014_041E', 'CP02_2014_042E', 'CP02_2014_043E', 'CP02_2014_044E', 'CP02_2014_045E', 'CP02_2014_046E', 'CP02_2014_047E', 'CP02_2014_048E', 'CP02_2014_049E', 'CP02_2014_050E', 'CP02_2014_051E', 'CP02_2014_052E', 'CP02_2014_053E', 'CP02_2014_054E', 'CP02_2014_055E', 'CP02_20

### Dowload data for the leaf variables

In [31]:
df_data = ced.download(DATASET, YEAR, leaves, state="*")

In [32]:
df_data.head()

Unnamed: 0,STATE,CP02_2014_003E,CP02_2014_005E,CP02_2014_007E,CP02_2014_009E,CP02_2014_011E,CP02_2014_013E,CP02_2014_014E,CP02_2014_015E,CP02_2014_016E,...,CP02_2019_143E,CP02_2019_144E,CP02_2019_145E,CP02_2019_146E,CP02_2019_147E,CP02_2019_148E,CP02_2019_149E,CP02_2019_150E,CP02_2019_152E,CP02_2019_153E
0,1,17.5,1.4,1.2,3.0,7.4,7.4,31.8,27.0,2.55,...,1.8,0.0,1.0,0.3,0.1,0.1,0.4,0.2,85.5,76.4
1,2,22.5,3.2,1.9,2.4,5.5,3.6,36.2,17.6,2.79,...,2.3,0.1,0.8,2.0,0.4,0.4,0.8,0.2,94.1,85.5
2,4,18.4,2.7,1.6,3.2,5.8,6.6,32.2,28.2,2.69,...,1.7,0.1,0.7,1.4,0.2,0.2,0.6,0.2,91.7,84.1
3,5,18.2,1.9,1.5,3.1,6.6,7.4,32.1,27.2,2.53,...,1.7,0.0,0.6,0.5,0.2,0.1,0.5,0.1,86.2,73.0
4,6,22.5,2.7,1.4,2.7,5.7,6.0,36.5,25.6,2.95,...,1.2,0.1,0.7,0.9,0.3,0.3,0.4,0.2,93.0,86.7
