In [1]:
# Copyright 2025 Google LLC
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     https://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# Analyzing a GEOGRAPHY column with `bigframes.geopandas.GeoSeries`

In [2]:
import bigframes
import bigframes.geopandas
import bigframes.pandas as bpd
bpd.options.display.progress_bar = None

### Load the Counties table from the Census Bureau US Boundaries dataset

In [3]:
df = bpd.read_gbq("bigquery-public-data.geo_us_boundaries.counties")



### Create a series from the int_point_geom column

In [4]:
point_geom_series = df['int_point_geom']

## The `GeoSeries` constructor accepts local data or a `bigframes.pandas.Series` object.

### 1. Create a GeoSeries from local data with `Peek`

In [5]:
five_geo_points = point_geom_series.peek(n = 5)
five_geo_points

37     POINT (-91.19496 39.98605)
406    POINT (-84.86717 33.92103)
926    POINT (-82.47974 35.33641)
940    POINT (-75.50298 39.09709)
996     POINT (-92.56434 39.8298)
Name: int_point_geom, dtype: geometry

### Convert the five geo points to `bigframes.gopandas.GeoSeries`

In [6]:
geo_points = bigframes.geopandas.GeoSeries(
        [point for point in five_geo_points]
)
geo_points

0    POINT (-91.19496 39.98605)
1    POINT (-84.86717 33.92103)
2    POINT (-82.47974 35.33641)
3    POINT (-75.50298 39.09709)
4     POINT (-92.56434 39.8298)
dtype: geometry

### Retrieve the x (longitude) and y (latitude) from the GeoSeries with `.x` and `.y`.

#### Note: TypeError is raised if `.x` and `.y` are used with a geometry type other than `Point`.

### `.x`

In [7]:
geo_points.x

0   -91.194961
1   -84.867169
2   -82.479741
3   -75.502982
4    -92.56434
dtype: Float64

### `.y`

In [8]:
geo_points.y

0    39.986053
1     33.92103
2    35.336415
3    39.097088
4    39.829795
dtype: Float64

### 2. Alternatively, use the `.geo` accessor to access GeoSeries methods from a `bigframes.pandas.Series` object.

#### `geo.x`

In [9]:
point_geom_series.geo.x

0    -101.298265
1     -99.111085
2      -66.58687
3    -102.601791
4     -71.578625
5     -88.961529
6     -87.492986
7     -82.422666
8    -100.208166
9     -85.815939
10   -101.681133
11   -119.516659
12    -89.398306
13    -107.78848
14    -91.159306
15   -113.887042
16    -83.470416
17    -98.520146
18    -83.911718
19    -87.321865
20    -91.727626
21    -93.466093
22   -101.143324
23    -78.657634
24    -94.272323
dtype: Float64

#### `geo.y`

In [10]:
point_geom_series.geo.y

0     46.710819
1     29.353661
2     18.211152
3     38.835646
4     41.869768
5     39.860237
6     36.892059
7     38.143642
8     34.524623
9     30.862007
10    40.180165
11    46.228125
12    36.054196
13    38.154731
14    38.761902
15    44.928506
16    30.447232
17    29.448671
18    42.602532
19    34.529776
20    33.957675
21    42.037538
22    29.875285
23    36.299884
24    44.821657
dtype: Float64

## Retrive the `area` of different geometry shapes. 

### 1. Create a geometry collection from local data with `Peek`

In [11]:
geom_series = df["county_geom"].peek(n = 5)
geom_series

10     POLYGON ((-101.7778 40.34969, -101.77812 40.34...
127    POLYGON ((-89.22333 44.50398, -89.22334 44.499...
253    POLYGON ((-76.69446 37.07288, -76.69515 37.072...
261    POLYGON ((-98.70136 44.45055, -98.70136 44.450...
303    POLYGON ((-85.99565 30.28131, -85.99566 30.280...
Name: county_geom, dtype: geometry

### Convert the geometry collection to `bigframes.gopandas.GeoSeries`

In [12]:
five_geom = bigframes.geopandas.GeoSeries(
        [point for point in geom_series]
)
five_geom

0    POLYGON ((-101.7778 40.34969, -101.77812 40.34...
1    POLYGON ((-89.22333 44.50398, -89.22334 44.499...
2    POLYGON ((-76.69446 37.07288, -76.69515 37.072...
3    POLYGON ((-98.70136 44.45055, -98.70136 44.450...
4    POLYGON ((-85.99565 30.28131, -85.99566 30.280...
dtype: geometry

## Note: `bigframes.geopandas.GeoSeries.area` raises NotImplementedError.  

In [13]:
five_geom.area

NotImplementedError: GeoSeries.area is not supported. Use bigframes.bigquery.st_area(series), instead. Share your usecase with the BigQuery DataFrames team at the https://bit.ly/bigframes-feedback survey.You are currently running BigFrames version 1.34.0

## Use `bigframes.bigquery.st_area` to retirive the `area` in square meters instead. See: https://cloud.google.com/bigquery/docs/reference/standard-sql/geography_functions#st_area

In [14]:
import bigframes.bigquery as bbq

In [15]:
geom_area = bbq.st_area(five_geom)
geom_area

0     2382382043.48891
1     1977633097.26862
2     939388839.499466
3    3269015229.381782
4    2678752241.321673
dtype: Float64