# SHOW A LIST OF DATA ON THE BUCKET

In [1]:
from google.cloud import storage


In [8]:
bucket_name = "cgpdata"


In [9]:
def list_blobs(bucket_name):
    """Lists all the blobs in the bucket."""
    # bucket_name = "your-bucket-name"

    storage_client = storage.Client()

    # Note: Client.list_blobs requires at least package version 1.17.0.
    blobs = storage_client.list_blobs(bucket_name)

    # Note: The call returns a response only when the iterator is consumed.
    for blob in blobs:
        print(blob.name)

In [10]:
list_blobs(bucket_name)

2000-01-SPY_5min_alphavantage.csv
raw/
raw/2000-01-SPY_5min_alphavantage.csv
raw/yf-sp500/
raw/yf_sp500/25-03-SP500/2025-03-06.csv
s&p500_data_20250304.csv


## LIST OBJECTS WITH A PREFIX (i.e. folder name)

In [13]:

def list_blobs_with_prefix(bucket_name, prefix, delimiter=None):
    """Lists all the blobs in the bucket that begin with the prefix.

    This can be used to list all blobs in a "folder", e.g. "public/".

    The delimiter argument can be used to restrict the results to only the
    "files" in the given "folder". Without the delimiter, the entire tree under
    the prefix is returned. For example, given these blobs:

        a/1.txt
        a/b/2.txt

    If you specify prefix ='a/', without a delimiter, you'll get back:

        a/1.txt
        a/b/2.txt

    However, if you specify prefix='a/' and delimiter='/', you'll get back
    only the file directly under 'a/':

        a/1.txt

    As part of the response, you'll also get back a blobs.prefixes entity
    that lists the "subfolders" under `a/`:

        a/b/
    """

    storage_client = storage.Client()

    # Note: Client.list_blobs requires at least package version 1.17.0.
    blobs = storage_client.list_blobs(bucket_name, prefix=prefix, delimiter=delimiter)

    # Note: The call returns a response only when the iterator is consumed.
    print("Blobs:")
    for blob in blobs:
        print(blob.name)

    if delimiter:
        print("Prefixes:")
        for prefix in blobs.prefixes:
            print(prefix)


In [15]:
prefix = "raw"
list_blobs_with_prefix(bucket_name, prefix)

Blobs:
raw/
raw/2000-01-SPY_5min_alphavantage.csv
raw/yf_sp500/


In [23]:
prefix = "raw/yf_sp500/"
list_blobs_with_prefix(bucket_name, prefix)

Blobs:
raw/yf_sp500/
raw/yf_sp500/25-03-SP500/2025-03-06.csv
raw/yf_sp500/25-03-SP500/placeholder.txt
