# Canonada usage example notebook

Notebooks are a great way to explore and experiment with data. Canonada allows you to use all catalog and pipelines features in a notebook environment.

In [1]:
import os
import canonada.catalog as catalog

# Import project defined pipelines and systems
os.chdir("..")
import pipelines
import systems

## Lets showcase some of the catalog features

In [2]:
# List all available catalog sources
print("Catalog sources:")
print(catalog.ls())

Catalog sources:
['raw_signals', 'stats', 'offset_signals_catalog', 'better_stats']


In [3]:
# List all available parameters
print("Parameters:")
print(catalog.params())

Parameters:
{'section_1.offset': 5}


In [4]:
# List all available credentials
print("Credentials:")
print(catalog.credentials())

Credentials:
{}


In [None]:
# Grab a datahandler from the list of sources
raw_signals_datahandler: catalog.Datahandler = catalog.get("raw_signals")

# Print a few rows of the data
print("Raw signal data:")
for i, row in enumerate(raw_signals_datahandler):
    print(row)
    if i > 5:
        break

## Run the example pipeline system

In [6]:
systems.example_system.example_system()

# In the same way you can call any pipeline to run it

2024-09-13 21:02:06,221 - canonada: [INFO]: Running pipeline system: 'example_system'
2024-09-13 21:02:06,224 - canonada: [INFO]: Running pipeline: streaming_pipe
2024-09-13 21:02:06,539 - canonada: [INFO]: Pipeline streaming_pipe finished
2024-09-13 21:02:06,587 - canonada: [INFO]: Running pipeline: calculate_better_stats
2024-09-13 21:02:06,713 - canonada: [INFO]: Pipeline calculate_better_stats finished


## Run a pipeline for a single datum (without the catalog)

In [13]:
# Load a single data point from the datahandler
signal_dict = raw_signals_datahandler["signal_0"]

# Run the pipeline with the data point
pipeline_output = pipelines.example_pipelines.streaming_pipe.run_once({"raw_signals": signal_dict, "params:section_1.offset": 6})

print("Pipeline output:")
print("Output keys: ", pipeline_output.keys())
print(pipeline_output["stats"])

Pipeline output:
Output keys:  dict_keys(['raw_signals', 'params:section_1.offset', 'offset_signals', 'offset_signals_catalog', 'max_values', 'mean_values', 'stats'])
{'id': '80b57db2-55fb-4194-9c71-4bae5a237222', 'maximum': 5.999204361922914, 'mean': 5.516971098237362}
