In [None]:
from flight_fusion import FlightFusionClient
import numpy as np
import pandas as pd
from pathlib import Path

ffc = FlightFusionClient()

delta_path =  str(Path.cwd() / "delta")

In [None]:
ffc.drop_table("table-fgh")

In [None]:
np.random.seed(42)  
df = pd.DataFrame(np.random.randn(5, 3), columns=["col1", "col2", "col3"])
ffc.register_memory_table("test_table", df)

### Data Ingestion

The fusion server supports registering data available locally as a managed dataset or registering data which resides in an external system.
Local data will be written to configured object storage and can be versioned if desired. For versioned datasets `Delta` tables are used.

- `register_memory_table`
- `register_dataset`
- `register_location`


In [None]:
np.random.seed(42)  
df = pd.DataFrame(np.random.randn(500000, 20), columns=list('qwertzuiopasdfghjkly'))
ffc.register_dataset(None, None, "upload", df)

In [None]:
np.random.seed(42)  
df = pd.DataFrame(np.random.randn(500, 3), columns=["col1", "col2", "col3"])
ffc.write_into_delta(None, None, delta_path, SaveMode.SAVE_MODE_OVERWRITE, df)

In [None]:
query = "SELECT * FROM catalog.schema.test_table"
table = ffc.execute_query(query).to_pandas()
table.sample(5)

In [None]:
ffc.register_remote_dataset(None, None, "upload_remote", "test/flight/largish2.parquet")

In [None]:
query = 'SELECT * FROM catalog.schema.upload_remote WHERE A > 0 LIMIT 100'
ffc.execute_query(query).to_pandas()

In [None]:
query = "SELECT count(l) FROM catalog.schema.upload"
ffc.execute_query(query).to_pandas()

In [None]:
query = "select * from information_schema.columns"
ffc.execute_query(query).to_pandas()

In [None]:
arr = table.column("x_axis").to_pandas()
arr