# Connect to Dremio (use this as a template)

You'll need to enter your credentials. They will not be stored.

In [None]:
################################################
#              Connect to Dremio               #
################################################
# Don't edit this
from os import getenv
from getpass import getpass
import pyodbc
import pandas as pd

dremio_host = 'dremio-client.dremio.svc.cluster.local'
dremio_port = 31010
dremio_driver = getenv('DREMIO_DRIVER')

cnxn = pyodbc.connect(';'.join([
    f"Driver={dremio_driver}", 
    "ConnectionType=Direct;",
    f"HOST={dremio_host}",
    f"PORT={dremio_port}",
    "AuthenticationType=Plain",
    "UID={}".format(getpass('Dremio Username: ')),
    "PWD={}".format(getpass('Dremio Password: '))]),
    autocommit=True
)

print("Connected.")

## An overview of what's available

In [None]:
print("Catalogs:")
sql = """SELECT * FROM INFORMATION_SCHEMA.CATALOGS LIMIT 5"""
pd.read_sql(sql,cnxn)

In [None]:
print("Tables:")
sql = '''SELECT * FROM INFORMATION_SCHEMA."TABLES" LIMIT 5'''
pd.read_sql(sql,cnxn)

In [None]:
print("Columns:")
sql = """SELECT * FROM INFORMATION_SCHEMA.COLUMNS LIMIT 5"""
pd.read_sql(sql,cnxn)

In [None]:
# For more commands, see the SQL Reference
# https://docs.dremio.com/sql-reference/

################################################
#           End of Connect to Dremio           #
################################################

# Get started with your analysis!

In [None]:
sql = '''SELECT * FROM dremiosharedstorage.shared."12100121_Metadata.csv" '''
pd.read_sql(sql,cnxn)

sql = '''SELECT * FROM dremiosharedstorage.shared."12100121.csv" LIMIT 10'''
df = pd.read_sql(sql,cnxn)

In [None]:
df

In [None]:
# df = df.rename(columns=df.iloc[0]).drop(df.index[0])

In [None]:
import numpy as np

In [None]:
values = pd.to_numeric(df['VALUE'])
df['VALUE'] = values

In [None]:
values.std()

In [None]:
values.mean()

In [None]:
pd.DataFrame.hist(df)

In [None]:
values