https://learn.microsoft.com/en-us/azure/databricks/dev-tools/databricks-utils

In [0]:
dbutils.help()


#Data utility (dbutils.data)

In [0]:
import pandas as pd
from ydata_profiling import ProfileReport

data = pd.read_csv('/databricks-datasets/Rdatasets/data-001/csv/ggplot2/diamonds.csv')

  @nb.jit


In [0]:
profile = ProfileReport(data, title="Profiling Report")

In [0]:
profile



In [0]:
df = spark.read.format('csv').load(
  '/databricks-datasets/Rdatasets/data-001/csv/ggplot2/diamonds.csv',
  header=True,
  inferSchema=True
)
dbutils.data.summarize(df)

In [0]:
%scala
val df = spark.read.format("csv")
  .option("inferSchema", "true")
  .option("header", "true")
  .load("/databricks-datasets/Rdatasets/data-001/csv/ggplot2/diamonds.csv")
dbutils.data.summarize(df)

# File system utility (dbutils.fs)

Commands: cp, head, ls, mkdirs, mount, mounts, mv, put, refreshMounts, rm, unmount, updateMount

In [0]:
out = dbutils.fs.ls("dbfs:/mnt/dbacademy-users/olonok@hotmail.com/large-language-models/")

In [0]:
out

[FileInfo(path='dbfs:/mnt/dbacademy-users/olonok@hotmail.com/large-language-models/datasets/', name='datasets/', size=0, modificationTime=1717701453000),
 FileInfo(path='dbfs:/mnt/dbacademy-users/olonok@hotmail.com/large-language-models/working/', name='working/', size=0, modificationTime=1718464728000),
 FileInfo(path='dbfs:/mnt/dbacademy-users/olonok@hotmail.com/large-language-models/working-testing-files/', name='working-testing-files/', size=0, modificationTime=1717701778000)]

In [0]:
out[1].path

'dbfs:/mnt/dbacademy-users/olonok@hotmail.com/large-language-models/working/'

In [0]:
dbutils.fs.help("ls")

In [0]:
! ls /

BUILD.bazel  boot		  dev	lib32	     media  root  sys	var
Volumes      databricks		  etc	lib64	     mnt    run   tmp
Workspace    databricks-datasets  home	libx32	     opt    sbin  ttyd
bin	     dbfs		  lib	local_disk0  proc   srv   usr


In [0]:
dbutils.fs.ls("dbfs:/mnt")

[FileInfo(path='dbfs:/mnt/dbacademy-datasets/', name='dbacademy-datasets/', size=0, modificationTime=1717699479000),
 FileInfo(path='dbfs:/mnt/dbacademy-users/', name='dbacademy-users/', size=0, modificationTime=1717699479000),
 FileInfo(path='dbfs:/mnt/tmp/', name='tmp/', size=0, modificationTime=1718291806000)]

# Jobs utility (dbutils.jobs)
Commands: get, set

In [0]:
dbutils.jobs.taskValues.set(key = "loss", value = 5)

In [0]:
dbutils.jobs.taskValues.get(taskKey = "execution", key  = "loss", default=6,    debugValue = 42)

42

# Notebook utility (dbutils.notebook)
Commands: exit, run

In [0]:
dbutils.notebook.run("/Workspace/Users/olonok@hotmail.com/execution", 600, {"name": "kevin lebron", "city": "Paris"})

'kevin lebron lives in Paris'

# Secrets utility (dbutils.secrets)

In [0]:
dbutils.secrets.listScopes()

[SecretScope(name='databricks-azure'),
 SecretScope(name='local-scope'),
 SecretScope(name='test-dev'),
 SecretScope(name='test-dev-2'),
 SecretScope(name='test-dev-3'),
 SecretScope(name='test-scope-test2'),
 SecretScope(name='test-scope-test3')]

In [0]:
dbutils.secrets.get(scope= "test-dev", key = "HF_TOKEN")

'[REDACTED]'

In [0]:
dbutils.secrets.list(scope="databricks-azure")

[SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-8CfSLrz1ASCMGCrNI9dkPbzl7M9sUi5U7O1cFmiieeI'),
 SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-bUt1Qdglk0S06U-nyiMMxO0TYuuwYoVIq37OcgcL6TA'),
 SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-e6UfIDBVevZNE5bSaGApCGxWAAn4rivk3P1kF4cJ19I'),
 SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-gKj5vnGDg3hwYjM4VcUgcyGehfv8zbADO6Zy9tMRbTQ'),
 SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-lvgq7p7B8u3qytG65UC-zu99URLrd-jPbeQaMCj2tS4'),
 SecretMetadata(key='OPENAIAPIKEY'),
 SecretMetadata(key='test-local'),
 SecretMetadata(key='test-local-2'),
 SecretMetadata(key='test3')]

In [0]:
dbutils.secrets.list(scope="test-scope-test3")

[SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-8CfSLrz1ASCMGCrNI9dkPbzl7M9sUi5U7O1cFmiieeI'),
 SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-bUt1Qdglk0S06U-nyiMMxO0TYuuwYoVIq37OcgcL6TA'),
 SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-e6UfIDBVevZNE5bSaGApCGxWAAn4rivk3P1kF4cJ19I'),
 SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-gKj5vnGDg3hwYjM4VcUgcyGehfv8zbADO6Zy9tMRbTQ'),
 SecretMetadata(key='cd2e4b76-c4bf-4826-bdd3-addc6c4f7cee-lvgq7p7B8u3qytG65UC-zu99URLrd-jPbeQaMCj2tS4'),
 SecretMetadata(key='OPENAIAPIKEY'),
 SecretMetadata(key='test-local'),
 SecretMetadata(key='test-local-2'),
 SecretMetadata(key='test3')]

In [0]:
dbutils.secrets.get(scope= "test-scope-test3", key = "OPENAIAPIKEY")

'[REDACTED]'

In [0]:
dbutils.widgets.multiselect("multi", defaultValue= "uno",choices=["uno", "dos", "tres", "cuatro"])