/
databricks_new_cluster_job.json
62 lines (62 loc) · 1.87 KB
/
databricks_new_cluster_job.json
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
{
"name": "Item_Table_Create",
"new_cluster": {
"spark_version": "5.0.x-ml-scala2.11",
"node_type_id": "Standard_DS3_v2",
"spark_conf":{
"spark.databricks.cluster.profile":"serverless",
"spark.databricks.repl.allowedLanguages":"sql,python,r",
"spark.databricks.delta.preview.enabled": true,
"spark.sql.crossJoin.enabled": true,
"spark.driver.maxResultSize": "20g",
"spark.network.timeout": 2000,
"spark.databricks.service.server.enabled": true,
"spark.databricks.service.port": 8787,
"spark.sql.execution.arrow.enabled": true
},
"init_scripts": [ {
"dbfs": {
"destination": "dbfs:/databricks/rstudio/cluster-init1a.sh"
}
} ],
"cluster_log_conf": {
"dbfs" : {
"destination": "dbfs:/cluster-logs"
}
},
"num_workers": 2
},
"libraries": [
{
"pypi": {
"package": "datacompy"
}
},
{
"cran": {
"package": "xgboost",
"repo": "http://cran.us.r-project.org"
}
},
{
"maven": {
"coordinates": "com.microsoft.sqlserver:mssql-jdbc:6.5.3.jre8-preview"
}
}
],
"email_notifications": {
"on_start": ["charlesc@wpress.com"],
"on_success": ["charlesc@wpress.com"],
"on_failure": ["charlesc@wpress.com"]
},
"timeout_seconds": 3600,
"max_retries": 1,
"notebook_task": {
"_comment": "path param||notebook_path||notebooks/python_notebook",
"notebook_path": "/notebooks/jobs_demo",
"base_parameters": {
"argument1": "value 1",
"argument2": "value 2"
}
}
}