Connection

Configuration

NAMETYPEDESCRIPTIONREQUIREDREADONLY
server_hostnamestringtruefalse
portintegertruefalse
access_tokenstringtruefalse
http_pathstringtruefalse
cloud_providerstringAccepted Values: aws, azurefalsefalse
auth_modestringHow to authenticate with AWS. Defaults to Access Key and Secret. Accepted Values: access_key_and_secret, iam_roletruefalse
iam_role_arnstring(required if auth_mode is “iam_role”)falsefalse
storage_credential_namestringfalsefalse
external_idstringExternal ID for the IAM rolefalsefalse
aws_access_key_idstringSee https://docs.polytomic.com/docs/databricks-connections#writing-to-databricks (required if auth_mode is “aws_access_key_id”)falsefalse
aws_secret_access_keystring(required if auth_mode is “aws_access_key_id”)falsefalse
aws_userstringfalsefalse
s3_bucket_namestringName of bucket used for staging data load files (required if cloud_provider is “aws”)falsefalse
s3_bucket_regionstring(required if cloud_provider is “aws”)falsefalse
azure_account_namestringThe account name of the storage account (required if cloud_provider is “azure”)falsefalse
azure_access_keystringThe access key associated with this storage account (required if cloud_provider is “azure”)falsefalse
container_namestringThe container which we will stage files in (required if cloud_provider is “azure”)falsefalse
unity_catalog_enabledbooleanfalsefalse
enable_delta_uniformbooleanfalsefalse
enforce_query_limitbooleanfalsefalse
concurrent_queriesintegerfalsefalse
set_retention_propertiesbooleanfalsefalse
log_file_retention_daysintegerfalsefalse
deleted_file_retention_daysintegerfalsefalse

Example

1{
2 "name": "databricks connection",
3 "type": "databricks",
4 "configuration": {
5 "access_token": "isoz8af6zvp8067gu68gvrp0oftevn",
6 "auth_mode": "access_key_and_secret",
7 "aws_access_key_id": "AKIAIOSFODNN7EXAMPLE",
8 "aws_secret_access_key": "wJalrXUtnFEMI/K7MDENG/bPxRfiCYEXAMPLEKEY",
9 "aws_user": "",
10 "azure_access_key": "abcdefghijklmnopqrstuvwxyz0123456789/+ABCDEabcdefghijklmnopqrstuvwxyz0123456789/+ABCDE==",
11 "azure_account_name": "account",
12 "cloud_provider": "aws",
13 "concurrent_queries": 0,
14 "container_name": "container",
15 "deleted_file_retention_days": 0,
16 "enable_delta_uniform": false,
17 "enforce_query_limit": false,
18 "external_id": "",
19 "http_path": "/sql",
20 "iam_role_arn": "",
21 "log_file_retention_days": 0,
22 "port": 443,
23 "s3_bucket_name": "s3://polytomic-databricks-results/customer-dataset",
24 "s3_bucket_region": "",
25 "server_hostname": "dbc-1234dsafas-d0001.cloud.databricks.com",
26 "set_retention_properties": false,
27 "storage_credential_name": "",
28 "unity_catalog_enabled": false
29 }
30}

Model Sync

Source

Configuration

NAMETYPEDESCRIPTIONREQUIREDREADONLY
catalogstringCatalogfalsefalse
schemastringSchemafalsefalse
tablestringTablefalsefalse
querystringQueryfalsefalse

Example

1{
2 ...
3 "configuration": {
4 "catalog": "samples",
5 "query": "SELECT * FROM samples.nyctaxi.trips",
6 "schema": "nyctaxi",
7 "table": "trips"
8 }
9}

Target

Configuration

NAMETYPEDESCRIPTIONREQUIREDREADONLY
preserve_table_on_resyncbooleanPreserve destination table when resyncingfalsefalse
write_record_timestampsbooleanWrite row timestamp metadatafalsefalse
created_columnstring’Created at’ timestamp columnfalsefalse
updated_columnstring’Updated at’ timestamp columnfalsefalse

Example

1{
2 ...
3 "target": {
4 "configuration": {
5 "created_column": "",
6 "preserve_table_on_resync": false,
7 "updated_column": "",
8 "write_record_timestamps": false
9 }
10 }
11}

Bulk Sync

Destination

Configuration

NAMETYPEDESCRIPTIONREQUIREDREADONLY
advancedobjectfalsefalse
catalogstringCatalogfalsefalse
schemastringOutput schemafalsefalse
mirror_schemasbooleanMirror schemasfalsefalse
external_location_namestringExternal locationfalsefalse

Example

1{
2 ...
3 "destination_configuration": {
4 "advanced": {
5 "deleted_file_retention_days": 0,
6 "hard_deletes": false,
7 "log_file_retention_days": 0,
8 "set_retention_properties": false,
9 "table_prefix": "",
10 "truncate_existing": false
11 },
12 "catalog": "samples",
13 "external_location_name": "",
14 "mirror_schemas": false,
15 "schema": "nyctaxi"
16 }
17}

Type handling

Destination types

POLYTOMIC TYPEDATABRICKS TYPE
array<>ARRAY<>
bigintBIGINT
booleanBOOLEAN
dateDATE
datetimeTIMESTAMP
decimal(precision, scale)DECIMAL(precision,scale)
doubleDOUBLE
intINT
jsonSTRING
jsonarraySTRING
numberDECIMAL(38,18)
object{}STRUCT<>
singleFLOAT
smallintSMALLINT
stringSTRING
timeTIMESTAMP

Source types

DATABRICKS TYPEPOLYTOMIC TYPE
ARRAY<>array<>
BIGINTbigint
DATEdate
DECIMAL(precision, scale)decimal(precision, scale)
DOUBLEdouble
FLOATsingle
INTint
INTERVALstring
MAP<>object{}
SMALLINTsmallint
STRUCT<>object{}
TIMESTAMPdatetime
TIMESTAMP_NTZdatetime
TINYINTsmallint
VARCHARstring