Monitoring the Execution of Transformation Jobs
Defining a Job through the Data Product Builder
Low-code pipeline builder
{
"config": {
"docker_tag": "0.1.10",
"executor_core_request": "800m",
"executor_core_limit": "1500m",
"executor_instances": 1,
"min_executor_instances": 1,
"max_executor_instances": 1,
"executor_memory": "5120m",
"driver_core_request": "0.3",
"driver_core_limit": "800m",
"driver_memory": "2048m"
},
"inputs": {
"input_26e5351b_dab2_4e3d_979b_6e7936d5143b": {
"input_type": "data_object",
"identifier": "26e5351b-dab2-4e3d-979b-6e7936d5143b",
"preview_limit": 10
}
},
"transformations": [
{
"transform": "cast",
"input": "input_26e5351b_dab2_4e3d_979b_6e7936d5143b",
"output": "shipments_casted",
"changes": [
{
"column": "shipment_id",
"data_type": "integer",
"kwargs": {}
},
{
"column": "route_id",
"data_type": "integer",
"kwargs": {}
},
{
"column": "carrier_id",
"data_type": "integer",
"kwargs": {}
},
{
"column": "shipment_date",
"data_type": "timestamp",
"kwargs": {}
},
{
"column": "expected_delivery_date",
"data_type": "timestamp",
"kwargs": {}
},
{
"column": "actual_delivery_date",
"data_type": "timestamp",
"kwargs": {}
},
{
"column": "weight",
"data_type": "double",
"kwargs": {}
},
{
"column": "volume",
"data_type": "double",
"kwargs": {}
},
{
"column": "priority",
"data_type": "integer",
"kwargs": {}
},
{
"column": "cost",
"data_type": "double",
"kwargs": {}
}
]
},
{
"transform": "select_columns",
"input": "shipments_casted",
"output": "shipments_final",
"columns": [
"shipment_id",
"route_id",
"carrier_id",
"shipment_date",
"expected_delivery_date",
"actual_delivery_date",
"origin",
"destination",
"weight",
"volume",
"status",
"delay_reason",
"priority",
"cost"
]
}
],
"finalisers": {
"input": "shipments_final",
"enable_quality": true,
"write_config": {
"mode": "overwrite"
},
"enable_profiling": true,
"enable_classification": false
},
"preview": false
}Custom script pipeline builder
Monitoring the compute jobs
Common Issues
Last updated