Hi,
I just started using Druid.
I currently have the following datasource that is created using kafka injestion. I want to create one other datasource out of this by extracting a subset of datapoints from the original. But the task is failing without any details.
Please help with figuring out what could be wrong. The total data is less 200MB. Thanks
Here is the original datasource:
{
"spec": {
"dataSchema": {
"dataSource": "OrigDataSrc",
"dimensionsSpec": {
"dimensions": [
"org_id",
"user_id",
"login_id"
]
},
"granularitySpec": {
"queryGranularity": "NONE",
"rollup": false,
"segmentGranularity": "HOUR",
"type": "uniform"
},
"timestampSpec": {
"column": "timestamp",
"format": "iso"
}
},
"ioConfig": {
"consumerProperties": {
"bootstrap.servers": "kafka:9092"
},
"inputFormat": {
"type": "json"
},
"topic": "DemDataXfrm.ProbeData",
"type": "kafka",
"useEarliestOffset": true
},
"tuningConfig": {
"type": "kafka"
}
},
"type": "kafka"
}
Task Json:
{
"type": "index_parallel",
"spec": {
"ioConfig": {
"type": "index_parallel",
"inputSource": {
"type": "druid",
"dataSource": "OrigDataSrc",
"interval": "2021-10-07/P2D"
}
},
"dataSchema": {
"dataSource": "DerivedDataSrc1",
"granularitySpec": {
"type": "uniform",
"queryGranularity": "NONE",
"segmentGranularity": "HOUR",
"rollup": false
},
"timestampSpec": {
"column": "__time",
"format": "auto"
},
"dimensionsSpec": {
"dimensions": [
"org_id",
"user_id",
"login_id"
]
}
}
}
}