kauts shukla
05/02/2021, 11:12 AMselect userid,eventlabel,sessionid, MIN(timestampist) as mint, MAX(timestampist) as maxt, (MAX(timestampist) - MIN(timestampist)) as diff_time from default.click_stream where eventlabel !='null' and timestampist between 1615833000000 and 1616225312000 group by userid,eventlabel,sessionid
Mayank
kauts shukla
05/02/2021, 1:31 PMkauts shukla
05/02/2021, 1:37 PMkauts shukla
05/02/2021, 1:42 PMselect userid,eventlabel, MIN(timestampist) as mint, MAX(timestampist) as maxt, (MAX(timestampist) - MIN(timestampist)) as diff_time from click_stream where timestampist between 1612264456000 and 1619962345000 group by userid,eventlabel. This is taking 60 seconds numDocsScanned 221866025
Mayank
kauts shukla
05/02/2021, 3:46 PM{
"tableName": "click_stream_REALTIME",
"tableType": "REALTIME",
"segmentsConfig": {
"segmentAssignmentStrategy": "BalanceNumSegmentAssignmentStrategy",
"timeColumnName": "created_at",
"retentionTimeUnit": "DAYS",
"retentionTimeValue": "90",
"segmentPushType": "APPEND",
"timeType": "DAYS",
"replication": "1",
"replicasPerPartition": "1",
"schemaName": "click_stream"
},
"tenants": {
"broker": "DefaultTenant",
"server": "DefaultTenant"
},
"tableIndexConfig": {
"autoGeneratedInvertedIndex": true,
"loadMode": "MMAP",
"streamConfigs": {
"streamType": "kafka",
"stream.kafka.consumer.type": "simple",
"stream.kafka.topic.name": "vedantu.dp.click_stream.click_stream",
"stream.kafka.decoder.class.name": "org.apache.pinot.plugin.stream.kafka.KafkaJSONMessageDecoder",
"stream.kafka.consumer.factory.class.name": "org.apache.pinot.plugin.stream.kafka20.KafkaConsumerFactory",
"stream.kafka.hlc.zk.connect.string": "zk1:2181/kafka",
"stream.kafka.zk.broker.url": "zk1:2181/kafka",
"stream.kafka.broker.list": "kafka01:9092",
"realtime.segment.flush.threshold.time": "3600000",
"realtime.segment.flush.threshold.size": "50000",
"stream.kafka.consumer.prop.auto.offset.reset": "smallest"
},
"aggregateMetrics": false,
"enableDefaultStarTree": false,
"enableDynamicStarTreeCreation": false,
"nullHandlingEnabled": true,
"createInvertedIndexDuringSegmentGeneration": false,
"starTreeIndexConfigs": [
{
"dimensionsSplitOrder": [
"eventcategory",
"eventlabel",
"userid",
"sessionid"
],
"skipStarNodeCreationForDimensions": [],
"functionColumnPairs": [
"MIN__timestampist",
"MAX__timestampist"
]
}
],
"rangeIndexColumns": [
"timestampist",
"created_at"
]
},
"metadata": {
"customConfigs": {}
},
"routing": {
"instanceSelectorType": "replicaGroup"
},
"isDimTable": false
}
kauts shukla
05/02/2021, 3:47 PMMayank
Mayank
kauts shukla
05/02/2021, 3:48 PMMayank
kauts shukla
05/02/2021, 3:50 PMselect userid,eventlabel,sessionid, MIN(timestampist) as mint, MAX(timestampist) as maxt, (MAX(timestampist) - MIN(timestampist)) as diff_time from default.click_stream where sessionid !='null' and timestampist between 1615833000000 and 1616225312000 group by userid,eventlabel,sessionid
kauts shukla
05/02/2021, 3:50 PMMayank
kauts shukla
05/02/2021, 3:51 PMMayank
Mayank
Mayank
kauts shukla
05/02/2021, 3:52 PMkauts shukla
05/02/2021, 3:53 PM"dateTimeFieldSpecs": [
{
"name": "created_at",
"dataType": "LONG",
"format": "1:MILLISECONDS:EPOCH",
"granularity": "1:DAY"
}
]
kauts shukla
05/02/2021, 3:53 PMMayank
kauts shukla
05/02/2021, 3:54 PMkauts shukla
05/02/2021, 3:54 PMMayank
Mayank
kauts shukla
05/02/2021, 4:02 PMkauts shukla
05/02/2021, 4:10 PMSUM
on “aggregateMetrics”: true. Which aren’t using as a part of query. Now My queries are not ever responding in 60 seconds with new table definition with start tree index.