Mayank
luanmorenomaciel
01/20/2021, 10:54 PM{
"user_id": 17611,
"uuid": "469fe40e-84cf-482c-ba73-fe722596f7bc",
"first_name": "Christina",
"last_name": "Jones",
"date_birth": "1954-03-09",
"city": "Thomastown",
"country": "Honduras",
"company_name": "Nelson, Kline and Munoz",
"job": "Drilling engineer",
"phone_number": "<tel:331.851.7563|331.851.7563>",
"last_access_time": "1994-04-08T07:32:19",
"time_zone": "America/Montevideo",
"dt_current_timestamp": "2021-01-20 12:05:53.219255"
}
schema definition
{
"schemaName": "sch_users_json",
"dimensionFieldSpecs": [
{
"name": "user_id",
"dataType": "INT"
},
{
"name": "uuid",
"dataType": "STRING",
"singleValueField": false
},
{
"name": "first_name",
"dataType": "STRING"
},
{
"name": "last_name",
"dataType": "STRING"
},
{
"name": "date_birth",
"dataType": "STRING"
},
{
"name": "city",
"dataType": "STRING"
},
{
"name": "country",
"dataType": "STRING",
"singleValueField": false
},
{
"name": "phone_number",
"dataType": "STRING",
"singleValueField": false
},
{
"name": "last_access_time",
"dataType": "STRING",
"singleValueField": false
},
{
"name": "time_zone",
"dataType": "STRING",
"singleValueField": false
}
],
"timeFieldSpec": {
"incomingGranularitySpec": {
"timeType": "MILLISECONDS",
"timeFormat": "EPOCH",
"dataType": "LONG",
"name": "dt_current_timestamp"
}
}
}
task creationluanmorenomaciel
01/20/2021, 10:54 PM{
"tableName": "realtime_users_json_events",
"tableType": "REALTIME",
"segmentsConfig": {
"timeColumnName": "mergedTimeMillis",
"timeType": "MILLISECONDS",
"retentionTimeUnit": "DAYS",
"retentionTimeValue": "60",
"schemaName": "sch_users_json",
"replication": "1",
"replicasPerPartition": "1"
},
"tenants": {},
"tableIndexConfig": {
"loadMode": "MMAP",
"invertedIndexColumns": [
"city",
"country"
],
"streamConfigs": {
"streamType": "kafka",
"stream.kafka.consumer.type": "lowlevel",
"stream.kafka.topic.name": "src-app-users-json",
"stream.kafka.decoder.class.name": "org.apache.pinot.plugin.stream.kafka.KafkaJSONMessageDecoder",
"stream.kafka.consumer.factory.class.name": "org.apache.pinot.plugin.stream.kafka20.KafkaConsumerFactory",
"stream.kafka.broker.list": "127.0.0.1:9094",
"realtime.segment.flush.threshold.time": "3600000",
"realtime.segment.flush.threshold.size": "50000",
"stream.kafka.consumer.prop.auto.offset.reset": "smallest"
}
},
"metadata": {
"customConfigs": {}
}
}
I'm connecting on pinot-controller and executing the following command, but getting any results
root@pinot-controller-0:/opt/pinot# bin/pinot-admin.sh AddTable \
> -schemaFile /opt/pinot/sch_users_json.json \
> -tableConfigFile /opt/pinot/realtime_users_json_events.json \
> -exec
root@pinot-controller-0:/opt/pinot#
Neha Pawar
Neha Pawar
luanmorenomaciel
01/20/2021, 11:02 PMluanmorenomaciel
01/20/2021, 11:02 PMluanmorenomaciel
01/20/2021, 11:03 PM2021/01/20 22:51:03.534 INFO [PinotTableRestletResource] [grizzly-http-server-0] Cannot find valid fieldSpec for timeColumn: mergedTimeMillis from the table config: realtime_users_json_events_REALTIME, in the schema: sch_users_json exception: Cannot find valid fieldSpec for timeColumn: mergedTimeMillis from the table config: realtime_users_json_events_REALTIME, in the schema: sch_users_json
luanmorenomaciel
01/20/2021, 11:04 PMluanmorenomaciel
01/20/2021, 11:08 PM{
"schemaName": "sch_users_json",
"dimensionFieldSpecs": [
{
"name": "user_id",
"dataType": "LONG"
},
{
"name": "uuid",
"dataType": "STRING"
},
{
"name": "first_name",
"dataType": "STRING"
},
{
"name": "last_name",
"dataType": "STRING"
},
{
"name": "date_birth",
"dataType": "STRING"
},
{
"name": "city",
"dataType": "STRING"
},
{
"name": "country",
"dataType": "STRING"
},
{
"name": "phone_number",
"dataType": "STRING"
},
{
"name": "last_access_time",
"dataType": "STRING"
},
{
"name": "time_zone",
"dataType": "STRING"
}
],
"dateTimeFieldSpec": {
"incomingGranularitySpec": {
"name": "dt_current_timestamp",
"dataType": "STRING",
"format": "SIMPLE_DATE_FORMAT"
}
}
}
Neha Pawar
luanmorenomaciel
01/20/2021, 11:10 PMNeha Pawar
"dateTimeFieldSpecs": [
{
"name": "millisSinceEpoch",
"dataType": "LONG",
"format": "1:MILLISECONDS:EPOCH",
"granularity": "15:MINUTES"
},
{
"name": "hoursSinceEpoch",
"dataType": "INT",
"format": "1:HOURS:EPOCH",
"granularity": "1:HOURS"
},
{
"name": "dateString",
"dataType": "STRING",
"format": "1:DAYS:SIMPLE_DATE_FORMAT:yyyy-MM-dd",
"granularity": "1:DAYS"
}
]
Neha Pawar
Neha Pawar
luanmorenomaciel
01/20/2021, 11:12 PM"dateTimeFieldSpecs": [{
"name": "dt_current_timestamp",
"dataType": "STRING",
"format": "1:DAYS:SIMPLE_DATE_FORMAT:yyyy-MM-dd",
"granularity": "1:DAYS"
}]
Neha Pawar
Neha Pawar
2021-01-20 12:05:53.219255
Neha Pawar
Neha Pawar
luanmorenomaciel
01/20/2021, 11:14 PMluanmorenomaciel
01/20/2021, 11:14 PMNeha Pawar
2021-01-20 12:05:53.219255
and Pinot will try to match it with just yyyy-MM-dd
luanmorenomaciel
01/20/2021, 11:16 PMNeha Pawar
Neha Pawar
luanmorenomaciel
01/20/2021, 11:18 PM21/01/20 23:17:37.817 WARN [PartitionCountFetcher] [grizzly-http-server-1] Could not get partition count for topic src-app-users-json
org.apache.kafka.common.errors.TimeoutException: Timeout expired while fetching topic metadata
2021/01/20 23:17:37.818 ERROR [PinotTableIdealStateBuilder] [grizzly-http-server-1] Could not get partition count for src-app-users-json
org.apache.kafka.common.errors.TimeoutException: Timeout expired while fetching topic metadata
2021/01/20 23:17:37.818 ERROR [PinotTableRestletResource] [grizzly-http-server-1] org.apache.kafka.common.errors.TimeoutException: Timeout expired while fetching topic metadata
java.lang.RuntimeException: org.apache.kafka.common.errors.TimeoutException: Timeout expired while fetching topic metadata
Neha Pawar
Neha Pawar
luanmorenomaciel
01/20/2021, 11:20 PM