Playsted
12/12/2020, 5:04 PMKishore G
Playsted
12/12/2020, 5:08 PMKishore G
The next time I run an ingestion job for the table unrelated to the deleted segments it re-adds them to the table. Is this expected? Am I missing something?This is not expected. Can you show the segments list and ingestion job spec
Playsted
12/12/2020, 5:11 PMexecutionFrameworkSpec:
name: 'standalone'
segmentGenerationJobRunnerClassName: 'org.apache.pinot.plugin.ingestion.batch.standalone.SegmentGenerationJobRunner'
segmentUriPushJobRunnerClassName: 'org.apache.pinot.plugin.ingestion.batch.standalone.SegmentUriPushJobRunner'
jobType: SegmentCreationAndUriPush
inputDirURI: '<s3://pinot-io/dotnet>'
includeFileNamePattern: 'glob:**/*.parquet'
outputDirURI: '<s3://pinot-io/segments>'
segmentCreationJobParallelism: 4
overwriteOutput: true
pinotFSSpecs:
- scheme: s3
className: org.apache.pinot.plugin.filesystem.S3PinotFS
configs:
region: 'us-east-1'
endpoint: '<http://pinot-minio:9090>'
accessKey: 'pinot'
secretKey: 'pinot!!!'
recordReaderSpec:
dataFormat: 'parquet'
className: 'org.apache.pinot.plugin.inputformat.parquet.ParquetRecordReader'
tableSpec:
tableName: 'mm'
schemaURI: '<http://pinot-controller:9000/tables/mm/schema>'
tableConfigURI: '<http://pinot-controller:9000/tables/mm>'
pinotClusterSpecs:
- controllerURI: '<http://pinot-controller:9000>'
pushJobSpec:
pushAttempts: 2
pushRetryIntervalMillis: 1000
segmentNameGeneratorSpec:
type: normalizedDate
configs:
segment.name.prefix: 'mm_batch_test'
Playsted
12/12/2020, 5:12 PM{
"id": "mm_OFFLINE",
"simpleFields": {
"BATCH_MESSAGE_MODE": "false",
"IDEAL_STATE_MODE": "CUSTOMIZED",
"INSTANCE_GROUP_TAG": "mm_OFFLINE",
"MAX_PARTITIONS_PER_INSTANCE": "1",
"NUM_PARTITIONS": "3",
"REBALANCE_MODE": "CUSTOMIZED",
"REPLICAS": "1",
"STATE_MODEL_DEF_REF": "SegmentOnlineOfflineStateModel",
"STATE_MODEL_FACTORY_NAME": "DEFAULT"
},
"mapFields": {
"mm_batch_test_2020-11-19_2020-11-19_0": {
"Server_172.20.0.6_8098": "ONLINE"
},
"mm_batch_test_2020-11-19_2020-11-19_1": {
"Server_172.20.0.6_8098": "ONLINE"
},
"mm_batch_test_2020-11-19_2020-11-19_2": {
"Server_172.20.0.6_8098": "ONLINE"
}
},
"listFields": {}
}
Playsted
12/12/2020, 5:14 PMPlaysted
12/12/2020, 5:14 PM{
"id": "mm_OFFLINE",
"simpleFields": {
"BATCH_MESSAGE_MODE": "false",
"IDEAL_STATE_MODE": "CUSTOMIZED",
"INSTANCE_GROUP_TAG": "mm_OFFLINE",
"MAX_PARTITIONS_PER_INSTANCE": "1",
"NUM_PARTITIONS": "7",
"REBALANCE_MODE": "CUSTOMIZED",
"REPLICAS": "1",
"STATE_MODEL_DEF_REF": "SegmentOnlineOfflineStateModel",
"STATE_MODEL_FACTORY_NAME": "DEFAULT"
},
"mapFields": {
"mm_batch1_test_2020-11-19_2020-11-19_0": {
"Server_172.20.0.6_8098": "ONLINE"
},
"mm_batch1_test_2020-11-19_2020-11-19_1": {
"Server_172.20.0.6_8098": "ONLINE"
},
"mm_batch2_test_2020-11-19_2020-11-19_0": {
"Server_172.20.0.6_8098": "ONLINE"
},
"mm_batch2_test_2020-11-19_2020-11-19_1": {
"Server_172.20.0.6_8098": "ONLINE"
},
"mm_batch_test_2020-11-19_2020-11-19_0": {
"Server_172.20.0.6_8098": "ONLINE"
},
"mm_batch_test_2020-11-19_2020-11-19_1": {
"Server_172.20.0.6_8098": "ONLINE"
},
"mm_batch_test_2020-11-19_2020-11-19_2": {
"Server_172.20.0.6_8098": "ONLINE"
}
},
"listFields": {}
}
Playsted
12/12/2020, 5:14 PMPlaysted
12/12/2020, 5:15 PMKishore G
Playsted
12/12/2020, 5:20 PMPlaysted
12/12/2020, 5:20 PMKishore G
Kishore G
Kishore G
Playsted
12/12/2020, 5:24 PMPlaysted
12/12/2020, 5:24 PMSubbu Subramaniam
12/12/2020, 11:52 PMPlaysted
12/12/2020, 11:54 PMSubbu Subramaniam
12/13/2020, 1:37 AMDeleted_Segments/tableName