csdavidc opened a new issue, #15043: URL: https://github.com/apache/pinot/issues/15043
i'm running pinot on a docker container, I created a realtime table with the following configuration: ``` json { "REALTIME": { "tableName": "sso_REALTIME", "tableType": "REALTIME", "segmentsConfig": { "schemaName": "sso", "replication": "1", "retentionTimeUnit": "DAYS", "retentionTimeValue": "90", "replicasPerPartition": "1", "timeColumnName": "daysSinceEpoch", "minimizeDataMovement": false }, "tenants": { "broker": "DefaultTenant", "server": "DefaultTenant", "tagOverrideConfig": {} }, "tableIndexConfig": { "invertedIndexColumns": [], "rangeIndexColumns": [], "rangeIndexVersion": 2, "autoGeneratedInvertedIndex": false, "createInvertedIndexDuringSegmentGeneration": false, "sortedColumn": [], "bloomFilterColumns": [], "loadMode": "MMAP", "streamConfigs": { "streamType": "kafka", "stream.kafka.topic.name": "topic", "stream.kafka.broker.list": "localhost:9200", "stream.kafka.consumer.type": "lowlevel", "stream.kafka.consumer.prop.auto.offset.reset": "smallest", "stream.kafka.consumer.factory.class.name": "org.apache.pinot.plugin.stream.kafka20.KafkaConsumerFactory", "stream.kafka.decoder.class.name": "org.apache.pinot.plugin.inputformat.protobuf.ProtoBufMessageDecoder", "realtime.segment.flush.threshold.rows": "0", "realtime.segment.flush.threshold.segment.rows": "0", "realtime.segment.flush.threshold.time": "24h", "realtime.segment.flush.threshold.segment.size": "100M", "stream.kafka.decoder.prop.protoClassName": "Events", "stream.kafka.decoder.prop.descriptorFile": "file:///opt/pinot/kafka/sample.desc" }, "noDictionaryColumns": [ "events_count" ], "onHeapDictionaryColumns": [], "varLengthDictionaryColumns": [], "enableDefaultStarTree": false, "enableDynamicStarTreeCreation": false, "aggregateMetrics": false, "nullHandlingEnabled": false, "columnMajorSegmentBuilderEnabled": true, "optimizeDictionary": false, "optimizeDictionaryForMetrics": false, "optimizeDictionaryType": false, "noDictionarySizeRatioThreshold": 0.85 }, "metadata": {}, "quota": {}, "routing": {}, "query": {}, "ingestionConfig": { "transformConfigs": [ { "columnName": "daysSinceEpoch", "transformFunction": "toEpochDays(\"UTCTimestamp\")" } ], "aggregationConfigs": [ { "columnName": "events_count", "aggregationFunction": "COUNT(*)" } ], "continueOnError": false, "rowTimeValueCheck": false, "segmentTimeValueCheck": true }, "isDimTable": false } } ``` It created successfully but then it became to a BAD status The query console shows this error: "Error Code: 305 null: 2 segments unavailable: [sso__1__0__20250212T1236Z, sso__0__0__20250212T1236Z]" and the container logs shows this error: ``` 2025/02/12 12:36:57.169 ERROR [HelixStateTransitionHandler] [HelixTaskExecutor-message_handle_thread_69] Exception while executing a state transition task sso__0__0__20250212T1236Z java.lang.reflect.InvocationTargetException: null at jdk.internal.reflect.GeneratedMethodAccessor245.invoke(Unknown Source) ~[?:?] at java.base/jdk.internal.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) ~[?:?] at java.base/java.lang.reflect.Method.invoke(Method.java:566) ~[?:?] at org.apache.helix.messaging.handling.HelixStateTransitionHandler.invoke(HelixStateTransitionHandler.java:350) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.helix.messaging.handling.HelixStateTransitionHandler.handleMessage(HelixStateTransitionHandler.java:278) [pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.helix.messaging.handling.HelixTask.call(HelixTask.java:97) [pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.helix.messaging.handling.HelixTask.call(HelixTask.java:49) [pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at java.base/java.util.concurrent.FutureTask.run(FutureTask.java:264) [?:?] at java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1128) [?:?] at java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:628) [?:?] at java.base/java.lang.Thread.run(Thread.java:829) [?:?] Caused by: org.apache.pinot.spi.utils.retry.AttemptsExceededException: Operation failed after 5 attempts at org.apache.pinot.spi.utils.retry.BaseRetryPolicy.attempt(BaseRetryPolicy.java:65) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.core.data.manager.realtime.RealtimeSegmentDataManager.<init>(RealtimeSegmentDataManager.java:1628) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.core.data.manager.realtime.RealtimeTableDataManager.doAddConsumingSegment(RealtimeTableDataManager.java:552) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.core.data.manager.realtime.RealtimeTableDataManager.addConsumingSegment(RealtimeTableDataManager.java:497) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.server.starter.helix.HelixInstanceDataManager.addConsumingSegment(HelixInstanceDataManager.java:266) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.server.starter.helix.SegmentOnlineOfflineStateModelFactory$SegmentOnlineOfflineStateModel.onBecomeConsumingFromOffline(SegmentOnlineOfflineStateModelFactory.java:81) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] ... 11 more 2025/02/12 12:36:57.169 ERROR [StateModel] [HelixTaskExecutor-message_handle_thread_69] Default rollback method invoked on error. Error Code: ERROR 2025/02/12 12:36:57.171 ERROR [HelixTask] [HelixTaskExecutor-message_handle_thread_69] Message execution failed. msgId: f58f06f3-06c7-4af0-a743-bb4ce810fd5d, errorMsg: java.lang.reflect.InvocationTargetException 2025/02/12 12:36:57.171 ERROR [HelixStateTransitionHandler] [HelixTaskExecutor-message_handle_thread_69] Skip internal error. errCode: ERROR, errMsg: null 2025/02/12 12:36:57.177 ERROR [MessageGenerationPhase] [HelixController-pipeline-default-QuickStartCluster-(f37f33c7_DEFAULT)] Event f37f33c7_DEFAULT : Unable to find a next state for resource: sso_REALTIME partition: sso__0__0__20250212T1236Z from stateModelDefinitionclass org.apache.helix.model.StateModelDefinition from:ERROR to:CONSUMING 2025/02/12 12:36:57.182 ERROR [MessageGenerationPhase] [HelixController-pipeline-default-QuickStartCluster-(91519c8e_DEFAULT)] Event 91519c8e_DEFAULT : Unable to find a next state for resource: sso_REALTIME partition: sso__0__0__20250212T1236Z from stateModelDefinitionclass org.apache.helix.model.StateModelDefinition from:ERROR to:CONSUMING 2025/02/12 12:36:57.235 ERROR [HelixStateTransitionHandler] [HelixTaskExecutor-message_handle_thread_73] Exception while executing a state transition task sso__1__0__20250212T1236Z java.lang.reflect.InvocationTargetException: null at jdk.internal.reflect.GeneratedMethodAccessor245.invoke(Unknown Source) ~[?:?] at java.base/jdk.internal.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) ~[?:?] at java.base/java.lang.reflect.Method.invoke(Method.java:566) ~[?:?] at org.apache.helix.messaging.handling.HelixStateTransitionHandler.invoke(HelixStateTransitionHandler.java:350) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.helix.messaging.handling.HelixStateTransitionHandler.handleMessage(HelixStateTransitionHandler.java:278) [pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.helix.messaging.handling.HelixTask.call(HelixTask.java:97) [pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.helix.messaging.handling.HelixTask.call(HelixTask.java:49) [pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at java.base/java.util.concurrent.FutureTask.run(FutureTask.java:264) [?:?] at java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1128) [?:?] at java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:628) [?:?] at java.base/java.lang.Thread.run(Thread.java:829) [?:?] Caused by: org.apache.pinot.spi.utils.retry.AttemptsExceededException: Operation failed after 5 attempts at org.apache.pinot.spi.utils.retry.BaseRetryPolicy.attempt(BaseRetryPolicy.java:65) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.core.data.manager.realtime.RealtimeSegmentDataManager.<init>(RealtimeSegmentDataManager.java:1628) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.core.data.manager.realtime.RealtimeTableDataManager.doAddConsumingSegment(RealtimeTableDataManager.java:552) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.core.data.manager.realtime.RealtimeTableDataManager.addConsumingSegment(RealtimeTableDataManager.java:497) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.server.starter.helix.HelixInstanceDataManager.addConsumingSegment(HelixInstanceDataManager.java:266) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] at org.apache.pinot.server.starter.helix.SegmentOnlineOfflineStateModelFactory$SegmentOnlineOfflineStateModel.onBecomeConsumingFromOffline(SegmentOnlineOfflineStateModelFactory.java:81) ~[pinot-all-1.4.0-SNAPSHOT-jar-with-dependencies.jar:1.4.0-SNAPSHOT-eb9c759344502969c80e3e9ec00fe67bd24d2965] ... 11 more 2025/02/12 12:36:57.235 ERROR [StateModel] [HelixTaskExecutor-message_handle_thread_73] Default rollback method invoked on error. Error Code: ERROR 2025/02/12 12:36:57.237 ERROR [HelixTask] [HelixTaskExecutor-message_handle_thread_73] Message execution failed. msgId: 791de854-5de2-4014-a01c-997aaedec2c2, errorMsg: java.lang.reflect.InvocationTargetException 2025/02/12 12:36:57.237 ERROR [HelixStateTransitionHandler] [HelixTaskExecutor-message_handle_thread_73] Skip internal error. errCode: ERROR, errMsg: null 2025/02/12 12:36:57.246 ERROR [MessageGenerationPhase] [HelixController-pipeline-default-QuickStartCluster-(88af965e_DEFAULT)] Event 88af965e_DEFAULT : Unable to find a next state for resource: sso_REALTIME partition: sso__0__0__20250212T1236Z from stateModelDefinitionclass org.apache.helix.model.StateModelDefinition from:ERROR to:CONSUMING 2025/02/12 12:36:57.246 ERROR [MessageGenerationPhase] [HelixController-pipeline-default-QuickStartCluster-(88af965e_DEFAULT)] Event 88af965e_DEFAULT : Unable to find a next state for resource: sso_REALTIME partition: sso__1__0__20250212T1236Z from stateModelDefinitionclass org.apache.helix.model.StateModelDefinition from:ERROR to:CONSUMING 2025/02/12 12:36:57.255 ERROR [MessageGenerationPhase] [HelixController-pipeline-default-QuickStartCluster-(5305082a_DEFAULT)] Event 5305082a_DEFAULT : Unable to find a next state for resource: sso_REALTIME partition: sso__0__0__20250212T1236Z from stateModelDefinitionclass org.apache.helix.model.StateModelDefinition from:ERROR to:CONSUMING 2025/02/12 12:36:57.255 ERROR [MessageGenerationPhase] [HelixController-pipeline-default-QuickStartCluster-(5305082a_DEFAULT)] Event 5305082a_DEFAULT : Unable to find a next state for resource: sso_REALTIME partition: sso__1__0__20250212T1236Z from stateModelDefinitionclass org.apache.helix.model.StateModelDefinition from:ERROR to:CONSUMING 2025/02/12 12:39:54.084 ERROR [CompletionServiceHelper] [grizzly-http-server-5] Server: Server_172.17.0.2_7050 returned error: 500, reason: Internal Server Error for uri: http://172.17.0.2:7500/debug/segments/sso_REALTIME/sso__0__0__20250212T1236Z 2025/02/12 12:39:56.748 ERROR [CompletionServiceHelper] [grizzly-http-server-0] Server: Server_172.17.0.2_7050 returned error: 404, reason: Not Found for uri: http://172.17.0.2:7500/tables/sso_REALTIME/segments/sso__0__0__20250212T1236Z/metadata?columns=* ``` I Would really appreciate your help with this, Thanks! -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: commits-unsubscr...@pinot.apache.org.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org --------------------------------------------------------------------- To unsubscribe, e-mail: commits-unsubscr...@pinot.apache.org For additional commands, e-mail: commits-h...@pinot.apache.org