nsivabalan commented on code in PR #18132:
URL: https://github.com/apache/hudi/pull/18132#discussion_r3042686639
##########
hudi-spark-datasource/hudi-spark-common/src/main/scala/org/apache/hudi/HoodieFileIndex.scala:
##########
@@ -447,6 +452,38 @@ object HoodieFileIndex extends Logging {
schema.fieldNames.filter { colName => refs.exists(r =>
resolver.apply(colName, r.name)) }
}
+ /**
+ * Identifies timestamp-millis columns from the Avro schema. These columns
are excluded from
+ * column-stats filter translation (e.g. they may have been indexed before a
fix and should
+ * not be used for filtering).
+ *
+ * @param avroSchema the table's Avro schema
+ * @return set of field names whose type is timestamp-millis or
local-timestamp-millis
+ */
+ def getTimestampMillisColumns(avroSchema: org.apache.avro.Schema):
Set[String] = {
Review Comment:
are we considering only top level fields here?
--
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.
To unsubscribe, e-mail: [email protected]
For queries about this service, please contact Infrastructure at:
[email protected]