rdblue commented on code in PR #12105: URL: https://github.com/apache/iceberg/pull/12105#discussion_r1932649565
########## core/src/main/java/org/apache/iceberg/variants/ShreddedObject.java: ########## @@ -35,22 +39,55 @@ * fields. This also does not allow updating or replacing the metadata for the unshredded object, * which could require recursively rewriting field IDs. */ -class ShreddedObject implements VariantObject { - private final SerializedMetadata metadata; - private final SerializedObject unshredded; +public class ShreddedObject implements VariantObject { + private final VariantMetadata metadata; + private final VariantObject unshredded; private final Map<String, VariantValue> shreddedFields = Maps.newHashMap(); + private final Set<String> removedFields = Sets.newHashSet(); private SerializationState serializationState = null; - ShreddedObject(SerializedMetadata metadata) { + ShreddedObject(VariantMetadata metadata) { this.metadata = metadata; this.unshredded = null; } - ShreddedObject(SerializedObject unshredded) { - this.metadata = unshredded.metadata(); + ShreddedObject(VariantMetadata metadata, VariantObject unshredded) { + this.metadata = metadata; this.unshredded = unshredded; } + @VisibleForTesting + VariantMetadata metadata() { + return metadata; + } + + private Set<String> nameSet() { + Set<String> names = Sets.newHashSet(shreddedFields.keySet()); + + if (unshredded != null) { + Iterables.addAll(names, unshredded.fieldNames()); + } + + names.removeAll(removedFields); + + return names; + } + + @Override + public Iterable<String> fieldNames() { + return nameSet(); + } + + @Override + public int numFields() { + return nameSet().size(); + } + + public void remove(String field) { Review Comment: That doesn't handle the case where `unshredded` incorrectly includes the field. We need to keep track of the shredded fields, whether present or missing, so that the shredded fields are always used. -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: issues-unsubscr...@iceberg.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org --------------------------------------------------------------------- To unsubscribe, e-mail: issues-unsubscr...@iceberg.apache.org For additional commands, e-mail: issues-h...@iceberg.apache.org