sdd commented on code in PR #373: URL: https://github.com/apache/iceberg-rust/pull/373#discussion_r1609368600
########## crates/iceberg/src/scan.rs: ########## @@ -189,66 +195,20 @@ impl TableScan { self.case_sensitive, )?; - let mut partition_filter_cache = PartitionFilterCache::new(); - let mut manifest_evaluator_cache = ManifestEvaluatorCache::new(); - - Ok(try_stream! { - let manifest_list = context - .snapshot - .load_manifest_list(&context.file_io, &context.table_metadata) - .await?; - - for entry in manifest_list.entries() { - if !Self::content_type_is_data(entry) { - continue; - } + let (sender, receiver) = channel(CHANNEL_BUFFER_SIZE); - let partition_spec_id = entry.partition_spec_id; + let manifest_list = context + .snapshot + .load_manifest_list(&context.file_io, &context.table_metadata) + .await?; - let partition_filter = partition_filter_cache.get( - partition_spec_id, - &context, - )?; + spawn(async move { Review Comment: I reverted reader.rs to be essentially the same as before, without any concurrent processing of batches from within the same file. I removed the nested try_for_each_concurrent from scan.rs but kept the mpsc channel. -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: issues-unsubscr...@iceberg.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org --------------------------------------------------------------------- To unsubscribe, e-mail: issues-unsubscr...@iceberg.apache.org For additional commands, e-mail: issues-h...@iceberg.apache.org