BsoBird commented on code in PR #9546: URL: https://github.com/apache/iceberg/pull/9546#discussion_r1482658331
########## core/src/main/java/org/apache/iceberg/hadoop/HadoopTableOperations.java: ########## @@ -289,64 +377,153 @@ Path versionHintFile() { return metadataPath(Util.VERSION_HINT_FILENAME); } - private void writeVersionHint(int versionToWrite) { + @VisibleForTesting + boolean writeVersionHint(FileSystem fs, Integer versionToWrite) throws Exception { Path versionHintFile = versionHintFile(); - FileSystem fs = getFileSystem(versionHintFile, conf); - + Path tempVersionHintFile = metadataPath(UUID.randomUUID() + "-version-hint.temp"); try { - Path tempVersionHintFile = metadataPath(UUID.randomUUID().toString() + "-version-hint.temp"); writeVersionToPath(fs, tempVersionHintFile, versionToWrite); - fs.delete(versionHintFile, false /* recursive delete */); - fs.rename(tempVersionHintFile, versionHintFile); - } catch (IOException e) { - LOG.warn("Failed to update version hint", e); + // We can accept that version Hint fails to write, but we can't accept that version Hint + // writes the wrong version. + if (fs.exists(versionHintFile) || findVersionWithOutVersionHint(fs) != versionToWrite) { + throw new AlreadyExistsException( + "Failed to write a new versionHintFile,You are writing to an old-version-Hint,Are there other clients running in parallel with the current task?"); + } + return renameVersionHint(fs, tempVersionHintFile, versionHintFile); + } catch (Exception e) { + // Cleaning up temporary files. + io().deleteFile(tempVersionHintFile.toString()); + throw e; } } - private void writeVersionToPath(FileSystem fs, Path path, int versionToWrite) throws IOException { + @VisibleForTesting + void deleteOldVersionHint(FileSystem fs, Path versionHintFile, Integer nextVersion) + throws IOException { + // In order to be compatible with scenarios where the iceberg table has just been created or Review Comment: In addition, even if the delete operation is not atomic, I think the problem is not very big, we will clean up the operation of the versionHint to the first step, even if there is a problem, the metadata.json is not damaged. The client can still read normally. After all, versionHint is not very important to us. I was even tempted to delete versionHint at one point. -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: issues-unsubscr...@iceberg.apache.org For queries about this service, please contact Infrastructure at: us...@infra.apache.org --------------------------------------------------------------------- To unsubscribe, e-mail: issues-unsubscr...@iceberg.apache.org For additional commands, e-mail: issues-h...@iceberg.apache.org