mymeiyi commented on code in PR #32980:
URL: https://github.com/apache/doris/pull/32980#discussion_r1561923173


##########
fe/fe-core/src/main/java/org/apache/doris/transaction/DatabaseTransactionMgr.java:
##########
@@ -2290,4 +2480,177 @@ protected void 
updateMultiTableRunningTransactionTableIds(long transactionId, Li
         }
         
idToRunningTransactionState.get(transactionId).setTableIdList(tableIds);
     }
+
+    private PublishResult finishCheckQuorumReplicas(TransactionState 
transactionState, Set<Long> errorReplicaIds) {
+        long now = System.currentTimeMillis();
+        long firstPublishVersionTime = 
transactionState.getFirstPublishVersionTime();
+        boolean allowPublishOneSucc = false;
+        if (Config.publish_wait_time_second > 0 && firstPublishVersionTime > 0
+                && now >= firstPublishVersionTime + 
Config.publish_wait_time_second * 1000L) {
+            allowPublishOneSucc = true;
+        }
+        List<String> logs = Lists.newArrayList();
+
+        Map<Long, List<PublishVersionTask>> publishTasks = 
transactionState.getPublishVersionTasks();
+        PublishResult publishResult = PublishResult.QUORUM_SUCC;
+        for (SubTransactionState subTransactionState : 
transactionState.getSubTransactionStates()) {
+            long subTxnId = subTransactionState.getSubTransactionId();
+            TableCommitInfo tableCommitInfo = 
transactionState.getSubTxnIdToTableCommitInfo().get(subTxnId);
+            if (tableCommitInfo == null) {
+                continue;
+            }
+            OlapTable table = (OlapTable) subTransactionState.getTable();
+            long tableId = table.getId();
+            for (Entry<Long, PartitionCommitInfo> entry : 
tableCommitInfo.getIdToPartitionCommitInfo().entrySet()) {
+                long partitionId = entry.getValue().getPartitionId();
+                Partition partition = table.getPartition(partitionId);
+                if (partition == null) {
+                    continue;
+                }
+                int loadRequiredReplicaNum = 
table.getLoadRequiredReplicaNum(partitionId);
+
+                // TODO should use sub transaction load indexes
+                List<MaterializedIndex> allIndices;
+                if (transactionState.getLoadedTblIndexes().isEmpty()) {
+                    allIndices = 
partition.getMaterializedIndices(MaterializedIndex.IndexExtState.ALL);
+                } else {
+                    allIndices = Lists.newArrayList();
+                    for (long indexId : 
transactionState.getLoadedTblIndexes().get(tableId)) {
+                        MaterializedIndex index = partition.getIndex(indexId);
+                        if (index != null) {
+                            allIndices.add(index);
+                        }
+                    }
+                }
+
+                boolean alterReplicaLoadedTxn = 
isAlterReplicaLoadedTxn(transactionState.getTransactionId(), table);
+
+                // check success replica number for each tablet.
+                // a success replica means:
+                //  1. Not in errorReplicaIds: succeed in both commit and 
publish phase
+                //  2. last failed version < 0: is a health replica before
+                //  3. version catch up: not with a stale version
+                // Here we only check number, the replica version will be 
updated in updateCatalogAfterVisible()
+                for (MaterializedIndex index : allIndices) {
+                    for (Tablet tablet : 
partition.getIndex(index.getId()).getTablets()) {
+                        List<Replica> tabletSuccReplicas = 
Lists.newArrayList();
+                        List<Replica> tabletWriteFailedReplicas = 
Lists.newArrayList();
+                        List<Replica> tabletVersionFailedReplicas = 
Lists.newArrayList();
+                        // TODO always use the visible version because the 
replica version is not changed
+                        long newVersion = partition.getVisibleVersion() + 1;
+                        for (Replica replica : tablet.getReplicas()) {
+                            for (PublishVersionTask publishVersionTask : 
publishTasks.get(replica.getBackendId())) {
+                                boolean needCheck = 
publishVersionTask.getTransactionId()
+                                        == 
subTransactionState.getSubTransactionId()
+                                        && 
publishVersionTask.getPartitionVersionInfos().stream()
+                                        .anyMatch(s -> s.getPartitionId() == 
partitionId);
+                                if (needCheck) {
+                                    
checkReplicaContinuousVersionSucc(tablet.getId(), replica, 
alterReplicaLoadedTxn,
+                                            newVersion, publishVersionTask,
+                                            errorReplicaIds, 
tabletSuccReplicas, tabletWriteFailedReplicas,
+                                            tabletVersionFailedReplicas);
+                                    LOG.debug("after 
checkReplicaContinuousVersion for txn_id={}, sub_txn_id={}, "
+                                                    + "tablet_id={}, 
new_version={}, success_replicas={}, "
+                                                    + 
"write_failed_replicas={}, version_failed_replicas={}",
+                                            
transactionState.getTransactionId(),
+                                            
subTransactionState.getSubTransactionId(), tablet.getId(), newVersion,
+                                            tabletSuccReplicas, 
tabletWriteFailedReplicas, tabletVersionFailedReplicas);
+                                }
+                            }
+                        }
+
+                        publishResult = checkQuorumReplicas(transactionState, 
tableId, partition, tablet,
+                                loadRequiredReplicaNum, allowPublishOneSucc, 
newVersion, tabletSuccReplicas,
+                                tabletWriteFailedReplicas, 
tabletVersionFailedReplicas, publishResult, logs);
+                    }
+                }
+            }
+        }
+

Review Comment:
   support it and add a ut 
`GlobalTransactionMgrTest#testCommitTransactionWithSubTxnAndReplicaFailed` 
check it. 



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: commits-unsubscr...@doris.apache.org

For queries about this service, please contact Infrastructure at:
us...@infra.apache.org


---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscr...@doris.apache.org
For additional commands, e-mail: commits-h...@doris.apache.org

Reply via email to