timoninmaxim commented on code in PR #10617:
URL: https://github.com/apache/ignite/pull/10617#discussion_r1159507204


##########
modules/core/src/main/java/org/apache/ignite/internal/processors/cache/persistence/snapshot/IncrementalSnapshotVerificationTask.java:
##########
@@ -0,0 +1,421 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements. See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License. You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package org.apache.ignite.internal.processors.cache.persistence.snapshot;
+
+import java.io.File;
+import java.io.IOException;
+import java.nio.file.Files;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collection;
+import java.util.HashMap;
+import java.util.HashSet;
+import java.util.Iterator;
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
+import java.util.Set;
+import java.util.concurrent.atomic.LongAdder;
+import java.util.function.BiConsumer;
+import java.util.function.Function;
+import java.util.stream.Collectors;
+import org.apache.ignite.IgniteCheckedException;
+import org.apache.ignite.IgniteException;
+import org.apache.ignite.IgniteLogger;
+import org.apache.ignite.cache.CacheAtomicityMode;
+import org.apache.ignite.cluster.ClusterNode;
+import org.apache.ignite.compute.ComputeJob;
+import org.apache.ignite.compute.ComputeJobAdapter;
+import org.apache.ignite.compute.ComputeJobResult;
+import org.apache.ignite.internal.IgniteEx;
+import org.apache.ignite.internal.processors.cache.GridCacheOperation;
+import org.apache.ignite.internal.processors.cache.StoredCacheData;
+import org.apache.ignite.internal.processors.cache.verify.IdleVerifyResultV2;
+import 
org.apache.ignite.internal.processors.cache.verify.PartitionHashRecordV2;
+import org.apache.ignite.internal.processors.cache.verify.PartitionKeyV2;
+import 
org.apache.ignite.internal.processors.cache.verify.TransactionsHashRecord;
+import org.apache.ignite.internal.processors.cache.version.GridCacheVersion;
+import org.apache.ignite.internal.processors.cluster.BaselineTopology;
+import org.apache.ignite.internal.processors.task.GridInternal;
+import org.apache.ignite.internal.util.typedef.F;
+import org.apache.ignite.internal.util.typedef.internal.CU;
+import org.apache.ignite.resources.IgniteInstanceResource;
+import org.apache.ignite.resources.LoggerResource;
+import org.apache.ignite.transactions.TransactionState;
+import org.jetbrains.annotations.Nullable;
+
+import static 
org.apache.ignite.internal.managers.discovery.ConsistentIdMapper.ALL_NODES;
+import static 
org.apache.ignite.internal.processors.cache.persistence.file.FilePageStoreManager.CACHE_DATA_FILENAME;
+import static 
org.apache.ignite.internal.processors.cache.persistence.snapshot.IgniteSnapshotManager.databaseRelativePath;
+
+/** */
+@GridInternal
+public class IncrementalSnapshotVerificationTask extends 
AbstractSnapshotVerificationTask {
+    /** Serial version uid. */
+    private static final long serialVersionUID = 0L;
+
+    /** Ignite instance. */
+    @IgniteInstanceResource
+    private IgniteEx ignite;
+
+    /** Injected logger. */
+    @LoggerResource
+    private IgniteLogger log;
+
+    /** {@inheritDoc} */
+    @Override public SnapshotPartitionsVerifyTaskResult 
reduce(List<ComputeJobResult> results) throws IgniteException {
+        Map<Object, Map<Object, TransactionsHashRecord>> nodeTxHashMap = new 
HashMap<>();
+
+        List<List<TransactionsHashRecord>> txHashConflicts = new ArrayList<>();
+        Map<PartitionKeyV2, List<PartitionHashRecordV2>> partHashes = new 
HashMap<>();
+        Map<ClusterNode, Collection<GridCacheVersion>> partialCommits = new 
HashMap<>();
+
+        Map<ClusterNode, Exception> errors = new HashMap<>();
+
+        for (ComputeJobResult nodeRes: results) {
+            if (nodeRes.getException() != null) {
+                errors.put(nodeRes.getNode(), nodeRes.getException());
+
+                continue;
+            }
+
+            IncrementalSnapshotVerificationTaskResult res = nodeRes.getData();
+
+            if (!F.isEmpty(res.exceptions())) {
+                errors.put(nodeRes.getNode(), F.first(res.exceptions()));
+
+                continue;
+            }
+
+            if (!F.isEmpty(res.partialCommittedTxs()))
+                partialCommits.put(nodeRes.getNode(), 
res.partialCommittedTxs());
+
+            for (Map.Entry<PartitionKeyV2, PartitionHashRecordV2> entry: 
res.partHashRes().entrySet())
+                partHashes.computeIfAbsent(entry.getKey(), v -> new 
ArrayList<>()).add(entry.getValue());
+
+            if (log.isDebugEnabled())
+                log.debug("Handle VerifyIncrementalSnapshotJob result [node=" 
+ nodeRes.getNode() + ", taskRes=" + res + ']');
+
+            nodeTxHashMap.put(nodeRes.getNode().consistentId(), 
res.txHashRes());
+
+            Iterator<Map.Entry<Object, TransactionsHashRecord>> resIt = 
res.txHashRes().entrySet().iterator();
+
+            while (resIt.hasNext()) {
+                Map.Entry<Object, TransactionsHashRecord> nodeTxHash = 
resIt.next();
+
+                Map<Object, TransactionsHashRecord> prevNodeTxHash = 
nodeTxHashMap.get(nodeTxHash.getKey());
+
+                if (prevNodeTxHash != null) {
+                    TransactionsHashRecord hash = nodeTxHash.getValue();
+                    TransactionsHashRecord prevHash = 
prevNodeTxHash.remove(hash.localConsistentId());
+
+                    if (prevHash == null || prevHash.transactionHash() != 
hash.transactionHash())
+                        txHashConflicts.add(F.asList(hash, prevHash));
+
+                    resIt.remove();
+                }
+            }
+        }
+
+        // Add all missed pairs to conflicts.
+        nodeTxHashMap.values().stream()
+            .flatMap(e -> e.values().stream())
+            .forEach(e -> txHashConflicts.add(F.asList(e, null)));
+
+        return new SnapshotPartitionsVerifyTaskResult(
+            metas,
+            errors.isEmpty() ? new IdleVerifyResultV2(partHashes, 
txHashConflicts, partialCommits) : new IdleVerifyResultV2(errors));
+    }
+
+    /** {@inheritDoc} */
+    @Override protected ComputeJob createJob(
+        String name,
+        @Nullable String path,
+        int incIdx,
+        String constId,
+        Collection<String> groups,
+        boolean check
+    ) {
+        return new VerifyIncrementalSnapshotJob(name, path, incIdx, constId);
+    }
+
+    /** */
+    private static class VerifyIncrementalSnapshotJob extends 
ComputeJobAdapter {
+        /** Serial version uid. */
+        private static final long serialVersionUID = 0L;
+
+        /** Ignite instance. */
+        @IgniteInstanceResource
+        private IgniteEx ignite;
+
+        /** Injected logger. */
+        @LoggerResource
+        private IgniteLogger log;
+
+        /** Snapshot name to validate. */
+        private final String snpName;
+
+        /** Snapshot directory path. */
+        private final String snpPath;
+
+        /** Incremental snapshot index. */
+        private final int incIdx;
+
+        /** Consistent ID. */
+        private final String consId;
+
+        /**
+         * @param snpName Snapshot name.
+         * @param snpPath Snapshot directory path.
+         * @param incIdx Incremental snapshot index.
+         * @param consId Consistent ID.
+         */
+        public VerifyIncrementalSnapshotJob(
+            String snpName,
+            @Nullable String snpPath,
+            int incIdx,
+            String consId
+        ) {
+            this.snpName = snpName;
+            this.snpPath = snpPath;
+            this.incIdx = incIdx;
+            this.consId = consId;
+        }
+
+        /**
+         * @return Map containing calculated transactions hash for every 
remote node in the cluster.
+         */
+        @Override public IncrementalSnapshotVerificationTaskResult execute() 
throws IgniteException {
+            try {
+                if (log.isInfoEnabled()) {
+                    log.info("Verify incremental snapshot procedure has been 
initiated " +
+                        "[snpName=" + snpName + ", incrementIndex=" + incIdx + 
", consId=" + consId + ']');
+                }
+
+                if (incIdx <= 0)
+                    return new IncrementalSnapshotVerificationTaskResult();
+
+                BaselineTopology blt = 
ignite.context().state().clusterState().baselineTopology();
+
+                checkBaseline(blt);
+
+                Map<Integer, StoredCacheData> txCaches = readTxCachesData();
+
+                IncrementalSnapshotProcessor proc = new 
IncrementalSnapshotProcessor(
+                    ignite.context().cache().context(), snpName, snpPath, 
incIdx, txCaches.keySet()
+                ) {
+                    @Override void totalWalSegments(int segCnt) {
+                        // No-op.
+                    }
+
+                    @Override void processedWalSegments(int segCnt) {
+                        // No-op.
+                    }
+
+                    @Override void initWalEntries(LongAdder entriesCnt) {
+                        // No-op.
+                    }
+                };
+
+                short locShortId = blt.consistentIdMapping().get(consId);
+
+                Set<GridCacheVersion> activeDhtTxs = new HashSet<>();
+                Map<GridCacheVersion, Set<Short>> txPrimPartNodes = new 
HashMap<>();
+                Map<Short, Integer> nodesTxHash = new HashMap<>();
+
+                Set<GridCacheVersion> partialCommittedTxs = new HashSet<>();
+                Map<PartitionKeyV2, PartitionHashHolder> partMap = new 
HashMap<>();
+                List<Exception> exceptions = new ArrayList<>();
+
+                BiConsumer<GridCacheVersion, Set<Short>> calcTransactionHash = 
(xid, partNodes) -> {
+                    for (short shortId: partNodes) {
+                        if (shortId != locShortId)
+                            nodesTxHash.compute(shortId, (id, hash) -> 
xid.hashCode() + (hash == null ? 0 : hash));
+                    }
+                };
+
+                proc.process(dataEntry -> {
+                    if (dataEntry.op() == GridCacheOperation.READ)
+                        return;
+
+                    if (!activeDhtTxs.contains(dataEntry.writeVersion()))
+                        partialCommittedTxs.add(dataEntry.nearXidVersion());
+
+                    StoredCacheData cacheData = 
txCaches.get(dataEntry.cacheId());
+
+                    int grpId = CU.cacheGroupId(cacheData.config().getName(), 
cacheData.config().getGroupName());
+
+                    PartitionKeyV2 partKey = new PartitionKeyV2(grpId, 
dataEntry.partitionId(), CU.cacheOrGroupName(cacheData.config()));
+
+                    partMap.compute(partKey, (k, v) -> {
+                        try {
+                            int valHash = dataEntry.key().hashCode() + 
Arrays.hashCode(dataEntry.value().valueBytes(null));
+                            int verHash = dataEntry.writeVersion().hashCode();
+
+                            if (v == null)
+                                v = new PartitionHashHolder();
+
+                            v.increment(valHash, verHash);
+
+                            return v;
+                        }
+                        catch (IgniteCheckedException ex) {
+                            exceptions.add(ex);
+
+                            return null;
+                        }
+                    });
+                }, txRec -> {
+                    if (txRec.state() == TransactionState.PREPARED) {
+                        // Collect only primary nodes. For some cases backup 
nodes is included into TxRecord#participationNodes()
+                        // but actually doesn't even start transaction, for 
example, if the node participates only as a backup
+                        // of reading only keys.
+                        Set<Short> primPartNodes = 
txRec.participatingNodes().keySet();
+
+                        if (primPartNodes.contains(locShortId)) {
+                            txPrimPartNodes.put(txRec.nearXidVersion(), 
primPartNodes);
+                            activeDhtTxs.add(txRec.writeVersion());
+                        }
+                        else {
+                            for (Collection<Short> backups: 
txRec.participatingNodes().values()) {
+                                if (backups.contains(ALL_NODES) || 
backups.contains(locShortId))
+                                    activeDhtTxs.add(txRec.writeVersion());
+                            }
+                        }
+                    }
+                    else if (txRec.state() == TransactionState.COMMITTED) {
+                        activeDhtTxs.remove(txRec.writeVersion());
+
+                        Set<Short> partNodes = 
txPrimPartNodes.remove(txRec.nearXidVersion());
+
+                        // Legal cases:
+                        // 1. This node is a transaction near node, but not 
primary or backup node.
+                        // 2. This node participated in the transaction 
multiple times (e.g., primary for one key and backup for other key).
+                        // 3. A transaction is included into previous 
incremental snapshot.
+                        if (partNodes == null)
+                            return;
+
+                        calcTransactionHash.accept(txRec.nearXidVersion(), 
partNodes);
+                    }
+                    else if (txRec.state() == TransactionState.ROLLED_BACK) {
+                        activeDhtTxs.remove(txRec.writeVersion());
+                        txPrimPartNodes.remove(txRec.nearXidVersion());
+                    }
+                });
+
+                // All active transactions that didn't log COMMITTED or 
ROLL_BACK records are considered committed.
+                // It is possible as incremental snapshot started after 
transaction left IgniteTxManager#activeTransactions() collection,
+                // but completed before the final TxRecord was written.
+                for (Map.Entry<GridCacheVersion, Set<Short>> tx: 
txPrimPartNodes.entrySet())
+                    calcTransactionHash.accept(tx.getKey(), tx.getValue());
+
+                Map<Object, TransactionsHashRecord> txHashRes = 
nodesTxHash.entrySet().stream()
+                    .map(e -> new TransactionsHashRecord(consId, 
blt.compactIdMapping().get(e.getKey()), e.getValue()))
+                    
.collect(Collectors.toMap(TransactionsHashRecord::remoteConsistentId, 
Function.identity()));
+
+                Map<PartitionKeyV2, PartitionHashRecordV2> partHashRes = 
partMap.entrySet().stream()
+                    .collect(Collectors.toMap(Map.Entry::getKey, e -> new 
PartitionHashRecordV2(
+                        e.getKey(), false, consId, e.getValue().hash, 
e.getValue().verHash, null, 0, null)));
+
+                return new 
IncrementalSnapshotVerificationTaskResult(txHashRes, partHashRes, 
partialCommittedTxs, exceptions);
+            }
+            catch (IgniteCheckedException | IOException e) {
+                throw new IgniteException(e);
+            }
+        }
+
+        /** Checks that current baseline topology matches baseline topology of 
the snapshot. */
+        private void checkBaseline(BaselineTopology blt) throws 
IgniteCheckedException, IOException {
+            IgniteSnapshotManager snpMgr = 
ignite.context().cache().context().snapshotMgr();
+
+            File snpDir = snpMgr.snapshotLocalDir(snpName, snpPath);
+            SnapshotMetadata meta = snpMgr.readSnapshotMetadata(snpDir, 
ignite.localNode().consistentId().toString());
+
+            String errMsg = "Topologies of snapshot and current cluster are 
different [snp=" +
+                meta.baselineNodes() + ", current=" + blt.consistentIds() + 
']';
+
+            if (blt.size() != meta.baselineNodes().size())
+                throw new IgniteCheckedException(errMsg);
+
+            for (Object consistentId: blt.consistentIds()) {
+                if (!meta.baselineNodes().contains(consistentId.toString()))
+                    throw new IgniteCheckedException(errMsg);
+            }
+        }
+
+        /** @return Collection of snapshotted transactional caches, key is a 
cache ID. */
+        private Map<Integer, StoredCacheData> readTxCachesData() throws 
IgniteCheckedException, IOException {
+            File snpDir = 
ignite.context().cache().context().snapshotMgr().snapshotLocalDir(snpName, 
snpPath);
+
+            String folderName = 
ignite.context().pdsFolderResolver().resolveFolders().folderName();
+
+            File snpDbDir = new File(snpDir, databaseRelativePath(folderName));
+
+            Map<Integer, StoredCacheData> cacheData = new HashMap<>();
+
+            File[] caches = snpDbDir.listFiles();
+
+            for (File cache: caches) {
+                File[] cfgs = cache.listFiles(p -> 
Files.isRegularFile(p.toPath()) && p.getName().endsWith(CACHE_DATA_FILENAME));
+
+                for (File cfg: cfgs) {
+                    StoredCacheData data = 
ignite.context().cache().configManager().readCacheData(cfg);
+
+                    if (data.config().getAtomicityMode() == 
CacheAtomicityMode.TRANSACTIONAL)
+                        cacheData.put(data.cacheId(), data);
+                }
+            }
+
+            return cacheData;
+        }
+
+        /** {@inheritDoc} */
+        @Override public boolean equals(Object o) {
+            if (this == o)
+                return true;
+
+            if (o == null || getClass() != o.getClass())
+                return false;
+
+            VerifyIncrementalSnapshotJob job = (VerifyIncrementalSnapshotJob)o;
+
+            return snpName.equals(job.snpName) && Objects.equals(incIdx, 
job.incIdx) && Objects.equals(snpPath, job.snpPath)
+                && consId.equals(job.consId);
+        }
+
+        /** {@inheritDoc} */
+        @Override public int hashCode() {
+            return Objects.hash(snpName, incIdx, snpPath, consId);
+        }
+    }
+
+    /** Holder for parition hashes. */
+    private static class PartitionHashHolder {
+        /** */
+        private int hash;

Review Comment:
   I made it as `int`, because `PartitionHashRecordV2` stores hashes as `int` 
too: `partHash`, `partVerHash`.



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

Reply via email to