test: added new raft rejoin test

lvca · lvca · commit bfafd9bb5dae · 2026-05-05T11:11:29.000-04:00
diff --git a/ha-raft/src/test/java/com/arcadedb/server/ha/raft/RaftPriorityRejoinIT.java b/ha-raft/src/test/java/com/arcadedb/server/ha/raft/RaftPriorityRejoinIT.java
@@ -0,0 +1,250 @@
+/*
+ * Copyright 2021-present Arcade Data Ltd (info@arcadedata.com)
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ *
+ * SPDX-FileCopyrightText: 2021-present Arcade Data Ltd (info@arcadedata.com)
+ * SPDX-License-Identifier: Apache-2.0
+ */
+package com.arcadedb.server.ha.raft;
+
+import com.arcadedb.ContextConfiguration;
+import com.arcadedb.GlobalConfiguration;
+import com.arcadedb.graph.MutableVertex;
+import com.arcadedb.log.LogManager;
+import com.arcadedb.server.ArcadeDBServer;
+import com.arcadedb.utility.CodeUtils;
+import org.junit.jupiter.api.Tag;
+import org.junit.jupiter.api.Test;
+
+import java.util.logging.Level;
+
+import static org.assertj.core.api.Assertions.assertThat;
+
+/**
+ * Regression test for issue #4081.
+ * <p>
+ * Reproduces the user's reported scenario: a 4-node cluster where node 0 has the
+ * highest leader-election priority and node 3 is a replica. After:
+ * <ol>
+ *   <li>Killing the priority leader (node 0)</li>
+ *   <li>Restarting it (Raft storage is wiped because {@code raftPersistStorage=false})</li>
+ *   <li>Letting it become leader again via priority</li>
+ *   <li>Stopping the replica (node 3)</li>
+ *   <li>Restarting the replica (Raft storage is wiped)</li>
+ * </ol>
+ * the leader must not get stuck in an INCONSISTENCY/append-entries loop. The cluster must
+ * eventually converge: writes succeed and the rejoined replica catches up.
+ *
+ * @author Luca Garulli (l.garulli@arcadedata.com)
+ */
+@Tag("slow")
+class RaftPriorityRejoinIT extends BaseRaftHATest {
+
+  private static final int BASE_RAFT_PORT = 2434;
+  private static final int BASE_HTTP_PORT = 2480;
+
+  @Override
+  protected int getServerCount() {
+    return 4;
+  }
+
+  @Override
+  protected boolean persistentRaftStorage() {
+    // The user's setup uses default (false). Storage is wiped on every restart.
+    return false;
+  }
+
+  @Override
+  protected String getServerAddresses() {
+    // Mirror the user's configuration: priorities 10/8/6/0, last node is replica role.
+    final int[] priorities = { 10, 8, 6, 0 };
+    final StringBuilder sb = new StringBuilder();
+    for (int i = 0; i < getServerCount(); i++) {
+      if (i > 0)
+        sb.append(",");
+      sb.append("localhost:").append(BASE_RAFT_PORT + i)
+          .append(":").append(BASE_HTTP_PORT + i)
+          .append(":").append(priorities[i]);
+    }
+    return sb.toString();
+  }
+
+  @Override
+  protected void onServerConfiguration(final ContextConfiguration config) {
+    super.onServerConfiguration(config);
+    config.setValue(GlobalConfiguration.HA_QUORUM, "majority");
+    // Mirror the user's adb*.sh: quorumTimeout=1000ms.
+    config.setValue(GlobalConfiguration.HA_QUORUM_TIMEOUT, 1_000L);
+
+    // Tag the last server as replica role (mirrors the user's adb4.sh).
+    final String serverName = config.getValueAsString(GlobalConfiguration.SERVER_NAME);
+    final int idx = Integer.parseInt(serverName.substring(serverName.lastIndexOf('_') + 1));
+    if (idx == getServerCount() - 1)
+      config.setValue(GlobalConfiguration.HA_SERVER_ROLE, "replica");
+
+    // Keep election timeouts small so the test runs in reasonable time.
+    config.setValue(GlobalConfiguration.HA_ELECTION_TIMEOUT_MIN, 1_000);
+    config.setValue(GlobalConfiguration.HA_ELECTION_TIMEOUT_MAX, 2_000);
+  }
+
+  @Test
+  void leaderRestartThenReplicaRestartConverges() {
+    // Step 1: write some data with all nodes online.
+    final int firstLeader = findLeaderIndex();
+    assertThat(firstLeader).as("a Raft leader must be elected at startup").isGreaterThanOrEqualTo(0);
+
+    final var leaderDb = getServerDatabase(firstLeader, getDatabaseName());
+    leaderDb.transaction(() -> {
+      if (!leaderDb.getSchema().existsType("Issue4081"))
+        leaderDb.getSchema().createVertexType("Issue4081");
+    });
+
+    // Many small transactions so the Raft log has plenty of entries to replicate.
+    for (int t = 0; t < 50; t++) {
+      final int base = t * 10;
+      leaderDb.transaction(() -> {
+        for (int i = 0; i < 10; i++) {
+          final MutableVertex v = leaderDb.newVertex("Issue4081");
+          v.set("phase", "initial");
+          v.set("idx", base + i);
+          v.save();
+        }
+      });
+    }
+
+    assertClusterConsistency();
+
+    // Step 2: kill the priority-leader (server 0).
+    LogManager.instance().log(this, Level.INFO, "TEST: stopping priority leader (server 0)");
+    getServer(0).stop();
+    while (getServer(0).getStatus() == ArcadeDBServer.STATUS.SHUTTING_DOWN)
+      CodeUtils.sleep(200);
+
+    // Step 3: wait for a new leader among the remaining nodes.
+    final int interimLeader = waitForAnyLeader(0);
+    assertThat(interimLeader).as("a new leader must be elected after stopping server 0").isGreaterThanOrEqualTo(0);
+    assertThat(interimLeader).isNotEqualTo(0);
+
+    // Write more so the interim leader's log advances beyond the killed leader's snapshot point.
+    final var interimDb = getServerDatabase(interimLeader, getDatabaseName());
+    for (int t = 0; t < 30; t++) {
+      final int base = t * 10;
+      interimDb.transaction(() -> {
+        for (int i = 0; i < 10; i++) {
+          final MutableVertex v = interimDb.newVertex("Issue4081");
+          v.set("phase", "after-leader-stop");
+          v.set("idx", base + i);
+          v.save();
+        }
+      });
+    }
+
+    // Step 4: restart server 0. Its Raft storage was wiped (persistStorage=false) so it joins fresh.
+    LogManager.instance().log(this, Level.INFO, "TEST: restarting server 0");
+    getServer(0).start();
+
+    // Step 5: with priority 10, server 0 should become the leader again. Wait for that.
+    final int reLeader = waitForLeader(0, 60_000);
+    assertThat(reLeader).as("server 0 should reclaim leadership via priority").isEqualTo(0);
+
+    // Confirm the cluster is functional with server 0 as leader.
+    final var reLeaderDb = getServerDatabase(0, getDatabaseName());
+    for (int t = 0; t < 30; t++) {
+      final int base = t * 10;
+      reLeaderDb.transaction(() -> {
+        for (int i = 0; i < 10; i++) {
+          final MutableVertex v = reLeaderDb.newVertex("Issue4081");
+          v.set("phase", "after-leader-rejoin");
+          v.set("idx", base + i);
+          v.save();
+        }
+      });
+    }
+
+    // Step 6: stop the replica (server 3).
+    LogManager.instance().log(this, Level.INFO, "TEST: stopping replica (server 3)");
+    getServer(3).stop();
+    while (getServer(3).getStatus() == ArcadeDBServer.STATUS.SHUTTING_DOWN)
+      CodeUtils.sleep(200);
+
+    // Write more so the leader's log advances while the replica is offline.
+    // Aim for enough entries to cross the snapshot threshold so the leader's log gets purged.
+    for (int t = 0; t < 30; t++) {
+      final int base = t * 10;
+      reLeaderDb.transaction(() -> {
+        for (int i = 0; i < 10; i++) {
+          final MutableVertex v = reLeaderDb.newVertex("Issue4081");
+          v.set("phase", "while-replica-down");
+          v.set("idx", base + i);
+          v.save();
+        }
+      });
+    }
+
+    // Step 7: restart the replica. Storage is wiped so it joins as a fresh peer.
+    LogManager.instance().log(this, Level.INFO, "TEST: restarting replica (server 3)");
+    getServer(3).start();
+
+    // Step 8: the replica must catch up. The leader must NOT get stuck in an INCONSISTENCY loop.
+    waitForReplicationIsCompleted(3);
+
+    // Final write to confirm the cluster is fully operational.
+    for (int t = 0; t < 30; t++) {
+      final int base = t * 10;
+      reLeaderDb.transaction(() -> {
+        for (int i = 0; i < 10; i++) {
+          final MutableVertex v = reLeaderDb.newVertex("Issue4081");
+          v.set("phase", "final");
+          v.set("idx", base + i);
+          v.save();
+        }
+      });
+    }
+
+    assertClusterConsistency();
+
+    // Every node must hold all 1700 vertices (50+30+30+30+30 transactions x 10 vertices each).
+    final long expected = (50 + 30 + 30 + 30 + 30) * 10L;
+    for (int i = 0; i < getServerCount(); i++) {
+      final long count = getServerDatabase(i, getDatabaseName()).countType("Issue4081", true);
+      assertThat(count).as("server " + i + " should have all " + expected + " records").isEqualTo(expected);
+    }
+  }
+
+  private int waitForAnyLeader(final int excludeIndex) {
+    final long deadline = System.currentTimeMillis() + 30_000;
+    while (System.currentTimeMillis() < deadline) {
+      for (int i = 0; i < getServerCount(); i++) {
+        if (i == excludeIndex)
+          continue;
+        final RaftHAPlugin plugin = getRaftPlugin(i);
+        if (plugin != null && plugin.isLeader())
+          return i;
+      }
+      CodeUtils.sleep(250);
+    }
+    return -1;
+  }
+
+  private int waitForLeader(final int expectedIndex, final long timeoutMs) {
+    final long deadline = System.currentTimeMillis() + timeoutMs;
+    while (System.currentTimeMillis() < deadline) {
+      final RaftHAPlugin plugin = getRaftPlugin(expectedIndex);
+      if (plugin != null && plugin.isLeader())
+        return expectedIndex;
+      CodeUtils.sleep(500);
+    }
+    return -1;
+  }
+}