using Akka.Cluster; using Microsoft.EntityFrameworkCore; using Microsoft.Extensions.DependencyInjection; using Shouldly; using Xunit; using ZB.MOM.WW.OtOpcUa.Commons.Interfaces; using ZB.MOM.WW.OtOpcUa.Commons.Messages.Admin; using ZB.MOM.WW.OtOpcUa.Configuration; using ZB.MOM.WW.OtOpcUa.Configuration.Enums; namespace ZB.MOM.WW.OtOpcUa.Host.IntegrationTests; /// /// Failover scenarios layered on Stop/Restart primitives. /// Covers graceful node loss, rejoin on the same Akka port, and deployment under reduced membership. /// public sealed class FailoverDuringDeployTests { private static CancellationToken Ct => TestContext.Current.CancellationToken; [Fact] public async Task Stopping_node_b_shrinks_cluster_to_one_up_member() { await using var harness = await TwoNodeClusterHarness.StartAsync(); Akka.Cluster.Cluster.Get(harness.NodeASystem).State.Members .Count(m => m.Status == MemberStatus.Up).ShouldBe(2); await harness.StopNodeBAsync(); await harness.WaitForClusterSizeAsync(1, TimeSpan.FromSeconds(20)); Akka.Cluster.Cluster.Get(harness.NodeASystem).State.Members .Count(m => m.Status == MemberStatus.Up).ShouldBe(1); } [Fact] public async Task Restarted_node_b_rejoins_cluster_on_same_port() { await using var harness = await TwoNodeClusterHarness.StartAsync(); await harness.StopNodeBAsync(); await harness.WaitForClusterSizeAsync(1, TimeSpan.FromSeconds(20)); await harness.RestartNodeBAsync(); Akka.Cluster.Cluster.Get(harness.NodeASystem).State.Members .Count(m => m.Status == MemberStatus.Up).ShouldBe(2); Akka.Cluster.Cluster.Get(harness.NodeBSystem).State.Members .Count(m => m.Status == MemberStatus.Up).ShouldBe(2); } [Fact] public async Task Deployment_started_with_node_b_down_seals_with_one_node_state() { // Establishes that ConfigPublishCoordinator.DiscoverDriverNodes snapshots membership at // dispatch time — when only node A is Up, only one ApplyAck is expected and the // deployment seals without B ever participating. await using var harness = await TwoNodeClusterHarness.StartAsync(); await harness.StopNodeBAsync(); await harness.WaitForClusterSizeAsync(1, TimeSpan.FromSeconds(20)); await using var scope = harness.NodeA.Services.CreateAsyncScope(); var client = scope.ServiceProvider.GetRequiredService(); var result = await client.StartDeploymentAsync(createdBy: "alice@test", Ct); result.Outcome.ShouldBe(StartDeploymentOutcome.Accepted); var deploymentId = result.DeploymentId!.Value.Value; await WaitForAsync(async () => { await using var db = await CreateDbAsync(harness); var d = await db.Deployments.AsNoTracking() .FirstOrDefaultAsync(d => d.DeploymentId == deploymentId, Ct); return d?.Status == DeploymentStatus.Sealed; }, TimeSpan.FromSeconds(15)); await using var db = await CreateDbAsync(harness); var nodeStates = await db.NodeDeploymentStates.AsNoTracking() .Where(s => s.DeploymentId == deploymentId) .ToListAsync(Ct); nodeStates.Count.ShouldBe(1); nodeStates[0].Status.ShouldBe(NodeDeploymentStatus.Applied); } private static async Task CreateDbAsync(TwoNodeClusterHarness harness) { var factory = harness.NodeA.Services.GetRequiredService>(); return await factory.CreateDbContextAsync(); } private static async Task WaitForAsync(Func> condition, TimeSpan timeout) { var deadline = DateTime.UtcNow + timeout; while (DateTime.UtcNow < deadline) { if (await condition()) return; await Task.Delay(200); } throw new TimeoutException($"Condition not met within {timeout}"); } }