feat: add stream replica groups and leader stepdown
This commit is contained in:
65
src/NATS.Server/JetStream/Cluster/StreamReplicaGroup.cs
Normal file
65
src/NATS.Server/JetStream/Cluster/StreamReplicaGroup.cs
Normal file
@@ -0,0 +1,65 @@
|
||||
using NATS.Server.Raft;
|
||||
|
||||
namespace NATS.Server.JetStream.Cluster;
|
||||
|
||||
public sealed class StreamReplicaGroup
|
||||
{
|
||||
private readonly List<RaftNode> _nodes;
|
||||
|
||||
public string StreamName { get; }
|
||||
public IReadOnlyList<RaftNode> Nodes => _nodes;
|
||||
public RaftNode Leader { get; private set; }
|
||||
|
||||
public StreamReplicaGroup(string streamName, int replicas)
|
||||
{
|
||||
StreamName = streamName;
|
||||
|
||||
var nodeCount = Math.Max(replicas, 1);
|
||||
_nodes = Enumerable.Range(1, nodeCount)
|
||||
.Select(i => new RaftNode($"{streamName.ToLowerInvariant()}-r{i}"))
|
||||
.ToList();
|
||||
|
||||
foreach (var node in _nodes)
|
||||
node.ConfigureCluster(_nodes);
|
||||
|
||||
Leader = ElectLeader(_nodes[0]);
|
||||
}
|
||||
|
||||
public async ValueTask<long> ProposeAsync(string command, CancellationToken ct)
|
||||
{
|
||||
if (!Leader.IsLeader)
|
||||
Leader = ElectLeader(SelectNextCandidate(Leader));
|
||||
|
||||
return await Leader.ProposeAsync(command, ct);
|
||||
}
|
||||
|
||||
public Task StepDownAsync(CancellationToken ct)
|
||||
{
|
||||
_ = ct;
|
||||
var previous = Leader;
|
||||
previous.RequestStepDown();
|
||||
Leader = ElectLeader(SelectNextCandidate(previous));
|
||||
return Task.CompletedTask;
|
||||
}
|
||||
|
||||
private RaftNode SelectNextCandidate(RaftNode currentLeader)
|
||||
{
|
||||
if (_nodes.Count == 1)
|
||||
return _nodes[0];
|
||||
|
||||
var index = _nodes.FindIndex(n => n.Id == currentLeader.Id);
|
||||
if (index < 0)
|
||||
return _nodes[0];
|
||||
|
||||
return _nodes[(index + 1) % _nodes.Count];
|
||||
}
|
||||
|
||||
private RaftNode ElectLeader(RaftNode candidate)
|
||||
{
|
||||
candidate.StartElection(_nodes.Count);
|
||||
foreach (var voter in _nodes.Where(n => n.Id != candidate.Id))
|
||||
candidate.ReceiveVote(voter.GrantVote(candidate.Term), _nodes.Count);
|
||||
|
||||
return candidate;
|
||||
}
|
||||
}
|
||||
@@ -14,6 +14,8 @@ public sealed class StreamManager
|
||||
private readonly JetStreamMetaGroup? _metaGroup;
|
||||
private readonly ConcurrentDictionary<string, StreamHandle> _streams =
|
||||
new(StringComparer.Ordinal);
|
||||
private readonly ConcurrentDictionary<string, StreamReplicaGroup> _replicaGroups =
|
||||
new(StringComparer.Ordinal);
|
||||
private readonly ConcurrentDictionary<string, List<MirrorCoordinator>> _mirrorsByOrigin =
|
||||
new(StringComparer.Ordinal);
|
||||
private readonly ConcurrentDictionary<string, List<SourceCoordinator>> _sourcesByOrigin =
|
||||
@@ -36,6 +38,12 @@ public sealed class StreamManager
|
||||
normalized.Name,
|
||||
_ => new StreamHandle(normalized, new MemStore()),
|
||||
(_, existing) => existing with { Config = normalized });
|
||||
_replicaGroups.AddOrUpdate(
|
||||
normalized.Name,
|
||||
_ => new StreamReplicaGroup(normalized.Name, normalized.Replicas),
|
||||
(_, existing) => existing.Nodes.Count == Math.Max(normalized.Replicas, 1)
|
||||
? existing
|
||||
: new StreamReplicaGroup(normalized.Name, normalized.Replicas));
|
||||
RebuildReplicationCoordinators();
|
||||
_metaGroup?.ProposeCreateStreamAsync(normalized, default).GetAwaiter().GetResult();
|
||||
|
||||
@@ -77,6 +85,9 @@ public sealed class StreamManager
|
||||
if (stream == null)
|
||||
return null;
|
||||
|
||||
if (_replicaGroups.TryGetValue(stream.Config.Name, out var replicaGroup))
|
||||
_ = replicaGroup.ProposeAsync($"PUB {subject}", default).GetAwaiter().GetResult();
|
||||
|
||||
var seq = stream.Store.AppendAsync(subject, payload, default).GetAwaiter().GetResult();
|
||||
EnforceLimits(stream);
|
||||
var stored = stream.Store.LoadAsync(seq, default).GetAwaiter().GetResult();
|
||||
@@ -90,6 +101,14 @@ public sealed class StreamManager
|
||||
};
|
||||
}
|
||||
|
||||
public Task StepDownStreamLeaderAsync(string stream, CancellationToken ct)
|
||||
{
|
||||
if (_replicaGroups.TryGetValue(stream, out var replicaGroup))
|
||||
return replicaGroup.StepDownAsync(ct);
|
||||
|
||||
return Task.CompletedTask;
|
||||
}
|
||||
|
||||
private static StreamConfig NormalizeConfig(StreamConfig config)
|
||||
{
|
||||
var copy = new StreamConfig
|
||||
|
||||
Reference in New Issue
Block a user