7b0b9c7365
Solution + 23 src projects + 26 test projects renamed; folders, csproj, namespaces, and ScadaLinkDbContext/ScadaBridgeDbContext class updated. ActorSystem "scadalink" → "scadabridge", Akka seed-node URLs migrated. SQL roles/logins, LDAP domains, CLI command name, and CLI config dir (~/.scadalink → ~/.scadabridge) also renamed. Build green; 5 Host.Tests fail awaiting SQL login rename in next commit. Pre-existing StaleTagMonitor timing flakes unchanged. Rename script committed at tools/rename-to-scadabridge.sh.
96 lines
4.3 KiB
C#
96 lines
4.3 KiB
C#
using Microsoft.Extensions.Options;
|
|
|
|
namespace ZB.MOM.WW.ScadaBridge.ClusterInfrastructure;
|
|
|
|
/// <summary>
|
|
/// CI-004: Validates <see cref="ClusterOptions"/> at startup. The values it
|
|
/// guards carry cluster-wide consequences — the design doc
|
|
/// (<c>Component-ClusterInfrastructure.md</c>) is emphatic that misconfiguring
|
|
/// them produces a total cluster shutdown or an indefinitely blocked singleton.
|
|
/// Registered with <c>ValidateOnStart()</c> so a bad <c>appsettings.json</c>
|
|
/// fails fast at boot rather than failing far from the cause.
|
|
/// </summary>
|
|
public sealed class ClusterOptionsValidator : IValidateOptions<ClusterOptions>
|
|
{
|
|
/// <summary>Split-brain resolver strategies safe for ScadaBridge's two-node clusters.</summary>
|
|
private static readonly HashSet<string> AllowedStrategies = new(StringComparer.OrdinalIgnoreCase)
|
|
{
|
|
"keep-oldest"
|
|
};
|
|
|
|
/// <summary>
|
|
/// Validates the cluster options, returning a failure result if any critical settings are misconfigured.
|
|
/// </summary>
|
|
/// <param name="name">Named options instance name (unused; all instances are validated identically).</param>
|
|
/// <param name="options">The cluster options to validate.</param>
|
|
public ValidateOptionsResult Validate(string? name, ClusterOptions options)
|
|
{
|
|
var failures = new List<string>();
|
|
|
|
if (options.SeedNodes is null || options.SeedNodes.Count < 2)
|
|
{
|
|
// CI-012: design doc states "both nodes are seed nodes — each node lists
|
|
// both itself and its partner" so a properly-configured deployment lists
|
|
// two. Accepting a single-seed configuration silently defeats the
|
|
// "no startup ordering dependency" guarantee called out by
|
|
// Component-ClusterInfrastructure.md (Node Configuration).
|
|
failures.Add(
|
|
"ClusterOptions.SeedNodes must contain at least 2 seed nodes "
|
|
+ "(Component-ClusterInfrastructure.md → Node Configuration: "
|
|
+ "both nodes are seed nodes); a single-seed configuration defeats "
|
|
+ "the no-startup-ordering-dependency guarantee.");
|
|
}
|
|
|
|
if (string.IsNullOrWhiteSpace(options.SplitBrainResolverStrategy)
|
|
|| !AllowedStrategies.Contains(options.SplitBrainResolverStrategy))
|
|
{
|
|
failures.Add(
|
|
$"ClusterOptions.SplitBrainResolverStrategy must be 'keep-oldest' for a two-node cluster; " +
|
|
$"'{options.SplitBrainResolverStrategy}' would risk a total cluster shutdown on a partition.");
|
|
}
|
|
|
|
if (options.MinNrOfMembers != 1)
|
|
{
|
|
failures.Add(
|
|
$"ClusterOptions.MinNrOfMembers must be 1 (was {options.MinNrOfMembers}); " +
|
|
"any other value blocks the cluster singleton after failover and halts all data collection.");
|
|
}
|
|
|
|
if (options.StableAfter <= TimeSpan.Zero)
|
|
{
|
|
failures.Add("ClusterOptions.StableAfter must be a positive duration.");
|
|
}
|
|
|
|
if (options.HeartbeatInterval <= TimeSpan.Zero)
|
|
{
|
|
failures.Add("ClusterOptions.HeartbeatInterval must be a positive duration.");
|
|
}
|
|
|
|
if (options.FailureDetectionThreshold <= TimeSpan.Zero)
|
|
{
|
|
failures.Add("ClusterOptions.FailureDetectionThreshold must be a positive duration.");
|
|
}
|
|
|
|
if (options.HeartbeatInterval >= options.FailureDetectionThreshold)
|
|
{
|
|
failures.Add(
|
|
$"ClusterOptions.HeartbeatInterval ({options.HeartbeatInterval}) must be well below " +
|
|
$"FailureDetectionThreshold ({options.FailureDetectionThreshold}); otherwise nodes are " +
|
|
"declared unreachable before a heartbeat can arrive.");
|
|
}
|
|
|
|
if (!options.DownIfAlone)
|
|
{
|
|
failures.Add(
|
|
"ClusterOptions.DownIfAlone must be true for the keep-oldest resolver "
|
|
+ "(Component-ClusterInfrastructure.md → Split-Brain Resolution); with it false the "
|
|
+ "oldest node can run as an isolated single-node cluster during a partition while the "
|
|
+ "younger node forms its own, producing two live clusters.");
|
|
}
|
|
|
|
return failures.Count > 0
|
|
? ValidateOptionsResult.Fail(failures)
|
|
: ValidateOptionsResult.Success;
|
|
}
|
|
}
|