Group all 69 projects into category subfolders under src/ and tests/ so the Rider Solution Explorer mirrors the module structure. Folders: Core, Server, Drivers (with a nested Driver CLIs subfolder), Client, Tooling. - Move every project folder on disk with git mv (history preserved as renames). - Recompute relative paths in 57 .csproj files: cross-category ProjectReferences, the lib/ HintPath+None refs in Driver.Historian.Wonderware, and the external mxaccessgw refs in Driver.Galaxy and its test project. - Rebuild ZB.MOM.WW.OtOpcUa.slnx with nested solution folders. - Re-prefix project paths in functional scripts (e2e, compliance, smoke SQL, integration, install). Build green (0 errors); unit tests pass. Docs left for a separate pass. Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
107 lines
6.7 KiB
C#
107 lines
6.7 KiB
C#
using ZB.MOM.WW.OtOpcUa.Core.Abstractions;
|
||
|
||
namespace ZB.MOM.WW.OtOpcUa.Core.Resilience;
|
||
|
||
/// <summary>
|
||
/// Per-tier × per-capability resilience policy configuration for a driver instance.
|
||
/// Bound from <c>DriverInstance.ResilienceConfig</c> JSON (nullable column; null = tier defaults).
|
||
/// Per <c>docs/v2/plan.md</c> decisions #143 and #144.
|
||
/// </summary>
|
||
public sealed record DriverResilienceOptions
|
||
{
|
||
/// <summary>Tier the owning driver type is registered as; drives the default map.</summary>
|
||
public required DriverTier Tier { get; init; }
|
||
|
||
/// <summary>
|
||
/// Per-capability policy overrides. Capabilities absent from this map fall back to
|
||
/// <see cref="GetTierDefaults(DriverTier)"/> for the configured <see cref="Tier"/>.
|
||
/// </summary>
|
||
public IReadOnlyDictionary<DriverCapability, CapabilityPolicy> CapabilityPolicies { get; init; }
|
||
= new Dictionary<DriverCapability, CapabilityPolicy>();
|
||
|
||
/// <summary>Bulkhead (max concurrent in-flight calls) for every capability. Default 32.</summary>
|
||
public int BulkheadMaxConcurrent { get; init; } = 32;
|
||
|
||
/// <summary>
|
||
/// Bulkhead queue depth. Zero = no queueing; overflow fails fast with
|
||
/// <c>BulkheadRejectedException</c>. Default 64.
|
||
/// </summary>
|
||
public int BulkheadMaxQueue { get; init; } = 64;
|
||
|
||
/// <summary>
|
||
/// Periodic scheduled recycle interval for Tier C out-of-process hosts, in seconds.
|
||
/// Null (the default) = no scheduled recycle; the driver's Host process keeps running
|
||
/// indefinitely unless a memory breach or operator action triggers a recycle. Only
|
||
/// respected for <see cref="DriverTier.C"/>; Tier A/B recycle would tear down every
|
||
/// OPC UA session, so the loader ignores non-null values for those tiers + logs a
|
||
/// warning (per decisions #74 / #145).
|
||
/// </summary>
|
||
public int? RecycleIntervalSeconds { get; init; }
|
||
|
||
/// <summary>
|
||
/// Look up the effective policy for a capability, falling back to tier defaults when no
|
||
/// override is configured. Never returns null.
|
||
/// </summary>
|
||
public CapabilityPolicy Resolve(DriverCapability capability)
|
||
{
|
||
if (CapabilityPolicies.TryGetValue(capability, out var policy))
|
||
return policy;
|
||
|
||
var defaults = GetTierDefaults(Tier);
|
||
return defaults[capability];
|
||
}
|
||
|
||
/// <summary>
|
||
/// Per-tier per-capability default policy table, per decisions #143-144 and the Phase 6.1
|
||
/// Stream A.2 specification. Retries skipped on <see cref="DriverCapability.Write"/> and
|
||
/// <see cref="DriverCapability.AlarmAcknowledge"/> regardless of tier.
|
||
/// </summary>
|
||
public static IReadOnlyDictionary<DriverCapability, CapabilityPolicy> GetTierDefaults(DriverTier tier) =>
|
||
tier switch
|
||
{
|
||
DriverTier.A => new Dictionary<DriverCapability, CapabilityPolicy>
|
||
{
|
||
[DriverCapability.Read] = new(TimeoutSeconds: 2, RetryCount: 3, BreakerFailureThreshold: 5),
|
||
[DriverCapability.Write] = new(TimeoutSeconds: 2, RetryCount: 0, BreakerFailureThreshold: 5),
|
||
[DriverCapability.Discover] = new(TimeoutSeconds: 30, RetryCount: 2, BreakerFailureThreshold: 3),
|
||
[DriverCapability.Subscribe] = new(TimeoutSeconds: 5, RetryCount: 3, BreakerFailureThreshold: 5),
|
||
[DriverCapability.Probe] = new(TimeoutSeconds: 2, RetryCount: 3, BreakerFailureThreshold: 5),
|
||
[DriverCapability.AlarmSubscribe] = new(TimeoutSeconds: 5, RetryCount: 3, BreakerFailureThreshold: 5),
|
||
[DriverCapability.AlarmAcknowledge] = new(TimeoutSeconds: 5, RetryCount: 0, BreakerFailureThreshold: 5),
|
||
[DriverCapability.HistoryRead] = new(TimeoutSeconds: 30, RetryCount: 2, BreakerFailureThreshold: 5),
|
||
},
|
||
DriverTier.B => new Dictionary<DriverCapability, CapabilityPolicy>
|
||
{
|
||
[DriverCapability.Read] = new(TimeoutSeconds: 4, RetryCount: 3, BreakerFailureThreshold: 5),
|
||
[DriverCapability.Write] = new(TimeoutSeconds: 4, RetryCount: 0, BreakerFailureThreshold: 5),
|
||
[DriverCapability.Discover] = new(TimeoutSeconds: 60, RetryCount: 2, BreakerFailureThreshold: 3),
|
||
[DriverCapability.Subscribe] = new(TimeoutSeconds: 8, RetryCount: 3, BreakerFailureThreshold: 5),
|
||
[DriverCapability.Probe] = new(TimeoutSeconds: 4, RetryCount: 3, BreakerFailureThreshold: 5),
|
||
[DriverCapability.AlarmSubscribe] = new(TimeoutSeconds: 8, RetryCount: 3, BreakerFailureThreshold: 5),
|
||
[DriverCapability.AlarmAcknowledge] = new(TimeoutSeconds: 8, RetryCount: 0, BreakerFailureThreshold: 5),
|
||
[DriverCapability.HistoryRead] = new(TimeoutSeconds: 60, RetryCount: 2, BreakerFailureThreshold: 5),
|
||
},
|
||
DriverTier.C => new Dictionary<DriverCapability, CapabilityPolicy>
|
||
{
|
||
[DriverCapability.Read] = new(TimeoutSeconds: 10, RetryCount: 1, BreakerFailureThreshold: 0),
|
||
[DriverCapability.Write] = new(TimeoutSeconds: 10, RetryCount: 0, BreakerFailureThreshold: 0),
|
||
[DriverCapability.Discover] = new(TimeoutSeconds: 120, RetryCount: 1, BreakerFailureThreshold: 0),
|
||
[DriverCapability.Subscribe] = new(TimeoutSeconds: 15, RetryCount: 1, BreakerFailureThreshold: 0),
|
||
[DriverCapability.Probe] = new(TimeoutSeconds: 10, RetryCount: 1, BreakerFailureThreshold: 0),
|
||
[DriverCapability.AlarmSubscribe] = new(TimeoutSeconds: 15, RetryCount: 1, BreakerFailureThreshold: 0),
|
||
[DriverCapability.AlarmAcknowledge] = new(TimeoutSeconds: 15, RetryCount: 0, BreakerFailureThreshold: 0),
|
||
[DriverCapability.HistoryRead] = new(TimeoutSeconds: 120, RetryCount: 1, BreakerFailureThreshold: 0),
|
||
},
|
||
_ => throw new ArgumentOutOfRangeException(nameof(tier), tier, $"No default policy table defined for tier {tier}."),
|
||
};
|
||
}
|
||
|
||
/// <summary>Policy for one capability on one driver instance.</summary>
|
||
/// <param name="TimeoutSeconds">Per-call timeout (wraps the inner Polly execution).</param>
|
||
/// <param name="RetryCount">Number of retry attempts after the first failure; zero = no retry.</param>
|
||
/// <param name="BreakerFailureThreshold">
|
||
/// Consecutive-failure count that opens the circuit breaker; zero = no breaker
|
||
/// (Tier C uses the supervisor's process-level breaker instead, per decision #68).
|
||
/// </param>
|
||
public sealed record CapabilityPolicy(int TimeoutSeconds, int RetryCount, int BreakerFailureThreshold);
|