feat(historian-gateway): GatewayAlarmHistorianWriter — SendEvent + gRPC->outcome mapping
Claude-Session: https://claude.ai/code/session_012SDSQ3AcaXqPcBtDESBRii
This commit is contained in:
+141
@@ -0,0 +1,141 @@
|
||||
using Grpc.Core;
|
||||
using Microsoft.Extensions.Logging;
|
||||
using ZB.MOM.WW.HistorianGateway.Client;
|
||||
using ZB.MOM.WW.HistorianGateway.Contracts.Grpc;
|
||||
using ZB.MOM.WW.OtOpcUa.Core.AlarmHistorian;
|
||||
using ZB.MOM.WW.OtOpcUa.Driver.Historian.Gateway.Mapping;
|
||||
|
||||
namespace ZB.MOM.WW.OtOpcUa.Driver.Historian.Gateway;
|
||||
|
||||
/// <summary>
|
||||
/// <see cref="IAlarmHistorianWriter"/> backed by the HistorianGateway <c>SendEvent</c> path. The
|
||||
/// drain worker behind <c>SqliteStoreAndForwardSink</c> calls
|
||||
/// <see cref="WriteBatchAsync"/> and uses the returned per-event
|
||||
/// <see cref="HistorianWriteOutcome"/> to decide retry vs. dead-letter, so this writer maps every
|
||||
/// gateway result — success ack, the published client's typed exception hierarchy, raw
|
||||
/// <see cref="RpcException"/> (defensive), and any unexpected error — onto exactly one outcome per
|
||||
/// event and <b>never throws</b>.
|
||||
/// </summary>
|
||||
/// <remarks>
|
||||
/// <para>
|
||||
/// Each event is sent individually so one poison event cannot fail the whole batch: a permanent
|
||||
/// failure on event N is dead-lettered while its siblings continue. Outcomes are returned in
|
||||
/// input order, one per event; an empty batch yields an empty list with no gateway call.
|
||||
/// </para>
|
||||
/// <para>
|
||||
/// <b>Outcome mapping.</b> Success (or store-forward-queued) ack ⇒ <see cref="HistorianWriteOutcome.Ack"/>.
|
||||
/// Transient gRPC codes (<c>Unavailable</c>, <c>DeadlineExceeded</c>, <c>ResourceExhausted</c>,
|
||||
/// <c>Aborted</c>, <c>Internal</c>) and the auth codes (<c>Unauthenticated</c>,
|
||||
/// <c>PermissionDenied</c>) ⇒ <see cref="HistorianWriteOutcome.RetryPlease"/> — an auth fix
|
||||
/// re-enables the batch, so an auth blip never dead-letters. Permanent codes
|
||||
/// (<c>InvalidArgument</c>, <c>FailedPrecondition</c>, <c>OutOfRange</c>, <c>Unimplemented</c>) ⇒
|
||||
/// <see cref="HistorianWriteOutcome.PermanentFail"/> (dead-letter poison — mirrors the Wonderware
|
||||
/// <c>PerEventStatus==2</c> boundary). The typed client exceptions are classified by type, or by
|
||||
/// the <see cref="RpcException"/> they wrap; any other or unclassifiable error defaults to
|
||||
/// <see cref="HistorianWriteOutcome.PermanentFail"/> so the drain worker cannot loop a poison
|
||||
/// event forever.
|
||||
/// </para>
|
||||
/// </remarks>
|
||||
public sealed class GatewayAlarmHistorianWriter : IAlarmHistorianWriter
|
||||
{
|
||||
private readonly IHistorianGatewayClient _client;
|
||||
private readonly ILogger<GatewayAlarmHistorianWriter> _logger;
|
||||
|
||||
/// <summary>Creates the writer over a gateway client seam.</summary>
|
||||
/// <param name="client">The gateway client used for the <c>SendEvent</c> write path.</param>
|
||||
/// <param name="logger">Logger for per-event outcome diagnostics (never logs event content).</param>
|
||||
public GatewayAlarmHistorianWriter(IHistorianGatewayClient client, ILogger<GatewayAlarmHistorianWriter> logger)
|
||||
{
|
||||
_client = client ?? throw new ArgumentNullException(nameof(client));
|
||||
_logger = logger ?? throw new ArgumentNullException(nameof(logger));
|
||||
}
|
||||
|
||||
/// <inheritdoc />
|
||||
public async Task<IReadOnlyList<HistorianWriteOutcome>> WriteBatchAsync(
|
||||
IReadOnlyList<AlarmHistorianEvent> batch, CancellationToken cancellationToken)
|
||||
{
|
||||
ArgumentNullException.ThrowIfNull(batch);
|
||||
|
||||
if (batch.Count == 0)
|
||||
{
|
||||
return Array.Empty<HistorianWriteOutcome>();
|
||||
}
|
||||
|
||||
var outcomes = new HistorianWriteOutcome[batch.Count];
|
||||
|
||||
for (var i = 0; i < batch.Count; i++)
|
||||
{
|
||||
outcomes[i] = await SendOneAsync(batch[i], cancellationToken).ConfigureAwait(false);
|
||||
}
|
||||
|
||||
return outcomes;
|
||||
}
|
||||
|
||||
private async Task<HistorianWriteOutcome> SendOneAsync(AlarmHistorianEvent evt, CancellationToken cancellationToken)
|
||||
{
|
||||
try
|
||||
{
|
||||
var ack = await _client.SendEventAsync(AlarmEventMapper.ToHistorianEvent(evt), cancellationToken)
|
||||
.ConfigureAwait(false);
|
||||
return MapAck(ack);
|
||||
}
|
||||
catch (Exception exception)
|
||||
{
|
||||
// NEVER throw out of the writer — the drain worker expects a per-event outcome. Classify
|
||||
// and log only the failure category (no event content, hostnames, or credentials).
|
||||
var outcome = Classify(exception);
|
||||
if (outcome == HistorianWriteOutcome.PermanentFail)
|
||||
{
|
||||
_logger.LogWarning(
|
||||
"Alarm SendEvent permanently failed ({Exception}); dead-lettering the event.",
|
||||
exception.GetType().Name);
|
||||
}
|
||||
else
|
||||
{
|
||||
_logger.LogDebug(
|
||||
"Alarm SendEvent transiently failed ({Exception}); will retry.",
|
||||
exception.GetType().Name);
|
||||
}
|
||||
|
||||
return outcome;
|
||||
}
|
||||
}
|
||||
|
||||
// A non-success ack that the gateway durably queued (store-forward) is still accepted — do not
|
||||
// re-drain it. A non-success, non-queued ack is a soft failure: retry rather than dead-letter.
|
||||
private static HistorianWriteOutcome MapAck(WriteAck ack) =>
|
||||
ack.Success || ack.Queued ? HistorianWriteOutcome.Ack : HistorianWriteOutcome.RetryPlease;
|
||||
|
||||
private static HistorianWriteOutcome Classify(Exception exception) => exception switch
|
||||
{
|
||||
// Published client's typed hierarchy (production reality). Unavailable + both auth kinds retry.
|
||||
HistorianGatewayUnavailableException => HistorianWriteOutcome.RetryPlease,
|
||||
HistorianGatewayAuthenticationException => HistorianWriteOutcome.RetryPlease,
|
||||
HistorianGatewayAuthorizationException => HistorianWriteOutcome.RetryPlease,
|
||||
// A base client exception wrapping a permanent/transient RpcException → classify by inner status.
|
||||
HistorianGatewayException { InnerException: RpcException inner } => ClassifyStatus(inner.StatusCode),
|
||||
// Defensive raw RpcException path (the seam type signature permits it).
|
||||
RpcException rpc => ClassifyStatus(rpc.StatusCode),
|
||||
// Anything else (incl. a bare base client exception we cannot classify) → dead-letter to avoid
|
||||
// an infinite drain loop on a poison event.
|
||||
_ => HistorianWriteOutcome.PermanentFail,
|
||||
};
|
||||
|
||||
private static HistorianWriteOutcome ClassifyStatus(StatusCode code) => code switch
|
||||
{
|
||||
StatusCode.Unavailable
|
||||
or StatusCode.DeadlineExceeded
|
||||
or StatusCode.ResourceExhausted
|
||||
or StatusCode.Aborted
|
||||
or StatusCode.Internal
|
||||
// An auth fix re-enables the whole batch — never dead-letter on an auth blip.
|
||||
or StatusCode.Unauthenticated
|
||||
or StatusCode.PermissionDenied => HistorianWriteOutcome.RetryPlease,
|
||||
StatusCode.InvalidArgument
|
||||
or StatusCode.FailedPrecondition
|
||||
or StatusCode.OutOfRange
|
||||
or StatusCode.Unimplemented => HistorianWriteOutcome.PermanentFail,
|
||||
// Unknown/unclassified gRPC code → dead-letter to avoid an infinite drain loop.
|
||||
_ => HistorianWriteOutcome.PermanentFail,
|
||||
};
|
||||
}
|
||||
Reference in New Issue
Block a user