From 5a8029df19146b9beec1983cf269445e36c52d49 Mon Sep 17 00:00:00 2001 From: Martin Taillefer Date: Tue, 27 Jun 2023 07:05:32 -0700 Subject: [PATCH] Simplify task handling in MeteringCollector to avoid racy edge case (#4121) Co-authored-by: Martin Taillefer --- .../Metering/MetricCollector.cs | 53 ++++++++++++------- 1 file changed, 34 insertions(+), 19 deletions(-) diff --git a/src/Libraries/Microsoft.Extensions.Telemetry.Testing/Metering/MetricCollector.cs b/src/Libraries/Microsoft.Extensions.Telemetry.Testing/Metering/MetricCollector.cs index f6c73163a13..4d162b9b5ab 100644 --- a/src/Libraries/Microsoft.Extensions.Telemetry.Testing/Metering/MetricCollector.cs +++ b/src/Libraries/Microsoft.Extensions.Telemetry.Testing/Metering/MetricCollector.cs @@ -130,18 +130,19 @@ public void Dispose() } _disposed = true; + } - _meterListener.Dispose(); - _measurements.Clear(); - - // wake up anybody still waiting and inform them of the bad news: their horse is dead... - foreach (var w in _waiters) - { - _ = w.TaskSource.TrySetException(MakeObjectDisposedException()); - } + _meterListener.Dispose(); + _measurements.Clear(); - _waiters.Clear(); + // wake up anybody still waiting and inform them of the bad news: their horse is dead... + foreach (var w in _waiters) + { + // trigger the task from outside the lock + _ = w.TaskSource.TrySetException(MakeObjectDisposedException()); } + + _waiters.Clear(); } /// @@ -230,14 +231,15 @@ public Task WaitForMeasurementsAsync(int minCount, CancellationToken cancellatio { lock (_measurements) { + _waiters.Remove(w); + } + + // trigger the task from outside the lock #if NET6_0_OR_GREATER - w.TaskSource.TrySetCanceled(cancellationToken); + w.TaskSource.TrySetCanceled(cancellationToken); #else - w.TaskSource.TrySetCanceled(); + w.TaskSource.TrySetCanceled(); #endif - - _waiters.Remove(w); - } }); } @@ -298,6 +300,7 @@ private void OnMeasurementRecorded(Instrument instrument, T measurement, ReadOnl { var m = new CollectedMeasurement(measurement, tags, _timeProvider.GetUtcNow()); + List? toBeWoken = null; lock (_measurements) { if (!_disposed) @@ -310,13 +313,23 @@ private void OnMeasurementRecorded(Instrument instrument, T measurement, ReadOnl { if (_measurements.Count >= _waiters[i].MinCount) { - // we use TrySetResult since the task may already be in the Cancelled state due to a timeout. - _ = _waiters[i].TaskSource.TrySetResult(true); + toBeWoken ??= new(); + toBeWoken.Add(_waiters[i]); _waiters.RemoveAt(i); } } } } + + if (toBeWoken != null) + { + // trigger the task from outside the lock + foreach (var w in toBeWoken) + { + // we use TrySetResult since the task may already be in the Cancelled state due to a timeout. + _ = w.TaskSource.TrySetResult(true); + } + } } private void ThrowIfDisposed() @@ -341,8 +354,10 @@ public Waiter(int minCount) public int MinCount { get; } - // The TCS is modified in a lock. - // Use RunContinuationsAsynchronously to ensure continuations don't run when holding the lock. - public TaskCompletionSource TaskSource { get; } = new(TaskCreationOptions.RunContinuationsAsynchronously); + // NOTE: In order to avoid potential dead locks, this task should + // be completed when the main lock is not being held. Otherwise, + // application code being woken up by the task could potentially + // call back into the MetricCollector code and thus trigger a deadlock. + public TaskCompletionSource TaskSource { get; } = new(); } }