Skip to content

Commit

Permalink
HashedWheelTimer startup crash on .NET 6+ (#7174)
Browse files Browse the repository at this point in the history
* `HashedWheelTimer` startup crash on .NET 6+

More issues with the `PeriodicTimer` - this time it's a bit of a spooky heisenbug. Added a spec that can reproduce it but it must be run continuously in order to catch it.

* fixed issue with `HashedWheelTimer` startup

* restored volatile, cache value before comparand
  • Loading branch information
Aaronontheweb authored Apr 26, 2024
1 parent 906c4d1 commit 1ef1869
Show file tree
Hide file tree
Showing 2 changed files with 104 additions and 5 deletions.
97 changes: 97 additions & 0 deletions src/core/Akka.Tests/Actor/TimerStartupCrashBugFixSpec.cs
Original file line number Diff line number Diff line change
@@ -0,0 +1,97 @@
// -----------------------------------------------------------------------
// <copyright file="TimerStartupCrashBugFixSpec.cs" company="Akka.NET Project">
// Copyright (C) 2009-2024 Lightbend Inc. <http://www.lightbend.com>
// Copyright (C) 2013-2024 .NET Foundation <https://github.com/akkadotnet/akka.net>
// </copyright>
// -----------------------------------------------------------------------

#nullable enable
using System;
using System.Linq;
using System.Threading.Tasks;
using Akka.Actor;
using Akka.Event;
using Akka.Routing;
using Akka.TestKit;
using FluentAssertions;
using FsCheck;
using Xunit;
using Xunit.Abstractions;

namespace Akka.Tests.Actor;

public class TimerStartupCrashBugFixSpec : AkkaSpec
{
public TimerStartupCrashBugFixSpec(ITestOutputHelper output) : base(output: output, Akka.Configuration.Config.Empty)
{
Sys.Log.Info("Starting TimerStartupCrashBugFixSpec");
}

private class TimerActor : UntypedActor, IWithTimers
{
public sealed class Check
{
public static Check Instance { get; } = new Check();

private Check()
{
}
}

public sealed class Hit
{
public static Hit Instance { get; } = new Hit();

private Hit()
{
}
}

private readonly ILoggingAdapter _log = Context.GetLogger();
private int _counter = 0;
public ITimerScheduler? Timers { get; set; } = null;

protected override void PreStart()
{
Timers?.StartPeriodicTimer("key", Hit.Instance, TimeSpan.FromMilliseconds(1));
}

protected override void OnReceive(object message)
{
switch (message)
{
case Check _:
_log.Info("Check received");
Sender.Tell(_counter);
break;
case Hit _:
_log.Info("Hit received");
_counter++;
break;
}
}

protected override void PreRestart(Exception reason, object message)
{
_log.Error(reason, "Not restarting - shutting down");
Context.Stop(Self);
}
}

[Fact]
public async Task TimerActor_should_not_crash_on_startup()
{
var actors = Enumerable.Range(0, 10).Select(c => Sys.ActorOf(Props.Create(() => new TimerActor()))).ToList();
var watchTasks = actors.Select(actor => actor.WatchAsync()).ToList();

var i = 0;
while (i == 0)
{
// guarantee that the actor has started and processed a message from scheduler
i = await actors[0].Ask<int>(TimerActor.Check.Instance);
}


watchTasks.Any(c => c.IsCompleted).Should().BeFalse();
}
}
12 changes: 7 additions & 5 deletions src/core/Akka/Actor/Scheduler/HashedWheelTimerScheduler.cs
Original file line number Diff line number Diff line change
Expand Up @@ -147,25 +147,27 @@ private static int NormalizeTicksPerWheel(int ticksPerWheel)

private void Start()
{
if (_workerState == WORKER_STATE_STARTED)
// only read the worker state once so it can't be a moving target for else-branch
var workerStateRead = _workerState;
if (workerStateRead == WORKER_STATE_STARTED)
{
// do nothing
}
else if (_workerState == WORKER_STATE_INIT)
else if (workerStateRead == WORKER_STATE_INIT)
{
if (Interlocked.CompareExchange(ref _workerState, WORKER_STATE_STARTED, WORKER_STATE_INIT) == WORKER_STATE_INIT)
{
_timer ??= new PeriodicTimer(_timerDuration);
Task.Run(() => RunAsync(_cts.Token)); // start the clock
Task.Run(() => RunAsync(_cts.Token).ConfigureAwait(false)); // start the clock
}
}
else if (_workerState == WORKER_STATE_SHUTDOWN)
else if (workerStateRead == WORKER_STATE_SHUTDOWN)
{
throw new SchedulerException("cannot enqueue after timer shutdown");
}
else
{
throw new InvalidOperationException($"Worker in invalid state: {_workerState}");
throw new InvalidOperationException($"Worker in invalid state: {workerStateRead}");
}

if(_startTime == 0)
Expand Down

0 comments on commit 1ef1869

Please sign in to comment.