| | | 1 | | using System.Net.Sockets; |
| | | 2 | | using Microsoft.Extensions.DependencyInjection; |
| | | 3 | | using Microsoft.Extensions.Logging; |
| | | 4 | | |
| | | 5 | | namespace NLightning.Application.Node.Managers; |
| | | 6 | | |
| | | 7 | | using Domain.Channels.Enums; |
| | | 8 | | using Domain.Channels.Events; |
| | | 9 | | using Domain.Channels.Interfaces; |
| | | 10 | | using Domain.Crypto.ValueObjects; |
| | | 11 | | using Domain.Exceptions; |
| | | 12 | | using Domain.Node.Constants; |
| | | 13 | | using Domain.Node.Events; |
| | | 14 | | using Domain.Node.Interfaces; |
| | | 15 | | using Domain.Node.Models; |
| | | 16 | | using Domain.Node.ValueObjects; |
| | | 17 | | using Domain.Persistence.Interfaces; |
| | | 18 | | using Domain.Protocol.Constants; |
| | | 19 | | using Domain.Protocol.Interfaces; |
| | | 20 | | using Infrastructure.Protocol.Models; |
| | | 21 | | using Infrastructure.Transport.Events; |
| | | 22 | | using Infrastructure.Transport.Interfaces; |
| | | 23 | | |
| | | 24 | | /// <summary> |
| | | 25 | | /// Service for managing peers. |
| | | 26 | | /// </summary> |
| | | 27 | | /// <remarks> |
| | | 28 | | /// This class is used to manage peers in the network. |
| | | 29 | | /// </remarks> |
| | | 30 | | /// <seealso cref="IPeerManager" /> |
| | | 31 | | public sealed class PeerManager : IPeerManager |
| | | 32 | | { |
| | | 33 | | private readonly IChannelManager _channelManager; |
| | | 34 | | private readonly ILogger<PeerManager> _logger; |
| | | 35 | | private readonly IPeerServiceFactory _peerServiceFactory; |
| | | 36 | | private readonly ITcpService _tcpService; |
| | | 37 | | private readonly IServiceProvider _serviceProvider; |
| | 0 | 38 | | private readonly Dictionary<CompactPubKey, PeerModel> _peers = []; |
| | | 39 | | |
| | | 40 | | private CancellationTokenSource? _cts; |
| | | 41 | | |
| | 0 | 42 | | public PeerManager(IChannelManager channelManager, ILogger<PeerManager> logger, |
| | 0 | 43 | | IPeerServiceFactory peerServiceFactory, ITcpService tcpService, IServiceProvider serviceProvider) |
| | | 44 | | { |
| | 0 | 45 | | _channelManager = channelManager; |
| | 0 | 46 | | _logger = logger; |
| | 0 | 47 | | _peerServiceFactory = peerServiceFactory; |
| | 0 | 48 | | _tcpService = tcpService; |
| | 0 | 49 | | _serviceProvider = serviceProvider; |
| | 0 | 50 | | } |
| | | 51 | | |
| | | 52 | | public async Task StartAsync(CancellationToken cancellationToken) |
| | | 53 | | { |
| | 0 | 54 | | _cts = CancellationTokenSource.CreateLinkedTokenSource(cancellationToken); |
| | | 55 | | |
| | 0 | 56 | | _tcpService.OnNewPeerConnected += HandleNewPeerConnected; |
| | | 57 | | |
| | 0 | 58 | | _channelManager.OnResponseMessageReady += HandleResponseMessageReady; |
| | | 59 | | |
| | | 60 | | // Load peers and initialize the channel manager |
| | 0 | 61 | | using var scope = _serviceProvider.CreateScope(); |
| | 0 | 62 | | using var uow = scope.ServiceProvider.GetRequiredService<IUnitOfWork>(); |
| | 0 | 63 | | var peers = await uow.GetPeersForStartupAsync(); |
| | 0 | 64 | | foreach (var peer in peers) |
| | | 65 | | { |
| | | 66 | | try |
| | | 67 | | { |
| | 0 | 68 | | _ = await ConnectToPeerAsync(peer.PeerAddressInfo, uow); |
| | 0 | 69 | | if (!_peers.TryGetValue(peer.NodeId, out _)) |
| | | 70 | | { |
| | 0 | 71 | | _logger.LogWarning("Unable to connect to peer {PeerId} on startup", peer.NodeId); |
| | | 72 | | // TODO: Handle this case, maybe retry or log more details |
| | 0 | 73 | | continue; |
| | | 74 | | } |
| | | 75 | | |
| | | 76 | | // Register channels with peer |
| | 0 | 77 | | if (peer.Channels is not { Count: > 0 }) |
| | 0 | 78 | | continue; |
| | | 79 | | |
| | | 80 | | // Only register channels that are not closed or stale |
| | 0 | 81 | | foreach (var channel in peer.Channels.Where(c => c.State != ChannelState.Closed)) |
| | | 82 | | // We don't care about the result here, as we just want to register the existing channels |
| | 0 | 83 | | _ = _channelManager.RegisterExistingChannelAsync(channel); |
| | 0 | 84 | | } |
| | 0 | 85 | | catch (ConnectionException) |
| | | 86 | | { |
| | 0 | 87 | | _logger.LogWarning("Unable to connect to peer {PeerId} on startup", peer.NodeId); |
| | 0 | 88 | | } |
| | 0 | 89 | | catch (Exception e) |
| | | 90 | | { |
| | 0 | 91 | | _logger.LogError(e, "Error connecting to peer {PeerId} on startup", peer.NodeId); |
| | 0 | 92 | | } |
| | 0 | 93 | | } |
| | | 94 | | |
| | 0 | 95 | | await uow.SaveChangesAsync(); |
| | | 96 | | |
| | 0 | 97 | | await _tcpService.StartListeningAsync(_cts.Token); |
| | 0 | 98 | | } |
| | | 99 | | |
| | | 100 | | public async Task StopAsync() |
| | | 101 | | { |
| | 0 | 102 | | if (_cts is null) |
| | 0 | 103 | | throw new InvalidOperationException($"{nameof(PeerManager)} is not running"); |
| | | 104 | | |
| | 0 | 105 | | foreach (var peerKey in _peers.Keys) |
| | | 106 | | try |
| | | 107 | | { |
| | 0 | 108 | | DisconnectPeer(peerKey); |
| | 0 | 109 | | } |
| | 0 | 110 | | catch (Exception e) |
| | | 111 | | { |
| | 0 | 112 | | _logger.LogWarning(e, "Error disconnecting peer {Peer}", peerKey); |
| | 0 | 113 | | } |
| | | 114 | | |
| | | 115 | | try |
| | | 116 | | { |
| | | 117 | | // Give it a 5-second timeout to disconnect all peers |
| | 0 | 118 | | var timeoutTokenSource = new CancellationTokenSource(TimeSpan.FromSeconds(5)); |
| | 0 | 119 | | while (_peers.Count > 0 && !_cts.IsCancellationRequested) |
| | 0 | 120 | | await Task.Delay(TimeSpan.FromSeconds(1), timeoutTokenSource.Token); |
| | 0 | 121 | | } |
| | 0 | 122 | | catch (TaskCanceledException) |
| | | 123 | | { |
| | 0 | 124 | | _logger.LogWarning("Timeout while waiting for peers to disconnect"); |
| | 0 | 125 | | } |
| | | 126 | | |
| | 0 | 127 | | await _cts.CancelAsync(); |
| | 0 | 128 | | } |
| | | 129 | | |
| | | 130 | | /// <inheritdoc /> |
| | | 131 | | /// <exception cref="ConnectionException">Thrown when the connection to the peer fails.</exception> |
| | | 132 | | /// <exception cref="InvalidOperationException">Thrown when the connection to the peer already exists.</exception> |
| | | 133 | | public async Task<PeerModel> ConnectToPeerAsync(PeerAddressInfo peerAddressInfo) |
| | | 134 | | { |
| | 0 | 135 | | using var scope = _serviceProvider.CreateScope(); |
| | 0 | 136 | | using var uow = scope.ServiceProvider.GetRequiredService<IUnitOfWork>(); |
| | | 137 | | |
| | 0 | 138 | | var peer = await ConnectToPeerAsync(peerAddressInfo, uow); |
| | | 139 | | |
| | 0 | 140 | | await uow.SaveChangesAsync(); |
| | | 141 | | |
| | 0 | 142 | | return peer; |
| | 0 | 143 | | } |
| | | 144 | | |
| | | 145 | | /// <inheritdoc /> |
| | | 146 | | public void DisconnectPeer(CompactPubKey pubKey, Exception? exception = null) |
| | | 147 | | { |
| | 0 | 148 | | if (_peers.TryGetValue(pubKey, out var peer)) |
| | | 149 | | { |
| | 0 | 150 | | if (!peer.TryGetPeerService(out var peerService)) |
| | | 151 | | { |
| | 0 | 152 | | _logger.LogWarning("PeerService not found for {Peer}", pubKey); |
| | 0 | 153 | | return; |
| | | 154 | | } |
| | | 155 | | |
| | 0 | 156 | | DisconnectPeer(peerService, exception); |
| | | 157 | | } |
| | | 158 | | else |
| | | 159 | | { |
| | 0 | 160 | | _logger.LogWarning("Peer {Peer} not found", pubKey); |
| | | 161 | | } |
| | 0 | 162 | | } |
| | | 163 | | |
| | | 164 | | public List<PeerModel> ListPeers() |
| | | 165 | | { |
| | 0 | 166 | | return _peers.Values.ToList(); |
| | | 167 | | } |
| | | 168 | | |
| | | 169 | | public PeerModel? GetPeer(CompactPubKey peerId) |
| | | 170 | | { |
| | 0 | 171 | | return _peers.GetValueOrDefault(peerId); |
| | | 172 | | } |
| | | 173 | | |
| | | 174 | | private static void DisconnectPeer(IPeerService peerService, Exception? exception = null) |
| | | 175 | | { |
| | 0 | 176 | | peerService.Disconnect(exception); |
| | 0 | 177 | | } |
| | | 178 | | |
| | | 179 | | private async Task<PeerModel> ConnectToPeerAsync(PeerAddressInfo peerAddressInfo, IUnitOfWork uow) |
| | | 180 | | { |
| | | 181 | | // Convert and validate the address |
| | 0 | 182 | | var peerAddress = new PeerAddress(peerAddressInfo.Address); |
| | | 183 | | |
| | | 184 | | // Check if we're already connected to the peer |
| | 0 | 185 | | if (_peers.ContainsKey(peerAddress.PubKey)) |
| | | 186 | | { |
| | 0 | 187 | | throw new InvalidOperationException($"Already connected to peer {peerAddress.PubKey}"); |
| | | 188 | | } |
| | | 189 | | |
| | | 190 | | // Connect to the peer |
| | 0 | 191 | | var connectedPeer = await _tcpService.ConnectToPeerAsync(peerAddress); |
| | | 192 | | |
| | 0 | 193 | | var peerService = await _peerServiceFactory.CreateConnectedPeerAsync(connectedPeer.CompactPubKey, |
| | 0 | 194 | | connectedPeer.TcpClient); |
| | 0 | 195 | | peerService.OnDisconnect += HandlePeerDisconnection; |
| | 0 | 196 | | peerService.OnChannelMessageReceived += HandlePeerChannelMessage; |
| | | 197 | | |
| | 0 | 198 | | var preferredHost = connectedPeer.Host; |
| | 0 | 199 | | var preferredPort = connectedPeer.Port; |
| | | 200 | | |
| | | 201 | | // Check if the node has set it's preferred address |
| | 0 | 202 | | if (peerService.PreferredHost is not null) |
| | 0 | 203 | | preferredHost = peerService.PreferredHost; |
| | | 204 | | |
| | 0 | 205 | | if (peerService.PreferredPort is not null) |
| | 0 | 206 | | preferredPort = peerService.PreferredPort.Value; |
| | | 207 | | |
| | 0 | 208 | | var peer = new PeerModel(connectedPeer.CompactPubKey, preferredHost, preferredPort, |
| | 0 | 209 | | connectedPeer.TcpClient.Client.ProtocolType == ProtocolType.IPv6 ? "IPv6" : "IPv4") |
| | 0 | 210 | | { |
| | 0 | 211 | | LastSeenAt = DateTime.UtcNow |
| | 0 | 212 | | }; |
| | 0 | 213 | | peer.SetPeerService(peerService); |
| | | 214 | | |
| | 0 | 215 | | _peers.Add(connectedPeer.CompactPubKey, peer); |
| | | 216 | | |
| | 0 | 217 | | await uow.PeerDbRepository.AddOrUpdateAsync(peer); |
| | | 218 | | |
| | 0 | 219 | | return peer; |
| | 0 | 220 | | } |
| | | 221 | | |
| | | 222 | | private void HandleNewPeerConnected(object? _, NewPeerConnectedEventArgs args) |
| | | 223 | | { |
| | | 224 | | try |
| | | 225 | | { |
| | | 226 | | // Create the peer |
| | 0 | 227 | | var peerService = _peerServiceFactory.CreateConnectingPeerAsync(args.TcpClient).GetAwaiter().GetResult(); |
| | 0 | 228 | | peerService.OnDisconnect += HandlePeerDisconnection; |
| | 0 | 229 | | peerService.OnChannelMessageReceived += HandlePeerChannelMessage; |
| | | 230 | | |
| | 0 | 231 | | _logger.LogTrace("PeerService created for peer {PeerPubKey}", peerService.PeerPubKey); |
| | | 232 | | |
| | 0 | 233 | | var preferredHost = args.Host; |
| | 0 | 234 | | var preferredPort = NodeConstants.DefaultPort; |
| | | 235 | | |
| | | 236 | | // Check if the node has set it's preferred address |
| | 0 | 237 | | if (peerService.PreferredHost is not null) |
| | 0 | 238 | | preferredHost = peerService.PreferredHost; |
| | | 239 | | |
| | 0 | 240 | | if (peerService.PreferredPort is not null) |
| | 0 | 241 | | preferredPort = peerService.PreferredPort.Value; |
| | | 242 | | |
| | 0 | 243 | | var peer = new PeerModel(peerService.PeerPubKey, preferredHost, preferredPort, |
| | 0 | 244 | | args.TcpClient.Client.ProtocolType == ProtocolType.IPv6 ? "IPv6" : "IPv4") |
| | 0 | 245 | | { |
| | 0 | 246 | | LastSeenAt = DateTime.UtcNow |
| | 0 | 247 | | }; |
| | 0 | 248 | | peer.SetPeerService(peerService); |
| | | 249 | | |
| | 0 | 250 | | if (preferredHost != "127.0.0.1") |
| | | 251 | | { |
| | | 252 | | // Get a context to save the peer to the database |
| | 0 | 253 | | using var scope = _serviceProvider.CreateScope(); |
| | 0 | 254 | | using var uow = scope.ServiceProvider.GetRequiredService<IUnitOfWork>(); |
| | | 255 | | |
| | 0 | 256 | | uow.PeerDbRepository.AddOrUpdateAsync(peer); |
| | 0 | 257 | | uow.SaveChanges(); |
| | | 258 | | } |
| | | 259 | | |
| | 0 | 260 | | _peers.Add(peerService.PeerPubKey, peer); |
| | 0 | 261 | | } |
| | 0 | 262 | | catch (Exception e) |
| | | 263 | | { |
| | 0 | 264 | | _logger.LogError(e, "Error handling new peer connection from {Host}:{Port}", args.Host, args.Port); |
| | 0 | 265 | | } |
| | 0 | 266 | | } |
| | | 267 | | |
| | | 268 | | private void HandlePeerDisconnection(object? sender, PeerDisconnectedEventArgs args) |
| | | 269 | | { |
| | 0 | 270 | | ArgumentNullException.ThrowIfNull(args); |
| | | 271 | | |
| | 0 | 272 | | _peers.Remove(args.PeerPubKey); |
| | 0 | 273 | | _logger.LogInformation("Peer {Peer} disconnected", args.PeerPubKey); |
| | | 274 | | |
| | 0 | 275 | | if (sender is IPeerService peerService) |
| | | 276 | | { |
| | 0 | 277 | | peerService.OnDisconnect -= HandlePeerDisconnection; |
| | 0 | 278 | | peerService.OnChannelMessageReceived -= HandlePeerChannelMessage; |
| | 0 | 279 | | peerService.Dispose(); |
| | | 280 | | } |
| | | 281 | | else |
| | | 282 | | { |
| | 0 | 283 | | _logger.LogWarning("Peer {Peer} disconnected, but we were unable to detach event handlers", |
| | 0 | 284 | | args.PeerPubKey); |
| | | 285 | | } |
| | 0 | 286 | | } |
| | | 287 | | |
| | | 288 | | private void HandlePeerChannelMessage(object? _, ChannelMessageEventArgs args) |
| | | 289 | | { |
| | 0 | 290 | | ArgumentNullException.ThrowIfNull(args); |
| | | 291 | | |
| | 0 | 292 | | if (!_peers.TryGetValue(args.PeerPubKey, out var peer)) |
| | 0 | 293 | | throw new ConnectionException($"Peer {args.PeerPubKey} not found while handling channel message"); |
| | | 294 | | |
| | 0 | 295 | | if (!peer.TryGetPeerService(out var peerService)) |
| | 0 | 296 | | throw new ConnectionException( |
| | 0 | 297 | | $"PeerService not found for peer {args.PeerPubKey} while handling channel message"); |
| | | 298 | | |
| | 0 | 299 | | _channelManager.HandleChannelMessageAsync(args.Message, peerService.Features, peerService.PeerPubKey) |
| | 0 | 300 | | .ContinueWith(task => HandleChannelMessageResponseAsync(task, peerService.PeerPubKey, |
| | 0 | 301 | | args.Message.Type)); |
| | 0 | 302 | | } |
| | | 303 | | |
| | | 304 | | private async Task HandleChannelMessageResponseAsync(Task<IChannelMessage?> task, CompactPubKey peerPubKey, |
| | | 305 | | MessageTypes messageType) |
| | | 306 | | { |
| | 0 | 307 | | if (!_peers.TryGetValue(peerPubKey, out var peer)) |
| | 0 | 308 | | throw new ConnectionException($"Peer {peerPubKey} not found while handling channel response message"); |
| | | 309 | | |
| | 0 | 310 | | if (!peer.TryGetPeerService(out var peerService)) |
| | 0 | 311 | | throw new ConnectionException( |
| | 0 | 312 | | $"PeerService not found for peer {peerPubKey} while handling channel response message"); |
| | | 313 | | |
| | 0 | 314 | | if (task.IsFaulted) |
| | | 315 | | { |
| | 0 | 316 | | if (task.Exception is { InnerException: ChannelErrorException cee }) |
| | | 317 | | { |
| | 0 | 318 | | _logger.LogError( |
| | 0 | 319 | | "Error handling channel message ({messageType}) from peer {peer}: {message}", |
| | 0 | 320 | | Enum.GetName(messageType), peerService.PeerPubKey, |
| | 0 | 321 | | !string.IsNullOrEmpty(cee.PeerMessage) |
| | 0 | 322 | | ? cee.PeerMessage |
| | 0 | 323 | | : cee.Message); |
| | | 324 | | |
| | 0 | 325 | | DisconnectPeer(peerService, cee); |
| | 0 | 326 | | return; |
| | | 327 | | } |
| | | 328 | | |
| | 0 | 329 | | if (task.Exception is { InnerException: ChannelWarningException cwe }) |
| | | 330 | | { |
| | 0 | 331 | | _logger.LogWarning( |
| | 0 | 332 | | "Error handling channel message ({messageType}) from peer {peer}: {message}", |
| | 0 | 333 | | Enum.GetName(messageType), peerService.PeerPubKey, |
| | 0 | 334 | | !string.IsNullOrEmpty(cwe.PeerMessage) |
| | 0 | 335 | | ? cwe.PeerMessage |
| | 0 | 336 | | : cwe.Message); |
| | | 337 | | |
| | 0 | 338 | | _ = peerService.SendWarningAsync(cwe) |
| | 0 | 339 | | .ContinueWith(warningTask => |
| | 0 | 340 | | { |
| | 0 | 341 | | if (warningTask.IsFaulted) |
| | 0 | 342 | | { |
| | 0 | 343 | | _logger.LogError(warningTask.Exception, |
| | 0 | 344 | | "Failed to send warning message to peer {Peer}", |
| | 0 | 345 | | peerService.PeerPubKey); |
| | 0 | 346 | | } |
| | 0 | 347 | | }, TaskContinuationOptions.OnlyOnFaulted); |
| | | 348 | | |
| | 0 | 349 | | return; |
| | | 350 | | } |
| | | 351 | | |
| | 0 | 352 | | _logger.LogError( |
| | 0 | 353 | | task.Exception, "Error handling channel message ({messageType}) from peer {peer}", |
| | 0 | 354 | | Enum.GetName(messageType), peerService.PeerPubKey); |
| | | 355 | | |
| | 0 | 356 | | DisconnectPeer(peerService); |
| | 0 | 357 | | return; |
| | | 358 | | } |
| | | 359 | | |
| | 0 | 360 | | var replyMessage = task.Result; |
| | 0 | 361 | | if (replyMessage is not null) |
| | 0 | 362 | | await peerService.SendMessageAsync(replyMessage); |
| | 0 | 363 | | } |
| | | 364 | | |
| | | 365 | | private void HandleResponseMessageReady(object? sender, ChannelResponseMessageEventArgs args) |
| | | 366 | | { |
| | 0 | 367 | | ArgumentNullException.ThrowIfNull(args); |
| | | 368 | | |
| | | 369 | | // Find PeerService by CompactPubKey |
| | 0 | 370 | | if (!_peers.TryGetValue(args.PeerPubKey, out var peer)) |
| | 0 | 371 | | throw new ConnectionException($"Peer {args.PeerPubKey} not found while handling response message"); |
| | | 372 | | |
| | 0 | 373 | | if (!peer.TryGetPeerService(out var peerService)) |
| | 0 | 374 | | throw new ConnectionException( |
| | 0 | 375 | | $"PeerService not found for peer {args.PeerPubKey} while handling response message"); |
| | | 376 | | |
| | | 377 | | // Send the response message to the peer |
| | 0 | 378 | | peerService.SendMessageAsync(args.ResponseMessage) |
| | 0 | 379 | | .ContinueWith(task => |
| | 0 | 380 | | { |
| | 0 | 381 | | _logger.LogError(task.Exception, "Failed to send response message to peer {Peer}", |
| | 0 | 382 | | args.PeerPubKey); |
| | 0 | 383 | | }, TaskContinuationOptions.OnlyOnFaulted); |
| | 0 | 384 | | } |
| | | 385 | | } |