relay_client.py 6.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159
  1. from __future__ import annotations
  2. import asyncio
  3. import contextlib
  4. import socket
  5. from dataclasses import dataclass
  6. import time
  7. from typing import Awaitable, Callable, Dict
  8. from .config import Config, RelayNode
  9. from .protocol import AUTH, PING, PONG, STATUS_OK, Frame, encode_json, read_frame, write_frame
  10. from .scheduler import Scheduler
  11. FrameHandler = Callable[["RelayConnection", Frame], Awaitable[None]]
  12. @dataclass
  13. class RelayConnection:
  14. node: RelayNode
  15. manager: "RelayManager"
  16. reader: asyncio.StreamReader
  17. writer: asyncio.StreamWriter
  18. closed: bool = False
  19. handlers: Dict[tuple[int, int], FrameHandler] = None
  20. pump_task: asyncio.Task | None = None
  21. keepalive_task: asyncio.Task | None = None
  22. last_pong_at: float = 0.0
  23. def __post_init__(self) -> None:
  24. if self.handlers is None:
  25. self.handlers = {}
  26. async def start(self) -> None:
  27. print(f"[edge] connecting relay name={self.node.name} addr={self.node.host}:{self.node.port}")
  28. await write_frame(self.writer, Frame(AUTH, 0, 0, 0, 0, encode_json({"token": self.node.token})))
  29. frame = await read_frame(self.reader)
  30. if frame.kind != AUTH or frame.packet_id != STATUS_OK:
  31. raise ConnectionError(f"relay auth failed: {self.node.name}")
  32. print(f"[edge] relay connected name={self.node.name} addr={self.node.host}:{self.node.port}")
  33. self.last_pong_at = time.monotonic()
  34. self.keepalive_task = asyncio.create_task(self._keepalive())
  35. self.pump_task = asyncio.create_task(self._pump())
  36. async def _keepalive(self) -> None:
  37. try:
  38. while not self.closed:
  39. await asyncio.sleep(self.manager.config.relay_ping_interval)
  40. if self.closed:
  41. break
  42. if time.monotonic() - self.last_pong_at > self.manager.config.relay_ping_timeout:
  43. print(f"[edge] relay health timeout name={self.node.name} addr={self.node.host}:{self.node.port} timeout={self.manager.config.relay_ping_timeout}")
  44. await self.close()
  45. break
  46. await self.send(Frame(PING, 0, 0, 0, 0, b""))
  47. except asyncio.CancelledError:
  48. pass
  49. except Exception:
  50. await self.close()
  51. async def _pump(self) -> None:
  52. try:
  53. while True:
  54. frame = await read_frame(self.reader)
  55. if frame.kind == PONG:
  56. self.last_pong_at = time.monotonic()
  57. continue
  58. handler = self.handlers.get((frame.session_id, frame.stream_id))
  59. if handler:
  60. await handler(self, frame)
  61. except asyncio.IncompleteReadError:
  62. print(f"[edge] relay disconnected name={self.node.name} eof=true")
  63. except Exception as exc:
  64. print(f"[edge] relay pump error name={self.node.name} error={exc!r}")
  65. finally:
  66. await self.close()
  67. async def send(self, frame: Frame) -> None:
  68. if self.closed:
  69. raise ConnectionError(f"relay closed: {self.node.name}")
  70. await write_frame(self.writer, frame)
  71. def bind(self, session_id: int, stream_id: int, handler: FrameHandler) -> None:
  72. self.handlers[(session_id, stream_id)] = handler
  73. def unbind(self, session_id: int, stream_id: int) -> None:
  74. self.handlers.pop((session_id, stream_id), None)
  75. async def close(self) -> None:
  76. if self.closed:
  77. return
  78. self.closed = True
  79. self.manager.on_closed(self)
  80. if self.keepalive_task and self.keepalive_task is not asyncio.current_task():
  81. self.keepalive_task.cancel()
  82. with contextlib.suppress(Exception):
  83. await self.keepalive_task
  84. self.writer.close()
  85. with contextlib.suppress(Exception):
  86. await self.writer.wait_closed()
  87. class RelayManager:
  88. def __init__(self, config: Config) -> None:
  89. self.config = config
  90. self.scheduler = Scheduler(config)
  91. self.connections: Dict[str, RelayConnection] = {}
  92. self.tasks: list[asyncio.Task] = []
  93. async def start(self) -> None:
  94. await self.scheduler.start()
  95. for node in self.config.relays:
  96. self.tasks.append(asyncio.create_task(self._maintain(node)))
  97. async def _maintain(self, node: RelayNode) -> None:
  98. while True:
  99. if node.name in self.connections and not self.connections[node.name].closed:
  100. await asyncio.sleep(2)
  101. continue
  102. connected = False
  103. for attempt in range(1, self.config.relay_reconnect_attempts + 1):
  104. try:
  105. print(f"[edge] relay reconnect attempt name={node.name} addr={node.host}:{node.port} attempt={attempt}/{self.config.relay_reconnect_attempts}")
  106. reader, writer = await asyncio.wait_for(asyncio.open_connection(node.host, node.port), timeout=self.config.relay_open_timeout)
  107. connection = RelayConnection(node=node, manager=self, reader=reader, writer=writer)
  108. sock = writer.get_extra_info("socket")
  109. if sock is not None and self.config.relay_tcp_nodelay:
  110. with contextlib.suppress(OSError):
  111. sock.setsockopt(socket.IPPROTO_TCP, socket.TCP_NODELAY, 1)
  112. await connection.start()
  113. self.connections[node.name] = connection
  114. connected = True
  115. await connection.pump_task
  116. break
  117. except Exception as exc:
  118. print(f"[edge] relay connect failed name={node.name} addr={node.host}:{node.port} attempt={attempt}/{self.config.relay_reconnect_attempts} error={exc!r}")
  119. if attempt < self.config.relay_reconnect_attempts:
  120. await asyncio.sleep(self.config.relay_reconnect_delay)
  121. if not connected:
  122. print(f"[edge] relay reconnect exhausted name={node.name} addr={node.host}:{node.port} attempts={self.config.relay_reconnect_attempts}")
  123. await asyncio.sleep(self.config.relay_reconnect_delay)
  124. def on_closed(self, connection: RelayConnection) -> None:
  125. current = self.connections.get(connection.node.name)
  126. if current is connection:
  127. self.connections.pop(connection.node.name, None)
  128. def available(self) -> list[RelayConnection]:
  129. chosen = {node.name for node in self.scheduler.choose()}
  130. preferred = [self.connections[name] for name in chosen if name in self.connections and not self.connections[name].closed]
  131. if preferred:
  132. return preferred
  133. return [conn for conn in self.connections.values() if not conn.closed]
  134. def snapshot(self) -> list[dict[str, object]]:
  135. data = self.scheduler.snapshot()
  136. online = {name for name, conn in self.connections.items() if not conn.closed}
  137. for item in data:
  138. item["online"] = item["name"] in online
  139. return data