sentinel.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300
  1. import os
  2. import time
  3. import json
  4. import random
  5. import threading
  6. import redis
  7. from typing import List, Dict, Callable
  8. from vs_types import GroupConfig, VSPlgConfig, Task, QueryWaitMode
  9. from vs_plg_factory import VSPlgFactory
  10. from toolkit.thread_pool import ThreadPool
  11. from toolkit.vs_cloud_api import VSCloudApi
  12. from toolkit.backoff import ExponentialBackoff
  13. class SentinelGCO:
  14. def __init__(self, cfg: GroupConfig, redis_conf: Dict, logger: Callable[[str], None] = None):
  15. self.m_cfg = cfg
  16. self.m_factory = VSPlgFactory()
  17. self.m_logger = logger
  18. self.m_tasks: List[Task] = []
  19. self.m_lock = threading.RLock()
  20. self.m_stop_event = threading.Event()
  21. self.redis_client = redis.Redis(**redis_conf)
  22. self.m_pending_builtin = 0
  23. # 1. 全局建连退避:起步 1 分钟,封顶 1 小时 (保护登录接口)
  24. self.group_backoff = ExponentialBackoff(base_delay=60.0, max_delay=3600.0, factor=2.0)
  25. self.m_last_spawn_time = 0.0
  26. self.m_spawn_interval = 120
  27. self.m_last_group_query_time = 0.0
  28. def _log(self, message):
  29. if self.m_logger:
  30. self.m_logger(f'[SENTINEL] [{self.m_cfg.identifier}] {message}')
  31. def _get_average_interval(self) -> float:
  32. """计算当前组平均的查询间隔(秒)"""
  33. mode = self.m_cfg.query_wait.mode
  34. if mode == QueryWaitMode.Loop:
  35. return 1.0
  36. elif mode == QueryWaitMode.Fixed:
  37. return float(self.m_cfg.query_wait.fixed_wait)
  38. elif mode == QueryWaitMode.Random:
  39. return (self.m_cfg.query_wait.random_min + self.m_cfg.query_wait.random_max) / 2.0
  40. return 30.0
  41. def start(self):
  42. if not self.m_cfg.enable:
  43. return
  44. self._log("Starting Sentinel...")
  45. plugin_name = self.m_cfg.plugin_config.plugin_name
  46. class_name = "".join(part.title() for part in plugin_name.split('_'))
  47. plugin_path = os.path.join(self.m_cfg.plugin_config.lib_path, self.m_cfg.plugin_config.plugin_bin)
  48. self.m_factory.register_plugin(plugin_name, plugin_path, class_name)
  49. threading.Thread(target=self._monitor_loop, daemon=True, name="Sentinel-Monitor").start()
  50. threading.Thread(target=self._creator_loop, daemon=True, name="Sentinel-Creator").start()
  51. def stop(self):
  52. self._log("Stopping Sentinel...")
  53. self.m_stop_event.set()
  54. with self.m_lock:
  55. tasks_to_cleanup = list(self.m_tasks)
  56. self.m_tasks.clear()
  57. for task in tasks_to_cleanup:
  58. self._cleanup_task(task, "sentinel stopped")
  59. def _cleanup_task(self, task: Task, reason: str):
  60. try:
  61. if task and task.instance and hasattr(task.instance, "cleanup"):
  62. self._log(f"Cleaning up sentinel instance. reason={reason}")
  63. task.instance.cleanup()
  64. except Exception as e:
  65. self._log(f"Cleanup failed. reason={reason}, error={e}")
  66. def _remove_task(self, task: Task, reason: str):
  67. removed = False
  68. with self.m_lock:
  69. if task in self.m_tasks:
  70. self.m_tasks.remove(task)
  71. removed = True
  72. if removed:
  73. self._cleanup_task(task, reason)
  74. def _get_redis_key(self, routing_key: str) -> str:
  75. return f"vs:signal:{routing_key}"
  76. def _monitor_loop(self):
  77. self._log("Monitor loop started.")
  78. self.m_last_group_query_time = 0.0
  79. while not self.m_stop_event.is_set():
  80. try:
  81. time.sleep(0.5)
  82. now = time.time()
  83. with self.m_lock:
  84. tasks_to_check = list(self.m_tasks)
  85. active_tasks = []
  86. dead_tasks = []
  87. for t in tasks_to_check:
  88. if not t.is_querying:
  89. active_tasks.append(t)
  90. continue
  91. try:
  92. if t.instance.health_check():
  93. active_tasks.append(t)
  94. else:
  95. dead_tasks.append(t)
  96. except Exception as e:
  97. dead_tasks.append(t)
  98. self._log(f"Health check failed: {e}")
  99. if dead_tasks:
  100. with self.m_lock:
  101. current_tasks = list(self.m_tasks)
  102. self.m_tasks = [t for t in self.m_tasks if t in active_tasks]
  103. for t in dead_tasks:
  104. if t in current_tasks:
  105. self._cleanup_task(t, "health check failed")
  106. else:
  107. with self.m_lock:
  108. self.m_tasks = [t for t in self.m_tasks if t in active_tasks]
  109. if not active_tasks:
  110. continue
  111. avg_interval = self._get_average_interval()
  112. global_gap = max(1.0, avg_interval / len(active_tasks))
  113. active_tasks.sort(key=lambda x: x.next_run)
  114. for task in active_tasks:
  115. if now < task.next_run:
  116. continue
  117. if task.is_querying:
  118. continue
  119. if now - self.m_last_group_query_time < global_gap:
  120. break
  121. apt_types = self.m_cfg.appointment_types
  122. if not apt_types:
  123. continue
  124. weights = [float(item.weight) for item in apt_types]
  125. apt_type = random.choices(apt_types, weights=weights, k=1)[0]
  126. interval = 30
  127. mode = task.qw_cfg.mode
  128. if mode == QueryWaitMode.Loop:
  129. interval = 1
  130. elif mode == QueryWaitMode.Fixed:
  131. interval = task.qw_cfg.fixed_wait
  132. elif mode == QueryWaitMode.Random:
  133. interval = random.randint(task.qw_cfg.random_min, task.qw_cfg.random_max)
  134. task.is_querying = True
  135. self.m_last_group_query_time = now
  136. def _query_job(current_task=task, a_type=apt_type, wait_gap=interval):
  137. try:
  138. VSCloudApi.Instance().slot_refresh_start(a_type.routing_key, country=a_type.country, city=a_type.city, visa_type=a_type.visa_type)
  139. result = current_task.instance.query(a_type)
  140. result.apt_type = a_type
  141. if result.success:
  142. ttl = self.m_cfg.sentinel.signal_ttl
  143. self._log(f"🔥 SLOT FOUND! Writing signal to Redis (TTL: {ttl}s)")
  144. payload = {
  145. "group_id": self.m_cfg.identifier,
  146. "apt_type": a_type.model_dump(),
  147. "query_result": result.to_snapshot_payload(),
  148. "timestamp": time.time()
  149. }
  150. redis_key = self._get_redis_key(a_type.routing_key)
  151. self.redis_client.setex(redis_key, ttl, json.dumps(payload))
  152. payload["query_result"]["website"] = self.m_cfg.website
  153. VSCloudApi.Instance().slot_snapshot_report(payload["query_result"])
  154. VSCloudApi.Instance().slot_refresh_success(a_type.routing_key)
  155. except Exception as e:
  156. self._log(f"Query exception: {e}")
  157. VSCloudApi.Instance().slot_refresh_fail(a_type.routing_key, error=str(e))
  158. finally:
  159. current_task.next_run = time.time() + wait_gap
  160. current_task.is_querying = False
  161. ThreadPool.getInstance().enqueue(_query_job)
  162. break
  163. except Exception as e:
  164. self._log(f"Monitor loop error: {e}")
  165. time.sleep(2)
  166. def _creator_loop(self):
  167. self._log("Creator loop started.")
  168. group_cd_key = f"vs:group:cooldown:{self.m_cfg.identifier}"
  169. while not self.m_stop_event.is_set():
  170. time.sleep(2)
  171. with self.m_lock:
  172. if self.redis_client.exists(group_cd_key):
  173. continue
  174. current = len(self.m_tasks)
  175. pending = self.m_pending_builtin
  176. target = self.m_cfg.sentinel.target_instances
  177. if (current + pending) < target:
  178. now = time.time()
  179. if now - self.m_last_spawn_time >= self.m_spawn_interval:
  180. with self.m_lock:
  181. self.m_last_spawn_time = now
  182. self._log(f"Staggered spawn triggered. Next spawn in {self.m_spawn_interval:.1f}s")
  183. self._spawn_sentinel_worker()
  184. def _spawn_sentinel_worker(self):
  185. with self.m_lock:
  186. self.m_pending_builtin += 1
  187. def _job():
  188. instance = None
  189. success = False
  190. try:
  191. plg_cfg = VSPlgConfig()
  192. plg_cfg.debug = self.m_cfg.debug
  193. plg_cfg.free_config = self.m_cfg.free_config
  194. plg_cfg.session_max_life = self.m_cfg.session_max_life
  195. if not self.m_cfg.need_account:
  196. plg_cfg.account.id = 0
  197. plg_cfg.account.username = "Guest"
  198. else:
  199. acc = VSCloudApi.Instance().get_next_account(self.m_cfg.sentinel.account_pool_id, self.m_cfg.sentinel.account_cd)
  200. plg_cfg.account.id = acc['id']
  201. plg_cfg.account.username = acc['username']
  202. plg_cfg.account.password = acc['password']
  203. if self.m_cfg.need_proxy:
  204. proxy = VSCloudApi.Instance().get_next_proxy(self.m_cfg.proxy_pool, self.m_cfg.proxy_cd)
  205. plg_cfg.proxy.id = proxy['id']
  206. plg_cfg.proxy.ip = proxy['ip']
  207. plg_cfg.proxy.port = proxy['port']
  208. plg_cfg.proxy.proto = proxy['proto']
  209. plg_cfg.proxy.username = proxy['username']
  210. plg_cfg.proxy.password = proxy['password']
  211. instance = self.m_factory.create(self.m_cfg.identifier, self.m_cfg.plugin_config.plugin_name)
  212. instance.set_log(self.m_logger)
  213. instance.set_config(plg_cfg)
  214. instance.create_session()
  215. with self.m_lock:
  216. self.m_tasks.append(
  217. Task(instance=instance,qw_cfg=self.m_cfg.query_wait,next_run=time.time(), book_allowed=False))
  218. group_fail_key = f"vs:group:failures:{self.m_cfg.identifier}"
  219. self.redis_client.delete(group_fail_key)
  220. success = True
  221. self._log(f"+++ Sentinel spawned: {plg_cfg.account.username}")
  222. except Exception as e:
  223. err_str = str(e)
  224. resource_not_found_indicators = [
  225. "40401" in err_str,
  226. "Account not found" in err_str,
  227. "Proxy not found" in err_str,
  228. ]
  229. if any(resource_not_found_indicators):
  230. return
  231. self._log(f"Spawn failed: {e}")
  232. rate_limited_indicators = [
  233. "42901" in err_str,
  234. "Rate limited" in err_str
  235. ]
  236. if any(rate_limited_indicators):
  237. group_fail_key = f"vs:group:failures:{self.m_cfg.identifier}"
  238. group_cd_key = f"vs:group:cooldown:{self.m_cfg.identifier}"
  239. g_fails = self.redis_client.incr(group_fail_key)
  240. g_cd = self.group_backoff.calculate(g_fails)
  241. self.redis_client.set(group_cd_key, "1", ex=int(g_cd))
  242. self._log(f"📉 [Rate Limited] Sentinel Spawn failed {g_fails} times. Global Backoff: {g_cd:.1f}s.")
  243. finally:
  244. if not success and instance is not None:
  245. try:
  246. if hasattr(instance, "cleanup"):
  247. instance.cleanup()
  248. except Exception as e:
  249. self._log(f"Cleanup failed after spawn failure: {e}")
  250. with self.m_lock:
  251. self.m_pending_builtin = max(0, self.m_pending_builtin - 1)
  252. ThreadPool.getInstance().enqueue(_job)