sentinel.py 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302
  1. import os
  2. import time
  3. import json
  4. import random
  5. import threading
  6. import redis
  7. from typing import List, Dict, Callable
  8. from vs_types import GroupConfig, VSPlgConfig, Task, QueryWaitMode
  9. from vs_plg_factory import VSPlgFactory
  10. from toolkit.thread_pool import ThreadPool
  11. from toolkit.vs_cloud_api import VSCloudApi
  12. from toolkit.backoff import ExponentialBackoff
  13. class SentinelGCO:
  14. def __init__(self, cfg: GroupConfig, redis_conf: Dict, logger: Callable[[str], None] = None):
  15. self.m_cfg = cfg
  16. self.m_factory = VSPlgFactory()
  17. self.m_logger = logger
  18. self.m_tasks: List[Task] = []
  19. self.m_lock = threading.RLock()
  20. self.m_stop_event = threading.Event()
  21. self.redis_client = redis.Redis(**redis_conf)
  22. self.m_pending_builtin = 0
  23. # 1. 全局建连退避:起步 1 分钟,封顶 1 小时 (保护登录接口)
  24. self.group_backoff = ExponentialBackoff(base_delay=60.0, max_delay=3600.0, factor=2.0)
  25. self.m_last_spawn_time = 0.0
  26. self.m_last_group_query_time = 0.0
  27. def _log(self, message):
  28. if self.m_logger:
  29. self.m_logger(f'[SENTINEL] [{self.m_cfg.identifier}] {message}')
  30. def _get_average_interval(self) -> float:
  31. """计算当前组平均的查询间隔(秒)"""
  32. mode = self.m_cfg.query_wait.mode
  33. if mode == QueryWaitMode.Loop:
  34. return 1.0
  35. elif mode == QueryWaitMode.Fixed:
  36. return float(self.m_cfg.query_wait.fixed_wait)
  37. elif mode == QueryWaitMode.Random:
  38. return (self.m_cfg.query_wait.random_min + self.m_cfg.query_wait.random_max) / 2.0
  39. return 30.0
  40. def start(self):
  41. if not self.m_cfg.enable:
  42. return
  43. self._log("Starting Sentinel...")
  44. plugin_name = self.m_cfg.plugin_config.plugin_name
  45. class_name = "".join(part.title() for part in plugin_name.split('_'))
  46. plugin_path = os.path.join(self.m_cfg.plugin_config.lib_path, self.m_cfg.plugin_config.plugin_bin)
  47. self.m_factory.register_plugin(plugin_name, plugin_path, class_name)
  48. threading.Thread(target=self._monitor_loop, daemon=True, name="Sentinel-Monitor").start()
  49. threading.Thread(target=self._creator_loop, daemon=True, name="Sentinel-Creator").start()
  50. def stop(self):
  51. self._log("Stopping Sentinel...")
  52. self.m_stop_event.set()
  53. with self.m_lock:
  54. tasks_to_cleanup = list(self.m_tasks)
  55. self.m_tasks.clear()
  56. for task in tasks_to_cleanup:
  57. self._cleanup_task(task, "sentinel stopped")
  58. def _cleanup_task(self, task: Task, reason: str):
  59. try:
  60. if task and task.instance and hasattr(task.instance, "cleanup"):
  61. self._log(f"Cleaning up sentinel instance. reason={reason}")
  62. task.instance.cleanup()
  63. except Exception as e:
  64. self._log(f"Cleanup failed. reason={reason}, error={e}")
  65. def _remove_task(self, task: Task, reason: str):
  66. removed = False
  67. with self.m_lock:
  68. if task in self.m_tasks:
  69. self.m_tasks.remove(task)
  70. removed = True
  71. if removed:
  72. self._cleanup_task(task, reason)
  73. def _get_redis_key(self, routing_key: str) -> str:
  74. return f"vs:signal:{routing_key}"
  75. def _monitor_loop(self):
  76. self._log("Monitor loop started.")
  77. self.m_last_group_query_time = 0.0
  78. while not self.m_stop_event.is_set():
  79. try:
  80. time.sleep(0.5)
  81. now = time.time()
  82. with self.m_lock:
  83. tasks_to_check = list(self.m_tasks)
  84. active_tasks = []
  85. dead_tasks = []
  86. for t in tasks_to_check:
  87. if not t.is_querying:
  88. active_tasks.append(t)
  89. continue
  90. try:
  91. if t.instance.health_check():
  92. active_tasks.append(t)
  93. else:
  94. dead_tasks.append(t)
  95. except Exception as e:
  96. dead_tasks.append(t)
  97. self._log(f"Health check failed: {e}")
  98. if dead_tasks:
  99. with self.m_lock:
  100. current_tasks = list(self.m_tasks)
  101. self.m_tasks = [t for t in self.m_tasks if t in active_tasks]
  102. for t in dead_tasks:
  103. if t in current_tasks:
  104. self._cleanup_task(t, "health check failed")
  105. else:
  106. with self.m_lock:
  107. self.m_tasks = [t for t in self.m_tasks if t in active_tasks]
  108. if not active_tasks:
  109. continue
  110. avg_interval = self._get_average_interval()
  111. global_gap = max(1.0, avg_interval / len(active_tasks))
  112. active_tasks.sort(key=lambda x: x.next_run)
  113. for task in active_tasks:
  114. if now < task.next_run:
  115. continue
  116. if task.is_querying:
  117. continue
  118. if now - self.m_last_group_query_time < global_gap:
  119. break
  120. apt_types = self.m_cfg.appointment_types
  121. if not apt_types:
  122. continue
  123. weights = [float(item.weight) for item in apt_types]
  124. apt_type = random.choices(apt_types, weights=weights, k=1)[0]
  125. interval = 30
  126. mode = task.qw_cfg.mode
  127. if mode == QueryWaitMode.Loop:
  128. interval = 1
  129. elif mode == QueryWaitMode.Fixed:
  130. interval = task.qw_cfg.fixed_wait
  131. elif mode == QueryWaitMode.Random:
  132. interval = random.randint(task.qw_cfg.random_min, task.qw_cfg.random_max)
  133. task.is_querying = True
  134. self.m_last_group_query_time = now
  135. def _query_job(current_task=task, a_type=apt_type, wait_gap=interval):
  136. try:
  137. VSCloudApi.Instance().slot_refresh_start(a_type.routing_key, country=a_type.country, city=a_type.city, visa_type=a_type.visa_type)
  138. result = current_task.instance.query(a_type)
  139. result.apt_type = a_type
  140. if result.success:
  141. ttl = self.m_cfg.sentinel.signal_ttl
  142. self._log(f"🔥 SLOT FOUND! Writing signal to Redis (TTL: {ttl}s)")
  143. payload = {
  144. "group_id": self.m_cfg.identifier,
  145. "apt_type": a_type.model_dump(),
  146. "query_result": result.to_snapshot_payload(),
  147. "timestamp": time.time()
  148. }
  149. redis_key = self._get_redis_key(a_type.routing_key)
  150. self.redis_client.setex(redis_key, ttl, json.dumps(payload))
  151. payload["query_result"]["website"] = self.m_cfg.website
  152. VSCloudApi.Instance().slot_snapshot_report(payload["query_result"])
  153. VSCloudApi.Instance().slot_refresh_success(a_type.routing_key)
  154. except Exception as e:
  155. self._log(f"Query exception: {e}")
  156. VSCloudApi.Instance().slot_refresh_fail(a_type.routing_key, error=str(e))
  157. finally:
  158. current_task.next_run = time.time() + wait_gap
  159. current_task.is_querying = False
  160. ThreadPool.getInstance().enqueue(_query_job)
  161. break
  162. except Exception as e:
  163. self._log(f"Monitor loop error: {e}")
  164. time.sleep(2)
  165. def _creator_loop(self):
  166. self._log("Creator loop started.")
  167. group_cd_key = f"vs:group:cooldown:{self.m_cfg.identifier}"
  168. while not self.m_stop_event.is_set():
  169. time.sleep(2)
  170. with self.m_lock:
  171. if self.redis_client.exists(group_cd_key):
  172. continue
  173. current = len(self.m_tasks)
  174. pending = self.m_pending_builtin
  175. target = self.m_cfg.sentinel.target_instances
  176. if (current + pending) < target:
  177. now = time.time()
  178. avg_interval = self._get_average_interval()
  179. stagger_delay = avg_interval / max(1, target)
  180. stagger_delay = max(10.0, stagger_delay)
  181. if now - self.m_last_spawn_time >= stagger_delay:
  182. with self.m_lock:
  183. self.m_last_spawn_time = now
  184. self._log(f"Staggered spawn triggered. Next spawn in {stagger_delay:.1f}s")
  185. self._spawn_sentinel_worker()
  186. def _spawn_sentinel_worker(self):
  187. with self.m_lock:
  188. self.m_pending_builtin += 1
  189. def _job():
  190. instance = None
  191. success = False
  192. try:
  193. plg_cfg = VSPlgConfig()
  194. plg_cfg.debug = self.m_cfg.debug
  195. plg_cfg.free_config = self.m_cfg.free_config
  196. plg_cfg.session_max_life = self.m_cfg.session_max_life
  197. if not self.m_cfg.need_account:
  198. plg_cfg.account.id = 0
  199. plg_cfg.account.username = "Guest"
  200. else:
  201. acc = VSCloudApi.Instance().get_next_account(self.m_cfg.sentinel.account_pool_id, self.m_cfg.sentinel.account_cd)
  202. plg_cfg.account.id = acc['id']
  203. plg_cfg.account.username = acc['username']
  204. plg_cfg.account.password = acc['password']
  205. if self.m_cfg.need_proxy:
  206. proxy = VSCloudApi.Instance().get_next_proxy(self.m_cfg.proxy_pool, self.m_cfg.proxy_cd)
  207. plg_cfg.proxy.id = proxy['id']
  208. plg_cfg.proxy.ip = proxy['ip']
  209. plg_cfg.proxy.port = proxy['port']
  210. plg_cfg.proxy.proto = proxy['proto']
  211. plg_cfg.proxy.username = proxy['username']
  212. plg_cfg.proxy.password = proxy['password']
  213. instance = self.m_factory.create(self.m_cfg.identifier, self.m_cfg.plugin_config.plugin_name)
  214. instance.set_log(self.m_logger)
  215. instance.set_config(plg_cfg)
  216. instance.create_session()
  217. with self.m_lock:
  218. self.m_tasks.append(
  219. Task(instance=instance,qw_cfg=self.m_cfg.query_wait,next_run=time.time(), book_allowed=False))
  220. group_fail_key = f"vs:group:failures:{self.m_cfg.identifier}"
  221. self.redis_client.delete(group_fail_key)
  222. success = True
  223. self._log(f"+++ Sentinel spawned: {plg_cfg.account.username}")
  224. except Exception as e:
  225. err_str = str(e)
  226. resource_not_found_indicators = [
  227. "40401" in err_str,
  228. "Account not found" in err_str,
  229. "Proxy not found" in err_str,
  230. ]
  231. if any(resource_not_found_indicators):
  232. return
  233. self._log(f"Spawn failed: {e}")
  234. rate_limited_indicators = [
  235. "42901" in err_str,
  236. "Rate limited" in err_str
  237. ]
  238. if any(rate_limited_indicators):
  239. group_fail_key = f"vs:group:failures:{self.m_cfg.identifier}"
  240. group_cd_key = f"vs:group:cooldown:{self.m_cfg.identifier}"
  241. g_fails = self.redis_client.incr(group_fail_key)
  242. g_cd = self.group_backoff.calculate(g_fails)
  243. self.redis_client.set(group_cd_key, "1", ex=int(g_cd))
  244. self._log(f"📉 [Rate Limited] Sentinel Spawn failed {g_fails} times. Global Backoff: {g_cd:.1f}s.")
  245. finally:
  246. if not success and instance is not None:
  247. try:
  248. if hasattr(instance, "cleanup"):
  249. instance.cleanup()
  250. except Exception as e:
  251. self._log(f"Cleanup failed after spawn failure: {e}")
  252. with self.m_lock:
  253. self.m_pending_builtin = max(0, self.m_pending_builtin - 1)
  254. ThreadPool.getInstance().enqueue(_job)