tls_plugin.py 23 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559
  1. import time
  2. import json
  3. import random
  4. import re
  5. import os
  6. from datetime import datetime
  7. from typing import List, Dict, Optional, Any, Callable
  8. from urllib.parse import urljoin, urlparse
  9. from requests_toolbelt import MultipartEncoder
  10. from curl_cffi import requests, const
  11. from bs4 import BeautifulSoup
  12. from vs_plg import IVSPlg
  13. from vs_types import VSPlgConfig, AppointmentType, VSQueryResult, VSBookResult, AvailabilityStatus, TimeSlot, DateAvailability, NotFoundError, PermissionDeniedError, RateLimiteddError, SessionExpiredOrInvalidError, BizLogicError
  14. from toolkit.vs_cloud_api import VSCloudApi
  15. class TlsPlugin(IVSPlg):
  16. """
  17. TLSContact 签证预约插件
  18. 适配法国签证 (FR) 流程
  19. """
  20. def __init__(self, group_id: str):
  21. self.group_id = group_id
  22. self.config: Optional[VSPlgConfig] = None
  23. self.free_config: Dict[str, Any] = {}
  24. self.is_healthy = True
  25. self.logger = None
  26. self.session: Optional[requests.Session] = None
  27. self.travel_group: Optional[Dict] = None
  28. self.user_agent: str = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/124.0.0.0 Safari/537.36"
  29. self.session_create_time: float = 0
  30. def get_group_id(self) -> str:
  31. return self.group_id
  32. def set_log(self, logger: Callable[[str], None]) -> None:
  33. self.logger = logger
  34. def set_config(self, config: VSPlgConfig):
  35. self.config = config
  36. self.free_config = config.free_config or {}
  37. def health_check(self) -> bool:
  38. if not self.is_healthy:
  39. return False
  40. if self.session is None:
  41. return False
  42. if self.config.session_max_life > 0:
  43. current_time = time.time()
  44. elapsed_time = current_time - self.session_create_time
  45. if elapsed_time > self.config.session_max_life * 60:
  46. self._log(f"Session Life ({int(elapsed_time)}s) out of max life limit ({self.config.session_max_life * 60}s), mark as unhealth session")
  47. return False
  48. return True
  49. def create_session(self):
  50. """
  51. 创建会话:处理 Cloudflare -> 登录 -> 获取 Travel Group
  52. """
  53. # 1. 初始化 Session
  54. curlopt = {
  55. const.CurlOpt.MAXAGE_CONN: 1800,
  56. const.CurlOpt.MAXLIFETIME_CONN: 1800,
  57. const.CurlOpt.VERBOSE: self.config.debug,
  58. }
  59. self.session = requests.Session(
  60. proxy=self._get_proxy_url(),
  61. impersonate="chrome124",
  62. curl_options=curlopt,
  63. use_thread_local_curl=False,
  64. http_version=const.CurlHttpVersion.V2TLS
  65. )
  66. apt_config = self.free_config.get('apt_config', {})
  67. if not apt_config:
  68. raise NotFoundError(message="apt_config not found in free config")
  69. # 2. 解决 Cloudflare 5s 盾
  70. self._solve_cloudflare5S_challenge()
  71. # 3. 获取登录页面参数 (OIDC)
  72. login_page = "https://visas-fr.tlscontact.com/en-us/login"
  73. params = {
  74. "issuerId": apt_config["code"],
  75. "country": apt_config["country"],
  76. "vac": apt_config["code"],
  77. "redirect": f"/en-us/country/{apt_config['country']}/vac/{apt_config['code']}"
  78. }
  79. headers = {
  80. 'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
  81. 'Accept-Language': 'zh-CN,zh;q=0.9,en;q=0.8',
  82. 'Referer': f'https://visas-fr.tlscontact.com/en-us/country/{apt_config["country"]}/vac/{apt_config["code"]}',
  83. 'User-Agent': self.user_agent,
  84. }
  85. resp = self._perform_request("GET", login_page, headers=headers, params=params)
  86. if self.config.debug:
  87. self._save_debug_html(resp.text, prefix='Tls_Login_Page')
  88. # 解析 Keycloak 登录地址
  89. soup = BeautifulSoup(resp.text, 'html.parser')
  90. form = soup.find('form')
  91. if not form:
  92. raise NotFoundError(message="Login form not found")
  93. action = form.get('action')
  94. authenticate_url = action if action.startswith('http') else urljoin(resp.url, action)
  95. # 4. 解决 ReCaptcha V2 (登录验证码)
  96. api_token = self.free_config.get("capsolver_key", "")
  97. if not api_token:
  98. raise NotFoundError(message="Missing 'capsolver_key' in free_config, captcha might fail.")
  99. rc_params = {
  100. "type": "ReCaptchaV2TaskProxyLess",
  101. "page": authenticate_url,
  102. "siteKey": "6LcDpXcfAAAAAM7wOEsF_38DNsL20tTvPTKxpyn0",
  103. "apiToken": api_token,
  104. "proxy": self._get_proxy_url()
  105. }
  106. g_token = self._solve_recaptcha(rc_params)
  107. # 5. 提交登录
  108. payload = {
  109. 'username': self.config.account.username,
  110. 'password': self.config.account.password,
  111. 'g-recaptcha-response': g_token
  112. }
  113. headers['Content-Type'] = 'application/x-www-form-urlencoded'
  114. resp = self._perform_request("POST", authenticate_url, headers=headers, data=payload)
  115. if self.config.debug:
  116. self._save_debug_html(resp.text, prefix='Tls_Travel_Groups_Page')
  117. # 6. 解析 Travel Groups
  118. self._check_page_is_session_expired_or_invalid("My travel group", resp.text)
  119. groups = self._parse_travel_groups(resp.text)
  120. # 选择匹配城市的 Group
  121. target_city = apt_config['city'].lower()
  122. for g in groups:
  123. if g['location'].lower() == target_city:
  124. self.travel_group = g
  125. break
  126. if not self.travel_group:
  127. raise NotFoundError(message=f"No matched group found for city {target_city}")
  128. self.session_create_time = time.time()
  129. self._log(f"Session created successfully. Group: {self.travel_group['group_number']}")
  130. def query(self, apt_type: AppointmentType) -> VSQueryResult:
  131. res = VSQueryResult()
  132. res.success = False
  133. apt_config = self.free_config.get('apt_config', {})
  134. group_num = self.travel_group['group_number']
  135. interest_month = self.free_config.get("interest_month", time.strftime("%m-%Y"))
  136. max_retries = self.free_config.get("max_retries", 2)
  137. url = f'https://visas-fr.tlscontact.com/en-us/{group_num}/workflow/appointment-booking'
  138. params = {
  139. 'location': apt_config["code"],
  140. 'month': interest_month,
  141. }
  142. headers = {
  143. 'accept': '*/*',
  144. 'accept-language': 'zh-CN,zh;q=0.9,en;q=0.8',
  145. 'referer': f'{url}?location={apt_config["code"]}',
  146. 'user-agent': self.user_agent,
  147. }
  148. for attempt in range(1, max_retries + 1):
  149. try:
  150. resp = self._perform_request("GET", url, headers=headers, params=params)
  151. if self.config.debug:
  152. self._save_debug_html(resp.text, prefix='Tls_Query_Slot_Page')
  153. break # ✅ 请求成功,跳出重试循环
  154. except PermissionDeniedError:
  155. self._log(f"Query Appointment-booking blocked (403), attempt {attempt}/{max_retries}")
  156. # 最后一次就不再绕盾了
  157. if attempt >= max_retries:
  158. raise PermissionDeniedError()
  159. self._solve_cloudflare5S_challenge()
  160. self._log("Cloudflare bypass success, retrying...")
  161. continue
  162. self._check_page_is_session_expired_or_invalid('Book your appointment', resp.text)
  163. # 3. 解析 Slots
  164. all_slots = self._parse_appointment_slots(resp.text)
  165. target_labels = self.free_config.get("target_labels", ["", "pta"])
  166. available = [s for s in all_slots if s.get("label") in target_labels]
  167. if available:
  168. res.success = True
  169. earliest_date = available[0]["date"]
  170. earliest_dt = datetime.strptime(earliest_date, "%Y-%m-%d")
  171. res.availability_status = AvailabilityStatus.Available
  172. res.earliest_date = earliest_dt
  173. date_map: dict[datetime, list[TimeSlot]] = {}
  174. for s in available:
  175. date_str = s["date"]
  176. dt = datetime.strptime(date_str, "%Y-%m-%d")
  177. date_map.setdefault(dt, []).append(
  178. TimeSlot(time=s["time"], label=str(s.get("label", "")))
  179. )
  180. res.availability = [DateAvailability(date=d, times=slots) for d, slots in date_map.items()]
  181. else:
  182. res.success = False
  183. res.availability_status = AvailabilityStatus.NoneAvailable
  184. return res
  185. def book(self, slot_info: VSQueryResult, user_inputs: Dict = None) -> VSBookResult:
  186. res = VSBookResult()
  187. res.success = False
  188. # 1. 基础信息提取
  189. apt_config = self.free_config.get('apt_config', {})
  190. group_num = self.travel_group['group_number']
  191. available_dates = [da.date for da in slot_info.availability]
  192. exp_start = user_inputs.get('expected_start_date', '')
  193. exp_end = user_inputs.get('expected_end_date', '')
  194. support_pta = user_inputs.get('support_pta', True)
  195. target_labels = ['']
  196. if support_pta:
  197. target_labels.append('pta')
  198. available_dates_str = [
  199. da.date.strftime("%Y-%m-%d")
  200. for da in slot_info.availability
  201. ]
  202. valid_dates = self._filter_dates(available_dates, exp_start, exp_end)
  203. if not valid_dates:
  204. raise NotFoundError(message="No dates match user constraints")
  205. selected_date = None
  206. selected_time = None
  207. selected_label = None
  208. # [关键修正] Label 处理
  209. for d in valid_dates:
  210. for da in slot_info.availability:
  211. if da.date == d:
  212. for t in da.times:
  213. if t.label in target_labels:
  214. selected_date = d
  215. selected_time = t
  216. selected_label = t.label
  217. break
  218. # 2. 解决 ReCaptcha V3
  219. # 动作必须是 "book"
  220. page_url = f'https://visas-fr.tlscontact.com/en-us/{group_num}/workflow/appointment-booking?location={apt_config["code"]}&month={selected_date[:7]}'
  221. api_token = self.free_config.get("capsolver_key", "")
  222. rc_params = {
  223. "type": "ReCaptchaV3Task",
  224. "page": page_url,
  225. "action": "book",
  226. "siteKey": "6LcTpXcfAAAAAM3VojNhyV-F1z92ADJIvcSZ39Y9",
  227. "apiToken": api_token,
  228. "proxy": self._get_proxy_url()
  229. }
  230. g_token = self._solve_recaptcha(rc_params)
  231. # 3. 构造 Payload (严格对齐你的 Curl Dump)
  232. # Next.js Server Action ID (从你的 header 确认)
  233. ACTION_ID = "60d0616946df1fc4e7c094ca6a7a04f134d0be3d53"
  234. fields = {
  235. '1_formGroupId': str(group_num), # 修正:加了 form 前缀
  236. '1_lang': 'en-us',
  237. '1_process': 'APPOINTMENT',
  238. '1_location': apt_config["code"], # 例如 gbLON2fr
  239. '1_date': selected_date,
  240. '1_time': selected_time,
  241. '1_appointmentLabel': selected_label, # 修正:单数 Label,值为字符串 "pta" 或 "regular"
  242. '1_captcha_token': g_token, # 修正:下划线格式
  243. '0': '[{"status":"IDLE"},"$K1"]' # 对应 Next.js Action 的状态位
  244. }
  245. m = MultipartEncoder(fields=fields)
  246. # 4. 发送请求
  247. url = f'https://visas-fr.tlscontact.com/en-us/{group_num}/workflow/appointment-booking'
  248. headers = {
  249. 'Next-Action': ACTION_ID,
  250. 'Referer': page_url,
  251. 'Origin': 'https://visas-fr.tlscontact.com',
  252. 'Accept': 'text/x-component',
  253. 'User-Agent': self.user_agent, # 确保和 curl_cffi 的 impersonate 一致
  254. 'Content-Type': m.content_type,
  255. # 使用你 dump 里的 State Tree,虽然长,但最稳妥
  256. 'Next-Router-State-Tree': '%5B%22%22%2C%7B%22children%22%3A%5B%5B%22lang%22%2C%22en-us%22%2C%22d%22%5D%2C%7B%22children%22%3A%5B%5B%22groupId%22%2C%22'+str(group_num)+'%22%2C%22d%22%5D%2C%7B%22children%22%3A%5B%22workflow%22%2C%7B%22children%22%3A%5B%22appointment-booking%22%2C%7B%22children%22%3A%5B%22__PAGE__%22%2C%7B%7D%2Cnull%2Cnull%5D%7D%2Cnull%2Cnull%2Ctrue%5D%7D%2Cnull%2Cnull%5D%7D%2Cnull%2Cnull%5D%7D%2Cnull%2Cnull%2Ctrue%5D%7D%2Cnull%2Cnull%5D'
  257. }
  258. # 必须使用 curl_cffi 模拟浏览器指纹
  259. resp = self.session.post(url, data=m.to_string(), headers=headers, allow_redirects=False)
  260. if self.config.debug:
  261. self._save_debug_html(resp.text, prefix='Tls_Book_Result')
  262. # 5. 结果判定
  263. if resp.status_code == 303:
  264. location = resp.headers.get('Location', '')
  265. self._log(f"Booking Success! Redirecting to: {location}")
  266. res.success = True
  267. res.book_date = selected_date
  268. res.book_time = selected_time
  269. return res
  270. elif resp.status_code == 200:
  271. # Next.js 有时会在 200 中返回业务错误
  272. if "APPOINTMENT_LIMIT_REACHED" in resp.text:
  273. self._log("Failed: 限制/无号")
  274. elif "Invalid captcha" in resp.text:
  275. self._log("Failed: 验证码错误")
  276. else:
  277. self._log(f"Booking Failed (200 OK but error content): {resp.text[:200]}")
  278. else:
  279. self._log(f'Booking Failed. Status: {resp.status_code}')
  280. return res
  281. def _log(self, message):
  282. if self.logger:
  283. self.logger(f'[TlsPlugin] [{self.group_id}] {message}')
  284. def _save_debug_html(self, content: str, prefix: str = "debug"):
  285. save_dir = "debug_pages"
  286. if not os.path.exists(save_dir):
  287. os.makedirs(save_dir)
  288. timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
  289. filename = f"{save_dir}/{prefix}_{timestamp}.html"
  290. with open(filename, "w", encoding="utf-8") as f:
  291. f.write(content)
  292. self._log(f"HTML saved to: {filename}")
  293. def _get_proxy_url(self):
  294. # 构造代理
  295. proxy_url = ""
  296. if self.config.proxy.ip:
  297. s = self.config.proxy
  298. if s.username:
  299. proxy_url = f"{s.scheme}://{s.username}:{s.password}@{s.ip}:{s.port}"
  300. else:
  301. proxy_url = f"{s.scheme}://{s.ip}:{s.port}"
  302. return proxy_url
  303. def _perform_request(self, method, url, headers=None, data=None, json_data=None, params=None):
  304. """
  305. 统一 HTTP 请求封装,严格复刻 C++ 逻辑:
  306. 1. 发送 OPTIONS 请求
  307. 2. 发送实际请求
  308. """
  309. resp = self.session.request(method, url, headers=headers, data=data, json=json_data, params=params, timeout=30)
  310. if self.config.debug:
  311. self._log(f'[perform request] Response={resp.text}\nMethod={method}, Url={url}, Data={data}, JsonData={json_data}, Params={params}')
  312. if resp.status_code == 200:
  313. return resp
  314. elif resp.status_code == 401:
  315. self.is_healthy = False
  316. raise SessionExpiredOrInvalidError()
  317. elif resp.status_code == 403:
  318. raise PermissionDeniedError()
  319. elif resp.status_code == 429:
  320. self.is_healthy = False
  321. raise RateLimiteddError()
  322. else:
  323. raise BizLogicError(message=f"HTTP Error {resp.status_code}: {resp.text[:100]}")
  324. def _solve_cloudflare5S_challenge(self):
  325. """
  326. 解决 Cloudflare 5s 盾
  327. """
  328. self._log(f"Solving Cloudflare 5s...")
  329. apt_config = self.free_config.get('apt_config', {})
  330. website_url = f'https://visas-fr.tlscontact.com/en-us/country/{apt_config["country"]}'
  331. # 1. 格式化代理字符串, 这里的接口要求格式通常是: host:port:user:pass (根据你的脚本示例)
  332. p = self.config.proxy
  333. if p.username:
  334. proxy_str = f"{p.ip}:{p.port}:{p.username}:{p.password}"
  335. else:
  336. proxy_str = f"{p.ip}:{p.port}"
  337. # 2. 提交任务
  338. task_id = VSCloudApi.Instance().create_task(
  339. command="AntiCloudflareTask",
  340. args={
  341. "proxy": proxy_str,
  342. "websiteUrl": website_url
  343. }
  344. )
  345. result_data = VSCloudApi.Instance().get_task_result(task_id, timeout=60)
  346. task_result = result_data.get("result", {})
  347. cookies_list = task_result.get('cookies', [])
  348. for cookie in cookies_list:
  349. if cookie['name'] in ['__cf_bm', 'cf_clearance']:
  350. self.session.cookies.set(
  351. cookie['name'],
  352. cookie['value'],
  353. domain=cookie['domain'],
  354. path='/'
  355. )
  356. ua = task_result.get('userAgent')
  357. if ua:
  358. self.user_agent = ua
  359. self.session.headers['User-Agent'] = ua
  360. self._log("Cloudflare 5s challenge solved.")
  361. def _solve_recaptcha(self, params) -> str:
  362. """
  363. 调用 Capsolver
  364. """
  365. key = params.get("apiToken")
  366. if not key:
  367. raise NotFoundError(message="Api-token is required for recaptcha solver")
  368. submit_url = "https://api.capsolver.com/createTask"
  369. task = {
  370. "type": params.get("type"),
  371. "websiteURL": params.get("page"),
  372. "websiteKey": params.get("siteKey"),
  373. }
  374. if params.get("action"):
  375. task["pageAction"] = params.get("action")
  376. if params.get("proxy"):
  377. p = urlparse(params.get("proxy"))
  378. task["proxyType"] = p.scheme
  379. task["proxyAddress"] = p.hostname
  380. task["proxyPort"] = p.port
  381. if p.username:
  382. task["proxyLogin"] = p.username
  383. task["proxyPassword"] = p.password
  384. payload = {"clientKey": key, "task": task}
  385. r = requests.post(submit_url, json=payload, timeout=20)
  386. if r.status_code != 200:
  387. raise BizLogicError(message="Failed to submit capsolver task")
  388. task_id = r.json().get("taskId")
  389. for _ in range(20):
  390. r = requests.post("https://api.capsolver.com/getTaskResult", json={"clientKey": key, "taskId": task_id}, timeout=20)
  391. if r.status_code == 200:
  392. d = r.json()
  393. if d.get("status") == "ready":
  394. return d["solution"]["gRecaptchaResponse"]
  395. time.sleep(3)
  396. raise BizLogicError(message="Capsolver task timeout")
  397. def _parse_travel_groups(self, html: str) -> List[Dict]:
  398. groups = []
  399. js_pattern = r'\\"travelGroups\\":\s*(\[.*?\]),\\"availableCountriesToCreateGroups'
  400. js_match = re.search(js_pattern, html, re.DOTALL)
  401. if js_match:
  402. json_str = js_match.group(1).replace(r'\"', '"')
  403. data = json.loads(json_str)
  404. for g in data:
  405. groups.append({
  406. 'group_name': g.get('groupName'),
  407. 'group_number': g.get('formGroupId'),
  408. 'location': g.get('vacName')
  409. })
  410. else:
  411. self._log('Parsed travel group page, but not found travelGroups')
  412. return groups
  413. def _parse_appointment_slots(self, html: str) -> List[Dict]:
  414. slots = []
  415. pattern = r'"availableAppointments\\":\s*(\[.*\]),\\"showFlexiAppointment'
  416. match = re.search(pattern, html, re.DOTALL)
  417. if match:
  418. json_str = match.group(1).replace(r'\"', '"')
  419. data = json.loads(json_str)
  420. for day in data:
  421. d_str = day.get('day')
  422. for s in day.get('slots', []):
  423. labels = s.get('labels', [])
  424. lbl = ""
  425. stype = ""
  426. cost = ""
  427. if 'pta' in labels:
  428. lbl = 'pta'
  429. stype = "Prime"
  430. elif 'ptaw' in labels:
  431. lbl = 'ptaw'
  432. stype = "Prime Weekend"
  433. elif '' in labels:
  434. lbl = ''
  435. stype = "Standard"
  436. if lbl or not labels:
  437. slots.append({
  438. 'date': d_str,
  439. 'time': s.get('time'),
  440. 'label': lbl,
  441. 'type': stype,
  442. 'cost': cost
  443. })
  444. return slots
  445. else:
  446. self._log('Parsed appointment slot page, but not found availableAppointments')
  447. return slots
  448. def _check_page_is_session_expired_or_invalid(self, keyword, html: str) -> bool:
  449. if not html:
  450. self.is_healthy = False
  451. raise SessionExpiredOrInvalidError()
  452. if keyword not in html:
  453. if 'redirected automatically' in html.lower():
  454. self.is_healthy = False
  455. raise SessionExpiredOrInvalidError()
  456. if 'login' in html.lower() and 'password' in html.lower():
  457. self.is_healthy = False
  458. raise SessionExpiredOrInvalidError()
  459. if 'session expired!' in html.lower() and 'for security reasons, your session has expired. please log in again to continue.' in html.lower() and 'you will be redirected automatically in 10 seconds.' in html.lower():
  460. self.is_healthy = False
  461. raise SessionExpiredOrInvalidError()
  462. if 'temporarily blocked!' in html.lower() and 'Your session has been temporarily suspended due to the high number of your access to this page.' in html.lower() and 'You can try to access your account again in 2 hours.' in html.lower():
  463. self.is_healthy = False
  464. raise SessionExpiredOrInvalidError()
  465. def _filter_dates(self, dates: List[str], start_str: str, end_str: str) -> List[str]:
  466. """
  467. 根据用户的期望范围筛选可用日期
  468. :param dates: API 返回的可用日期列表 (YYYY-MM-DD)
  469. :param start_str: 用户期望开始日期 (YYYY-MM-DD)
  470. :param end_str: 用户期望结束日期 (YYYY-MM-DD)
  471. :return: 符合要求的日期列表
  472. """
  473. # 如果没有设置范围,则不过滤,返回所有日期
  474. if not start_str or not end_str:
  475. return dates
  476. valid_dates = []
  477. # 截取前10位以防带有时分秒
  478. s_date = datetime.strptime(start_str[:10], "%Y-%m-%d")
  479. e_date = datetime.strptime(end_str[:10], "%Y-%m-%d")
  480. for date_str in dates:
  481. curr_date = datetime.strptime(date_str, "%Y-%m-%d")
  482. # 比较范围 (闭区间)
  483. if s_date <= curr_date <= e_date:
  484. valid_dates.append(date_str)
  485. random.shuffle(valid_dates)
  486. return valid_dates