base.py 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306
  1. # mautrix-instagram - A Matrix-Instagram puppeting bridge.
  2. # Copyright (C) 2023 Tulir Asokan
  3. #
  4. # This program is free software: you can redistribute it and/or modify
  5. # it under the terms of the GNU Affero General Public License as published by
  6. # the Free Software Foundation, either version 3 of the License, or
  7. # (at your option) any later version.
  8. #
  9. # This program is distributed in the hope that it will be useful,
  10. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. # GNU Affero General Public License for more details.
  13. #
  14. # You should have received a copy of the GNU Affero General Public License
  15. # along with this program. If not, see <https://www.gnu.org/licenses/>.
  16. from __future__ import annotations
  17. from typing import Any, Type, TypeVar
  18. import json
  19. import logging
  20. import random
  21. import time
  22. from aiohttp import ClientResponse, ClientSession, ContentTypeError, CookieJar
  23. from yarl import URL
  24. from mautrix.types import JSON, Serializable
  25. from mautrix.util.logging import TraceLogger
  26. from ..errors import (
  27. IG2FACodeExpiredError,
  28. IGActionSpamError,
  29. IGBad2FACodeError,
  30. IGChallengeError,
  31. IGCheckpointError,
  32. IGConsentRequiredError,
  33. IGFBEmailTaken,
  34. IGFBNoContactPointFoundError,
  35. IGFBSSODisabled,
  36. IGInactiveUserError,
  37. IGLoginBadPasswordError,
  38. IGLoginInvalidUserError,
  39. IGLoginRequiredError,
  40. IGLoginTwoFactorRequiredError,
  41. IGLoginUnusablePasswordError,
  42. IGNotFoundError,
  43. IGPrivateUserError,
  44. IGRateLimitError,
  45. IGResponseError,
  46. IGSentryBlockError,
  47. IGUnknownError,
  48. IGUserHasLoggedOutError,
  49. )
  50. from ..proxy import ProxyHandler
  51. from ..state import AndroidState
  52. from ..types import ChallengeContext
  53. try:
  54. from aiohttp_socks import ProxyConnector
  55. except ImportError:
  56. ProxyConnector = None
  57. T = TypeVar("T")
  58. def remove_nulls(d: dict) -> dict:
  59. return {
  60. k: remove_nulls(v) if isinstance(v, dict) else v for k, v in d.items() if v is not None
  61. }
  62. class BaseAndroidAPI:
  63. url = URL("https://i.instagram.com")
  64. http: ClientSession
  65. state: AndroidState
  66. log: TraceLogger
  67. def __init__(
  68. self,
  69. state: AndroidState,
  70. log: TraceLogger | None = None,
  71. proxy_handler: ProxyHandler | None = None,
  72. ) -> None:
  73. self.log = log or logging.getLogger("mauigpapi.http")
  74. self.proxy_handler = proxy_handler
  75. self.setup_http(cookie_jar=state.cookies.jar)
  76. self.state = state
  77. @staticmethod
  78. def sign(req: Any, filter_nulls: bool = False) -> dict[str, str]:
  79. if isinstance(req, Serializable):
  80. req = req.serialize()
  81. if isinstance(req, dict):
  82. req = json.dumps(remove_nulls(req) if filter_nulls else req)
  83. return {"signed_body": f"SIGNATURE.{req}"}
  84. @property
  85. def _headers(self) -> dict[str, str]:
  86. headers = {
  87. "x-ads-opt-out": str(int(self.state.session.ads_opt_out)),
  88. "x-device-id": self.state.device.uuid,
  89. "x-ig-app-locale": self.state.device.language,
  90. "x-ig-device-locale": self.state.device.language,
  91. "x-ig-mapped-locale": self.state.device.language,
  92. "x-pigeon-session-id": f"UFS-{self.state.pigeon_session_id}-0",
  93. "x-pigeon-rawclienttime": str(round(time.time(), 3)),
  94. "x-ig-bandwidth-speed-kbps": "-1.000",
  95. "x-ig-bandwidth-totalbytes-b": "0",
  96. "x-ig-bandwidth-totaltime-ms": "0",
  97. "x-ig-app-startup-country": self.state.device.language.split("_")[1],
  98. "x-bloks-version-id": self.state.application.BLOKS_VERSION_ID,
  99. "x-ig-www-claim": self.state.session.ig_www_claim or "0",
  100. "x-bloks-is-layout-rtl": str(self.state.device.is_layout_rtl).lower(),
  101. "x-ig-timezone-offset": self.state.device.timezone_offset,
  102. "x-ig-device-id": self.state.device.uuid,
  103. "x-ig-family-device-id": self.state.device.fdid,
  104. "x-ig-android-id": self.state.device.id,
  105. "x-ig-connection-type": self.state.device.connection_type,
  106. "x-fb-connection-type": self.state.device.connection_type,
  107. "x-ig-capabilities": self.state.application.CAPABILITIES,
  108. "x-ig-app-id": self.state.application.FACEBOOK_ANALYTICS_APPLICATION_ID,
  109. "user-agent": self.state.user_agent,
  110. "accept-language": self.state.device.language.replace("_", "-"),
  111. "authorization": self.state.session.authorization,
  112. "x-mid": self.state.cookies.get_value("mid"),
  113. "ig-u-ig-direct-region-hint": self.state.session.region_hint,
  114. "ig-u-shbid": self.state.session.shbid,
  115. "ig-u-shbts": self.state.session.shbts,
  116. "ig-u-ds-user-id": self.state.session.ds_user_id,
  117. "ig-u-rur": self.state.session.rur,
  118. "ig-intended-user-id": self.state.session.ds_user_id or "0",
  119. "ig-client-endpoint": "unknown",
  120. "x-fb-http-engine": "Liger",
  121. "x-fb-client-ip": "True",
  122. "x-fb-rmd": "cached=0;state=NO_MATCH",
  123. "x-fb-server-cluster": "True",
  124. "x-tigon-is-retry": "False",
  125. "accept-encoding": "gzip",
  126. }
  127. return {k: v for k, v in headers.items() if v is not None}
  128. def setup_http(self, cookie_jar: CookieJar) -> None:
  129. connector = None
  130. http_proxy = self.proxy_handler.get_proxy_url()
  131. if http_proxy:
  132. if ProxyConnector:
  133. connector = ProxyConnector.from_url(http_proxy)
  134. else:
  135. self.log.warning("http_proxy is set, but aiohttp-socks is not installed")
  136. self.http = ClientSession(connector=connector, cookie_jar=cookie_jar)
  137. return None
  138. def raw_http_get(self, url: URL | str):
  139. if isinstance(url, str):
  140. url = URL(url, encoded=True)
  141. return self.http.get(
  142. url,
  143. headers={
  144. "user-agent": self.state.user_agent,
  145. "accept-language": self.state.device.language.replace("_", "-"),
  146. },
  147. )
  148. async def std_http_post(
  149. self,
  150. path: str,
  151. data: JSON = None,
  152. raw: bool = False,
  153. filter_nulls: bool = False,
  154. headers: dict[str, str] | None = None,
  155. query: dict[str, str] | None = None,
  156. response_type: Type[T] | None = JSON,
  157. ) -> T:
  158. headers = {**self._headers, **headers} if headers else self._headers
  159. if not raw:
  160. data = self.sign(data, filter_nulls=filter_nulls)
  161. url = self.url.with_path(path).with_query(query or {})
  162. resp = await self.http.post(url=url, headers=headers, data=data)
  163. self.log.trace(f"{path} response: {await resp.text()}")
  164. if response_type is str or response_type is None:
  165. self._handle_response_headers(resp)
  166. if response_type is str:
  167. return await resp.text()
  168. return None
  169. json_data = await self._handle_response(resp)
  170. if response_type is not JSON:
  171. return response_type.deserialize(json_data)
  172. return json_data
  173. async def std_http_get(
  174. self,
  175. path: str,
  176. query: dict[str, str] | None = None,
  177. headers: dict[str, str] | None = None,
  178. response_type: Type[T] | None = JSON,
  179. ) -> T:
  180. headers = {**self._headers, **headers} if headers else self._headers
  181. query = {k: v for k, v in (query or {}).items() if v is not None}
  182. resp = await self.http.get(url=self.url.with_path(path).with_query(query), headers=headers)
  183. self.log.trace(f"{path} response: {await resp.text()}")
  184. if response_type is None:
  185. self._handle_response_headers(resp)
  186. return None
  187. json_data = await self._handle_response(resp)
  188. if response_type is not JSON:
  189. return response_type.deserialize(json_data)
  190. return json_data
  191. async def _handle_response(self, resp: ClientResponse) -> JSON:
  192. self._handle_response_headers(resp)
  193. try:
  194. body = await resp.json()
  195. except (json.JSONDecodeError, ContentTypeError) as e:
  196. raise IGUnknownError(resp) from e
  197. if body.get("status", "fail") == "ok":
  198. return body
  199. else:
  200. await self._raise_response_error(resp)
  201. async def _raise_response_error(self, resp: ClientResponse) -> None:
  202. try:
  203. data = await resp.json()
  204. except json.JSONDecodeError:
  205. data = {}
  206. if data.get("spam", False):
  207. raise IGActionSpamError(resp, data)
  208. elif data.get("two_factor_required", False):
  209. raise IGLoginTwoFactorRequiredError(resp, data)
  210. elif resp.status == 404:
  211. raise IGNotFoundError(resp, data)
  212. elif resp.status == 429:
  213. raise IGRateLimitError(resp, data)
  214. message = data.get("message")
  215. if isinstance(message, str):
  216. if message == "challenge_required":
  217. err = IGChallengeError(resp, data)
  218. self.log.debug(f"Storing challenge URL {err.url}")
  219. self.state.challenge_path = err.url
  220. try:
  221. self.state.challenge_context = ChallengeContext.parse_json(
  222. err.body.challenge.challenge_context
  223. )
  224. except Exception:
  225. self.log.exception(
  226. "Failed to deserialize challenge_context %s",
  227. err.body.challenge.challenge_context,
  228. )
  229. raise err
  230. elif message == "checkpoint_required":
  231. raise IGCheckpointError(resp, data)
  232. elif message == "consent_required":
  233. raise IGConsentRequiredError(resp, data)
  234. elif message == "user_has_logged_out":
  235. raise IGUserHasLoggedOutError(resp, data)
  236. elif message == "login_required":
  237. raise IGLoginRequiredError(resp, data)
  238. elif message.lower() == "not authorized to view user":
  239. raise IGPrivateUserError(resp, data)
  240. error_type = data.get("error_type")
  241. if error_type == "sentry_block":
  242. raise IGSentryBlockError(resp, data)
  243. elif error_type == "inactive_user":
  244. raise IGInactiveUserError(resp, data)
  245. elif error_type == "bad_password":
  246. raise IGLoginBadPasswordError(resp, data)
  247. elif error_type == "unusable_password":
  248. raise IGLoginUnusablePasswordError(resp, data)
  249. elif error_type == "invalid_user":
  250. raise IGLoginInvalidUserError(resp, data)
  251. elif error_type == "sms_code_validation_code_invalid":
  252. raise IGBad2FACodeError(resp, data)
  253. elif error_type == "invalid_nonce":
  254. raise IG2FACodeExpiredError(resp, data)
  255. elif error_type == "fb_no_contact_point_found":
  256. raise IGFBNoContactPointFoundError(resp, data)
  257. elif error_type == "fb_email_taken":
  258. raise IGFBEmailTaken(resp, data)
  259. elif error_type == "sso_disabled":
  260. raise IGFBSSODisabled(resp, data)
  261. elif error_type == "rate_limit_error":
  262. raise IGRateLimitError(resp, data)
  263. raise IGResponseError(resp, data)
  264. def _handle_response_headers(self, resp: ClientResponse) -> None:
  265. fields = {
  266. "x-ig-set-www-claim": "ig_www_claim",
  267. "ig-set-authorization": "authorization",
  268. "ig-set-password-encryption-key-id": "password_encryption_key_id",
  269. "ig-set-password-encryption-pub-key": "password_encryption_pubkey",
  270. "ig-set-ig-u-ig-direct-region-hint": "region_hint",
  271. "ig-set-ig-u-shbid": "shbid",
  272. "ig-set-ig-u-shbts": "shbts",
  273. "ig-set-ig-u-rur": "rur",
  274. "ig-set-ig-u-ds-user-id": "ds_user_id",
  275. }
  276. for header, field in fields.items():
  277. value = resp.headers.get(header)
  278. if value and (header != "IG-Set-Authorization" or not value.endswith(":")):
  279. setattr(self.state.session, field, value)