portal.py 84 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123
  1. # mautrix-instagram - A Matrix-Instagram puppeting bridge.
  2. # Copyright (C) 2022 Tulir Asokan
  3. #
  4. # This program is free software: you can redistribute it and/or modify
  5. # it under the terms of the GNU Affero General Public License as published by
  6. # the Free Software Foundation, either version 3 of the License, or
  7. # (at your option) any later version.
  8. #
  9. # This program is distributed in the hope that it will be useful,
  10. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. # GNU Affero General Public License for more details.
  13. #
  14. # You should have received a copy of the GNU Affero General Public License
  15. # along with this program. If not, see <https://www.gnu.org/licenses/>.
  16. from __future__ import annotations
  17. from typing import TYPE_CHECKING, Any, AsyncGenerator, Awaitable, Callable, Union, cast
  18. from collections import deque
  19. from io import BytesIO
  20. import asyncio
  21. import html
  22. import json
  23. import mimetypes
  24. import re
  25. import sqlite3
  26. import time
  27. from yarl import URL
  28. import asyncpg
  29. import magic
  30. from mauigpapi.types import (
  31. AnimatedMediaItem,
  32. CommandResponse,
  33. ExpiredMediaItem,
  34. MediaShareItem,
  35. MediaType,
  36. MessageSyncMessage,
  37. Reaction,
  38. ReactionStatus,
  39. ReelMediaShareItem,
  40. ReelShareType,
  41. RegularMediaItem,
  42. Thread,
  43. ThreadItem,
  44. ThreadItemType,
  45. ThreadUser,
  46. ThreadUserLastSeenAt,
  47. TypingStatus,
  48. VoiceMediaItem,
  49. XMAMediaShareItem,
  50. )
  51. from mautrix.appservice import AppService, IntentAPI
  52. from mautrix.bridge import BasePortal, NotificationDisabler, async_getter_lock
  53. from mautrix.errors import MatrixError, MForbidden, MNotFound, SessionNotFound
  54. from mautrix.types import (
  55. AudioInfo,
  56. BeeperMessageStatusEventContent,
  57. ContentURI,
  58. EventID,
  59. EventType,
  60. Format,
  61. ImageInfo,
  62. LocationMessageEventContent,
  63. MediaMessageEventContent,
  64. MessageEventContent,
  65. MessageStatus,
  66. MessageStatusReason,
  67. MessageType,
  68. RelatesTo,
  69. RelationType,
  70. RoomID,
  71. TextMessageEventContent,
  72. UserID,
  73. VideoInfo,
  74. )
  75. from mautrix.util import ffmpeg
  76. from mautrix.util.message_send_checkpoint import MessageSendCheckpointStatus
  77. from mautrix.util.simple_lock import SimpleLock
  78. from . import matrix as m, puppet as p, user as u
  79. from .config import Config
  80. from .db import Message as DBMessage, Portal as DBPortal, Reaction as DBReaction
  81. if TYPE_CHECKING:
  82. from .__main__ import InstagramBridge
  83. try:
  84. from mautrix.crypto.attachments import decrypt_attachment, encrypt_attachment
  85. except ImportError:
  86. encrypt_attachment = decrypt_attachment = None
  87. try:
  88. from PIL import Image
  89. except ImportError:
  90. Image = None
  91. StateBridge = EventType.find("m.bridge", EventType.Class.STATE)
  92. StateHalfShotBridge = EventType.find("uk.half-shot.bridge", EventType.Class.STATE)
  93. MediaData = Union[
  94. AnimatedMediaItem,
  95. ExpiredMediaItem,
  96. MediaShareItem,
  97. ReelMediaShareItem,
  98. RegularMediaItem,
  99. VoiceMediaItem,
  100. XMAMediaShareItem,
  101. ]
  102. MediaUploadFunc = Callable[["u.User", MediaData, IntentAPI], Awaitable[MediaMessageEventContent]]
  103. # This doesn't need to capture all valid URLs, it's enough to catch most of them.
  104. # False negatives simply mean the link won't be linkified on Instagram,
  105. # but false positives will cause the message to fail to send.
  106. SIMPLE_URL_REGEX = re.compile(
  107. r"(?P<url>https?://[\da-z.-]+\.[a-z]{2,}(?:/[^\s]*)?)", flags=re.IGNORECASE
  108. )
  109. class UnsupportedAttachmentError(NotImplementedError):
  110. pass
  111. class Portal(DBPortal, BasePortal):
  112. by_mxid: dict[RoomID, Portal] = {}
  113. by_thread_id: dict[tuple[str, int], Portal] = {}
  114. config: Config
  115. matrix: m.MatrixHandler
  116. az: AppService
  117. private_chat_portal_meta: bool
  118. _main_intent: IntentAPI | None
  119. _create_room_lock: asyncio.Lock
  120. backfill_lock: SimpleLock
  121. _msgid_dedup: deque[str]
  122. _reqid_dedup: set[str]
  123. _last_participant_update: set[int]
  124. _reaction_lock: asyncio.Lock
  125. _backfill_leave: set[IntentAPI] | None
  126. _typing: set[UserID]
  127. def __init__(
  128. self,
  129. thread_id: str,
  130. receiver: int,
  131. other_user_pk: int | None,
  132. mxid: RoomID | None = None,
  133. name: str | None = None,
  134. avatar_url: ContentURI | None = None,
  135. encrypted: bool = False,
  136. name_set: bool = False,
  137. avatar_set: bool = False,
  138. relay_user_id: UserID | None = None,
  139. first_event_id: EventID | None = None,
  140. next_batch_id: BatchID | None = None,
  141. historical_base_insertion_event_id: EventID | None = None,
  142. ) -> None:
  143. super().__init__(
  144. thread_id,
  145. receiver,
  146. other_user_pk,
  147. mxid,
  148. name,
  149. avatar_url,
  150. encrypted,
  151. name_set,
  152. avatar_set,
  153. relay_user_id,
  154. first_event_id,
  155. next_batch_id,
  156. historical_base_insertion_event_id,
  157. )
  158. self._create_room_lock = asyncio.Lock()
  159. self.log = self.log.getChild(thread_id)
  160. self._msgid_dedup = deque(maxlen=100)
  161. self._reqid_dedup = set()
  162. self._last_participant_update = set()
  163. self.backfill_lock = SimpleLock(
  164. "Waiting for backfilling to finish before handling %s", log=self.log
  165. )
  166. self._backfill_leave = None
  167. self._main_intent = None
  168. self._reaction_lock = asyncio.Lock()
  169. self._typing = set()
  170. self._relay_user = None
  171. @property
  172. def is_direct(self) -> bool:
  173. return self.other_user_pk is not None
  174. @property
  175. def main_intent(self) -> IntentAPI:
  176. if not self._main_intent:
  177. raise ValueError("Portal must be postinit()ed before main_intent can be used")
  178. return self._main_intent
  179. @classmethod
  180. def init_cls(cls, bridge: "InstagramBridge") -> None:
  181. cls.config = bridge.config
  182. cls.matrix = bridge.matrix
  183. cls.az = bridge.az
  184. cls.loop = bridge.loop
  185. cls.bridge = bridge
  186. cls.private_chat_portal_meta = cls.config["bridge.private_chat_portal_meta"]
  187. NotificationDisabler.puppet_cls = p.Puppet
  188. NotificationDisabler.config_enabled = cls.config["bridge.backfill.disable_notifications"]
  189. # region Misc
  190. async def _send_delivery_receipt(self, event_id: EventID) -> None:
  191. if event_id and self.config["bridge.delivery_receipts"]:
  192. try:
  193. await self.az.intent.mark_read(self.mxid, event_id)
  194. except Exception:
  195. self.log.exception("Failed to send delivery receipt for %s", event_id)
  196. async def _send_bridge_success(
  197. self,
  198. sender: u.User,
  199. event_id: EventID,
  200. event_type: EventType,
  201. msgtype: MessageType | None = None,
  202. ) -> None:
  203. sender.send_remote_checkpoint(
  204. status=MessageSendCheckpointStatus.SUCCESS,
  205. event_id=event_id,
  206. room_id=self.mxid,
  207. event_type=event_type,
  208. message_type=msgtype,
  209. )
  210. asyncio.create_task(self._send_message_status(event_id, err=None))
  211. await self._send_delivery_receipt(event_id)
  212. async def _send_bridge_error(
  213. self,
  214. sender: u.User,
  215. err: Exception,
  216. event_id: EventID,
  217. event_type: EventType,
  218. message_type: MessageType | None = None,
  219. confirmed: bool = False,
  220. ) -> None:
  221. sender.send_remote_checkpoint(
  222. self._status_from_exception(err),
  223. event_id,
  224. self.mxid,
  225. event_type,
  226. message_type=message_type,
  227. error=err,
  228. )
  229. if self.config["bridge.delivery_error_reports"]:
  230. event_type_str = {
  231. EventType.REACTION: "reaction",
  232. EventType.ROOM_REDACTION: "redaction",
  233. }.get(event_type, "message")
  234. error_type = "was not" if confirmed else "may not have been"
  235. await self._send_message(
  236. self.main_intent,
  237. TextMessageEventContent(
  238. msgtype=MessageType.NOTICE,
  239. body=f"\u26a0 Your {event_type_str} {error_type} bridged: {str(err)}",
  240. ),
  241. )
  242. asyncio.create_task(self._send_message_status(event_id, err))
  243. async def _send_message_status(self, event_id: EventID, err: Exception | None) -> None:
  244. if not self.config["bridge.message_status_events"]:
  245. return
  246. intent = self.az.intent if self.encrypted else self.main_intent
  247. status = BeeperMessageStatusEventContent(
  248. network=self.bridge_info_state_key,
  249. relates_to=RelatesTo(
  250. rel_type=RelationType.REFERENCE,
  251. event_id=event_id,
  252. ),
  253. )
  254. if err:
  255. status.error = str(err)
  256. if isinstance(err, NotImplementedError):
  257. if isinstance(err, UnsupportedAttachmentError):
  258. status.message = str(err)
  259. status.reason = MessageStatusReason.UNSUPPORTED
  260. status.status = MessageStatus.FAIL
  261. else:
  262. status.reason = MessageStatusReason.GENERIC_ERROR
  263. status.status = MessageStatus.RETRIABLE
  264. else:
  265. status.status = MessageStatus.SUCCESS
  266. status.fill_legacy_booleans()
  267. await intent.send_message_event(
  268. room_id=self.mxid,
  269. event_type=EventType.BEEPER_MESSAGE_STATUS,
  270. content=status,
  271. )
  272. async def _upsert_reaction(
  273. self,
  274. existing: DBReaction | None,
  275. intent: IntentAPI,
  276. mxid: EventID,
  277. message: DBMessage,
  278. sender: u.User | p.Puppet,
  279. reaction: str,
  280. mx_timestamp: int,
  281. ) -> None:
  282. if existing:
  283. self.log.debug(
  284. f"_upsert_reaction redacting {existing.mxid} and inserting {mxid}"
  285. f" (message: {message.mxid})"
  286. )
  287. await intent.redact(existing.mx_room, existing.mxid)
  288. await existing.edit(
  289. reaction=reaction, mxid=mxid, mx_room=message.mx_room, mx_timestamp=mx_timestamp
  290. )
  291. else:
  292. self.log.debug(f"_upsert_reaction inserting {mxid} (message: {message.mxid})")
  293. await DBReaction(
  294. mxid=mxid,
  295. mx_room=message.mx_room,
  296. ig_item_id=message.item_id,
  297. ig_receiver=self.receiver,
  298. ig_sender=sender.igpk,
  299. reaction=reaction,
  300. mx_timestamp=mx_timestamp,
  301. ).insert()
  302. # endregion
  303. # region Matrix event handling
  304. @staticmethod
  305. def _status_from_exception(e: Exception) -> MessageSendCheckpointStatus:
  306. if isinstance(e, NotImplementedError):
  307. return MessageSendCheckpointStatus.UNSUPPORTED
  308. elif isinstance(e, asyncio.TimeoutError):
  309. return MessageSendCheckpointStatus.TIMEOUT
  310. return MessageSendCheckpointStatus.PERM_FAILURE
  311. async def handle_matrix_message(
  312. self, sender: u.User, message: MessageEventContent, event_id: EventID
  313. ) -> None:
  314. try:
  315. await self._handle_matrix_message(sender, message, event_id)
  316. except Exception as e:
  317. self.log.exception(f"Error handling Matrix event {event_id}")
  318. await self._send_bridge_error(
  319. sender,
  320. e,
  321. event_id,
  322. EventType.ROOM_MESSAGE,
  323. message_type=message.msgtype,
  324. confirmed=True,
  325. )
  326. else:
  327. await self._send_bridge_success(
  328. sender, event_id, EventType.ROOM_MESSAGE, message.msgtype
  329. )
  330. async def _handle_matrix_giphy(
  331. self,
  332. sender: u.User,
  333. event_id: EventID,
  334. request_id: str,
  335. giphy_id: str,
  336. ) -> CommandResponse:
  337. self.log.trace(f"Broadcasting giphy from {event_id} with request ID {request_id}")
  338. return await sender.client.broadcast(
  339. self.thread_id,
  340. ThreadItemType.ANIMATED_MEDIA,
  341. client_context=request_id,
  342. id=giphy_id,
  343. )
  344. async def _handle_matrix_image(
  345. self,
  346. sender: u.User,
  347. event_id: EventID,
  348. request_id: str,
  349. data: bytes,
  350. mime_type: str,
  351. width: int | None = None,
  352. height: int | None = None,
  353. ) -> CommandResponse:
  354. if mime_type != "image/jpeg":
  355. if Image is None:
  356. raise UnsupportedAttachmentError(
  357. "Instagram does not allow non-JPEG images, and Pillow is not installed, "
  358. "so the bridge couldn't convert the image automatically"
  359. )
  360. with BytesIO(data) as inp, BytesIO() as out:
  361. img = Image.open(inp)
  362. img.convert("RGB").save(out, format="JPEG", quality=80)
  363. data = out.getvalue()
  364. mime_type = "image/jpeg"
  365. self.log.trace(f"Uploading photo from {event_id} (mime: {mime_type})")
  366. upload_resp = await sender.client.upload_photo(
  367. data, mime=mime_type, width=width, height=height
  368. )
  369. self.log.trace(f"Broadcasting uploaded photo with request ID {request_id}")
  370. return await sender.client.broadcast(
  371. self.thread_id,
  372. ThreadItemType.CONFIGURE_PHOTO,
  373. client_context=request_id,
  374. upload_id=upload_resp.upload_id,
  375. allow_full_aspect_ratio="true",
  376. )
  377. async def _handle_matrix_video(
  378. self,
  379. sender: u.User,
  380. event_id: EventID,
  381. request_id: str,
  382. data: bytes,
  383. mime_type: str,
  384. duration: int | None = None,
  385. width: int | None = None,
  386. height: int | None = None,
  387. ) -> CommandResponse:
  388. if mime_type != "video/mp4":
  389. data = await ffmpeg.convert_bytes(
  390. data,
  391. output_extension=".mp4",
  392. output_args=("-c:v", "libx264", "-c:a", "aac"),
  393. input_mime=mime_type,
  394. )
  395. self.log.trace(f"Uploading video from {event_id}")
  396. _, upload_id = await sender.client.upload_mp4(
  397. data, duration_ms=duration, width=width, height=height
  398. )
  399. self.log.trace(f"Broadcasting uploaded video with request ID {request_id}")
  400. return await sender.client.broadcast(
  401. self.thread_id,
  402. ThreadItemType.CONFIGURE_VIDEO,
  403. client_context=request_id,
  404. upload_id=upload_id,
  405. video_result="",
  406. )
  407. async def _handle_matrix_audio(
  408. self,
  409. sender: u.User,
  410. event_id: EventID,
  411. request_id: str,
  412. data: bytes,
  413. mime_type: str,
  414. waveform: list[int],
  415. duration: int | None = None,
  416. ) -> CommandResponse:
  417. if mime_type != "audio/mp4":
  418. data = await ffmpeg.convert_bytes(
  419. data, output_extension=".m4a", output_args=("-c:a", "aac"), input_mime=mime_type
  420. )
  421. self.log.trace(f"Uploading audio from {event_id}")
  422. _, upload_id = await sender.client.upload_mp4(data, audio=True, duration_ms=duration)
  423. self.log.trace(f"Broadcasting uploaded audio with request ID {request_id}")
  424. return await sender.client.broadcast(
  425. self.thread_id,
  426. ThreadItemType.SHARE_VOICE,
  427. client_context=request_id,
  428. upload_id=upload_id,
  429. waveform=json.dumps([(part or 0) / 1024 for part in waveform], separators=(",", ":")),
  430. waveform_sampling_frequency_hz="10",
  431. )
  432. async def _handle_matrix_message(
  433. self, orig_sender: u.User, message: MessageEventContent, event_id: EventID
  434. ) -> None:
  435. sender, is_relay = await self.get_relay_sender(orig_sender, f"message {event_id}")
  436. assert sender, "user is not logged in"
  437. assert sender.is_connected, "You're not connected to Instagram"
  438. if is_relay:
  439. await self.apply_relay_message_format(orig_sender, message)
  440. reply_to = {}
  441. if message.get_reply_to():
  442. msg = await DBMessage.get_by_mxid(message.get_reply_to(), self.mxid)
  443. if msg and msg.client_context:
  444. reply_to = {
  445. "replied_to_item_id": msg.item_id,
  446. "replied_to_client_context": msg.client_context,
  447. }
  448. request_id = sender.state.gen_client_context()
  449. self._reqid_dedup.add(request_id)
  450. self.log.debug(
  451. f"Handling Matrix message {event_id} from {sender.mxid}/{sender.igpk} "
  452. f"with request ID {request_id}"
  453. )
  454. if message.msgtype == MessageType.NOTICE and not self.config["bridge.bridge_notices"]:
  455. return
  456. if message.msgtype in (MessageType.EMOTE, MessageType.TEXT, MessageType.NOTICE):
  457. text = message.body
  458. if message.msgtype == MessageType.EMOTE:
  459. text = f"/me {text}"
  460. self.log.trace(f"Sending Matrix text from {event_id} with request ID {request_id}")
  461. urls = SIMPLE_URL_REGEX.findall(text) or None
  462. if not self.is_direct:
  463. # Instagram groups don't seem to support sending link previews,
  464. # and the client_context-based deduplication breaks when trying to send them.
  465. urls = None
  466. resp = await sender.mqtt.send_text(
  467. self.thread_id, text=text, urls=urls, client_context=request_id, **reply_to
  468. )
  469. elif message.msgtype.is_media and "fi.mau.instagram.giphy_id" in message:
  470. resp = await self._handle_matrix_giphy(
  471. sender, event_id, request_id, message["fi.mau.instagram.giphy_id"]
  472. )
  473. elif message.msgtype.is_media:
  474. if message.file and decrypt_attachment:
  475. data = await self.main_intent.download_media(message.file.url)
  476. data = decrypt_attachment(
  477. data, message.file.key.key, message.file.hashes.get("sha256"), message.file.iv
  478. )
  479. else:
  480. data = await self.main_intent.download_media(message.url)
  481. mime_type = message.info.mimetype or magic.from_buffer(data, mime=True)
  482. if message.msgtype == MessageType.IMAGE:
  483. resp = await self._handle_matrix_image(
  484. sender,
  485. event_id,
  486. request_id,
  487. data,
  488. mime_type,
  489. width=message.info.width,
  490. height=message.info.height,
  491. )
  492. elif message.msgtype == MessageType.AUDIO:
  493. waveform = message.get("org.matrix.msc1767.audio", {}).get("waveform", [0] * 30)
  494. resp = await self._handle_matrix_audio(
  495. sender,
  496. event_id,
  497. request_id,
  498. data,
  499. mime_type,
  500. waveform,
  501. duration=message.info.duration,
  502. )
  503. elif message.msgtype == MessageType.VIDEO:
  504. resp = await self._handle_matrix_video(
  505. sender,
  506. event_id,
  507. request_id,
  508. data,
  509. mime_type,
  510. duration=message.info.duration,
  511. width=message.info.width,
  512. height=message.info.height,
  513. )
  514. else:
  515. raise UnsupportedAttachmentError(
  516. "Non-image/video/audio files are currently not supported"
  517. )
  518. else:
  519. raise NotImplementedError(f"Unknown message type {message.msgtype}")
  520. self.log.trace(f"Got response to message send {request_id}: {resp}")
  521. if resp.status != "ok" or not resp.payload:
  522. self.log.warning(f"Failed to handle {event_id}: {resp}")
  523. raise Exception(f"Sending message failed: {resp.error_message}")
  524. else:
  525. self._msgid_dedup.appendleft(resp.payload.item_id)
  526. try:
  527. await DBMessage(
  528. mxid=event_id,
  529. mx_room=self.mxid,
  530. item_id=resp.payload.item_id,
  531. client_context=resp.payload.client_context,
  532. receiver=self.receiver,
  533. sender=sender.igpk,
  534. ig_timestamp=int(resp.payload.timestamp),
  535. ).insert()
  536. except (asyncpg.UniqueViolationError, sqlite3.IntegrityError) as e:
  537. self.log.warning(
  538. f"Error while persisting {event_id} ({resp.payload.client_context}) "
  539. f"-> {resp.payload.item_id}: {e}"
  540. )
  541. self._reqid_dedup.remove(request_id)
  542. self.log.debug(
  543. f"Handled Matrix message {event_id} ({resp.payload.client_context}) "
  544. f"-> {resp.payload.item_id}"
  545. )
  546. async def handle_matrix_reaction(
  547. self, sender: u.User, event_id: EventID, reacting_to: EventID, emoji: str, timestamp: int
  548. ) -> None:
  549. try:
  550. await self._handle_matrix_reaction(sender, event_id, reacting_to, emoji, timestamp)
  551. except Exception as e:
  552. self.log.exception(f"Error handling Matrix reaction {event_id}")
  553. await self._send_bridge_error(
  554. sender,
  555. e,
  556. event_id,
  557. EventType.REACTION,
  558. confirmed=True,
  559. )
  560. else:
  561. await self._send_bridge_success(sender, event_id, EventType.REACTION)
  562. async def _handle_matrix_reaction(
  563. self, sender: u.User, event_id: EventID, reacting_to: EventID, emoji: str, timestamp: int
  564. ) -> None:
  565. if not await sender.is_logged_in():
  566. self.log.debug(f"Ignoring reaction by non-logged-in user {sender.mxid}")
  567. raise NotImplementedError("User is not logged in")
  568. message = await DBMessage.get_by_mxid(reacting_to, self.mxid)
  569. if not message or message.is_internal:
  570. self.log.debug(f"Ignoring reaction to unknown event {reacting_to}")
  571. await self.main_intent.redact(self.mxid, event_id, reason="Unknown target message")
  572. raise NotImplementedError("Unknown target message")
  573. existing = await DBReaction.get_by_item_id(message.item_id, message.receiver, sender.igpk)
  574. if existing and existing.reaction == emoji:
  575. return
  576. async with self._reaction_lock:
  577. resp = await sender.mqtt.send_reaction(
  578. self.thread_id, item_id=message.item_id, emoji=emoji
  579. )
  580. if resp.status != "ok":
  581. if resp.payload and resp.payload.message == "invalid unicode emoji":
  582. # Instagram doesn't support this reaction. Notify the user, and redact it
  583. # so that it doesn't get confusing.
  584. await self.main_intent.redact(self.mxid, event_id, reason="Unsupported emoji")
  585. raise NotImplementedError(f"Instagram does not support the {emoji} emoji.")
  586. raise Exception(f"Unknown response error: {resp}")
  587. self.log.trace(f"{sender.mxid} reacted to {message.item_id} with {emoji}")
  588. await self._upsert_reaction(
  589. existing, self.main_intent, event_id, message, sender, emoji, timestamp
  590. )
  591. async def handle_matrix_redaction(
  592. self, orig_sender: u.User, event_id: EventID, redaction_event_id: EventID
  593. ) -> None:
  594. sender = None
  595. try:
  596. sender, _ = await self.get_relay_sender(orig_sender, f"redaction {event_id}")
  597. if not sender:
  598. raise Exception("User is not logged in")
  599. await self._handle_matrix_redaction(sender, event_id)
  600. except Exception as e:
  601. self.log.exception(f"Error handling Matrix redaction {event_id}")
  602. await self._send_bridge_error(
  603. sender or orig_sender,
  604. e,
  605. redaction_event_id,
  606. EventType.ROOM_REDACTION,
  607. confirmed=True,
  608. )
  609. else:
  610. await self._send_bridge_success(sender, redaction_event_id, EventType.ROOM_REDACTION)
  611. async def _handle_matrix_redaction(self, sender: u.User, event_id: EventID) -> None:
  612. if not sender.is_connected:
  613. raise Exception("You're not connected to Instagram")
  614. reaction = await DBReaction.get_by_mxid(event_id, self.mxid)
  615. if reaction:
  616. try:
  617. await reaction.delete()
  618. await sender.mqtt.send_reaction(
  619. self.thread_id,
  620. item_id=reaction.ig_item_id,
  621. reaction_status=ReactionStatus.DELETED,
  622. emoji="",
  623. )
  624. except Exception as e:
  625. raise Exception(f"Removing reaction failed: {e}")
  626. else:
  627. self.log.trace(f"Removed reaction to {reaction.ig_item_id} after Matrix redaction")
  628. return
  629. message = await DBMessage.get_by_mxid(event_id, self.mxid)
  630. if message and not message.is_internal:
  631. try:
  632. await message.delete()
  633. await sender.client.delete_item(self.thread_id, message.item_id)
  634. self.log.trace(f"Removed {message} after Matrix redaction")
  635. except Exception as e:
  636. raise Exception(f"Removing message failed: {e}")
  637. else:
  638. self.log.trace(f"Removed message {message.item_id} after Matrix redaction")
  639. return
  640. raise NotImplementedError("No message or reaction found for redaction")
  641. async def handle_matrix_typing(self, users: set[UserID]) -> None:
  642. if users == self._typing:
  643. return
  644. old_typing = self._typing
  645. self._typing = users
  646. await self._handle_matrix_typing(old_typing - users, TypingStatus.OFF)
  647. await self._handle_matrix_typing(users - old_typing, TypingStatus.TEXT)
  648. async def _handle_matrix_typing(self, users: set[UserID], status: TypingStatus) -> None:
  649. for mxid in users:
  650. user = await u.User.get_by_mxid(mxid, create=False)
  651. if (
  652. not user
  653. or not await user.is_logged_in()
  654. or user.remote_typing_status == status
  655. or not user.is_connected
  656. ):
  657. continue
  658. user.remote_typing_status = None
  659. await user.mqtt.indicate_activity(self.thread_id, status)
  660. async def handle_matrix_leave(self, user: u.User) -> None:
  661. if not await user.is_logged_in():
  662. return
  663. if self.is_direct:
  664. self.log.info(f"{user.mxid} left private chat portal with {self.other_user_pk}")
  665. if user.igpk == self.receiver:
  666. self.log.info(
  667. f"{user.mxid} was the recipient of this portal. Cleaning up and deleting..."
  668. )
  669. await self.cleanup_and_delete()
  670. else:
  671. self.log.debug(f"{user.mxid} left portal to {self.thread_id}")
  672. # TODO cleanup if empty
  673. # endregion
  674. # region Instagram event handling
  675. async def _reupload_instagram_media(
  676. self, source: u.User, media: RegularMediaItem, intent: IntentAPI
  677. ) -> MediaMessageEventContent:
  678. if media.media_type == MediaType.IMAGE:
  679. image = media.best_image
  680. if not image:
  681. raise ValueError("Attachment not available: didn't find photo URL")
  682. url = image.url
  683. msgtype = MessageType.IMAGE
  684. info = ImageInfo(height=image.height, width=image.width)
  685. elif media.media_type == MediaType.VIDEO:
  686. video = media.best_video
  687. if not video:
  688. raise ValueError("Attachment not available: didn't find video URL")
  689. url = video.url
  690. msgtype = MessageType.VIDEO
  691. info = VideoInfo(height=video.height, width=video.width)
  692. elif media.media_type == MediaType.CAROUSEL:
  693. raise ValueError(
  694. "Carousel media is not currently supported, "
  695. "please view the post on Instagram via the link below"
  696. )
  697. else:
  698. raise ValueError(
  699. f"Attachment not available: unsupported media type {media.media_type.human_name}"
  700. )
  701. return await self._reupload_instagram_file(source, url, msgtype, info, intent)
  702. async def _reupload_instagram_animated(
  703. self, source: u.User, media: AnimatedMediaItem, intent: IntentAPI
  704. ) -> MediaMessageEventContent:
  705. url = media.images.fixed_height.webp
  706. info = ImageInfo(
  707. height=int(media.images.fixed_height.height),
  708. width=int(media.images.fixed_height.width),
  709. )
  710. return await self._reupload_instagram_file(source, url, MessageType.IMAGE, info, intent)
  711. async def _reupload_instagram_xma(
  712. self, source: u.User, media: XMAMediaShareItem, intent: IntentAPI
  713. ) -> MediaMessageEventContent:
  714. url = media.preview_url
  715. info = ImageInfo(
  716. mimetype=media.preview_url_mime_type,
  717. )
  718. return await self._reupload_instagram_file(source, url, MessageType.IMAGE, info, intent)
  719. async def _reupload_instagram_voice(
  720. self, source: u.User, media: VoiceMediaItem, intent: IntentAPI
  721. ) -> MediaMessageEventContent:
  722. async def convert_to_ogg(data, mimetype):
  723. converted = await ffmpeg.convert_bytes(
  724. data, ".ogg", output_args=("-c:a", "libopus"), input_mime=mimetype
  725. )
  726. return converted, "audio/ogg"
  727. url = media.media.audio.audio_src
  728. info = AudioInfo(duration=media.media.audio.duration)
  729. waveform = [int(p * 1024) for p in media.media.audio.waveform_data]
  730. content = await self._reupload_instagram_file(
  731. source, url, MessageType.AUDIO, info, intent, convert_to_ogg
  732. )
  733. content["org.matrix.msc1767.audio"] = {
  734. "duration": media.media.audio.duration,
  735. "waveform": waveform,
  736. }
  737. content["org.matrix.msc3245.voice"] = {}
  738. return content
  739. async def _reupload_instagram_file(
  740. self,
  741. source: u.User,
  742. url: str,
  743. msgtype: MessageType | None,
  744. info: ImageInfo | VideoInfo | AudioInfo,
  745. intent: IntentAPI,
  746. convert_fn: Callable[[bytes, str], Awaitable[tuple[bytes, str]]] | None = None,
  747. allow_encrypt: bool = True,
  748. ) -> MediaMessageEventContent:
  749. data = None
  750. async with source.client.raw_http_get(url) as resp:
  751. try:
  752. length = int(resp.headers["Content-Length"])
  753. except KeyError:
  754. # TODO can the download be short-circuited if there's too much data?
  755. self.log.warning(
  756. "Got file download response with no Content-Length header,"
  757. "reading data dangerously"
  758. )
  759. length = 0
  760. if length > self.matrix.media_config.upload_size:
  761. self.log.debug(
  762. f"{url} was too large ({length} > {self.matrix.media_config.upload_size})"
  763. )
  764. raise ValueError("Attachment not available: too large")
  765. data = await resp.read()
  766. info.mimetype = resp.headers["Content-Type"] or magic.from_buffer(data, mime=True)
  767. assert data is not None
  768. # Run the conversion function on the data.
  769. if convert_fn is not None:
  770. data, info.mimetype = await convert_fn(data, info.mimetype)
  771. if info.mimetype.startswith("image/") and not info.width and not info.height:
  772. with BytesIO(data) as inp, Image.open(inp) as img:
  773. info.width, info.height = img.size
  774. info.size = len(data)
  775. extension = {
  776. "image/webp": ".webp",
  777. "image/jpeg": ".jpg",
  778. "video/mp4": ".mp4",
  779. "audio/mp4": ".m4a",
  780. "audio/ogg": ".ogg",
  781. }.get(info.mimetype)
  782. extension = extension or mimetypes.guess_extension(info.mimetype) or ""
  783. file_name = f"{msgtype.value[2:]}{extension}" if msgtype else None
  784. upload_mime_type = info.mimetype
  785. upload_file_name = file_name
  786. decryption_info = None
  787. if allow_encrypt and self.encrypted and encrypt_attachment:
  788. data, decryption_info = encrypt_attachment(data)
  789. upload_mime_type = "application/octet-stream"
  790. upload_file_name = None
  791. mxc = await intent.upload_media(
  792. data,
  793. mime_type=upload_mime_type,
  794. filename=upload_file_name,
  795. async_upload=self.config["homeserver.async_media"],
  796. )
  797. if decryption_info:
  798. decryption_info.url = mxc
  799. mxc = None
  800. return MediaMessageEventContent(
  801. body=file_name,
  802. external_url=url,
  803. url=mxc,
  804. file=decryption_info,
  805. info=info,
  806. msgtype=msgtype,
  807. )
  808. def _get_instagram_media_info(self, item: ThreadItem) -> tuple[MediaUploadFunc, MediaData]:
  809. # TODO maybe use a dict and item.item_type instead of a ton of ifs
  810. method = self._reupload_instagram_media
  811. if (
  812. item.xma_media_share
  813. or item.xma_story_share
  814. or item.xma_reel_share
  815. or item.xma_reel_mention
  816. or item.generic_xma
  817. ):
  818. media_data = (
  819. item.xma_media_share
  820. or item.xma_story_share
  821. or item.xma_reel_share
  822. or item.xma_reel_mention
  823. or item.generic_xma
  824. )[0]
  825. method = self._reupload_instagram_xma
  826. elif item.media:
  827. media_data = item.media
  828. elif item.visual_media:
  829. media_data = item.visual_media.media
  830. elif item.animated_media:
  831. media_data = item.animated_media
  832. method = self._reupload_instagram_animated
  833. elif item.voice_media:
  834. media_data = item.voice_media
  835. method = self._reupload_instagram_voice
  836. elif item.reel_share:
  837. media_data = item.reel_share.media
  838. elif item.story_share:
  839. media_data = item.story_share.media
  840. elif item.clip:
  841. media_data = item.clip.clip
  842. elif item.felix_share and item.felix_share.video:
  843. media_data = item.felix_share.video
  844. elif item.media_share:
  845. media_data = item.media_share
  846. elif item.direct_media_share:
  847. media_data = item.direct_media_share.media
  848. else:
  849. self.log.debug(f"Unknown media type in {item}")
  850. raise ValueError("Attachment not available: unsupported media type")
  851. if not media_data:
  852. self.log.debug(f"Didn't get media_data in {item}")
  853. raise ValueError("Attachment not available: unsupported media type")
  854. elif isinstance(media_data, ExpiredMediaItem):
  855. self.log.debug(f"Expired media in item {item}")
  856. raise ValueError("Attachment not available: media expired")
  857. return method, media_data
  858. async def _convert_instagram_media(
  859. self, source: u.User, intent: IntentAPI, item: ThreadItem
  860. ) -> ConvertedMessage:
  861. try:
  862. reupload_func, media_data = self._get_instagram_media_info(item)
  863. content = await reupload_func(source, media_data, intent)
  864. except ValueError as e:
  865. content = TextMessageEventContent(body=str(e), msgtype=MessageType.NOTICE)
  866. except Exception:
  867. self.log.warning("Failed to upload media", exc_info=True)
  868. content = TextMessageEventContent(
  869. body="Attachment not available: failed to copy file", msgtype=MessageType.NOTICE
  870. )
  871. await self._add_instagram_reply(content, item.replied_to_message)
  872. return EventType.ROOM_MESSAGE, content
  873. # TODO this might be unused
  874. async def _convert_instagram_media_share(
  875. self, source: u.User, intent: IntentAPI, item: ThreadItem
  876. ) -> list[ConvertedMessage]:
  877. item_type_name = None
  878. if item.media_share:
  879. share_item = item.media_share
  880. elif item.clip:
  881. share_item = item.clip.clip
  882. item_type_name = "clip"
  883. elif item.felix_share and item.felix_share.video:
  884. share_item = item.felix_share.video
  885. elif item.story_share:
  886. share_item = item.story_share.media
  887. item_type_name = "story"
  888. elif item.direct_media_share:
  889. share_item = item.direct_media_share.media
  890. else:
  891. self.log.debug("No media share to bridge")
  892. return []
  893. item_type_name = item_type_name or share_item.media_type.human_name
  894. user_text = f"@{share_item.user.username}"
  895. user_link = (
  896. f'<a href="https://www.instagram.com/{share_item.user.username}/">{user_text}</a>'
  897. )
  898. prefix = TextMessageEventContent(
  899. msgtype=MessageType.NOTICE,
  900. format=Format.HTML,
  901. body=f"Sent {user_text}'s {item_type_name}",
  902. formatted_body=f"Sent {user_link}'s {item_type_name}",
  903. )
  904. if item.direct_media_share and item.direct_media_share.media_share_type == "tag":
  905. tagged_user_id = item.direct_media_share.tagged_user_id
  906. if tagged_user_id == source.igpk and share_item.user.pk == self.other_user_pk:
  907. prefix.body = prefix.formatted_body = "Tagged you in their post"
  908. elif share_item.user.pk == source.igpk and tagged_user_id == self.other_user_pk:
  909. prefix.body = prefix.formatted_body = "Tagged them in your post"
  910. _, content = await self._convert_instagram_media(source, intent, item)
  911. external_url = f"https://www.instagram.com/p/{share_item.code}/"
  912. if share_item.caption:
  913. caption_body = (
  914. f"> {share_item.caption.user.username}: {share_item.caption.text}\n\n"
  915. f"{external_url}"
  916. )
  917. caption_formatted_body = (
  918. f"<blockquote><strong>{share_item.caption.user.username}</strong>"
  919. f" {html.escape(share_item.caption.text)}</blockquote>"
  920. f'<a href="{external_url}">instagram.com/p/{share_item.code}</a>'
  921. )
  922. else:
  923. caption_body = external_url
  924. caption_formatted_body = (
  925. f'<a href="{external_url}">instagram.com/p/{share_item.code}</a>'
  926. )
  927. caption = TextMessageEventContent(
  928. msgtype=MessageType.TEXT,
  929. body=caption_body,
  930. formatted_body=caption_formatted_body,
  931. format=Format.HTML,
  932. external_url=external_url,
  933. )
  934. if self.bridge.config["bridge.caption_in_message"]:
  935. if isinstance(content, TextMessageEventContent):
  936. content.ensure_has_html()
  937. prefix.ensure_has_html()
  938. caption.ensure_has_html()
  939. combined = TextMessageEventContent(
  940. msgtype=MessageType.TEXT,
  941. body="\n".join((content.body, prefix.body, caption.body)),
  942. formatted_body=(
  943. f"<p><b>{content.formatted_body}</b></p>"
  944. f"<p><i>{prefix.formatted_body}</p>"
  945. f"<p>{caption.formatted_body}</p>"
  946. ),
  947. format=Format.HTML,
  948. external_url=external_url,
  949. )
  950. else:
  951. prefix.ensure_has_html()
  952. caption.ensure_has_html()
  953. combined_body = "\n".join((prefix.body, caption.body))
  954. combined_formatted_body = (
  955. f"<p><i>{prefix.formatted_body}</i></p><p>{caption.formatted_body}</p>"
  956. )
  957. combined = content
  958. combined["filename"] = content.body
  959. combined.body = combined_body
  960. combined["format"] = str(Format.HTML)
  961. combined["org.matrix.msc1767.caption"] = {
  962. "org.matrix.msc1767.text": combined_body,
  963. "org.matrix.msc1767.html": combined_formatted_body,
  964. }
  965. combined["formatted_body"] = combined_formatted_body
  966. return [(EventType.ROOM_MESSAGE, combined)]
  967. else:
  968. return [
  969. (EventType.ROOM_MESSAGE, prefix),
  970. (EventType.ROOM_MESSAGE, content),
  971. (EventType.ROOM_MESSAGE, caption),
  972. ]
  973. async def _convert_instagram_xma_media_share(
  974. self, source: u.User, intent: IntentAPI, item: ThreadItem
  975. ) -> list[ConvertedMessage]:
  976. # N.B. _get_instagram_media_info also only supports downloading the first xma item
  977. xma_list = (
  978. item.xma_media_share
  979. or item.xma_story_share
  980. or item.xma_reel_share
  981. or item.xma_reel_mention
  982. or item.generic_xma
  983. )
  984. media = xma_list[0]
  985. if len(xma_list) != 1:
  986. self.log.warning(f"Item {item.item_id} has multiple xma media share parts")
  987. if media.xma_layout_type not in (0, 4):
  988. self.log.warning(f"Unrecognized xma layout type {media.xma_layout_type}")
  989. _, content = await self._convert_instagram_media(source, intent, item)
  990. # Post shares (layout type 0): media title text
  991. # Reel shares/replies/reactions (layout type 4): item text
  992. caption_text = media.title_text or item.text or ""
  993. if media.subtitle_text:
  994. caption_text = (
  995. f"{caption_text}\n{media.subtitle_text}" if caption_text else media.subtitle_text
  996. )
  997. if media.target_url:
  998. caption_body = (
  999. f"> {caption_text}\n\n{media.target_url}" if caption_text else media.target_url
  1000. )
  1001. else:
  1002. caption_body = f"> {caption_text}"
  1003. escaped_caption_text = html.escape(caption_text).replace("\n", "<br>")
  1004. escaped_header_text = html.escape(media.header_title_text or "")
  1005. # For post shares, the media title starts with the username, which is also the header.
  1006. # That part should be bolded.
  1007. if (
  1008. escaped_header_text
  1009. and escaped_caption_text
  1010. and escaped_caption_text.startswith(escaped_header_text)
  1011. ):
  1012. escaped_caption_text = (
  1013. f"<strong>{escaped_header_text}</strong>"
  1014. f"{escaped_caption_text[len(escaped_header_text):]}"
  1015. )
  1016. if item.message_item_type == "animated_media":
  1017. anim = await self._reupload_instagram_file(
  1018. source,
  1019. url=item.animated_media.images.fixed_height.webp,
  1020. msgtype=MessageType.IMAGE,
  1021. info=ImageInfo(
  1022. width=int(item.animated_media.images.fixed_height.width),
  1023. height=int(item.animated_media.images.fixed_height.height),
  1024. ),
  1025. intent=intent,
  1026. )
  1027. inline_img = (
  1028. f'<img src="{anim.url}" width={anim.info.width} height={anim.info.height}/>'
  1029. )
  1030. escaped_caption_text = (
  1031. f"{escaped_caption_text}<br/>{inline_img}" if escaped_caption_text else inline_img
  1032. )
  1033. caption_formatted_body = (
  1034. f"<blockquote>{escaped_caption_text}</blockquote>" if escaped_caption_text else ""
  1035. )
  1036. if media.target_url:
  1037. target_url_pretty = str(URL(media.target_url).with_query(None)).replace(
  1038. "https://www.", ""
  1039. )
  1040. caption_formatted_body += (
  1041. f'<p><a href="{media.target_url}">{target_url_pretty}</a></p>'
  1042. )
  1043. # Add auxiliary text as prefix for caption
  1044. if item.auxiliary_text:
  1045. caption_formatted_body = (
  1046. f"<p>{html.escape(item.auxiliary_text)}</p>{caption_formatted_body}"
  1047. )
  1048. caption_body = f"{item.auxiliary_text}\n\n{caption_body}"
  1049. caption = TextMessageEventContent(
  1050. msgtype=MessageType.TEXT,
  1051. body=caption_body,
  1052. formatted_body=caption_formatted_body,
  1053. format=Format.HTML,
  1054. )
  1055. if media.target_url:
  1056. content.external_url = media.target_url
  1057. caption.external_url = media.target_url
  1058. if self.bridge.config["bridge.caption_in_message"]:
  1059. if isinstance(content, TextMessageEventContent):
  1060. content.ensure_has_html()
  1061. caption.ensure_has_html()
  1062. content.body += f"\n\n{caption.body}"
  1063. content.formatted_body = (
  1064. f"<p><b>{content.formatted_body}</b></p>{caption.formatted_body}"
  1065. )
  1066. else:
  1067. content["filename"] = content.body
  1068. content.body = caption.body
  1069. content["format"] = str(Format.HTML)
  1070. content["formatted_body"] = caption.formatted_body
  1071. content["org.matrix.msc1767.caption"] = {
  1072. "org.matrix.msc1767.text": content.body,
  1073. "org.matrix.msc1767.html": content["formatted_body"],
  1074. }
  1075. return [(EventType.ROOM_MESSAGE, content)]
  1076. else:
  1077. return [(EventType.ROOM_MESSAGE, content), (EventType.ROOM_MESSAGE, caption)]
  1078. # TODO this is probably unused
  1079. async def _convert_instagram_reel_share(
  1080. self, source: u.User, intent: IntentAPI, item: ThreadItem
  1081. ) -> list[ConvertedMessage]:
  1082. assert item.reel_share
  1083. media = item.reel_share.media
  1084. prefix_html = None
  1085. if item.reel_share.type == ReelShareType.REPLY:
  1086. if item.reel_share.reel_owner_id == source.igpk:
  1087. prefix = "Replied to your story"
  1088. else:
  1089. username = media.user.username
  1090. prefix = f"Sent @{username}'s story"
  1091. user_link = f'<a href="https://www.instagram.com/{username}/">@{username}</a>'
  1092. prefix_html = f"Sent {user_link}'s story"
  1093. elif item.reel_share.type == ReelShareType.REACTION:
  1094. if item.reel_share.reel_owner_id == source.igpk:
  1095. prefix = "Reacted to your story"
  1096. elif item.user_id == source.igpk:
  1097. prefix = "You reacted to their story"
  1098. else:
  1099. prefix = "Reacted to a story"
  1100. elif item.reel_share.type == ReelShareType.MENTION:
  1101. if item.reel_share.mentioned_user_id == source.igpk:
  1102. prefix = "Mentioned you in their story"
  1103. else:
  1104. prefix = "You mentioned them in your story"
  1105. else:
  1106. self.log.debug(f"Unsupported reel share type {item.reel_share.type}")
  1107. return []
  1108. prefix_content = TextMessageEventContent(msgtype=MessageType.NOTICE, body=prefix)
  1109. if prefix_html:
  1110. prefix_content.format = Format.HTML
  1111. prefix_content.formatted_body = prefix_html
  1112. caption_content = TextMessageEventContent(
  1113. msgtype=MessageType.TEXT, body=item.reel_share.text
  1114. )
  1115. if not caption_content.body and isinstance(media, MediaShareItem):
  1116. caption_content.body = media.caption.text if media.caption else ""
  1117. if not caption_content.body:
  1118. caption_content.body = "<no caption>"
  1119. media_content = None
  1120. fake_item_id = f"fi.mau.instagram.reel_share.{item.user_id}.{media.pk}"
  1121. if isinstance(media, ExpiredMediaItem):
  1122. media_content = TextMessageEventContent(
  1123. msgtype=MessageType.NOTICE, body="Story expired"
  1124. )
  1125. else:
  1126. existing = await DBMessage.get_by_item_id(fake_item_id, self.receiver)
  1127. if existing:
  1128. # If the user already reacted or replied to the same reel share item,
  1129. # use a Matrix reply instead of reposting the image.
  1130. caption_content.set_reply(existing.mxid)
  1131. else:
  1132. _, media_content = await self._convert_instagram_media(source, intent, item)
  1133. if self.bridge.config["bridge.caption_in_message"]:
  1134. if media_content:
  1135. if isinstance(media_content, TextMessageEventContent):
  1136. media_content.ensure_has_html()
  1137. prefix_content.ensure_has_html()
  1138. caption_content.ensure_has_html()
  1139. combined = TextMessageEventContent(
  1140. msgtype=MessageType.TEXT,
  1141. body="\n".join(
  1142. (media_content.body, prefix_content.body, caption_content.body)
  1143. ),
  1144. formatted_body=(
  1145. f"<p><b>{media_content.formatted_body}</b></p>"
  1146. f"<p><i>{prefix_content.formatted_body}</i></p>"
  1147. f"<p>{caption_content.formatted_body}</p>"
  1148. ),
  1149. format=Format.HTML,
  1150. )
  1151. else:
  1152. prefix_content.ensure_has_html()
  1153. caption_content.ensure_has_html()
  1154. combined_body = "\n".join((prefix_content.body, caption_content.body))
  1155. combined_formatted_body = (
  1156. f"<p><i>{prefix_content.formatted_body}</i></p>"
  1157. f"<p>{caption_content.formatted_body}</p>"
  1158. )
  1159. combined = media_content
  1160. combined["filename"] = combined.body
  1161. combined.body = combined_body
  1162. combined["format"] = str(Format.HTML)
  1163. combined["org.matrix.msc1767.caption"] = {
  1164. "org.matrix.msc1767.text": combined_body,
  1165. "org.matrix.msc1767.html": combined_formatted_body,
  1166. }
  1167. combined["formatted_body"] = combined_formatted_body
  1168. else:
  1169. combined = caption_content
  1170. return [(EventType.ROOM_MESSAGE, combined)]
  1171. else:
  1172. await self._send_message(intent, prefix_content, timestamp=item.timestamp_ms)
  1173. converted: list[ConvertedMessage] = []
  1174. if media_content:
  1175. converted.append((EventType.ROOM_MESSAGE, media_content))
  1176. converted.append((EventType.ROOM_MESSAGE, caption_content))
  1177. return converted
  1178. async def _convert_instagram_link(
  1179. self,
  1180. source: u.User,
  1181. intent: IntentAPI,
  1182. item: ThreadItem,
  1183. ) -> ConvertedMessage:
  1184. content = TextMessageEventContent(msgtype=MessageType.TEXT, body=item.link.text)
  1185. link = item.link.link_context
  1186. preview = {
  1187. "og:url": link.link_url,
  1188. "og:title": link.link_title,
  1189. "og:description": link.link_summary,
  1190. }
  1191. if link.link_image_url:
  1192. reuploaded = await self._reupload_instagram_file(
  1193. source, link.link_image_url, msgtype=None, info=ImageInfo(), intent=intent
  1194. )
  1195. preview["og:image"] = reuploaded.url
  1196. preview["og:image:type"] = reuploaded.info.mimetype
  1197. preview["og:image:width"] = reuploaded.info.width
  1198. preview["og:image:height"] = reuploaded.info.height
  1199. preview["matrix:image:size"] = reuploaded.info.size
  1200. if reuploaded.file:
  1201. preview["beeper:image:encryption"] = reuploaded.file.serialize()
  1202. preview = {k: v for k, v in preview.items() if v}
  1203. content["com.beeper.linkpreviews"] = [preview] if "og:title" in preview else []
  1204. await self._add_instagram_reply(content, item.replied_to_message)
  1205. return EventType.ROOM_MESSAGE, content
  1206. async def _convert_instagram_text(self, item: ThreadItem, text: str) -> ConvertedMessage:
  1207. content = TextMessageEventContent(msgtype=MessageType.TEXT, body=text)
  1208. content["com.beeper.linkpreviews"] = []
  1209. await self._add_instagram_reply(content, item.replied_to_message)
  1210. return EventType.ROOM_MESSAGE, content
  1211. async def _convert_instagram_unhandled(self, item: ThreadItem) -> ConvertedMessage:
  1212. content = TextMessageEventContent(
  1213. msgtype=MessageType.NOTICE, body=f"Unsupported message type {item.item_type.value}"
  1214. )
  1215. await self._add_instagram_reply(content, item.replied_to_message)
  1216. return EventType.ROOM_MESSAGE, content
  1217. async def _convert_instagram_location(self, item: ThreadItem) -> ConvertedMessage | None:
  1218. loc = item.location
  1219. if not loc or not loc.lng or not loc.lat:
  1220. # TODO handle somehow
  1221. return None
  1222. long_char = "E" if loc.lng > 0 else "W"
  1223. lat_char = "N" if loc.lat > 0 else "S"
  1224. body = (
  1225. f"{loc.name} - {round(abs(loc.lat), 4)}° {lat_char}, "
  1226. f"{round(abs(loc.lng), 4)}° {long_char}"
  1227. )
  1228. url = f"https://www.openstreetmap.org/#map=15/{loc.lat}/{loc.lng}"
  1229. external_url = None
  1230. if loc.external_source == "facebook_places":
  1231. external_url = f"https://www.facebook.com/{loc.short_name}-{loc.facebook_places_id}"
  1232. content = LocationMessageEventContent(
  1233. msgtype=MessageType.LOCATION,
  1234. geo_uri=f"geo:{loc.lat},{loc.lng}",
  1235. body=f"Location: {body}\n{url}",
  1236. external_url=external_url,
  1237. )
  1238. content["format"] = str(Format.HTML)
  1239. content["formatted_body"] = f"Location: <a href='{url}'>{body}</a>"
  1240. await self._add_instagram_reply(content, item.replied_to_message)
  1241. return EventType.ROOM_MESSAGE, content
  1242. async def _convert_instagram_profile(self, item: ThreadItem) -> ConvertedMessage:
  1243. username = item.profile.username
  1244. user_link = f'<a href="https://www.instagram.com/{username}/">@{username}</a>'
  1245. text = f"Shared @{username}'s profile"
  1246. html = f"Shared {user_link}'s profile"
  1247. content = TextMessageEventContent(
  1248. msgtype=MessageType.TEXT, format=Format.HTML, body=text, formatted_body=html
  1249. )
  1250. await self._add_instagram_reply(content, item.replied_to_message)
  1251. return EventType.ROOM_MESSAGE, content
  1252. async def _add_instagram_reply(
  1253. self, content: MessageEventContent, reply_to: ThreadItem | None
  1254. ) -> None:
  1255. if not reply_to:
  1256. return
  1257. message = await DBMessage.get_by_item_id(reply_to.item_id, self.receiver)
  1258. if not message:
  1259. return
  1260. content.set_reply(message.mxid)
  1261. if not isinstance(content, TextMessageEventContent):
  1262. return
  1263. try:
  1264. evt = await self.main_intent.get_event(message.mx_room, message.mxid)
  1265. except (MNotFound, MForbidden):
  1266. evt = None
  1267. if not evt:
  1268. return
  1269. if evt.type == EventType.ROOM_ENCRYPTED:
  1270. try:
  1271. evt = await self.matrix.e2ee.decrypt(evt, wait_session_timeout=0)
  1272. except SessionNotFound:
  1273. return
  1274. if isinstance(evt.content, TextMessageEventContent):
  1275. evt.content.trim_reply_fallback()
  1276. content.set_reply(evt)
  1277. async def handle_instagram_item(self, source: u.User, sender: p.Puppet, item: ThreadItem):
  1278. client_context = item.client_context
  1279. link_client_context = item.link.client_context if item.link else None
  1280. cc = client_context
  1281. if link_client_context:
  1282. if not client_context:
  1283. cc = f"link:{link_client_context}"
  1284. elif client_context != link_client_context:
  1285. cc = f"{client_context}/link:{link_client_context}"
  1286. if client_context and client_context in self._reqid_dedup:
  1287. self.log.debug(
  1288. f"Ignoring message {item.item_id} ({cc}) by {item.user_id}"
  1289. " as it was sent by us (client_context in dedup queue)"
  1290. )
  1291. return []
  1292. elif link_client_context and link_client_context in self._reqid_dedup:
  1293. self.log.debug(
  1294. f"Ignoring message {item.item_id} ({cc}) by {item.user_id}"
  1295. " as it was sent by us (link.client_context in dedup queue)"
  1296. )
  1297. return []
  1298. # Check in-memory queues for duplicates
  1299. if item.item_id in self._msgid_dedup:
  1300. self.log.debug(
  1301. f"Ignoring message {item.item_id} ({item.client_context}) by {item.user_id}"
  1302. " as it was already handled (message.id in dedup queue)"
  1303. )
  1304. return
  1305. self._msgid_dedup.appendleft(item.item_id)
  1306. # Check database for duplicates
  1307. if await DBMessage.get_by_item_id(item.item_id, self.receiver) is not None:
  1308. self.log.debug(
  1309. f"Ignoring message {item.item_id} ({item.client_context}) by {item.user_id}"
  1310. " as it was already handled (message.id in database)"
  1311. )
  1312. return
  1313. self.log.debug(
  1314. f"Handling Instagram message {item.item_id} ({item.client_context}) by {item.user_id}"
  1315. )
  1316. if not self.mxid:
  1317. # TODO figure out where to get the info from
  1318. mxid = await self.create_matrix_room(source)
  1319. if not mxid:
  1320. # Failed to create
  1321. return
  1322. if self.config["bridge.backfill.enable"]:
  1323. await self.enqueue_immediate_backfill(source, 0)
  1324. intent = sender.intent_for(self)
  1325. asyncio.create_task(intent.set_typing(self.mxid, is_typing=False))
  1326. event_ids = []
  1327. for event_type, content in await self.convert_instagram_item(source, sender, item):
  1328. event_ids.append(
  1329. await self._send_message(
  1330. intent, content, event_type=event_type, timestamp=item.timestamp_ms
  1331. )
  1332. )
  1333. event_ids = [event_id for event_id in event_ids if event_id]
  1334. if not event_ids:
  1335. self.log.warning(f"Unhandled Instagram message {item.item_id}")
  1336. return
  1337. self.log.debug(f"Handled Instagram message {item.item_id} -> {event_ids}")
  1338. await DBMessage(
  1339. mxid=event_ids[-1],
  1340. mx_room=self.mxid,
  1341. item_id=item.item_id,
  1342. client_context=item.client_context,
  1343. receiver=self.receiver,
  1344. sender=sender.igpk,
  1345. ig_timestamp=item.timestamp_ms,
  1346. ).insert()
  1347. await self._send_delivery_receipt(event_ids[-1])
  1348. # TODO handle reactions
  1349. return
  1350. if isinstance(message, graphql.Message) and message.message_reactions:
  1351. await self._handle_graphql_reactions(
  1352. source, created_msgs[0], message.message_reactions, timestamp
  1353. )
  1354. async def convert_instagram_item(
  1355. self, source: u.User, sender: p.Puppet, item: ThreadItem
  1356. ) -> list[ConvertedMessage]:
  1357. if not isinstance(item, ThreadItem):
  1358. # Parsing these items failed, they should have been logged already
  1359. return []
  1360. try:
  1361. return await self._convert_instagram_item(source, sender, item)
  1362. except Exception:
  1363. self.log.exception("Fatal error converting Instagram item")
  1364. self.log.trace("Item content: %s", item.serialize())
  1365. return []
  1366. async def _convert_instagram_item(
  1367. self, source: u.User, sender: p.Puppet, item: ThreadItem
  1368. ) -> list[ConvertedMessage]:
  1369. intent = sender.intent_for(self)
  1370. if (
  1371. item.xma_media_share
  1372. or item.xma_reel_share
  1373. or item.xma_reel_mention
  1374. or item.xma_story_share
  1375. or item.generic_xma
  1376. ):
  1377. return await self._convert_instagram_xma_media_share(source, intent, item)
  1378. converted: list[ConvertedMessage] = []
  1379. if item.media or item.animated_media or item.voice_media or item.visual_media:
  1380. converted.append(await self._convert_instagram_media(source, intent, item))
  1381. elif item.location:
  1382. if loc_content := await self._convert_instagram_location(item):
  1383. converted.append(loc_content)
  1384. elif item.profile:
  1385. converted.append(await self._convert_instagram_profile(item))
  1386. elif item.reel_share:
  1387. converted.extend(await self._convert_instagram_reel_share(source, intent, item))
  1388. elif (
  1389. item.media_share
  1390. or item.direct_media_share
  1391. or item.story_share
  1392. or item.clip
  1393. or item.felix_share
  1394. ):
  1395. converted.extend(await self._convert_instagram_media_share(source, intent, item))
  1396. elif item.action_log:
  1397. # These probably don't need to be bridged
  1398. self.log.debug(f"Ignoring action log message {item.item_id}")
  1399. return []
  1400. # TODO handle item.clip?
  1401. # TODO should these be put into a caption?
  1402. if item.text:
  1403. converted.append(await self._convert_instagram_text(item, item.text))
  1404. elif item.like:
  1405. # We handle likes as text because Matrix clients do big emoji on their own.
  1406. converted.append(await self._convert_instagram_text(item, item.like))
  1407. elif item.link:
  1408. converted.append(await self._convert_instagram_link(source, intent, item))
  1409. if len(converted) == 0:
  1410. self.log.debug(f"Unhandled Instagram message {item.item_id}")
  1411. converted.append(await self._convert_instagram_unhandled(item))
  1412. return converted
  1413. # TODO HANDLE REACTIONS
  1414. if is_backfill and item.reactions:
  1415. await self._handle_instagram_reactions(msg, item.reactions.emojis, is_backfill=True)
  1416. async def handle_instagram_remove(self, item_id: str) -> None:
  1417. message = await DBMessage.get_by_item_id(item_id, self.receiver)
  1418. if message is None:
  1419. return
  1420. await message.delete()
  1421. if message.mxid:
  1422. sender = await p.Puppet.get_by_pk(message.sender)
  1423. try:
  1424. await sender.intent_for(self).redact(self.mxid, message.mxid)
  1425. except MForbidden:
  1426. await self.main_intent.redact(self.mxid, message.mxid)
  1427. self.log.debug(f"Redacted {message.mxid} after Instagram unsend")
  1428. async def handle_instagram_reaction(self, item: ThreadItem, remove: bool) -> None:
  1429. sender = await p.Puppet.get_by_pk(item.new_reaction.sender_id)
  1430. message = await DBMessage.get_by_item_id(item.item_id, self.receiver)
  1431. if not message:
  1432. self.log.debug(f"Dropping reaction by {sender.pk} to unknown message {item.item_id}")
  1433. return
  1434. emoji = item.new_reaction.emoji
  1435. async with self._reaction_lock:
  1436. existing = await DBReaction.get_by_item_id(item.item_id, self.receiver, sender.pk)
  1437. if not existing and remove:
  1438. self.log.debug(
  1439. f"Ignoring duplicate reaction removal by {sender.pk} to {item.item_id}"
  1440. )
  1441. return
  1442. elif not remove and existing and existing.reaction == emoji:
  1443. self.log.debug(f"Ignoring duplicate reaction by {sender.pk} to {item.item_id}")
  1444. return
  1445. intent = sender.intent_for(self)
  1446. if remove:
  1447. await existing.delete()
  1448. await intent.redact(self.mxid, existing.mxid)
  1449. self.log.debug(
  1450. f"Removed {sender.pk}'s reaction to {item.item_id} (redacted {existing.mxid})"
  1451. )
  1452. else:
  1453. timestamp = item.new_reaction.timestamp_ms
  1454. reaction_event_id = await intent.react(
  1455. self.mxid, message.mxid, key=emoji, timestamp=timestamp
  1456. )
  1457. await self._upsert_reaction(
  1458. existing, intent, reaction_event_id, message, sender, emoji, timestamp
  1459. )
  1460. self.log.debug(
  1461. f"Handled {sender.pk}'s reaction to {item.item_id} -> {reaction_event_id}"
  1462. )
  1463. async def _handle_instagram_reactions(
  1464. self, message: DBMessage, reactions: list[Reaction], is_backfill: bool = False
  1465. ) -> None:
  1466. old_reactions: dict[int, DBReaction]
  1467. old_reactions = {
  1468. reaction.ig_sender: reaction
  1469. for reaction in await DBReaction.get_all_by_item_id(message.item_id, self.receiver)
  1470. }
  1471. timestamp_deduplicator = 1
  1472. for new_reaction in reactions:
  1473. old_reaction = old_reactions.pop(new_reaction.sender_id, None)
  1474. if old_reaction and old_reaction.reaction == new_reaction.emoji:
  1475. continue
  1476. puppet = await p.Puppet.get_by_pk(new_reaction.sender_id)
  1477. intent = puppet.intent_for(self)
  1478. timestamp = new_reaction.timestamp_ms if is_backfill else int(time.time() * 1000)
  1479. if is_backfill:
  1480. timestamp += timestamp_deduplicator
  1481. timestamp_deduplicator += 1
  1482. reaction_event_id = await intent.react(
  1483. self.mxid, message.mxid, new_reaction.emoji, timestamp=timestamp
  1484. )
  1485. await self._upsert_reaction(
  1486. old_reaction,
  1487. intent,
  1488. reaction_event_id,
  1489. message,
  1490. puppet,
  1491. new_reaction.emoji,
  1492. timestamp,
  1493. )
  1494. for old_reaction in old_reactions.values():
  1495. await old_reaction.delete()
  1496. puppet = await p.Puppet.get_by_pk(old_reaction.ig_sender)
  1497. await puppet.intent_for(self).redact(self.mxid, old_reaction.mxid)
  1498. async def handle_instagram_update(self, item: MessageSyncMessage) -> None:
  1499. message = await DBMessage.get_by_item_id(item.item_id, self.receiver)
  1500. if not message:
  1501. return
  1502. if item.has_seen:
  1503. puppet = await p.Puppet.get_by_pk(item.has_seen, create=False)
  1504. if puppet:
  1505. await puppet.intent_for(self).mark_read(self.mxid, message.mxid)
  1506. else:
  1507. async with self._reaction_lock:
  1508. await self._handle_instagram_reactions(
  1509. message, (item.reactions.emojis if item.reactions else [])
  1510. )
  1511. # endregion
  1512. # region Updating portal info
  1513. def _get_thread_name(self, thread: Thread) -> str:
  1514. if self.is_direct:
  1515. if self.other_user_pk == thread.viewer_id and len(thread.users) == 0:
  1516. return "Instagram chat with yourself"
  1517. elif len(thread.users) == 1:
  1518. tpl = self.config["bridge.private_chat_name_template"]
  1519. ui = thread.users[0]
  1520. return tpl.format(
  1521. displayname=ui.full_name or ui.username, id=ui.pk, username=ui.username
  1522. )
  1523. pass
  1524. elif thread.thread_title:
  1525. return self.config["bridge.group_chat_name_template"].format(name=thread.thread_title)
  1526. else:
  1527. return ""
  1528. async def update_info(self, thread: Thread, source: u.User) -> None:
  1529. changed = await self._update_name(self._get_thread_name(thread))
  1530. changed = await self._update_participants(thread.users, source) or changed
  1531. if changed:
  1532. await self.update_bridge_info()
  1533. await self.update()
  1534. # TODO update power levels with thread.admin_user_ids
  1535. async def update_info_from_puppet(self, puppet: p.Puppet | None = None) -> None:
  1536. if not self.is_direct:
  1537. return
  1538. if not puppet:
  1539. puppet = await self.get_dm_puppet()
  1540. await self._update_photo_from_puppet(puppet)
  1541. if self.name and not self.name_set:
  1542. await self._update_name(self.name)
  1543. async def _update_name(self, name: str) -> bool:
  1544. if name and (self.name != name or not self.name_set):
  1545. self.name = name
  1546. if self.mxid:
  1547. try:
  1548. await self.main_intent.set_room_name(self.mxid, name)
  1549. self.name_set = True
  1550. except Exception:
  1551. self.log.exception("Failed to update name")
  1552. self.name_set = False
  1553. return True
  1554. return False
  1555. async def _update_photo_from_puppet(self, puppet: p.Puppet) -> bool:
  1556. if not self.private_chat_portal_meta and not self.encrypted:
  1557. return False
  1558. if self.avatar_set and self.avatar_url == puppet.photo_mxc:
  1559. return False
  1560. self.avatar_url = puppet.photo_mxc
  1561. if self.mxid:
  1562. try:
  1563. await self.main_intent.set_room_avatar(self.mxid, puppet.photo_mxc)
  1564. self.avatar_set = True
  1565. except Exception:
  1566. self.log.exception("Failed to set room avatar")
  1567. self.avatar_set = False
  1568. return True
  1569. async def _update_participants(self, users: list[ThreadUser], source: u.User) -> bool:
  1570. meta_changed = False
  1571. # Make sure puppets who should be here are here
  1572. for user in users:
  1573. puppet = await p.Puppet.get_by_pk(user.pk)
  1574. await puppet.update_info(user, source)
  1575. if self.mxid:
  1576. await puppet.intent_for(self).ensure_joined(self.mxid)
  1577. if puppet.pk == self.other_user_pk:
  1578. meta_changed = await self._update_photo_from_puppet(puppet)
  1579. if self.mxid:
  1580. # Kick puppets who shouldn't be here
  1581. current_members = {int(user.pk) for user in users}
  1582. for user_id in await self.main_intent.get_room_members(self.mxid):
  1583. pk = p.Puppet.get_id_from_mxid(user_id)
  1584. if pk and pk not in current_members and pk != self.other_user_pk:
  1585. await self.main_intent.kick_user(
  1586. self.mxid,
  1587. p.Puppet.get_mxid_from_id(pk),
  1588. reason="User had left this Instagram DM",
  1589. )
  1590. return meta_changed
  1591. async def _update_read_receipts(self, receipts: dict[int | str, ThreadUserLastSeenAt]) -> None:
  1592. for user_id, receipt in receipts.items():
  1593. message: DBMessage | DBReaction
  1594. message = await DBMessage.get_by_item_id(receipt.item_id, self.receiver)
  1595. if not message:
  1596. reaction: DBReaction
  1597. message, reaction = await asyncio.gather(
  1598. DBMessage.get_closest(self.mxid, int(receipt.timestamp)),
  1599. DBReaction.get_closest(self.mxid, receipt.timestamp_ms),
  1600. )
  1601. if (not message or not message.mxid) and not reaction:
  1602. self.log.debug(
  1603. "Couldn't find message %s to mark as read by %s", receipt, user_id
  1604. )
  1605. continue
  1606. elif not message or (reaction and reaction.mx_timestamp > message.ig_timestamp_ms):
  1607. message = reaction
  1608. puppet = await p.Puppet.get_by_pk(int(user_id), create=False)
  1609. if not puppet:
  1610. continue
  1611. try:
  1612. await puppet.intent_for(self).mark_read(message.mx_room, message.mxid)
  1613. except Exception:
  1614. self.log.warning(
  1615. f"Failed to mark {message.mxid} in {message.mx_room} "
  1616. f"as read by {puppet.intent.mxid}",
  1617. exc_info=True,
  1618. )
  1619. async def get_dm_puppet(self) -> p.Puppet | None:
  1620. if not self.is_direct:
  1621. return None
  1622. return await p.Puppet.get_by_pk(self.other_user_pk)
  1623. # endregion
  1624. # region Backfilling
  1625. async def backfill(self, source: u.User, thread: Thread, is_initial: bool = False) -> None:
  1626. limit = (
  1627. self.config["bridge.backfill.initial_limit"]
  1628. if is_initial
  1629. else self.config["bridge.backfill.missed_limit"]
  1630. )
  1631. if limit == 0:
  1632. return
  1633. elif limit < 0:
  1634. limit = None
  1635. with self.backfill_lock:
  1636. await self._backfill(source, thread, is_initial, limit)
  1637. async def _backfill(
  1638. self, source: u.User, thread: Thread, is_initial: bool, limit: int
  1639. ) -> None:
  1640. self.log.debug("Backfilling history through %s", source.mxid)
  1641. entries = await self._fetch_backfill_items(source, thread, is_initial, limit)
  1642. if not entries:
  1643. self.log.debug("Didn't get any items to backfill from server")
  1644. return
  1645. self.log.debug("Got %d entries from server", len(entries))
  1646. self._backfill_leave = set()
  1647. async with NotificationDisabler(self.mxid, source):
  1648. for entry in reversed(entries):
  1649. sender = await p.Puppet.get_by_pk(int(entry.user_id))
  1650. await self.handle_instagram_item(source, sender, entry, is_backfill=True)
  1651. for intent in self._backfill_leave:
  1652. self.log.trace("Leaving room with %s post-backfill", intent.mxid)
  1653. await intent.leave_room(self.mxid)
  1654. self._backfill_leave = None
  1655. self.log.info("Backfilled %d messages through %s", len(entries), source.mxid)
  1656. async def _fetch_backfill_items(
  1657. self, source: u.User, thread: Thread, is_initial: bool, limit: int
  1658. ) -> list[ThreadItem]:
  1659. items = []
  1660. excluded_count = 0
  1661. self.log.debug("Fetching up to %d messages through %s", limit, source.igpk)
  1662. async for item in source.client.iter_thread(self.thread_id, start_at=thread):
  1663. if len(items) - excluded_count >= limit:
  1664. self.log.debug(f"Fetched {len(items)} messages (the limit)")
  1665. break
  1666. elif not is_initial:
  1667. msg = await DBMessage.get_by_item_id(item.item_id, receiver=self.receiver)
  1668. if msg is not None:
  1669. self.log.debug(
  1670. f"Fetched {len(items)} messages and hit a message"
  1671. " that's already in the database."
  1672. )
  1673. break
  1674. elif not item.is_handleable:
  1675. self.log.debug(
  1676. f"Not counting {item.unhandleable_type} item {item.item_id}"
  1677. " against backfill limit"
  1678. )
  1679. excluded_count += 1
  1680. items.append(item)
  1681. return items
  1682. # endregion
  1683. # region Bridge info state event
  1684. @property
  1685. def bridge_info_state_key(self) -> str:
  1686. return f"net.maunium.instagram://instagram/{self.thread_id}"
  1687. @property
  1688. def bridge_info(self) -> dict[str, Any]:
  1689. return {
  1690. "bridgebot": self.az.bot_mxid,
  1691. "creator": self.main_intent.mxid,
  1692. "protocol": {
  1693. "id": "instagram",
  1694. "displayname": "Instagram DM",
  1695. "avatar_url": self.config["appservice.bot_avatar"],
  1696. },
  1697. "channel": {
  1698. "id": self.thread_id,
  1699. "displayname": self.name,
  1700. "avatar_url": self.avatar_url,
  1701. },
  1702. }
  1703. async def update_bridge_info(self) -> None:
  1704. if not self.mxid:
  1705. self.log.debug("Not updating bridge info: no Matrix room created")
  1706. return
  1707. try:
  1708. self.log.debug("Updating bridge info...")
  1709. await self.main_intent.send_state_event(
  1710. self.mxid, StateBridge, self.bridge_info, self.bridge_info_state_key
  1711. )
  1712. # TODO remove this once https://github.com/matrix-org/matrix-doc/pull/2346 is in spec
  1713. await self.main_intent.send_state_event(
  1714. self.mxid, StateHalfShotBridge, self.bridge_info, self.bridge_info_state_key
  1715. )
  1716. except Exception:
  1717. self.log.warning("Failed to update bridge info", exc_info=True)
  1718. # endregion
  1719. # region Creating Matrix rooms
  1720. async def create_matrix_room(self, source: u.User, info: Thread) -> RoomID | None:
  1721. if self.mxid:
  1722. try:
  1723. await self.update_matrix_room(source, info)
  1724. except Exception:
  1725. self.log.exception("Failed to update portal")
  1726. return self.mxid
  1727. async with self._create_room_lock:
  1728. return await self._create_matrix_room(source, info)
  1729. def _get_invite_content(self, double_puppet: p.Puppet | None) -> dict[str, bool]:
  1730. invite_content = {}
  1731. if double_puppet:
  1732. invite_content["fi.mau.will_auto_accept"] = True
  1733. if self.is_direct:
  1734. invite_content["is_direct"] = True
  1735. return invite_content
  1736. async def update_matrix_room(
  1737. self, source: u.User, info: Thread, backfill: bool = False
  1738. ) -> None:
  1739. puppet = await p.Puppet.get_by_custom_mxid(source.mxid)
  1740. await self.main_intent.invite_user(
  1741. self.mxid,
  1742. source.mxid,
  1743. check_cache=True,
  1744. extra_content=self._get_invite_content(puppet),
  1745. )
  1746. if puppet:
  1747. did_join = await puppet.intent.ensure_joined(self.mxid)
  1748. if did_join and self.is_direct:
  1749. await source.update_direct_chats({self.main_intent.mxid: [self.mxid]})
  1750. await self.update_info(info, source)
  1751. if backfill:
  1752. last_msg = await DBMessage.get_by_item_id(
  1753. info.last_permanent_item.item_id, receiver=self.receiver
  1754. )
  1755. if last_msg is None:
  1756. self.log.debug(
  1757. f"Last permanent item ({info.last_permanent_item.item_id})"
  1758. " not found in database, starting backfilling"
  1759. )
  1760. await self.backfill(source, thread=info, is_initial=False)
  1761. await self._update_read_receipts(info.last_seen_at)
  1762. async def _create_matrix_room(self, source: u.User, info: Thread) -> RoomID | None:
  1763. if self.mxid:
  1764. await self.update_matrix_room(source, info)
  1765. return self.mxid
  1766. await self.update_info(info, source)
  1767. self.log.debug("Creating Matrix room")
  1768. name: str | None = None
  1769. initial_state = [
  1770. {
  1771. "type": str(StateBridge),
  1772. "state_key": self.bridge_info_state_key,
  1773. "content": self.bridge_info,
  1774. },
  1775. # TODO remove this once https://github.com/matrix-org/matrix-doc/pull/2346 is in spec
  1776. {
  1777. "type": str(StateHalfShotBridge),
  1778. "state_key": self.bridge_info_state_key,
  1779. "content": self.bridge_info,
  1780. },
  1781. ]
  1782. invites = []
  1783. if self.config["bridge.encryption.default"] and self.matrix.e2ee:
  1784. self.encrypted = True
  1785. initial_state.append(
  1786. {
  1787. "type": "m.room.encryption",
  1788. "content": self.get_encryption_state_event_json(),
  1789. }
  1790. )
  1791. if self.is_direct:
  1792. invites.append(self.az.bot_mxid)
  1793. if self.encrypted or self.private_chat_portal_meta or not self.is_direct:
  1794. name = self.name
  1795. # We lock backfill lock here so any messages that come between the room being created
  1796. # and the initial backfill finishing wouldn't be bridged before the backfill messages.
  1797. with self.backfill_lock:
  1798. creation_content = {}
  1799. if not self.config["bridge.federate_rooms"]:
  1800. creation_content["m.federate"] = False
  1801. self.mxid = await self.main_intent.create_room(
  1802. name=name,
  1803. is_direct=self.is_direct,
  1804. initial_state=initial_state,
  1805. invitees=invites,
  1806. creation_content=creation_content,
  1807. )
  1808. if not self.mxid:
  1809. raise Exception("Failed to create room: no mxid returned")
  1810. if self.encrypted and self.matrix.e2ee and self.is_direct:
  1811. try:
  1812. await self.az.intent.ensure_joined(self.mxid)
  1813. except Exception:
  1814. self.log.warning(f"Failed to add bridge bot to new private chat {self.mxid}")
  1815. await self.update()
  1816. self.log.debug(f"Matrix room created: {self.mxid}")
  1817. self.by_mxid[self.mxid] = self
  1818. puppet = await p.Puppet.get_by_custom_mxid(source.mxid)
  1819. await self.main_intent.invite_user(
  1820. self.mxid, source.mxid, extra_content=self._get_invite_content(puppet)
  1821. )
  1822. if puppet:
  1823. try:
  1824. if self.is_direct:
  1825. await source.update_direct_chats({self.main_intent.mxid: [self.mxid]})
  1826. await puppet.intent.join_room_by_id(self.mxid)
  1827. except MatrixError:
  1828. self.log.debug(
  1829. "Failed to join custom puppet into newly created portal", exc_info=True
  1830. )
  1831. await self._update_participants(info.users, source)
  1832. try:
  1833. await self.backfill(source, thread=info, is_initial=True)
  1834. except Exception:
  1835. self.log.exception("Failed to backfill new portal")
  1836. await self._update_read_receipts(info.last_seen_at)
  1837. return self.mxid
  1838. # endregion
  1839. # region Database getters
  1840. async def postinit(self) -> None:
  1841. self.by_thread_id[(self.thread_id, self.receiver)] = self
  1842. if self.mxid:
  1843. self.by_mxid[self.mxid] = self
  1844. self._main_intent = (
  1845. (await p.Puppet.get_by_pk(self.other_user_pk)).default_mxid_intent
  1846. if self.other_user_pk
  1847. else self.az.intent
  1848. )
  1849. async def delete(self) -> None:
  1850. await DBMessage.delete_all(self.mxid)
  1851. self.by_mxid.pop(self.mxid, None)
  1852. self.mxid = None
  1853. self.encrypted = False
  1854. await self.update()
  1855. async def save(self) -> None:
  1856. await self.update()
  1857. @classmethod
  1858. def all_with_room(cls) -> AsyncGenerator[Portal, None]:
  1859. return cls._db_to_portals(super().all_with_room())
  1860. @classmethod
  1861. def find_private_chats_with(cls, other_user: int) -> AsyncGenerator[Portal, None]:
  1862. return cls._db_to_portals(super().find_private_chats_with(other_user))
  1863. @classmethod
  1864. async def find_private_chat(cls, receiver: int, other_user: int) -> Portal | None:
  1865. thread_id = await super().find_private_chat_id(receiver, other_user)
  1866. if not thread_id:
  1867. return None
  1868. return await cls.get_by_thread_id(thread_id, receiver=receiver, is_group=False)
  1869. @classmethod
  1870. async def _db_to_portals(cls, query: Awaitable[list[Portal]]) -> AsyncGenerator[Portal, None]:
  1871. portals = await query
  1872. for index, portal in enumerate(portals):
  1873. try:
  1874. yield cls.by_thread_id[(portal.thread_id, portal.receiver)]
  1875. except KeyError:
  1876. await portal.postinit()
  1877. yield portal
  1878. @classmethod
  1879. @async_getter_lock
  1880. async def get_by_mxid(cls, mxid: RoomID) -> Portal | None:
  1881. try:
  1882. return cls.by_mxid[mxid]
  1883. except KeyError:
  1884. pass
  1885. portal = cast(cls, await super().get_by_mxid(mxid))
  1886. if portal is not None:
  1887. await portal.postinit()
  1888. return portal
  1889. return None
  1890. @classmethod
  1891. @async_getter_lock
  1892. async def get_by_thread_id(
  1893. cls,
  1894. thread_id: str,
  1895. *,
  1896. receiver: int,
  1897. is_group: bool | None = None,
  1898. other_user_pk: int | None = None,
  1899. ) -> Portal | None:
  1900. if is_group and receiver != 0:
  1901. receiver = 0
  1902. try:
  1903. return cls.by_thread_id[(thread_id, receiver)]
  1904. except KeyError:
  1905. pass
  1906. if is_group is None and receiver != 0:
  1907. try:
  1908. return cls.by_thread_id[(thread_id, 0)]
  1909. except KeyError:
  1910. pass
  1911. portal = cast(
  1912. cls,
  1913. await super().get_by_thread_id(
  1914. thread_id, receiver=receiver, rec_must_match=is_group is not None
  1915. ),
  1916. )
  1917. if portal is not None:
  1918. await portal.postinit()
  1919. return portal
  1920. if is_group is not None:
  1921. portal = cls(thread_id, receiver, other_user_pk=other_user_pk)
  1922. await portal.insert()
  1923. await portal.postinit()
  1924. return portal
  1925. return None
  1926. @classmethod
  1927. async def get_by_thread(cls, thread: Thread, receiver: int) -> Portal | None:
  1928. if thread.is_group:
  1929. receiver = 0
  1930. other_user_pk = None
  1931. else:
  1932. if len(thread.users) == 0:
  1933. other_user_pk = receiver
  1934. else:
  1935. other_user_pk = thread.users[0].pk
  1936. return await cls.get_by_thread_id(
  1937. thread.thread_id,
  1938. receiver=receiver,
  1939. is_group=thread.is_group,
  1940. other_user_pk=other_user_pk,
  1941. )
  1942. # endregion