backfill.go 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340
  1. // mautrix-whatsapp - A Matrix-WhatsApp puppeting bridge.
  2. // Copyright (C) 2021 Tulir Asokan, Sumner Evans
  3. //
  4. // This program is free software: you can redistribute it and/or modify
  5. // it under the terms of the GNU Affero General Public License as published by
  6. // the Free Software Foundation, either version 3 of the License, or
  7. // (at your option) any later version.
  8. //
  9. // This program is distributed in the hope that it will be useful,
  10. // but WITHOUT ANY WARRANTY; without even the implied warranty of
  11. // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  12. // GNU Affero General Public License for more details.
  13. //
  14. // You should have received a copy of the GNU Affero General Public License
  15. // along with this program. If not, see <https://www.gnu.org/licenses/>.
  16. package database
  17. import (
  18. "database/sql"
  19. "errors"
  20. "fmt"
  21. "strconv"
  22. "strings"
  23. "sync"
  24. "time"
  25. "go.mau.fi/util/dbutil"
  26. log "maunium.net/go/maulogger/v2"
  27. "maunium.net/go/mautrix/id"
  28. )
  29. type BackfillType int
  30. const (
  31. BackfillImmediate BackfillType = 0
  32. BackfillForward BackfillType = 100
  33. BackfillDeferred BackfillType = 200
  34. )
  35. func (bt BackfillType) String() string {
  36. switch bt {
  37. case BackfillImmediate:
  38. return "IMMEDIATE"
  39. case BackfillForward:
  40. return "FORWARD"
  41. case BackfillDeferred:
  42. return "DEFERRED"
  43. }
  44. return "UNKNOWN"
  45. }
  46. type BackfillQuery struct {
  47. db *Database
  48. log log.Logger
  49. backfillQueryLock sync.Mutex
  50. }
  51. func (bq *BackfillQuery) New() *Backfill {
  52. return &Backfill{
  53. db: bq.db,
  54. log: bq.log,
  55. Portal: &PortalKey{},
  56. }
  57. }
  58. func (bq *BackfillQuery) NewWithValues(userID id.UserID, backfillType BackfillType, priority int, portal *PortalKey, timeStart *time.Time, maxBatchEvents, maxTotalEvents, batchDelay int) *Backfill {
  59. return &Backfill{
  60. db: bq.db,
  61. log: bq.log,
  62. UserID: userID,
  63. BackfillType: backfillType,
  64. Priority: priority,
  65. Portal: portal,
  66. TimeStart: timeStart,
  67. MaxBatchEvents: maxBatchEvents,
  68. MaxTotalEvents: maxTotalEvents,
  69. BatchDelay: batchDelay,
  70. }
  71. }
  72. const (
  73. getNextBackfillQuery = `
  74. SELECT queue_id, user_mxid, type, priority, portal_jid, portal_receiver, time_start, max_batch_events, max_total_events, batch_delay
  75. FROM backfill_queue
  76. WHERE user_mxid=$1
  77. AND type IN (%s)
  78. AND (
  79. dispatch_time IS NULL
  80. OR (
  81. dispatch_time < $2
  82. AND completed_at IS NULL
  83. )
  84. )
  85. ORDER BY type, priority, queue_id
  86. LIMIT 1
  87. `
  88. getUnstartedOrInFlightQuery = `
  89. SELECT 1
  90. FROM backfill_queue
  91. WHERE user_mxid=$1
  92. AND type IN (%s)
  93. AND (dispatch_time IS NULL OR completed_at IS NULL)
  94. LIMIT 1
  95. `
  96. )
  97. // GetNext returns the next backfill to perform
  98. func (bq *BackfillQuery) GetNext(userID id.UserID, backfillTypes []BackfillType) (backfill *Backfill) {
  99. bq.backfillQueryLock.Lock()
  100. defer bq.backfillQueryLock.Unlock()
  101. var types []string
  102. for _, backfillType := range backfillTypes {
  103. types = append(types, strconv.Itoa(int(backfillType)))
  104. }
  105. rows, err := bq.db.Query(fmt.Sprintf(getNextBackfillQuery, strings.Join(types, ",")), userID, time.Now().Add(-15*time.Minute))
  106. if err != nil || rows == nil {
  107. bq.log.Errorfln("Failed to query next backfill queue job: %v", err)
  108. return
  109. }
  110. defer rows.Close()
  111. if rows.Next() {
  112. backfill = bq.New().Scan(rows)
  113. }
  114. return
  115. }
  116. func (bq *BackfillQuery) HasUnstartedOrInFlightOfType(userID id.UserID, backfillTypes []BackfillType) bool {
  117. if len(backfillTypes) == 0 {
  118. return false
  119. }
  120. bq.backfillQueryLock.Lock()
  121. defer bq.backfillQueryLock.Unlock()
  122. types := []string{}
  123. for _, backfillType := range backfillTypes {
  124. types = append(types, strconv.Itoa(int(backfillType)))
  125. }
  126. rows, err := bq.db.Query(fmt.Sprintf(getUnstartedOrInFlightQuery, strings.Join(types, ",")), userID)
  127. if err != nil || rows == nil {
  128. if err != nil && !errors.Is(err, sql.ErrNoRows) {
  129. bq.log.Warnfln("Failed to query backfill queue jobs: %v", err)
  130. }
  131. // No rows means that there are no unstarted or in flight backfill
  132. // requests.
  133. return false
  134. }
  135. defer rows.Close()
  136. return rows.Next()
  137. }
  138. func (bq *BackfillQuery) DeleteAll(userID id.UserID) {
  139. bq.backfillQueryLock.Lock()
  140. defer bq.backfillQueryLock.Unlock()
  141. _, err := bq.db.Exec("DELETE FROM backfill_queue WHERE user_mxid=$1", userID)
  142. if err != nil {
  143. bq.log.Warnfln("Failed to delete backfill queue items for %s: %v", userID, err)
  144. }
  145. }
  146. func (bq *BackfillQuery) DeleteAllForPortal(userID id.UserID, portalKey PortalKey) {
  147. bq.backfillQueryLock.Lock()
  148. defer bq.backfillQueryLock.Unlock()
  149. _, err := bq.db.Exec(`
  150. DELETE FROM backfill_queue
  151. WHERE user_mxid=$1
  152. AND portal_jid=$2
  153. AND portal_receiver=$3
  154. `, userID, portalKey.JID, portalKey.Receiver)
  155. if err != nil {
  156. bq.log.Warnfln("Failed to delete backfill queue items for %s/%s: %v", userID, portalKey.JID, err)
  157. }
  158. }
  159. type Backfill struct {
  160. db *Database
  161. log log.Logger
  162. // Fields
  163. QueueID int
  164. UserID id.UserID
  165. BackfillType BackfillType
  166. Priority int
  167. Portal *PortalKey
  168. TimeStart *time.Time
  169. MaxBatchEvents int
  170. MaxTotalEvents int
  171. BatchDelay int
  172. DispatchTime *time.Time
  173. CompletedAt *time.Time
  174. }
  175. func (b *Backfill) String() string {
  176. return fmt.Sprintf("Backfill{QueueID: %d, UserID: %s, BackfillType: %s, Priority: %d, Portal: %s, TimeStart: %s, MaxBatchEvents: %d, MaxTotalEvents: %d, BatchDelay: %d, DispatchTime: %s, CompletedAt: %s}",
  177. b.QueueID, b.UserID, b.BackfillType, b.Priority, b.Portal, b.TimeStart, b.MaxBatchEvents, b.MaxTotalEvents, b.BatchDelay, b.CompletedAt, b.DispatchTime,
  178. )
  179. }
  180. func (b *Backfill) Scan(row dbutil.Scannable) *Backfill {
  181. var maxTotalEvents, batchDelay sql.NullInt32
  182. err := row.Scan(&b.QueueID, &b.UserID, &b.BackfillType, &b.Priority, &b.Portal.JID, &b.Portal.Receiver, &b.TimeStart, &b.MaxBatchEvents, &maxTotalEvents, &batchDelay)
  183. if err != nil {
  184. if !errors.Is(err, sql.ErrNoRows) {
  185. b.log.Errorln("Database scan failed:", err)
  186. }
  187. return nil
  188. }
  189. b.MaxTotalEvents = int(maxTotalEvents.Int32)
  190. b.BatchDelay = int(batchDelay.Int32)
  191. return b
  192. }
  193. func (b *Backfill) Insert() {
  194. b.db.Backfill.backfillQueryLock.Lock()
  195. defer b.db.Backfill.backfillQueryLock.Unlock()
  196. rows, err := b.db.Query(`
  197. INSERT INTO backfill_queue
  198. (user_mxid, type, priority, portal_jid, portal_receiver, time_start, max_batch_events, max_total_events, batch_delay, dispatch_time, completed_at)
  199. VALUES ($1, $2, $3, $4, $5, $6, $7, $8, $9, $10, $11)
  200. RETURNING queue_id
  201. `, b.UserID, b.BackfillType, b.Priority, b.Portal.JID, b.Portal.Receiver, b.TimeStart, b.MaxBatchEvents, b.MaxTotalEvents, b.BatchDelay, b.DispatchTime, b.CompletedAt)
  202. defer rows.Close()
  203. if err != nil || !rows.Next() {
  204. b.log.Warnfln("Failed to insert %v/%s with priority %d: %v", b.BackfillType, b.Portal.JID, b.Priority, err)
  205. return
  206. }
  207. err = rows.Scan(&b.QueueID)
  208. if err != nil {
  209. b.log.Warnfln("Failed to insert %s/%s with priority %s: %v", b.BackfillType, b.Portal.JID, b.Priority, err)
  210. }
  211. }
  212. func (b *Backfill) MarkDispatched() {
  213. b.db.Backfill.backfillQueryLock.Lock()
  214. defer b.db.Backfill.backfillQueryLock.Unlock()
  215. if b.QueueID == 0 {
  216. b.log.Errorfln("Cannot mark backfill as dispatched without queue_id. Maybe it wasn't actually inserted in the database?")
  217. return
  218. }
  219. _, err := b.db.Exec("UPDATE backfill_queue SET dispatch_time=$1 WHERE queue_id=$2", time.Now(), b.QueueID)
  220. if err != nil {
  221. b.log.Warnfln("Failed to mark %s/%s as dispatched: %v", b.BackfillType, b.Priority, err)
  222. }
  223. }
  224. func (b *Backfill) MarkDone() {
  225. b.db.Backfill.backfillQueryLock.Lock()
  226. defer b.db.Backfill.backfillQueryLock.Unlock()
  227. if b.QueueID == 0 {
  228. b.log.Errorfln("Cannot mark backfill done without queue_id. Maybe it wasn't actually inserted in the database?")
  229. return
  230. }
  231. _, err := b.db.Exec("UPDATE backfill_queue SET completed_at=$1 WHERE queue_id=$2", time.Now(), b.QueueID)
  232. if err != nil {
  233. b.log.Warnfln("Failed to mark %s/%s as complete: %v", b.BackfillType, b.Priority, err)
  234. }
  235. }
  236. func (bq *BackfillQuery) NewBackfillState(userID id.UserID, portalKey *PortalKey) *BackfillState {
  237. return &BackfillState{
  238. db: bq.db,
  239. log: bq.log,
  240. UserID: userID,
  241. Portal: portalKey,
  242. }
  243. }
  244. const (
  245. getBackfillState = `
  246. SELECT user_mxid, portal_jid, portal_receiver, processing_batch, backfill_complete, first_expected_ts
  247. FROM backfill_state
  248. WHERE user_mxid=$1
  249. AND portal_jid=$2
  250. AND portal_receiver=$3
  251. `
  252. )
  253. type BackfillState struct {
  254. db *Database
  255. log log.Logger
  256. // Fields
  257. UserID id.UserID
  258. Portal *PortalKey
  259. ProcessingBatch bool
  260. BackfillComplete bool
  261. FirstExpectedTimestamp uint64
  262. }
  263. func (b *BackfillState) Scan(row dbutil.Scannable) *BackfillState {
  264. err := row.Scan(&b.UserID, &b.Portal.JID, &b.Portal.Receiver, &b.ProcessingBatch, &b.BackfillComplete, &b.FirstExpectedTimestamp)
  265. if err != nil {
  266. if !errors.Is(err, sql.ErrNoRows) {
  267. b.log.Errorln("Database scan failed:", err)
  268. }
  269. return nil
  270. }
  271. return b
  272. }
  273. func (b *BackfillState) Upsert() {
  274. _, err := b.db.Exec(`
  275. INSERT INTO backfill_state
  276. (user_mxid, portal_jid, portal_receiver, processing_batch, backfill_complete, first_expected_ts)
  277. VALUES ($1, $2, $3, $4, $5, $6)
  278. ON CONFLICT (user_mxid, portal_jid, portal_receiver)
  279. DO UPDATE SET
  280. processing_batch=EXCLUDED.processing_batch,
  281. backfill_complete=EXCLUDED.backfill_complete,
  282. first_expected_ts=EXCLUDED.first_expected_ts`,
  283. b.UserID, b.Portal.JID, b.Portal.Receiver, b.ProcessingBatch, b.BackfillComplete, b.FirstExpectedTimestamp)
  284. if err != nil {
  285. b.log.Warnfln("Failed to insert backfill state for %s: %v", b.Portal.JID, err)
  286. }
  287. }
  288. func (b *BackfillState) SetProcessingBatch(processing bool) {
  289. b.ProcessingBatch = processing
  290. b.Upsert()
  291. }
  292. func (bq *BackfillQuery) GetBackfillState(userID id.UserID, portalKey *PortalKey) (backfillState *BackfillState) {
  293. rows, err := bq.db.Query(getBackfillState, userID, portalKey.JID, portalKey.Receiver)
  294. if err != nil || rows == nil {
  295. bq.log.Error(err)
  296. return
  297. }
  298. defer rows.Close()
  299. if rows.Next() {
  300. backfillState = bq.NewBackfillState(userID, portalKey).Scan(rows)
  301. }
  302. return
  303. }