| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226 | // mautrix-discord - A Matrix-Discord puppeting bridge.// Copyright (C) 2023 Tulir Asokan//// This program is free software: you can redistribute it and/or modify// it under the terms of the GNU Affero General Public License as published by// the Free Software Foundation, either version 3 of the License, or// (at your option) any later version.//// This program is distributed in the hope that it will be useful,// but WITHOUT ANY WARRANTY; without even the implied warranty of// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the// GNU Affero General Public License for more details.//// You should have received a copy of the GNU Affero General Public License// along with this program.  If not, see <https://www.gnu.org/licenses/>.package mainimport (	"fmt"	"regexp"	"strings"	"github.com/bwmarrin/discordgo"	"github.com/yuin/goldmark"	"github.com/yuin/goldmark/extension"	"github.com/yuin/goldmark/parser"	"github.com/yuin/goldmark/util"	"maunium.net/go/mautrix/event"	"maunium.net/go/mautrix/format"	"maunium.net/go/mautrix/format/mdext"	"maunium.net/go/mautrix/id"	"maunium.net/go/mautrix/util/variationselector")// escapeFixer is a hacky partial fix for the difference in escaping markdown, used with escapeReplacement//// Discord allows escaping with just one backslash, e.g. \__a__,// but standard markdown requires both to be escaped (\_\_a__)var escapeFixer = regexp.MustCompile(`\\(__[^_]|\*\*[^*])`)func escapeReplacement(s string) string {	return s[:2] + `\` + s[2:]}// indentableParagraphParser is the default paragraph parser with CanAcceptIndentedLine.// Used when disabling CodeBlockParser (as disabling it without a replacement will make indented blocks disappear).type indentableParagraphParser struct {	parser.BlockParser}var defaultIndentableParagraphParser = &indentableParagraphParser{BlockParser: parser.NewParagraphParser()}func (b *indentableParagraphParser) CanAcceptIndentedLine() bool {	return true}var removeFeaturesExceptLinks = []any{	parser.NewListParser(), parser.NewListItemParser(), parser.NewHTMLBlockParser(), parser.NewRawHTMLParser(),	parser.NewSetextHeadingParser(), parser.NewATXHeadingParser(), parser.NewThematicBreakParser(),	parser.NewCodeBlockParser(),}var removeFeaturesAndLinks = append(removeFeaturesExceptLinks, parser.NewLinkParser())var fixIndentedParagraphs = goldmark.WithParserOptions(parser.WithBlockParsers(util.Prioritized(defaultIndentableParagraphParser, 500)))var discordExtensions = goldmark.WithExtensions(extension.Strikethrough, mdext.SimpleSpoiler, mdext.DiscordUnderline, ExtDiscordEveryone, ExtDiscordTag)var discordRenderer = goldmark.New(	goldmark.WithParser(mdext.ParserWithoutFeatures(removeFeaturesAndLinks...)),	fixIndentedParagraphs, format.HTMLOptions, discordExtensions,)var discordRendererWithInlineLinks = goldmark.New(	goldmark.WithParser(mdext.ParserWithoutFeatures(removeFeaturesExceptLinks...)),	fixIndentedParagraphs, format.HTMLOptions, discordExtensions,)func (portal *Portal) renderDiscordMarkdownOnlyHTML(text string, allowInlineLinks bool) string {	text = escapeFixer.ReplaceAllStringFunc(text, escapeReplacement)	var buf strings.Builder	ctx := parser.NewContext()	ctx.Set(parserContextPortal, portal)	renderer := discordRenderer	if allowInlineLinks {		renderer = discordRendererWithInlineLinks	}	err := renderer.Convert([]byte(text), &buf, parser.WithContext(ctx))	if err != nil {		panic(fmt.Errorf("markdown parser errored: %w", err))	}	return format.UnwrapSingleParagraph(buf.String())}const formatterContextPortalKey = "fi.mau.discord.portal"const formatterContextAllowedMentionsKey = "fi.mau.discord.allowed_mentions"func appendIfNotContains(arr []string, newItem string) []string {	for _, item := range arr {		if item == newItem {			return arr		}	}	return append(arr, newItem)}func (br *DiscordBridge) pillConverter(displayname, mxid, eventID string, ctx format.Context) string {	if len(mxid) == 0 {		return displayname	}	if mxid[0] == '#' {		alias, err := br.Bot.ResolveAlias(id.RoomAlias(mxid))		if err != nil {			return displayname		}		mxid = alias.RoomID.String()	}	if mxid[0] == '!' {		portal := br.GetPortalByMXID(id.RoomID(mxid))		if portal != nil {			if eventID == "" {				//currentPortal := ctx[formatterContextPortalKey].(*Portal)				return fmt.Sprintf("<#%s>", portal.Key.ChannelID)				//if currentPortal.GuildID == portal.GuildID {				//} else if portal.GuildID != "" {				//	return fmt.Sprintf("<#%s:%s:%s>", portal.Key.ChannelID, portal.GuildID, portal.Name)				//} else {				//	// TODO is mentioning private channels possible at all?				//}			} else if msg := br.DB.Message.GetByMXID(portal.Key, id.EventID(eventID)); msg != nil {				guildID := portal.GuildID				if guildID == "" {					guildID = "@me"				}				return fmt.Sprintf("https://discord.com/channels/%s/%s/%s", guildID, msg.DiscordProtoChannelID(), msg.DiscordID)			}		}	} else if mxid[0] == '@' {		mentions := ctx.ReturnData[formatterContextAllowedMentionsKey].(*discordgo.MessageAllowedMentions)		parsedID, ok := br.ParsePuppetMXID(id.UserID(mxid))		if ok {			mentions.Users = appendIfNotContains(mentions.Users, parsedID)			return fmt.Sprintf("<@%s>", parsedID)		}		mentionedUser := br.GetUserByMXID(id.UserID(mxid))		if mentionedUser != nil && mentionedUser.DiscordID != "" {			mentions.Users = appendIfNotContains(mentions.Users, mentionedUser.DiscordID)			return fmt.Sprintf("<@%s>", mentionedUser.DiscordID)		}	}	return displayname}// Discord links start with http:// or https://, contain at least two characters afterwards,// don't contain < or whitespace anywhere, and don't end with "'),.:;]//// Zero-width whitespace is mostly in the Format category and is allowed, except \uFEFF isn't for some reasonvar discordLinkRegex = regexp.MustCompile(`https?://[^<\p{Zs}\x{feff}]*[^"'),.:;\]\p{Zs}\x{feff}]`)var discordMarkdownEscaper = strings.NewReplacer(	`\`, `\\`,	`_`, `\_`,	`*`, `\*`,	`~`, `\~`,	"`", "\\`",	`|`, `\|`,	`<`, `\<`,)func escapeDiscordMarkdown(s string) string {	submatches := discordLinkRegex.FindAllStringIndex(s, -1)	if submatches == nil {		return discordMarkdownEscaper.Replace(s)	}	var builder strings.Builder	offset := 0	for _, match := range submatches {		start := match[0]		end := match[1]		builder.WriteString(discordMarkdownEscaper.Replace(s[offset:start]))		builder.WriteString(s[start:end])		offset = end	}	builder.WriteString(discordMarkdownEscaper.Replace(s[offset:]))	return builder.String()}var matrixHTMLParser = &format.HTMLParser{	TabsToSpaces:   4,	Newline:        "\n",	HorizontalLine: "\n---\n",	ItalicConverter: func(s string, ctx format.Context) string {		return fmt.Sprintf("*%s*", s)	},	UnderlineConverter: func(s string, ctx format.Context) string {		return fmt.Sprintf("__%s__", s)	},	TextConverter: func(s string, ctx format.Context) string {		if ctx.TagStack.Has("pre") || ctx.TagStack.Has("code") {			// If we're in a code block, don't escape markdown			return s		}		return escapeDiscordMarkdown(s)	},	SpoilerConverter: func(text, reason string, ctx format.Context) string {		if reason != "" {			return fmt.Sprintf("(%s) ||%s||", reason, text)		}		return fmt.Sprintf("||%s||", text)	},}func (portal *Portal) parseMatrixHTML(content *event.MessageEventContent) (string, *discordgo.MessageAllowedMentions) {	allowedMentions := &discordgo.MessageAllowedMentions{		Parse:       []discordgo.AllowedMentionType{},		Users:       []string{},		RepliedUser: true,	}	if content.Format == event.FormatHTML && len(content.FormattedBody) > 0 {		ctx := format.NewContext()		ctx.ReturnData[formatterContextPortalKey] = portal		ctx.ReturnData[formatterContextAllowedMentionsKey] = allowedMentions		return variationselector.FullyQualify(matrixHTMLParser.Parse(content.FormattedBody, ctx)), allowedMentions	} else {		return variationselector.FullyQualify(escapeDiscordMarkdown(content.Body)), allowedMentions	}}
 |