2018-08-26 00:26:24 +03:00
|
|
|
// mautrix-whatsapp - A Matrix-WhatsApp puppeting bridge.
|
2021-10-22 20:14:34 +03:00
|
|
|
// Copyright (C) 2021 Tulir Asokan
|
2018-08-26 00:26:24 +03:00
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful,
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"fmt"
|
2018-08-29 00:40:54 +03:00
|
|
|
"html"
|
2018-08-26 00:26:24 +03:00
|
|
|
"regexp"
|
|
|
|
"strings"
|
|
|
|
|
2021-10-22 20:14:34 +03:00
|
|
|
"go.mau.fi/whatsmeow/types"
|
2021-02-17 01:21:30 +02:00
|
|
|
|
2020-05-08 22:32:22 +03:00
|
|
|
"maunium.net/go/mautrix/event"
|
2019-01-11 21:17:31 +02:00
|
|
|
"maunium.net/go/mautrix/format"
|
2020-05-08 22:32:22 +03:00
|
|
|
"maunium.net/go/mautrix/id"
|
2018-08-26 00:26:24 +03:00
|
|
|
)
|
|
|
|
|
|
|
|
var italicRegex = regexp.MustCompile("([\\s>~*]|^)_(.+?)_([^a-zA-Z\\d]|$)")
|
|
|
|
var boldRegex = regexp.MustCompile("([\\s>_~]|^)\\*(.+?)\\*([^a-zA-Z\\d]|$)")
|
|
|
|
var strikethroughRegex = regexp.MustCompile("([\\s>_*]|^)~(.+?)~([^a-zA-Z\\d]|$)")
|
|
|
|
var codeBlockRegex = regexp.MustCompile("```(?:.|\n)+?```")
|
2022-06-24 21:50:58 +03:00
|
|
|
var inlineURLRegex = regexp.MustCompile(`\[(.+?)]\((.+?)\)`)
|
2020-07-31 14:30:58 +03:00
|
|
|
|
|
|
|
const mentionedJIDsContextKey = "net.maunium.whatsapp.mentioned_jids"
|
2018-08-26 00:26:24 +03:00
|
|
|
|
2018-08-29 00:40:54 +03:00
|
|
|
type Formatter struct {
|
2022-05-22 01:06:30 +03:00
|
|
|
bridge *WABridge
|
2018-08-29 00:40:54 +03:00
|
|
|
|
|
|
|
matrixHTMLParser *format.HTMLParser
|
|
|
|
|
|
|
|
waReplString map[*regexp.Regexp]string
|
|
|
|
waReplFunc map[*regexp.Regexp]func(string) string
|
|
|
|
waReplFuncText map[*regexp.Regexp]func(string) string
|
|
|
|
}
|
|
|
|
|
2022-05-22 01:06:30 +03:00
|
|
|
func NewFormatter(bridge *WABridge) *Formatter {
|
2018-08-29 00:40:54 +03:00
|
|
|
formatter := &Formatter{
|
|
|
|
bridge: bridge,
|
|
|
|
matrixHTMLParser: &format.HTMLParser{
|
|
|
|
TabsToSpaces: 4,
|
|
|
|
Newline: "\n",
|
|
|
|
|
2021-06-17 12:38:04 +03:00
|
|
|
PillConverter: func(displayname, mxid, eventID string, ctx format.Context) string {
|
2018-08-29 00:40:54 +03:00
|
|
|
if mxid[0] == '@' {
|
2020-05-08 22:32:22 +03:00
|
|
|
puppet := bridge.GetPuppetByMXID(id.UserID(mxid))
|
2018-08-29 00:40:54 +03:00
|
|
|
if puppet != nil {
|
2021-10-22 20:14:34 +03:00
|
|
|
jids, ok := ctx[mentionedJIDsContextKey].([]string)
|
2020-07-31 14:30:58 +03:00
|
|
|
if !ok {
|
2021-10-22 20:14:34 +03:00
|
|
|
ctx[mentionedJIDsContextKey] = []string{puppet.JID.String()}
|
2020-07-31 14:30:58 +03:00
|
|
|
} else {
|
2021-10-22 20:14:34 +03:00
|
|
|
ctx[mentionedJIDsContextKey] = append(jids, puppet.JID.String())
|
2020-07-31 14:30:58 +03:00
|
|
|
}
|
2021-10-22 20:14:34 +03:00
|
|
|
return "@" + puppet.JID.User
|
2018-08-29 00:40:54 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return mxid
|
|
|
|
},
|
2021-10-22 20:14:34 +03:00
|
|
|
BoldConverter: func(text string, _ format.Context) string { return fmt.Sprintf("*%s*", text) },
|
|
|
|
ItalicConverter: func(text string, _ format.Context) string { return fmt.Sprintf("_%s_", text) },
|
|
|
|
StrikethroughConverter: func(text string, _ format.Context) string { return fmt.Sprintf("~%s~", text) },
|
|
|
|
MonospaceConverter: func(text string, _ format.Context) string { return fmt.Sprintf("```%s```", text) },
|
|
|
|
MonospaceBlockConverter: func(text, language string, _ format.Context) string { return fmt.Sprintf("```%s```", text) },
|
2018-08-29 00:40:54 +03:00
|
|
|
},
|
|
|
|
waReplString: map[*regexp.Regexp]string{
|
|
|
|
italicRegex: "$1<em>$2</em>$3",
|
|
|
|
boldRegex: "$1<strong>$2</strong>$3",
|
|
|
|
strikethroughRegex: "$1<del>$2</del>$3",
|
|
|
|
},
|
|
|
|
}
|
|
|
|
formatter.waReplFunc = map[*regexp.Regexp]func(string) string{
|
2018-08-26 00:26:24 +03:00
|
|
|
codeBlockRegex: func(str string) string {
|
|
|
|
str = str[3 : len(str)-3]
|
|
|
|
if strings.ContainsRune(str, '\n') {
|
|
|
|
return fmt.Sprintf("<pre><code>%s</code></pre>", str)
|
|
|
|
}
|
|
|
|
return fmt.Sprintf("<code>%s</code>", str)
|
|
|
|
},
|
2018-08-29 00:40:54 +03:00
|
|
|
}
|
2021-10-22 20:14:34 +03:00
|
|
|
formatter.waReplFuncText = map[*regexp.Regexp]func(string) string{}
|
2018-08-29 00:40:54 +03:00
|
|
|
return formatter
|
|
|
|
}
|
|
|
|
|
2022-02-16 01:00:49 +02:00
|
|
|
func (formatter *Formatter) getMatrixInfoByJID(roomID id.RoomID, jid types.JID) (mxid id.UserID, displayname string) {
|
|
|
|
if puppet := formatter.bridge.GetPuppetByJID(jid); puppet != nil {
|
2018-08-29 00:40:54 +03:00
|
|
|
mxid = puppet.MXID
|
|
|
|
displayname = puppet.Displayname
|
|
|
|
}
|
2022-02-16 01:00:49 +02:00
|
|
|
if user := formatter.bridge.GetUserByJID(jid); user != nil {
|
|
|
|
mxid = user.MXID
|
|
|
|
member := formatter.bridge.StateStore.GetMember(roomID, user.MXID)
|
|
|
|
if len(member.Displayname) > 0 {
|
|
|
|
displayname = member.Displayname
|
|
|
|
}
|
|
|
|
}
|
2018-08-29 00:40:54 +03:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2022-06-24 23:25:37 +03:00
|
|
|
func (formatter *Formatter) ParseWhatsApp(roomID id.RoomID, content *event.MessageEventContent, mentionedJIDs []string, allowInlineURL, forceHTML bool) {
|
2018-08-29 00:40:54 +03:00
|
|
|
output := html.EscapeString(content.Body)
|
|
|
|
for regex, replacement := range formatter.waReplString {
|
|
|
|
output = regex.ReplaceAllString(output, replacement)
|
|
|
|
}
|
|
|
|
for regex, replacer := range formatter.waReplFunc {
|
|
|
|
output = regex.ReplaceAllStringFunc(output, replacer)
|
|
|
|
}
|
2022-06-24 21:50:58 +03:00
|
|
|
if allowInlineURL {
|
|
|
|
output = inlineURLRegex.ReplaceAllStringFunc(output, func(s string) string {
|
|
|
|
groups := inlineURLRegex.FindStringSubmatch(s)
|
|
|
|
return fmt.Sprintf(`<a href="%s">%s</a>`, groups[2], groups[1])
|
|
|
|
})
|
|
|
|
}
|
2021-10-22 20:14:34 +03:00
|
|
|
for _, rawJID := range mentionedJIDs {
|
|
|
|
jid, err := types.ParseJID(rawJID)
|
|
|
|
if err != nil {
|
|
|
|
continue
|
|
|
|
} else if jid.Server == types.LegacyUserServer {
|
|
|
|
jid.Server = types.DefaultUserServer
|
|
|
|
}
|
2022-02-16 01:00:49 +02:00
|
|
|
mxid, displayname := formatter.getMatrixInfoByJID(roomID, jid)
|
2021-10-22 20:14:34 +03:00
|
|
|
number := "@" + jid.User
|
|
|
|
output = strings.ReplaceAll(output, number, fmt.Sprintf(`<a href="https://matrix.to/#/%s">%s</a>`, mxid, displayname))
|
|
|
|
content.Body = strings.ReplaceAll(content.Body, number, displayname)
|
2020-07-31 14:30:58 +03:00
|
|
|
}
|
2022-06-24 23:25:37 +03:00
|
|
|
if output != content.Body || forceHTML {
|
2021-10-22 20:14:34 +03:00
|
|
|
output = strings.ReplaceAll(output, "\n", "<br/>")
|
2018-08-29 00:40:54 +03:00
|
|
|
content.FormattedBody = output
|
2020-05-08 22:32:22 +03:00
|
|
|
content.Format = event.FormatHTML
|
2018-08-29 00:40:54 +03:00
|
|
|
for regex, replacer := range formatter.waReplFuncText {
|
|
|
|
content.Body = regex.ReplaceAllStringFunc(content.Body, replacer)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2021-10-22 20:14:34 +03:00
|
|
|
func (formatter *Formatter) ParseMatrix(html string) (string, []string) {
|
2020-07-31 14:30:58 +03:00
|
|
|
ctx := make(format.Context)
|
|
|
|
result := formatter.matrixHTMLParser.Parse(html, ctx)
|
2021-10-22 20:14:34 +03:00
|
|
|
mentionedJIDs, _ := ctx[mentionedJIDsContextKey].([]string)
|
2020-07-31 14:30:58 +03:00
|
|
|
return result, mentionedJIDs
|
2018-08-26 00:26:24 +03:00
|
|
|
}
|