forked from MirrorHub/mautrix-whatsapp
a948ea0146
See d578d1a610
Database upgrades from before v0.4.0 were squashed, users must update
to at least v0.4.0 before updating beyond this commit.
146 lines
5.2 KiB
Go
146 lines
5.2 KiB
Go
// mautrix-whatsapp - A Matrix-WhatsApp puppeting bridge.
|
|
// Copyright (C) 2021 Tulir Asokan
|
|
//
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// This program is distributed in the hope that it will be useful,
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Affero General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
// along with this program. If not, see <https://www.gnu.org/licenses/>.
|
|
|
|
package main
|
|
|
|
import (
|
|
"fmt"
|
|
"html"
|
|
"regexp"
|
|
"strings"
|
|
|
|
"go.mau.fi/whatsmeow/types"
|
|
|
|
"maunium.net/go/mautrix/event"
|
|
"maunium.net/go/mautrix/format"
|
|
"maunium.net/go/mautrix/id"
|
|
)
|
|
|
|
var italicRegex = regexp.MustCompile("([\\s>~*]|^)_(.+?)_([^a-zA-Z\\d]|$)")
|
|
var boldRegex = regexp.MustCompile("([\\s>_~]|^)\\*(.+?)\\*([^a-zA-Z\\d]|$)")
|
|
var strikethroughRegex = regexp.MustCompile("([\\s>_*]|^)~(.+?)~([^a-zA-Z\\d]|$)")
|
|
var codeBlockRegex = regexp.MustCompile("```(?:.|\n)+?```")
|
|
|
|
const mentionedJIDsContextKey = "net.maunium.whatsapp.mentioned_jids"
|
|
|
|
type Formatter struct {
|
|
bridge *WABridge
|
|
|
|
matrixHTMLParser *format.HTMLParser
|
|
|
|
waReplString map[*regexp.Regexp]string
|
|
waReplFunc map[*regexp.Regexp]func(string) string
|
|
waReplFuncText map[*regexp.Regexp]func(string) string
|
|
}
|
|
|
|
func NewFormatter(bridge *WABridge) *Formatter {
|
|
formatter := &Formatter{
|
|
bridge: bridge,
|
|
matrixHTMLParser: &format.HTMLParser{
|
|
TabsToSpaces: 4,
|
|
Newline: "\n",
|
|
|
|
PillConverter: func(displayname, mxid, eventID string, ctx format.Context) string {
|
|
if mxid[0] == '@' {
|
|
puppet := bridge.GetPuppetByMXID(id.UserID(mxid))
|
|
if puppet != nil {
|
|
jids, ok := ctx[mentionedJIDsContextKey].([]string)
|
|
if !ok {
|
|
ctx[mentionedJIDsContextKey] = []string{puppet.JID.String()}
|
|
} else {
|
|
ctx[mentionedJIDsContextKey] = append(jids, puppet.JID.String())
|
|
}
|
|
return "@" + puppet.JID.User
|
|
}
|
|
}
|
|
return mxid
|
|
},
|
|
BoldConverter: func(text string, _ format.Context) string { return fmt.Sprintf("*%s*", text) },
|
|
ItalicConverter: func(text string, _ format.Context) string { return fmt.Sprintf("_%s_", text) },
|
|
StrikethroughConverter: func(text string, _ format.Context) string { return fmt.Sprintf("~%s~", text) },
|
|
MonospaceConverter: func(text string, _ format.Context) string { return fmt.Sprintf("```%s```", text) },
|
|
MonospaceBlockConverter: func(text, language string, _ format.Context) string { return fmt.Sprintf("```%s```", text) },
|
|
},
|
|
waReplString: map[*regexp.Regexp]string{
|
|
italicRegex: "$1<em>$2</em>$3",
|
|
boldRegex: "$1<strong>$2</strong>$3",
|
|
strikethroughRegex: "$1<del>$2</del>$3",
|
|
},
|
|
}
|
|
formatter.waReplFunc = map[*regexp.Regexp]func(string) string{
|
|
codeBlockRegex: func(str string) string {
|
|
str = str[3 : len(str)-3]
|
|
if strings.ContainsRune(str, '\n') {
|
|
return fmt.Sprintf("<pre><code>%s</code></pre>", str)
|
|
}
|
|
return fmt.Sprintf("<code>%s</code>", str)
|
|
},
|
|
}
|
|
formatter.waReplFuncText = map[*regexp.Regexp]func(string) string{}
|
|
return formatter
|
|
}
|
|
|
|
func (formatter *Formatter) getMatrixInfoByJID(roomID id.RoomID, jid types.JID) (mxid id.UserID, displayname string) {
|
|
if puppet := formatter.bridge.GetPuppetByJID(jid); puppet != nil {
|
|
mxid = puppet.MXID
|
|
displayname = puppet.Displayname
|
|
}
|
|
if user := formatter.bridge.GetUserByJID(jid); user != nil {
|
|
mxid = user.MXID
|
|
member := formatter.bridge.StateStore.GetMember(roomID, user.MXID)
|
|
if len(member.Displayname) > 0 {
|
|
displayname = member.Displayname
|
|
}
|
|
}
|
|
return
|
|
}
|
|
|
|
func (formatter *Formatter) ParseWhatsApp(roomID id.RoomID, content *event.MessageEventContent, mentionedJIDs []string) {
|
|
output := html.EscapeString(content.Body)
|
|
for regex, replacement := range formatter.waReplString {
|
|
output = regex.ReplaceAllString(output, replacement)
|
|
}
|
|
for regex, replacer := range formatter.waReplFunc {
|
|
output = regex.ReplaceAllStringFunc(output, replacer)
|
|
}
|
|
for _, rawJID := range mentionedJIDs {
|
|
jid, err := types.ParseJID(rawJID)
|
|
if err != nil {
|
|
continue
|
|
} else if jid.Server == types.LegacyUserServer {
|
|
jid.Server = types.DefaultUserServer
|
|
}
|
|
mxid, displayname := formatter.getMatrixInfoByJID(roomID, jid)
|
|
number := "@" + jid.User
|
|
output = strings.ReplaceAll(output, number, fmt.Sprintf(`<a href="https://matrix.to/#/%s">%s</a>`, mxid, displayname))
|
|
content.Body = strings.ReplaceAll(content.Body, number, displayname)
|
|
}
|
|
if output != content.Body {
|
|
output = strings.ReplaceAll(output, "\n", "<br/>")
|
|
content.FormattedBody = output
|
|
content.Format = event.FormatHTML
|
|
for regex, replacer := range formatter.waReplFuncText {
|
|
content.Body = regex.ReplaceAllStringFunc(content.Body, replacer)
|
|
}
|
|
}
|
|
}
|
|
|
|
func (formatter *Formatter) ParseMatrix(html string) (string, []string) {
|
|
ctx := make(format.Context)
|
|
result := formatter.matrixHTMLParser.Parse(html, ctx)
|
|
mentionedJIDs, _ := ctx[mentionedJIDsContextKey].([]string)
|
|
return result, mentionedJIDs
|
|
}
|