2017-06-28 17:10:17 +02:00
|
|
|
// Copyright 2017 Vector Creations Ltd
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package queue
|
|
|
|
|
|
|
|
import (
|
2020-07-01 12:46:38 +02:00
|
|
|
"context"
|
2020-06-10 17:54:43 +02:00
|
|
|
"crypto/ed25519"
|
2020-07-01 12:46:38 +02:00
|
|
|
"encoding/json"
|
2017-06-28 17:10:17 +02:00
|
|
|
"fmt"
|
|
|
|
"sync"
|
2020-09-03 22:17:55 +02:00
|
|
|
"time"
|
2017-06-28 17:10:17 +02:00
|
|
|
|
2020-07-22 18:01:29 +02:00
|
|
|
"github.com/matrix-org/dendrite/federationsender/statistics"
|
2020-07-01 12:46:38 +02:00
|
|
|
"github.com/matrix-org/dendrite/federationsender/storage"
|
2020-06-10 17:54:43 +02:00
|
|
|
"github.com/matrix-org/dendrite/roomserver/api"
|
2017-06-28 17:10:17 +02:00
|
|
|
"github.com/matrix-org/gomatrixserverlib"
|
2017-11-16 11:12:02 +01:00
|
|
|
log "github.com/sirupsen/logrus"
|
2020-08-13 15:23:37 +02:00
|
|
|
"github.com/tidwall/gjson"
|
2017-06-28 17:10:17 +02:00
|
|
|
)
|
|
|
|
|
|
|
|
// OutgoingQueues is a collection of queues for sending transactions to other
|
|
|
|
// matrix servers
|
|
|
|
type OutgoingQueues struct {
|
2020-07-01 12:46:38 +02:00
|
|
|
db storage.Database
|
2020-12-02 16:10:03 +01:00
|
|
|
disabled bool
|
2020-06-10 17:54:43 +02:00
|
|
|
rsAPI api.RoomserverInternalAPI
|
Improve federation sender performance, implement backoff and blacklisting, fix up invites a bit (#1007)
* Improve federation sender performance and behaviour, add backoff
* Tweaks
* Tweaks
* Tweaks
* Take copies of events before passing to destination queues
* Don't accidentally drop queued messages
* Don't take copies again
* Tidy up a bit
* Break out statistics (tracked component-wide), report success and failures from Perform actions
* Fix comment, use atomic add
* Improve logic a bit, don't block on wakeup, move idle check
* Don't retry sucessful invites, don't dispatch sendEvent, sendInvite etc
* Dedupe destinations, fix other bug hopefully
* Dispatch sends again
* Federation sender to ignore invites that are destined locally
* Loopback invite events
* Remodel a bit with channels
* Linter
* Only loopback invite event if we know the room
* We should tell other resident servers about the invite if we know about the room
* Correct invite signing
* Fix invite loopback
* Check HTTP response codes, push new invites to front of queue
* Review comments
2020-05-07 13:42:06 +02:00
|
|
|
origin gomatrixserverlib.ServerName
|
|
|
|
client *gomatrixserverlib.FederationClient
|
2020-07-22 18:01:29 +02:00
|
|
|
statistics *statistics.Statistics
|
2020-06-10 17:54:43 +02:00
|
|
|
signing *SigningInfo
|
Improve federation sender performance, implement backoff and blacklisting, fix up invites a bit (#1007)
* Improve federation sender performance and behaviour, add backoff
* Tweaks
* Tweaks
* Tweaks
* Take copies of events before passing to destination queues
* Don't accidentally drop queued messages
* Don't take copies again
* Tidy up a bit
* Break out statistics (tracked component-wide), report success and failures from Perform actions
* Fix comment, use atomic add
* Improve logic a bit, don't block on wakeup, move idle check
* Don't retry sucessful invites, don't dispatch sendEvent, sendInvite etc
* Dedupe destinations, fix other bug hopefully
* Dispatch sends again
* Federation sender to ignore invites that are destined locally
* Loopback invite events
* Remodel a bit with channels
* Linter
* Only loopback invite event if we know the room
* We should tell other resident servers about the invite if we know about the room
* Correct invite signing
* Fix invite loopback
* Check HTTP response codes, push new invites to front of queue
* Review comments
2020-05-07 13:42:06 +02:00
|
|
|
queuesMutex sync.Mutex // protects the below
|
2017-06-28 17:10:17 +02:00
|
|
|
queues map[gomatrixserverlib.ServerName]*destinationQueue
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewOutgoingQueues makes a new OutgoingQueues
|
2020-04-28 11:53:07 +02:00
|
|
|
func NewOutgoingQueues(
|
2020-07-01 12:46:38 +02:00
|
|
|
db storage.Database,
|
2020-12-02 16:10:03 +01:00
|
|
|
disabled bool,
|
2020-04-28 11:53:07 +02:00
|
|
|
origin gomatrixserverlib.ServerName,
|
|
|
|
client *gomatrixserverlib.FederationClient,
|
2020-06-10 17:54:43 +02:00
|
|
|
rsAPI api.RoomserverInternalAPI,
|
2020-07-22 18:01:29 +02:00
|
|
|
statistics *statistics.Statistics,
|
2020-06-10 17:54:43 +02:00
|
|
|
signing *SigningInfo,
|
2020-04-28 11:53:07 +02:00
|
|
|
) *OutgoingQueues {
|
2020-07-03 12:49:49 +02:00
|
|
|
queues := &OutgoingQueues{
|
2020-12-02 16:10:03 +01:00
|
|
|
disabled: disabled,
|
2020-07-01 12:46:38 +02:00
|
|
|
db: db,
|
2020-06-10 17:54:43 +02:00
|
|
|
rsAPI: rsAPI,
|
2020-04-28 11:53:07 +02:00
|
|
|
origin: origin,
|
|
|
|
client: client,
|
Improve federation sender performance, implement backoff and blacklisting, fix up invites a bit (#1007)
* Improve federation sender performance and behaviour, add backoff
* Tweaks
* Tweaks
* Tweaks
* Take copies of events before passing to destination queues
* Don't accidentally drop queued messages
* Don't take copies again
* Tidy up a bit
* Break out statistics (tracked component-wide), report success and failures from Perform actions
* Fix comment, use atomic add
* Improve logic a bit, don't block on wakeup, move idle check
* Don't retry sucessful invites, don't dispatch sendEvent, sendInvite etc
* Dedupe destinations, fix other bug hopefully
* Dispatch sends again
* Federation sender to ignore invites that are destined locally
* Loopback invite events
* Remodel a bit with channels
* Linter
* Only loopback invite event if we know the room
* We should tell other resident servers about the invite if we know about the room
* Correct invite signing
* Fix invite loopback
* Check HTTP response codes, push new invites to front of queue
* Review comments
2020-05-07 13:42:06 +02:00
|
|
|
statistics: statistics,
|
2020-06-10 17:54:43 +02:00
|
|
|
signing: signing,
|
2020-04-28 11:53:07 +02:00
|
|
|
queues: map[gomatrixserverlib.ServerName]*destinationQueue{},
|
2017-06-28 17:10:17 +02:00
|
|
|
}
|
2020-07-03 12:49:49 +02:00
|
|
|
// Look up which servers we have pending items for and then rehydrate those queues.
|
2020-12-02 16:10:03 +01:00
|
|
|
if !disabled {
|
|
|
|
time.AfterFunc(time.Second*5, func() {
|
|
|
|
serverNames := map[gomatrixserverlib.ServerName]struct{}{}
|
|
|
|
if names, err := db.GetPendingPDUServerNames(context.Background()); err == nil {
|
|
|
|
for _, serverName := range names {
|
|
|
|
serverNames[serverName] = struct{}{}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
log.WithError(err).Error("Failed to get PDU server names for destination queue hydration")
|
2020-09-03 22:17:55 +02:00
|
|
|
}
|
2020-12-02 16:10:03 +01:00
|
|
|
if names, err := db.GetPendingEDUServerNames(context.Background()); err == nil {
|
|
|
|
for _, serverName := range names {
|
|
|
|
serverNames[serverName] = struct{}{}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
log.WithError(err).Error("Failed to get EDU server names for destination queue hydration")
|
2020-09-03 22:17:55 +02:00
|
|
|
}
|
2020-12-02 16:10:03 +01:00
|
|
|
for serverName := range serverNames {
|
|
|
|
if !queues.getQueue(serverName).statistics.Blacklisted() {
|
|
|
|
queues.getQueue(serverName).wakeQueueIfNeeded()
|
|
|
|
}
|
2020-09-03 22:17:55 +02:00
|
|
|
}
|
2020-12-02 16:10:03 +01:00
|
|
|
})
|
|
|
|
}
|
2020-07-03 12:49:49 +02:00
|
|
|
return queues
|
2017-06-28 17:10:17 +02:00
|
|
|
}
|
|
|
|
|
2020-06-10 17:54:43 +02:00
|
|
|
// TODO: Move this somewhere useful for other components as we often need to ferry these 3 variables
|
|
|
|
// around together
|
|
|
|
type SigningInfo struct {
|
|
|
|
ServerName gomatrixserverlib.ServerName
|
|
|
|
KeyID gomatrixserverlib.KeyID
|
|
|
|
PrivateKey ed25519.PrivateKey
|
|
|
|
}
|
|
|
|
|
Improve federation sender performance, implement backoff and blacklisting, fix up invites a bit (#1007)
* Improve federation sender performance and behaviour, add backoff
* Tweaks
* Tweaks
* Tweaks
* Take copies of events before passing to destination queues
* Don't accidentally drop queued messages
* Don't take copies again
* Tidy up a bit
* Break out statistics (tracked component-wide), report success and failures from Perform actions
* Fix comment, use atomic add
* Improve logic a bit, don't block on wakeup, move idle check
* Don't retry sucessful invites, don't dispatch sendEvent, sendInvite etc
* Dedupe destinations, fix other bug hopefully
* Dispatch sends again
* Federation sender to ignore invites that are destined locally
* Loopback invite events
* Remodel a bit with channels
* Linter
* Only loopback invite event if we know the room
* We should tell other resident servers about the invite if we know about the room
* Correct invite signing
* Fix invite loopback
* Check HTTP response codes, push new invites to front of queue
* Review comments
2020-05-07 13:42:06 +02:00
|
|
|
func (oqs *OutgoingQueues) getQueue(destination gomatrixserverlib.ServerName) *destinationQueue {
|
|
|
|
oqs.queuesMutex.Lock()
|
|
|
|
defer oqs.queuesMutex.Unlock()
|
|
|
|
oq := oqs.queues[destination]
|
|
|
|
if oq == nil {
|
|
|
|
oq = &destinationQueue{
|
2020-07-03 17:31:56 +02:00
|
|
|
db: oqs.db,
|
|
|
|
rsAPI: oqs.rsAPI,
|
|
|
|
origin: oqs.origin,
|
|
|
|
destination: destination,
|
|
|
|
client: oqs.client,
|
|
|
|
statistics: oqs.statistics.ForServer(destination),
|
2020-07-07 17:36:10 +02:00
|
|
|
notifyPDUs: make(chan bool, 1),
|
2020-07-20 17:55:20 +02:00
|
|
|
notifyEDUs: make(chan bool, 1),
|
2020-07-03 17:31:56 +02:00
|
|
|
interruptBackoff: make(chan bool),
|
|
|
|
signing: oqs.signing,
|
Improve federation sender performance, implement backoff and blacklisting, fix up invites a bit (#1007)
* Improve federation sender performance and behaviour, add backoff
* Tweaks
* Tweaks
* Tweaks
* Take copies of events before passing to destination queues
* Don't accidentally drop queued messages
* Don't take copies again
* Tidy up a bit
* Break out statistics (tracked component-wide), report success and failures from Perform actions
* Fix comment, use atomic add
* Improve logic a bit, don't block on wakeup, move idle check
* Don't retry sucessful invites, don't dispatch sendEvent, sendInvite etc
* Dedupe destinations, fix other bug hopefully
* Dispatch sends again
* Federation sender to ignore invites that are destined locally
* Loopback invite events
* Remodel a bit with channels
* Linter
* Only loopback invite event if we know the room
* We should tell other resident servers about the invite if we know about the room
* Correct invite signing
* Fix invite loopback
* Check HTTP response codes, push new invites to front of queue
* Review comments
2020-05-07 13:42:06 +02:00
|
|
|
}
|
|
|
|
oqs.queues[destination] = oq
|
|
|
|
}
|
|
|
|
return oq
|
|
|
|
}
|
|
|
|
|
2017-06-28 17:10:17 +02:00
|
|
|
// SendEvent sends an event to the destinations
|
|
|
|
func (oqs *OutgoingQueues) SendEvent(
|
2020-03-27 17:28:22 +01:00
|
|
|
ev *gomatrixserverlib.HeaderedEvent, origin gomatrixserverlib.ServerName,
|
2017-06-28 17:10:17 +02:00
|
|
|
destinations []gomatrixserverlib.ServerName,
|
|
|
|
) error {
|
2020-12-02 16:10:03 +01:00
|
|
|
if oqs.disabled {
|
|
|
|
return fmt.Errorf("federation is disabled")
|
|
|
|
}
|
2017-06-28 17:10:17 +02:00
|
|
|
if origin != oqs.origin {
|
2018-08-10 17:26:57 +02:00
|
|
|
// TODO: Support virtual hosting; gh issue #577.
|
2017-06-28 17:10:17 +02:00
|
|
|
return fmt.Errorf(
|
|
|
|
"sendevent: unexpected server to send as: got %q expected %q",
|
|
|
|
origin, oqs.origin,
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
2020-08-13 15:23:37 +02:00
|
|
|
// Deduplicate destinations and remove the origin from the list of
|
|
|
|
// destinations just to be sure.
|
|
|
|
destmap := map[gomatrixserverlib.ServerName]struct{}{}
|
|
|
|
for _, d := range destinations {
|
|
|
|
destmap[d] = struct{}{}
|
|
|
|
}
|
|
|
|
delete(destmap, oqs.origin)
|
|
|
|
|
|
|
|
// Check if any of the destinations are prohibited by server ACLs.
|
|
|
|
for destination := range destmap {
|
2020-09-04 11:40:58 +02:00
|
|
|
if api.IsServerBannedFromRoom(
|
2020-08-13 15:23:37 +02:00
|
|
|
context.TODO(),
|
2020-09-04 11:40:58 +02:00
|
|
|
oqs.rsAPI,
|
2020-08-13 15:23:37 +02:00
|
|
|
ev.RoomID(),
|
|
|
|
destination,
|
|
|
|
) {
|
|
|
|
delete(destmap, destination)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// If there are no remaining destinations then give up.
|
|
|
|
if len(destmap) == 0 {
|
2020-06-12 16:11:33 +02:00
|
|
|
return nil
|
|
|
|
}
|
2017-06-28 17:10:17 +02:00
|
|
|
|
|
|
|
log.WithFields(log.Fields{
|
2020-08-13 15:23:37 +02:00
|
|
|
"destinations": len(destmap), "event": ev.EventID(),
|
2020-08-07 16:00:23 +02:00
|
|
|
}).Infof("Sending event")
|
2017-06-28 17:10:17 +02:00
|
|
|
|
2020-07-01 12:46:38 +02:00
|
|
|
headeredJSON, err := json.Marshal(ev)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("json.Marshal: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
nid, err := oqs.db.StoreJSON(context.TODO(), string(headeredJSON))
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("sendevent: oqs.db.StoreJSON: %w", err)
|
|
|
|
}
|
|
|
|
|
2020-08-13 15:23:37 +02:00
|
|
|
for destination := range destmap {
|
2020-07-01 12:46:38 +02:00
|
|
|
oqs.getQueue(destination).sendEvent(nid)
|
2017-06-28 17:10:17 +02:00
|
|
|
}
|
2018-08-10 17:26:57 +02:00
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-07-14 13:33:37 +02:00
|
|
|
// SendEDU sends an EDU event to the destinations.
|
2018-08-10 17:26:57 +02:00
|
|
|
func (oqs *OutgoingQueues) SendEDU(
|
|
|
|
e *gomatrixserverlib.EDU, origin gomatrixserverlib.ServerName,
|
|
|
|
destinations []gomatrixserverlib.ServerName,
|
|
|
|
) error {
|
2020-12-02 16:10:03 +01:00
|
|
|
if oqs.disabled {
|
|
|
|
return fmt.Errorf("federation is disabled")
|
|
|
|
}
|
2018-08-10 17:26:57 +02:00
|
|
|
if origin != oqs.origin {
|
|
|
|
// TODO: Support virtual hosting; gh issue #577.
|
|
|
|
return fmt.Errorf(
|
|
|
|
"sendevent: unexpected server to send as: got %q expected %q",
|
|
|
|
origin, oqs.origin,
|
|
|
|
)
|
|
|
|
}
|
|
|
|
|
2020-08-13 15:23:37 +02:00
|
|
|
// Deduplicate destinations and remove the origin from the list of
|
|
|
|
// destinations just to be sure.
|
|
|
|
destmap := map[gomatrixserverlib.ServerName]struct{}{}
|
|
|
|
for _, d := range destinations {
|
|
|
|
destmap[d] = struct{}{}
|
|
|
|
}
|
|
|
|
delete(destmap, oqs.origin)
|
2018-08-10 17:26:57 +02:00
|
|
|
|
2020-08-13 15:23:37 +02:00
|
|
|
// There is absolutely no guarantee that the EDU will have a room_id
|
|
|
|
// field, as it is not required by the spec. However, if it *does*
|
|
|
|
// (e.g. typing notifications) then we should try to make sure we don't
|
|
|
|
// bother sending them to servers that are prohibited by the server
|
|
|
|
// ACLs.
|
|
|
|
if result := gjson.GetBytes(e.Content, "room_id"); result.Exists() {
|
|
|
|
for destination := range destmap {
|
2020-09-04 11:40:58 +02:00
|
|
|
if api.IsServerBannedFromRoom(
|
2020-08-13 15:23:37 +02:00
|
|
|
context.TODO(),
|
2020-09-04 11:40:58 +02:00
|
|
|
oqs.rsAPI,
|
2020-08-13 15:23:37 +02:00
|
|
|
result.Str,
|
|
|
|
destination,
|
|
|
|
) {
|
|
|
|
delete(destmap, destination)
|
|
|
|
}
|
|
|
|
}
|
2019-07-01 17:04:49 +02:00
|
|
|
}
|
2018-08-10 17:26:57 +02:00
|
|
|
|
2020-08-13 15:23:37 +02:00
|
|
|
// If there are no remaining destinations then give up.
|
|
|
|
if len(destmap) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
log.WithFields(log.Fields{
|
|
|
|
"destinations": len(destmap), "edu_type": e.Type,
|
|
|
|
}).Info("Sending EDU event")
|
|
|
|
|
2020-07-20 17:55:20 +02:00
|
|
|
ephemeralJSON, err := json.Marshal(e)
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("json.Marshal: %w", err)
|
|
|
|
}
|
|
|
|
|
|
|
|
nid, err := oqs.db.StoreJSON(context.TODO(), string(ephemeralJSON))
|
|
|
|
if err != nil {
|
|
|
|
return fmt.Errorf("sendevent: oqs.db.StoreJSON: %w", err)
|
|
|
|
}
|
|
|
|
|
2020-08-13 15:23:37 +02:00
|
|
|
for destination := range destmap {
|
2020-07-20 17:55:20 +02:00
|
|
|
oqs.getQueue(destination).sendEDU(nid)
|
2018-08-10 17:26:57 +02:00
|
|
|
}
|
|
|
|
|
2017-06-28 17:10:17 +02:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-06-01 19:34:08 +02:00
|
|
|
// RetryServer attempts to resend events to the given server if we had given up.
|
|
|
|
func (oqs *OutgoingQueues) RetryServer(srv gomatrixserverlib.ServerName) {
|
2020-12-02 16:10:03 +01:00
|
|
|
if oqs.disabled {
|
|
|
|
return
|
|
|
|
}
|
2020-07-03 17:31:56 +02:00
|
|
|
q := oqs.getQueue(srv)
|
2020-06-01 19:34:08 +02:00
|
|
|
if q == nil {
|
|
|
|
return
|
|
|
|
}
|
2020-07-03 17:31:56 +02:00
|
|
|
q.wakeQueueIfNeeded()
|
2020-06-01 19:34:08 +02:00
|
|
|
}
|