mirror of
https://github.com/mattermost/mattermost.git
synced 2025-02-25 18:55:24 -06:00
Remote Cluster Service - provides ability for multiple Mattermost cluster instances to create a trusted connection with each other and exchange messages - trusted connections are managed via slash commands (for now) - facilitates features requiring inter-cluster communication, such as Shared Channels Shared Channels Service - provides ability to shared channels between one or more Mattermost cluster instances (using trusted connection) - sharing/unsharing of channels is managed via slash commands (for now)
175 lines
4.6 KiB
Go
175 lines
4.6 KiB
Go
// Copyright (c) 2015-present Mattermost, Inc. All Rights Reserved.
|
|
// See LICENSE.txt for license information.
|
|
|
|
package remotecluster
|
|
|
|
import (
|
|
"encoding/json"
|
|
"fmt"
|
|
"time"
|
|
|
|
"github.com/mattermost/mattermost-server/v5/model"
|
|
"github.com/mattermost/mattermost-server/v5/shared/mlog"
|
|
)
|
|
|
|
// pingLoop periodically sends a ping to all remote clusters.
|
|
func (rcs *Service) pingLoop(done <-chan struct{}) {
|
|
pingChan := make(chan *model.RemoteCluster, MaxConcurrentSends*2)
|
|
|
|
// create a thread pool to send pings concurrently to remotes.
|
|
for i := 0; i < MaxConcurrentSends; i++ {
|
|
go rcs.pingEmitter(pingChan, done)
|
|
}
|
|
|
|
go rcs.pingGenerator(pingChan, done)
|
|
}
|
|
|
|
func (rcs *Service) pingGenerator(pingChan chan *model.RemoteCluster, done <-chan struct{}) {
|
|
defer close(pingChan)
|
|
|
|
for {
|
|
start := time.Now()
|
|
|
|
// get all remotes, including any previously offline.
|
|
remotes, err := rcs.server.GetStore().RemoteCluster().GetAll(model.RemoteClusterQueryFilter{})
|
|
if err != nil {
|
|
rcs.server.GetLogger().Log(mlog.LvlRemoteClusterServiceError, "Ping remote cluster failed (could not get list of remotes)", mlog.Err(err))
|
|
select {
|
|
case <-time.After(PingFreq):
|
|
continue
|
|
case <-done:
|
|
return
|
|
}
|
|
}
|
|
|
|
for _, rc := range remotes {
|
|
if rc.SiteURL != "" { // filter out unconfirmed invites
|
|
pingChan <- rc
|
|
}
|
|
}
|
|
|
|
// try to maintain frequency
|
|
elapsed := time.Since(start)
|
|
if elapsed < PingFreq {
|
|
sleep := time.Until(start.Add(PingFreq))
|
|
select {
|
|
case <-time.After(sleep):
|
|
case <-done:
|
|
return
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// pingEmitter pulls Remotes from the ping queue (pingChan) and pings them.
|
|
// Pinging a remote cannot take longer than PingTimeoutMillis.
|
|
func (rcs *Service) pingEmitter(pingChan <-chan *model.RemoteCluster, done <-chan struct{}) {
|
|
for {
|
|
select {
|
|
case rc := <-pingChan:
|
|
if rc == nil {
|
|
return
|
|
}
|
|
|
|
online := rc.IsOnline()
|
|
|
|
if err := rcs.pingRemote(rc); err != nil {
|
|
rcs.server.GetLogger().Log(mlog.LvlRemoteClusterServiceWarn, "Remote cluster ping failed",
|
|
mlog.String("remote", rc.DisplayName),
|
|
mlog.String("remoteId", rc.RemoteId),
|
|
mlog.Err(err),
|
|
)
|
|
}
|
|
|
|
if online != rc.IsOnline() {
|
|
if metrics := rcs.server.GetMetrics(); metrics != nil {
|
|
metrics.IncrementRemoteClusterConnStateChangeCounter(rc.RemoteId, rc.IsOnline())
|
|
}
|
|
rcs.fireConnectionStateChgEvent(rc)
|
|
}
|
|
case <-done:
|
|
return
|
|
}
|
|
}
|
|
}
|
|
|
|
// pingRemote make a synchronous ping to a remote cluster. Return is error if ping is
|
|
// unsuccessful and nil on success.
|
|
func (rcs *Service) pingRemote(rc *model.RemoteCluster) error {
|
|
frame, err := makePingFrame(rc)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
url := fmt.Sprintf("%s/%s", rc.SiteURL, PingURL)
|
|
|
|
resp, err := rcs.sendFrameToRemote(PingTimeout, rc, frame, url)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
ping := model.RemoteClusterPing{}
|
|
err = json.Unmarshal(resp, &ping)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
if err := rcs.server.GetStore().RemoteCluster().SetLastPingAt(rc.RemoteId); err != nil {
|
|
rcs.server.GetLogger().Log(mlog.LvlRemoteClusterServiceError, "Failed to update LastPingAt for remote cluster",
|
|
mlog.String("remote", rc.DisplayName),
|
|
mlog.String("remoteId", rc.RemoteId),
|
|
mlog.Err(err),
|
|
)
|
|
}
|
|
rc.LastPingAt = model.GetMillis()
|
|
|
|
if metrics := rcs.server.GetMetrics(); metrics != nil {
|
|
sentAt := time.Unix(0, ping.SentAt*int64(time.Millisecond))
|
|
elapsed := time.Since(sentAt).Seconds()
|
|
metrics.ObserveRemoteClusterPingDuration(rc.RemoteId, elapsed)
|
|
|
|
// we approximate clock skew between remotes.
|
|
skew := elapsed/2 - float64(ping.RecvAt-ping.SentAt)/1000
|
|
metrics.ObserveRemoteClusterClockSkew(rc.RemoteId, skew)
|
|
}
|
|
|
|
rcs.server.GetLogger().Log(mlog.LvlRemoteClusterServiceDebug, "Remote cluster ping",
|
|
mlog.String("remote", rc.DisplayName),
|
|
mlog.String("remoteId", rc.RemoteId),
|
|
mlog.Int64("SentAt", ping.SentAt),
|
|
mlog.Int64("RecvAt", ping.RecvAt),
|
|
mlog.Int64("Diff", ping.RecvAt-ping.SentAt),
|
|
)
|
|
return nil
|
|
}
|
|
|
|
func makePingFrame(rc *model.RemoteCluster) (*model.RemoteClusterFrame, error) {
|
|
ping := model.RemoteClusterPing{
|
|
SentAt: model.GetMillis(),
|
|
}
|
|
pingRaw, err := json.Marshal(ping)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
msg := model.NewRemoteClusterMsg(PingTopic, pingRaw)
|
|
|
|
frame := &model.RemoteClusterFrame{
|
|
RemoteId: rc.RemoteId,
|
|
Msg: msg,
|
|
}
|
|
return frame, nil
|
|
}
|
|
|
|
func (rcs *Service) fireConnectionStateChgEvent(rc *model.RemoteCluster) {
|
|
rcs.mux.RLock()
|
|
listeners := make([]ConnectionStateListener, 0, len(rcs.connectionStateListeners))
|
|
for _, l := range rcs.connectionStateListeners {
|
|
listeners = append(listeners, l)
|
|
}
|
|
rcs.mux.RUnlock()
|
|
|
|
for _, l := range listeners {
|
|
l(rc, rc.IsOnline())
|
|
}
|
|
}
|