2017-08-02 15:21:35 +00:00
|
|
|
// Copyright 2017 Vector Creations Ltd
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package consumers
|
|
|
|
|
|
|
|
import (
|
2017-09-18 15:52:22 +00:00
|
|
|
"context"
|
2017-08-02 15:21:35 +00:00
|
|
|
"encoding/json"
|
2022-09-27 16:06:49 +00:00
|
|
|
"strings"
|
|
|
|
"time"
|
2017-08-02 15:21:35 +00:00
|
|
|
|
2021-03-24 10:25:24 +00:00
|
|
|
"github.com/getsentry/sentry-go"
|
2022-08-05 13:37:13 +00:00
|
|
|
"github.com/matrix-org/gomatrixserverlib"
|
|
|
|
"github.com/nats-io/nats.go"
|
|
|
|
"github.com/sirupsen/logrus"
|
|
|
|
log "github.com/sirupsen/logrus"
|
2022-09-27 16:06:49 +00:00
|
|
|
"github.com/tidwall/gjson"
|
2022-08-05 13:37:13 +00:00
|
|
|
|
2020-06-12 13:55:57 +00:00
|
|
|
"github.com/matrix-org/dendrite/internal/eventutil"
|
2022-09-27 16:06:49 +00:00
|
|
|
"github.com/matrix-org/dendrite/internal/fulltext"
|
2020-12-02 17:41:00 +00:00
|
|
|
"github.com/matrix-org/dendrite/setup/config"
|
2022-01-05 17:44:49 +00:00
|
|
|
"github.com/matrix-org/dendrite/setup/jetstream"
|
2021-01-26 12:56:20 +00:00
|
|
|
"github.com/matrix-org/dendrite/setup/process"
|
2021-01-08 16:59:06 +00:00
|
|
|
"github.com/matrix-org/dendrite/syncapi/notifier"
|
2017-08-02 15:21:35 +00:00
|
|
|
"github.com/matrix-org/dendrite/syncapi/storage"
|
2019-07-12 14:59:53 +00:00
|
|
|
"github.com/matrix-org/dendrite/syncapi/types"
|
2017-08-02 15:21:35 +00:00
|
|
|
)
|
|
|
|
|
2017-10-11 17:13:43 +00:00
|
|
|
// OutputClientDataConsumer consumes events that originated in the client API server.
|
|
|
|
type OutputClientDataConsumer struct {
|
2022-09-27 16:06:49 +00:00
|
|
|
ctx context.Context
|
|
|
|
jetstream nats.JetStreamContext
|
|
|
|
nats *nats.Conn
|
|
|
|
durable string
|
|
|
|
topic string
|
|
|
|
topicReIndex string
|
|
|
|
db storage.Database
|
|
|
|
stream types.StreamProvider
|
|
|
|
notifier *notifier.Notifier
|
|
|
|
serverName gomatrixserverlib.ServerName
|
|
|
|
fts *fulltext.Search
|
|
|
|
cfg *config.SyncAPI
|
2017-08-02 15:21:35 +00:00
|
|
|
}
|
|
|
|
|
2017-10-11 17:13:43 +00:00
|
|
|
// NewOutputClientDataConsumer creates a new OutputClientData consumer. Call Start() to begin consuming from room servers.
|
|
|
|
func NewOutputClientDataConsumer(
|
2021-01-26 12:56:20 +00:00
|
|
|
process *process.ProcessContext,
|
2020-08-10 13:18:04 +00:00
|
|
|
cfg *config.SyncAPI,
|
2022-01-05 17:44:49 +00:00
|
|
|
js nats.JetStreamContext,
|
2022-09-27 16:06:49 +00:00
|
|
|
nats *nats.Conn,
|
2020-01-03 14:07:05 +00:00
|
|
|
store storage.Database,
|
2021-01-08 16:59:06 +00:00
|
|
|
notifier *notifier.Notifier,
|
|
|
|
stream types.StreamProvider,
|
2022-09-27 16:06:49 +00:00
|
|
|
fts *fulltext.Search,
|
2017-10-11 17:13:43 +00:00
|
|
|
) *OutputClientDataConsumer {
|
2022-01-05 17:44:49 +00:00
|
|
|
return &OutputClientDataConsumer{
|
2022-09-27 16:06:49 +00:00
|
|
|
ctx: process.Context(),
|
|
|
|
jetstream: js,
|
|
|
|
topic: cfg.Matrix.JetStream.Prefixed(jetstream.OutputClientData),
|
|
|
|
topicReIndex: cfg.Matrix.JetStream.Prefixed(jetstream.InputFulltextReindex),
|
|
|
|
durable: cfg.Matrix.JetStream.Durable("SyncAPIAccountDataConsumer"),
|
|
|
|
nats: nats,
|
|
|
|
db: store,
|
|
|
|
notifier: notifier,
|
|
|
|
stream: stream,
|
|
|
|
serverName: cfg.Matrix.ServerName,
|
|
|
|
fts: fts,
|
|
|
|
cfg: cfg,
|
2017-08-02 15:21:35 +00:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Start consuming from room servers
|
2017-10-11 17:13:43 +00:00
|
|
|
func (s *OutputClientDataConsumer) Start() error {
|
2022-09-27 16:06:49 +00:00
|
|
|
_, err := s.nats.Subscribe(s.topicReIndex, func(msg *nats.Msg) {
|
|
|
|
if err := msg.Ack(); err != nil {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if !s.cfg.Fulltext.Enabled {
|
|
|
|
logrus.Warn("Fulltext indexing is disabled")
|
|
|
|
return
|
|
|
|
}
|
|
|
|
ctx := context.Background()
|
|
|
|
logrus.Debugf("Starting to index events")
|
|
|
|
var offset int
|
|
|
|
start := time.Now()
|
|
|
|
count := 0
|
|
|
|
var id int64 = 0
|
|
|
|
for {
|
|
|
|
evs, err := s.db.ReIndex(ctx, 1000, id)
|
|
|
|
if err != nil {
|
|
|
|
logrus.WithError(err).Errorf("unable to get events to index")
|
|
|
|
return
|
|
|
|
}
|
|
|
|
if len(evs) == 0 {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
logrus.Debugf("Indexing %d events", len(evs))
|
|
|
|
elements := make([]fulltext.IndexElement, 0, len(evs))
|
|
|
|
|
|
|
|
for streamPos, ev := range evs {
|
|
|
|
id = streamPos
|
|
|
|
e := fulltext.IndexElement{
|
|
|
|
EventID: ev.EventID(),
|
|
|
|
RoomID: ev.RoomID(),
|
|
|
|
StreamPosition: streamPos,
|
|
|
|
}
|
|
|
|
e.SetContentType(ev.Type())
|
|
|
|
|
|
|
|
switch ev.Type() {
|
|
|
|
case "m.room.message":
|
|
|
|
e.Content = gjson.GetBytes(ev.Content(), "body").String()
|
|
|
|
case gomatrixserverlib.MRoomName:
|
|
|
|
e.Content = gjson.GetBytes(ev.Content(), "name").String()
|
|
|
|
case gomatrixserverlib.MRoomTopic:
|
|
|
|
e.Content = gjson.GetBytes(ev.Content(), "topic").String()
|
|
|
|
default:
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
if strings.TrimSpace(e.Content) == "" {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
elements = append(elements, e)
|
|
|
|
}
|
|
|
|
if err = s.fts.Index(elements...); err != nil {
|
|
|
|
logrus.WithError(err).Error("unable to index events")
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
offset += len(evs)
|
|
|
|
count += len(elements)
|
|
|
|
}
|
|
|
|
logrus.Debugf("Indexed %d events in %v", count, time.Since(start))
|
|
|
|
})
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2022-02-02 13:32:48 +00:00
|
|
|
return jetstream.JetStreamConsumer(
|
2022-08-31 11:21:56 +00:00
|
|
|
s.ctx, s.jetstream, s.topic, s.durable, 1,
|
|
|
|
s.onMessage, nats.DeliverAll(), nats.ManualAck(),
|
2022-02-02 13:32:48 +00:00
|
|
|
)
|
2017-08-02 15:21:35 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// onMessage is called when the sync server receives a new event from the client API server output log.
|
|
|
|
// It is not safe for this function to be called from multiple goroutines, or else the
|
|
|
|
// sync stream position may race and be incorrectly calculated.
|
2022-08-31 11:21:56 +00:00
|
|
|
func (s *OutputClientDataConsumer) onMessage(ctx context.Context, msgs []*nats.Msg) bool {
|
|
|
|
msg := msgs[0] // Guaranteed to exist if onMessage is called
|
2022-02-02 13:32:48 +00:00
|
|
|
// Parse out the event JSON
|
|
|
|
userID := msg.Header.Get(jetstream.UserID)
|
|
|
|
var output eventutil.AccountData
|
|
|
|
if err := json.Unmarshal(msg.Data, &output); err != nil {
|
|
|
|
// If the message was invalid, log it and move on to the next message in the stream
|
|
|
|
log.WithError(err).Errorf("client API server output log: message parse failure")
|
|
|
|
sentry.CaptureException(err)
|
|
|
|
return true
|
|
|
|
}
|
2017-08-02 15:21:35 +00:00
|
|
|
|
2022-02-02 13:32:48 +00:00
|
|
|
log.WithFields(log.Fields{
|
|
|
|
"type": output.Type,
|
|
|
|
"room_id": output.RoomID,
|
|
|
|
}).Debug("Received data from client API server")
|
2022-01-05 17:44:49 +00:00
|
|
|
|
2022-02-02 13:32:48 +00:00
|
|
|
streamPos, err := s.db.UpsertAccountData(
|
|
|
|
s.ctx, userID, output.RoomID, output.Type,
|
|
|
|
)
|
|
|
|
if err != nil {
|
|
|
|
sentry.CaptureException(err)
|
|
|
|
log.WithFields(log.Fields{
|
|
|
|
"type": output.Type,
|
|
|
|
"room_id": output.RoomID,
|
|
|
|
log.ErrorKey: err,
|
2022-08-05 13:37:13 +00:00
|
|
|
}).Errorf("could not save account data")
|
|
|
|
return false
|
2022-02-02 13:32:48 +00:00
|
|
|
}
|
2017-08-02 15:21:35 +00:00
|
|
|
|
2022-04-07 14:08:19 +00:00
|
|
|
if output.IgnoredUsers != nil {
|
|
|
|
if err := s.db.UpdateIgnoresForUser(ctx, userID, output.IgnoredUsers); err != nil {
|
|
|
|
log.WithError(err).WithFields(logrus.Fields{
|
|
|
|
"user_id": userID,
|
|
|
|
}).Errorf("Failed to update ignored users")
|
|
|
|
sentry.CaptureException(err)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-02-02 13:32:48 +00:00
|
|
|
s.stream.Advance(streamPos)
|
|
|
|
s.notifier.OnNewAccountData(userID, types.StreamingToken{AccountDataPosition: streamPos})
|
2017-08-02 15:21:35 +00:00
|
|
|
|
2022-02-02 13:32:48 +00:00
|
|
|
return true
|
2017-08-02 15:21:35 +00:00
|
|
|
}
|