components-contrib/pubsub/mqtt/mqtt.go

479 lines
14 KiB
Go

/*
Copyright 2021 The Dapr Authors
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
*/
package mqtt
import (
"context"
"crypto/tls"
"errors"
"fmt"
"net/url"
"regexp"
"strconv"
"strings"
"sync"
"time"
mqtt "github.com/eclipse/paho.mqtt.golang"
"go.uber.org/ratelimit"
"github.com/dapr/components-contrib/pubsub"
"github.com/dapr/kit/logger"
)
const (
// errors.
errorMsgPrefix = "mqtt pub sub error:"
)
// mqttPubSub type allows sending and receiving data to/from MQTT broker.
type mqttPubSub struct {
producer mqtt.Client
consumer mqtt.Client
metadata *metadata
logger logger.Logger
topics map[string]mqttPubSubSubscription
retriableErrLimit ratelimit.Limiter
subscribingLock sync.RWMutex
ctx context.Context
cancel context.CancelFunc
}
type mqttPubSubSubscription struct {
handler pubsub.Handler
alias string
matcher func(topic string) bool
}
// NewMQTTPubSub returns a new mqttPubSub instance.
func NewMQTTPubSub(logger logger.Logger) pubsub.PubSub {
return &mqttPubSub{
logger: logger,
subscribingLock: sync.RWMutex{},
}
}
// Init parses metadata and creates a new Pub Sub client.
func (m *mqttPubSub) Init(metadata pubsub.Metadata) error {
mqttMeta, err := parseMQTTMetaData(metadata, m.logger)
if err != nil {
return err
}
m.metadata = mqttMeta
if m.metadata.maxRetriableErrorsPerSec > 0 {
m.retriableErrLimit = ratelimit.New(m.metadata.maxRetriableErrorsPerSec)
} else {
m.retriableErrLimit = ratelimit.NewUnlimited()
}
m.ctx, m.cancel = context.WithCancel(context.Background())
// mqtt broker allows only one connection at a given time from a clientID.
producerClientID := m.metadata.producerID
if producerClientID == "" {
// for backwards-compatibility; see: https://github.com/dapr/components-contrib/pull/2104
producerClientID = m.metadata.consumerID + "-producer"
}
connCtx, connCancel := context.WithTimeout(m.ctx, defaultWait)
p, err := m.connect(connCtx, producerClientID)
connCancel()
if err != nil {
return err
}
m.producer = p
m.topics = make(map[string]mqttPubSubSubscription)
m.logger.Debug("mqtt message bus initialization complete")
return nil
}
// Publish the topic to mqtt pub sub.
func (m *mqttPubSub) Publish(_ context.Context, req *pubsub.PublishRequest) error {
if req.Topic == "" {
return errors.New("topic name is empty")
}
// Note this can contain PII
// m.logger.Debugf("mqtt publishing topic %s with data: %v", req.Topic, req.Data)
m.logger.Debugf("mqtt publishing topic %s", req.Topic)
retain := m.metadata.retain
if val, ok := req.Metadata[mqttRetain]; ok && val != "" {
var err error
retain, err = strconv.ParseBool(val)
if err != nil {
return fmt.Errorf("mqtt invalid retain %s, %s", val, err)
}
}
token := m.producer.Publish(req.Topic, m.metadata.qos, retain, req.Data)
t := time.NewTimer(defaultWait)
defer func() {
if !t.Stop() {
<-t.C
}
}()
select {
case <-token.Done():
// Operation completed
case <-m.ctx.Done():
// Context canceled
return m.ctx.Err()
case <-t.C:
return fmt.Errorf("mqtt timeout while publishing")
}
if !token.WaitTimeout(defaultWait) || token.Error() != nil {
return fmt.Errorf("mqtt error from publish: %v", token.Error())
}
return nil
}
// Subscribe to the mqtt pub sub topic.
func (m *mqttPubSub) Subscribe(ctx context.Context, req pubsub.SubscribeRequest, handler pubsub.Handler) error {
if ctxErr := m.ctx.Err(); ctxErr != nil {
// If the global context has been canceled, we do not allow more subscriptions
return ctxErr
}
if req.Topic == "" {
return errors.New("topic name is empty")
}
m.subscribingLock.Lock()
defer m.subscribingLock.Unlock()
// Reset subscription if active
m.resetSubscription()
// Add the topic then start the subscription
m.addTopic(req.Topic, handler)
// Use the global context here to maintain the connection
m.startSubscription(m.ctx)
// Listen for context cancelation to remove the subscription
go func() {
select {
case <-ctx.Done():
case <-m.ctx.Done():
}
m.subscribingLock.Lock()
defer m.subscribingLock.Unlock()
// If this is the last subscription or if the global context is done, close the connection entirely
if len(m.topics) <= 1 || m.ctx.Err() != nil {
m.closeSubscription()
delete(m.topics, req.Topic)
return
}
// Reconnect with one less topic
m.resetSubscription()
delete(m.topics, req.Topic)
m.startSubscription(m.ctx)
}()
return nil
}
func (m *mqttPubSub) closeSubscription() {
m.consumer.Disconnect(5)
m.consumer = nil
}
// resetSubscription closes the subscription if it's currently active
func (m *mqttPubSub) resetSubscription() {
if m.consumer != nil && m.consumer.IsConnectionOpen() {
m.logger.Infof("re-initializing the subscriber")
m.closeSubscription()
} else {
m.logger.Infof("initializing the subscriber")
}
}
// startSubscription connects to the server and begins receiving messages
func (m *mqttPubSub) startSubscription(ctx context.Context) error {
// mqtt broker allows only one connection at a given time from a clientID.
consumerClientID := m.metadata.consumerID
if m.metadata.producerID == "" {
// for backwards-compatibility; see: https://github.com/dapr/components-contrib/pull/2104
consumerClientID += "-consumer"
}
connCtx, connCancel := context.WithTimeout(ctx, defaultWait)
c, err := m.connect(connCtx, consumerClientID)
connCancel()
if err != nil {
return err
}
m.consumer = c
subscribeTopics := make(map[string]byte, len(m.topics))
for k := range m.topics {
subscribeTopics[k] = m.metadata.qos
}
token := m.consumer.SubscribeMultiple(
subscribeTopics,
m.onMessage(ctx),
)
subscribeCtx, subscribeCancel := context.WithTimeout(m.ctx, defaultWait)
defer subscribeCancel()
select {
case <-token.Done():
// Subscription went through
case <-subscribeCtx.Done():
return subscribeCtx.Err()
}
if err := token.Error(); err != nil {
return fmt.Errorf("mqtt error from subscribe: %v", err)
}
return nil
}
// onMessage returns the callback to be invoked when there's a new message from a topic
func (m *mqttPubSub) onMessage(ctx context.Context) func(client mqtt.Client, mqttMsg mqtt.Message) {
return func(client mqtt.Client, mqttMsg mqtt.Message) {
ack := false
defer func() {
// MQTT does not support NACK's, so in case of error we need to re-enqueue the message and then send a positive ACK for this message
// Note that if the connection drops before the message is explicitly ACK'd below, then it's automatically re-sent (assuming QoS is 1 or greater, which is the default). So we do not risk losing messages.
// Problem with this approach is that if the service crashes between the time the message is re-enqueued and when the ACK is sent, the message may be delivered twice
if !ack {
m.logger.Debugf("Re-publishing message %s#%d", mqttMsg.Topic(), mqttMsg.MessageID())
publishErr := m.Publish(ctx, &pubsub.PublishRequest{
Topic: mqttMsg.Topic(),
Data: mqttMsg.Payload(),
})
if publishErr != nil {
m.logger.Errorf("Failed to re-publish message %s#%d. Error: %v", mqttMsg.Topic(), mqttMsg.MessageID(), publishErr)
// Return so Ack() isn't invoked
return
}
}
mqttMsg.Ack()
// If we re-published the message, consume a retriable error token
if !ack {
m.logger.Debugf("Taking a retriable error token")
before := time.Now()
_ = m.retriableErrLimit.Take()
m.logger.Debugf("Resumed after pausing for %v", time.Now().Sub(before))
}
}()
msg := pubsub.NewMessage{
Topic: mqttMsg.Topic(),
Data: mqttMsg.Payload(),
Metadata: map[string]string{"retained": strconv.FormatBool(mqttMsg.Retained())},
}
topicHandler := m.handlerForTopic(msg.Topic)
if topicHandler == nil {
m.logger.Errorf("no handler defined for topic %s", msg.Topic)
return
}
m.logger.Debugf("Processing MQTT message %s#%d (retained=%v)", mqttMsg.Topic(), mqttMsg.MessageID(), mqttMsg.Retained())
err := topicHandler(ctx, &msg)
if err != nil {
m.logger.Errorf("Failed processing MQTT message %s#%d: %v", mqttMsg.Topic(), mqttMsg.MessageID(), err)
return
}
m.logger.Debugf("Done processing MQTT message %s#%d; sending ACK", mqttMsg.Topic(), mqttMsg.MessageID())
ack = true
}
}
// Returns the handler for a message sent to a given topic, supporting wildcards and other special syntaxes.
func (m *mqttPubSub) handlerForTopic(topic string) pubsub.Handler {
m.subscribingLock.RLock()
defer m.subscribingLock.RUnlock()
// First, try to see if we have a handler for the exact topic (no wildcards etc)
topicHandler, ok := m.topics[topic]
if ok && topicHandler.handler != nil {
return topicHandler.handler
}
// Iterate through the topics and run the matchers
for _, obj := range m.topics {
if obj.alias == topic {
return obj.handler
}
if obj.matcher != nil && obj.matcher(topic) {
return obj.handler
}
}
return nil
}
func (m *mqttPubSub) connect(ctx context.Context, clientID string) (mqtt.Client, error) {
uri, err := url.Parse(m.metadata.url)
if err != nil {
return nil, err
}
opts := m.createClientOptions(uri, clientID)
// Turn off auto-ack
opts.SetAutoAckDisabled(true)
client := mqtt.NewClient(opts)
// Add all routes before we connect to catch messages that may be delivered before client.Subscribe is invoked
// The routes will be overwritten later
for topic := range m.topics {
client.AddRoute(topic, m.onMessage(ctx))
}
token := client.Connect()
select {
case <-token.Done():
// Connection went through
case <-ctx.Done():
return nil, ctx.Err()
}
if err := token.Error(); err != nil {
return nil, err
}
return client, nil
}
func (m *mqttPubSub) newTLSConfig() *tls.Config {
tlsConfig, err := pubsub.ConvertTLSPropertiesToTLSConfig(m.metadata.TLSProperties)
if err != nil {
m.logger.Warnf("failed to load TLS config: %s", err)
}
return tlsConfig
}
func (m *mqttPubSub) createClientOptions(uri *url.URL, clientID string) *mqtt.ClientOptions {
opts := mqtt.NewClientOptions()
opts.SetClientID(clientID)
opts.SetCleanSession(m.metadata.cleanSession)
// URL scheme backward compatibility
scheme := uri.Scheme
switch scheme {
case "mqtt":
scheme = "tcp"
case "mqtts", "tcps", "tls":
scheme = "ssl"
}
opts.AddBroker(scheme + "://" + uri.Host)
opts.SetUsername(uri.User.Username())
password, _ := uri.User.Password()
opts.SetPassword(password)
// tls config
opts.SetTLSConfig(m.newTLSConfig())
return opts
}
func (m *mqttPubSub) Close() error {
m.subscribingLock.Lock()
defer m.subscribingLock.Unlock()
m.cancel()
if m.consumer != nil {
m.consumer.Disconnect(5)
}
m.producer.Disconnect(5)
return nil
}
func (m *mqttPubSub) Features() []pubsub.Feature {
return []pubsub.Feature{pubsub.FeatureSubscribeWildcards}
}
var sharedSubscriptionMatch = regexp.MustCompile(`^\$share\/(.*?)\/.`)
// Adds a topic to the list of subscriptions.
func (m *mqttPubSub) addTopic(origTopicName string, handler pubsub.Handler) {
obj := mqttPubSubSubscription{
handler: handler,
}
// Shared subscriptions begin with "$share/GROUPID/" and we can remove that prefix
topicName := origTopicName
if found := sharedSubscriptionMatch.FindStringIndex(origTopicName); found != nil && found[0] == 0 {
topicName = topicName[(found[1] - 1):]
obj.alias = topicName
}
// If the topic name contains a wildcard, we need to add a matcher
regexStr := buildRegexForTopic(topicName)
if regexStr != "" {
// We built our own regex and this should never panic
match := regexp.MustCompile(regexStr)
obj.matcher = func(topic string) bool {
return match.MatchString(topic)
}
}
m.topics[origTopicName] = obj
}
// Returns a regular expression string that matches the topic, with support for wildcards.
func buildRegexForTopic(topicName string) string {
// This is a bit more lax than the specs, which for example require "#" to be at the end of the string only:
// in practice, seems that (at least some) brokers are more flexible and allow "#" in the middle of a string too
var (
regexStr string
lastPos int = -1
start int
okPos bool
)
if strings.ContainsAny(topicName, "#+") {
regexStr = "^"
// It's ok to iterate over bytes here (rather than codepoints) because all characters we're looking for are always single-byte
for i := 0; i < len(topicName); i++ {
// Wildcard chars must either be at the beginning of the string or must follow a /
okPos = (i == 0 || topicName[i-1] == '/')
if topicName[i] == '#' && okPos {
lastPos = i
if i > 0 && i == (len(topicName)-1) {
// Edge case: we're at the end of the string so we can allow omitting the preceding /
regexStr += regexp.QuoteMeta(topicName[start:(i-1)]) + "(.*)"
} else {
regexStr += regexp.QuoteMeta(topicName[start:i]) + "(.*)"
}
start = i + 1
} else if topicName[i] == '+' && okPos {
lastPos = i
if i > 0 && i == (len(topicName)-1) {
// Edge case: we're at the end of the string so we can allow omitting the preceding /
regexStr += regexp.QuoteMeta(topicName[start:(i-1)]) + `((\/|)[^\/]*)`
} else {
regexStr += regexp.QuoteMeta(topicName[start:i]) + `([^\/]*)`
}
start = i + 1
}
}
regexStr += regexp.QuoteMeta(topicName[(lastPos+1):]) + "$"
}
if lastPos == -1 {
return ""
}
return regexStr
}