forked from wenjianzhang/redisqueue
-
Notifications
You must be signed in to change notification settings - Fork 10
/
consumer.go
416 lines (371 loc) · 13 KB
/
consumer.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
package redisqueue
import (
"context"
"net"
"os"
"sync"
"time"
"github.com/pkg/errors"
"github.com/redis/go-redis/v9"
)
// ConsumerFunc is a type alias for the functions that will be used to handle
// and process Messages.
type ConsumerFunc func(*Message) error
type registeredConsumer struct {
fn ConsumerFunc
id string
}
// ConsumerOptions provide options to configure the Consumer.
type ConsumerOptions struct {
// Name sets the name of this consumer. This will be used when fetching from
// Redis. If empty, the hostname will be used.
Name string
// GroupName sets the name of the consumer group. This will be used when
// coordinating in Redis. If empty, the hostname will be used.
GroupName string
// VisibilityTimeout dictates the maximum amount of time a message should
// stay in pending. If there is a message that has been idle for more than
// this duration, the consumer will attempt to claim it.
VisibilityTimeout time.Duration
// BlockingTimeout designates how long the XREADGROUP call blocks for. If
// this is 0, it will block indefinitely. While this is the most efficient
// from a polling perspective, if this call never times out, there is no
// opportunity to yield back to Go at a regular interval. This means it's
// possible that if no messages are coming in, the consumer cannot
// gracefully shutdown. Instead, it's recommended to set this to 1-5
// seconds, or even longer, depending on how long your application can wait
// to shutdown.
BlockingTimeout time.Duration
// ReclaimInterval is the amount of time in between calls to XPENDING to
// attempt to reclaim jobs that have been idle for more than the visibility
// timeout. A smaller duration will result in more frequent checks. This
// will allow messages to be reaped faster, but it will put more load on
// Redis.
ReclaimInterval time.Duration
// BufferSize determines the size of the channel uses to coordinate the
// processing of the messages. This determines the maximum number of
// in-flight messages.
BufferSize int
// Concurrency dictates how many goroutines to spawn to handle the messages.
Concurrency int
// RedisClient supersedes the RedisOptions field, and allows you to inject
// an already-made Redis Client for use in the consumer. This may be either
// the standard client or a cluster client.
RedisClient redis.UniversalClient
// RedisOptions allows you to configure the underlying Redis connection.
// More info here:
// https://pkg.go.dev/github.com/go-redis/redis/v7?tab=doc#Options.
//
// This field is used if RedisClient field is nil.
RedisOptions *RedisOptions
}
// Consumer adds a convenient wrapper around dequeuing and managing concurrency.
type Consumer struct {
// Errors is a channel that you can receive from to centrally handle any
// errors that may occur either by your ConsumerFuncs or by internal
// processing functions. Because this is an unbuffered channel, you must
// have a listener on it. If you don't parts of the consumer could stop
// functioning when errors occur due to the blocking nature of unbuffered
// channels.
Errors chan error
options *ConsumerOptions
redis redis.UniversalClient
consumers map[string]registeredConsumer
streams []string
queue chan *Message
wg *sync.WaitGroup
stopReclaim chan struct{}
stopPoll chan struct{}
stopWorkers chan struct{}
}
var defaultConsumerOptions = &ConsumerOptions{
VisibilityTimeout: 60 * time.Second,
BlockingTimeout: 5 * time.Second,
ReclaimInterval: 1 * time.Second,
BufferSize: 100,
Concurrency: 10,
}
// NewConsumer uses a default set of options to create a Consumer. It sets Name
// to the hostname, GroupName to "redisqueue", VisibilityTimeout to 60 seconds,
// BufferSize to 100, and Concurrency to 10. In most production environments,
// you'll want to use NewConsumerWithOptions.
func NewConsumer() (*Consumer, error) {
return NewConsumerWithOptions(defaultConsumerOptions)
}
// NewConsumerWithOptions creates a Consumer with custom ConsumerOptions. If
// Name is left empty, it defaults to the hostname; if GroupName is left empty,
// it defaults to "redisqueue"; if BlockingTimeout is 0, it defaults to 5
// seconds; if ReclaimInterval is 0, it defaults to 1 second.
func NewConsumerWithOptions(options *ConsumerOptions) (*Consumer, error) {
hostname, _ := os.Hostname()
if options.Name == "" {
options.Name = hostname
}
if options.GroupName == "" {
options.GroupName = "redisqueue"
}
if options.BlockingTimeout == 0 {
options.BlockingTimeout = 5 * time.Second
}
if options.ReclaimInterval == 0 {
options.ReclaimInterval = 1 * time.Second
}
var r redis.UniversalClient
if options.RedisClient != nil {
r = options.RedisClient
} else {
r = newRedisClient(options.RedisOptions)
}
if err := redisPreflightChecks(r); err != nil {
return nil, err
}
return &Consumer{
Errors: make(chan error),
options: options,
redis: r,
consumers: make(map[string]registeredConsumer),
streams: make([]string, 0),
queue: make(chan *Message, options.BufferSize),
wg: &sync.WaitGroup{},
stopReclaim: make(chan struct{}, 1),
stopPoll: make(chan struct{}, 1),
stopWorkers: make(chan struct{}, options.Concurrency),
}, nil
}
// RegisterWithLastID is the same as Register, except that it also lets you
// specify the oldest message to receive when first creating the consumer group.
// This can be any valid message ID, "0" for all messages in the stream, or "$"
// for only new messages.
//
// If the consumer group already exists the id field is ignored, meaning you'll
// receive unprocessed messages.
func (c *Consumer) RegisterWithLastID(stream string, id string, fn ConsumerFunc) {
if len(id) == 0 {
id = "0"
}
c.consumers[stream] = registeredConsumer{
fn: fn,
id: id,
}
}
// Register takes in a stream name and a ConsumerFunc that will be called when a
// message comes in from that stream. Register must be called at least once
// before Run is called. If the same stream name is passed in twice, the first
// ConsumerFunc is overwritten by the second.
func (c *Consumer) Register(stream string, fn ConsumerFunc) {
c.RegisterWithLastID(stream, "0", fn)
}
// Run starts all of the worker goroutines and starts processing from the
// streams that have been registered with Register. All errors will be sent to
// the Errors channel. If Register was never called, an error will be sent and
// Run will terminate early. The same will happen if an error occurs when
// creating the consumer group in Redis. Run will block until Shutdown is called
// and all of the in-flight messages have been processed.
func (c *Consumer) Run() {
if len(c.consumers) == 0 {
c.Errors <- errors.New("at least one consumer function needs to be registered")
return
}
for stream, consumer := range c.consumers {
c.streams = append(c.streams, stream)
err := c.redis.XGroupCreateMkStream(context.TODO(), stream, c.options.GroupName, consumer.id).Err()
// ignoring the BUSYGROUP error makes this a noop
if err != nil && err.Error() != "BUSYGROUP Consumer Group name already exists" {
c.Errors <- errors.Wrap(err, "error creating consumer group")
return
}
}
for i := 0; i < len(c.consumers); i++ {
c.streams = append(c.streams, ">")
}
go c.reclaim()
go c.poll()
stop := newSignalHandler()
go func() {
<-stop
c.Shutdown()
}()
c.wg.Add(c.options.Concurrency)
for i := 0; i < c.options.Concurrency; i++ {
go c.work()
}
c.wg.Wait()
}
// Shutdown stops new messages from being processed and tells the workers to
// wait until all in-flight messages have been processed, and then they exit.
// The order that things stop is 1) the reclaim process (if it's running), 2)
// the polling process, and 3) the worker processes.
func (c *Consumer) Shutdown() {
c.stopReclaim <- struct{}{}
if c.options.VisibilityTimeout == 0 {
c.stopPoll <- struct{}{}
}
}
// reclaim runs in a separate goroutine and checks the list of pending messages
// in every stream. For every message, if it's been idle for longer than the
// VisibilityTimeout, it will attempt to claim that message for this consumer.
// If VisibilityTimeout is 0, this function returns early and no messages are
// reclaimed. It checks the list of pending messages according to
// ReclaimInterval.
func (c *Consumer) reclaim() {
if c.options.VisibilityTimeout == 0 {
return
}
ticker := time.NewTicker(c.options.ReclaimInterval)
for {
select {
case <-c.stopReclaim:
// once the reclaim process has stopped, stop the polling process
c.stopPoll <- struct{}{}
return
case <-ticker.C:
for stream := range c.consumers {
start := "-"
end := "+"
for {
res, err := c.redis.XPendingExt(context.TODO(), &redis.XPendingExtArgs{
Stream: stream,
Group: c.options.GroupName,
Start: start,
End: end,
Count: int64(c.options.BufferSize - len(c.queue)),
}).Result()
if err != nil && err != redis.Nil {
c.Errors <- errors.Wrap(err, "error listing pending messages")
break
}
if len(res) == 0 {
break
}
msgs := make([]string, 0)
for _, r := range res {
if r.Idle >= c.options.VisibilityTimeout {
claimres, err := c.redis.XClaim(context.TODO(), &redis.XClaimArgs{
Stream: stream,
Group: c.options.GroupName,
Consumer: c.options.Name,
MinIdle: c.options.VisibilityTimeout,
Messages: []string{r.ID},
}).Result()
if err != nil && err != redis.Nil {
c.Errors <- errors.Wrapf(err, "error claiming %d message(s)", len(msgs))
break
}
// If the Redis nil error is returned, it means that
// the message no longer exists in the stream.
// However, it is still in a pending state. This
// could happen if a message was claimed by a
// consumer, that consumer died, and the message
// gets deleted (either through a XDEL call or
// through MAXLEN). Since the message no longer
// exists, the only way we can get it out of the
// pending state is to acknowledge it.
if err == redis.Nil {
err = c.redis.XAck(context.TODO(), stream, c.options.GroupName, r.ID).Err()
if err != nil {
c.Errors <- errors.Wrapf(err, "error acknowledging after failed claim for %q stream and %q message", stream, r.ID)
continue
}
}
c.enqueue(stream, claimres)
}
}
newID, err := incrementMessageID(res[len(res)-1].ID)
if err != nil {
c.Errors <- err
break
}
start = newID
}
}
}
}
}
// poll constantly checks the streams using XREADGROUP to see if there are any
// messages for this consumer to process. It blocks for up to 5 seconds instead
// of blocking indefinitely so that it can periodically check to see if Shutdown
// was called.
func (c *Consumer) poll() {
for {
select {
case <-c.stopPoll:
// once the polling has stopped (i.e. there will be no more messages
// put onto c.queue), stop all of the workers
for i := 0; i < c.options.Concurrency; i++ {
c.stopWorkers <- struct{}{}
}
return
default:
res, err := c.redis.XReadGroup(context.TODO(), &redis.XReadGroupArgs{
Group: c.options.GroupName,
Consumer: c.options.Name,
Streams: c.streams,
Count: int64(c.options.BufferSize - len(c.queue)),
Block: c.options.BlockingTimeout,
}).Result()
if err != nil {
if err, ok := err.(net.Error); ok && err.Timeout() {
continue
}
if err == redis.Nil {
continue
}
c.Errors <- errors.Wrap(err, "error reading redis stream")
continue
}
for _, r := range res {
c.enqueue(r.Stream, r.Messages)
}
}
}
}
// enqueue takes a slice of XMessages, creates corresponding Messages, and sends
// them on the centralized channel for worker goroutines to process.
func (c *Consumer) enqueue(stream string, msgs []redis.XMessage) {
for _, m := range msgs {
msg := &Message{
ID: m.ID,
Stream: stream,
Values: m.Values,
}
c.queue <- msg
}
}
// work is called in a separate goroutine. The number of work goroutines is
// determined by Concurreny. Once it gets a message from the centralized
// channel, it calls the corrensponding ConsumerFunc depending on the stream it
// came from. If no error is returned from the ConsumerFunc, the message is
// acknowledged in Redis.
func (c *Consumer) work() {
defer c.wg.Done()
for {
select {
case msg := <-c.queue:
err := c.process(msg)
if err != nil {
c.Errors <- errors.Wrapf(err, "error calling ConsumerFunc for %q stream and %q message", msg.Stream, msg.ID)
continue
}
err = c.redis.XAck(context.TODO(), msg.Stream, c.options.GroupName, msg.ID).Err()
if err != nil {
c.Errors <- errors.Wrapf(err, "error acknowledging after success for %q stream and %q message", msg.Stream, msg.ID)
continue
}
case <-c.stopWorkers:
return
}
}
}
func (c *Consumer) process(msg *Message) (err error) {
defer func() {
if r := recover(); r != nil {
if e, ok := r.(error); ok {
err = errors.Wrap(e, "ConsumerFunc panic")
return
}
err = errors.Errorf("ConsumerFunc panic: %v", r)
}
}()
err = c.consumers[msg.Stream].fn(msg)
return
}