forked from robinjoseph08/redisqueue
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconsumer.go
More file actions
515 lines (460 loc) · 15.4 KB
/
consumer.go
File metadata and controls
515 lines (460 loc) · 15.4 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
package redisqueue
import (
"context"
"net"
"os"
"sync"
"time"
"github.com/pkg/errors"
"github.com/redis/go-redis/v9"
)
// ConsumerFunc is a type alias for the functions that will be used to handle
// and process Messages.
type ConsumerFunc func(*Message) error
type registeredConsumer struct {
fn ConsumerFunc
id string
}
// ConsumerOptions provide options to configure the Consumer.
type ConsumerOptions struct {
// Name sets the name of this consumer. This will be used when fetching from
// Redis. If empty, the hostname will be used.
Name string
// GroupName sets the name of the consumer group. This will be used when
// coordinating in Redis. If empty, the hostname will be used.
GroupName string
// VisibilityTimeout dictates the maximum amount of time a message should
// stay in pending. If there is a message that has been idle for more than
// this duration, the consumer will attempt to claim it.
VisibilityTimeout time.Duration
// BlockingTimeout designates how long the XREADGROUP call blocks for. If
// this is 0, it will block indefinitely. While this is the most efficient
// from a polling perspective, if this call never times out, there is no
// opportunity to yield back to Go at a regular interval. This means it's
// possible that if no messages are coming in, the consumer cannot
// gracefully shutdown. Instead, it's recommended to set this to 1-5
// seconds, or even longer, depending on how long your application can wait
// to shutdown.
BlockingTimeout time.Duration
// ReclaimInterval is the amount of time in between calls to XPENDING to
// attempt to reclaim jobs that have been idle for more than the visibility
// timeout. A smaller duration will result in more frequent checks. This
// will allow messages to be reaped faster, but it will put more load on
// Redis.
ReclaimInterval time.Duration
// BufferSize determines the size of the channel uses to coordinate the
// processing of the messages. This determines the maximum number of
// in-flight messages.
BufferSize int
// Concurrency dictates how many goroutines to spawn to handle the messages.
Concurrency int
// ErrorChannelBuffer sets the size of the Errors channel buffer. If this is
// 0, it defaults to 100. Errors are sent in a non-blocking way to avoid
// stalling processing when no listener is present.
ErrorChannelBuffer int
// MaxDeliveryCount is the maximum number of times a message can be delivered
// before it is considered failed. If this is set to 0, the message will be
// retried indefinitely
MaxDeliveryCount int64
// RedisClient supersedes the RedisOptions field, and allows you to inject
// an already-made Redis Client for use in the consumer. This may be either
// the standard client or a cluster client.
RedisClient redis.UniversalClient
// RedisOptions allows you to configure the underlying Redis connection.
// More info here:
// https://pkg.go.dev/github.com/redis/go-redis/v9#Options.
//
// This field is used if RedisClient field is nil.
RedisOptions *RedisOptions
}
// Consumer adds a convenient wrapper around dequeuing and managing concurrency.
type Consumer struct {
// Errors is a channel that you can receive from to centrally handle any
// errors that may occur either by your ConsumerFuncs or by internal
// processing functions. Errors are sent in a non-blocking manner, so if the
// channel buffer is full or no listener is present, errors may be dropped.
Errors chan error
options *ConsumerOptions
redis redis.UniversalClient
consumers map[string]registeredConsumer
streams []string
queue chan *Message
wg *sync.WaitGroup
stopReclaim chan struct{}
stopPoll chan struct{}
shutdownOnce sync.Once
closeQueueOnce sync.Once
}
var defaultConsumerOptions = &ConsumerOptions{
VisibilityTimeout: 60 * time.Second,
BlockingTimeout: 5 * time.Second,
ReclaimInterval: 1 * time.Second,
BufferSize: 100,
Concurrency: 10,
ErrorChannelBuffer: 100,
}
// NewConsumer uses a default set of options to create a Consumer. It sets Name
// to the hostname, GroupName to "redisqueue", VisibilityTimeout to 60 seconds,
// BufferSize to 100, and Concurrency to 10. In most production environments,
// you'll want to use NewConsumerWithOptions.
func NewConsumer() (*Consumer, error) {
return NewConsumerWithOptions(context.Background(), defaultConsumerOptions)
}
// NewConsumerWithOptions creates a Consumer with custom ConsumerOptions. If
// Name is left empty, it defaults to the hostname; if GroupName is left empty,
// it defaults to "redisqueue"; if BlockingTimeout is 0, it defaults to 5
// seconds; if ReclaimInterval is 0, it defaults to 1 second.
func NewConsumerWithOptions(ctx context.Context, options *ConsumerOptions) (*Consumer, error) {
if options == nil {
options = &ConsumerOptions{}
}
hostname, _ := os.Hostname()
if options.Name == "" {
options.Name = hostname
}
if options.GroupName == "" {
options.GroupName = "redisqueue"
}
if options.BufferSize < 0 {
return nil, errors.New("buffer size must be greater than 0")
}
if options.BufferSize == 0 {
options.BufferSize = defaultConsumerOptions.BufferSize
}
if options.Concurrency < 0 {
return nil, errors.New("concurrency must be greater than 0")
}
if options.Concurrency == 0 {
options.Concurrency = defaultConsumerOptions.Concurrency
}
if options.BlockingTimeout == 0 {
options.BlockingTimeout = 5 * time.Second
}
if options.ReclaimInterval == 0 {
options.ReclaimInterval = 1 * time.Second
}
if options.ErrorChannelBuffer == 0 {
options.ErrorChannelBuffer = defaultConsumerOptions.ErrorChannelBuffer
}
var r redis.UniversalClient
if options.RedisClient != nil {
r = options.RedisClient
} else {
r = newRedisClient(options.RedisOptions)
}
if err := redisPreflightChecks(ctx, r); err != nil {
return nil, err
}
return &Consumer{
Errors: make(chan error, options.ErrorChannelBuffer),
options: options,
redis: r,
consumers: make(map[string]registeredConsumer),
streams: make([]string, 0),
queue: make(chan *Message, options.BufferSize),
wg: &sync.WaitGroup{},
stopReclaim: make(chan struct{}, 1),
stopPoll: make(chan struct{}, 1),
}, nil
}
// RegisterWithLastID is the same as Register, except that it also lets you
// specify the oldest message to receive when first creating the consumer group.
// This can be any valid message ID, "0" for all messages in the stream, or "$"
// for only new messages.
//
// If the consumer group already exists the id field is ignored, meaning you'll
// receive unprocessed messages.
func (c *Consumer) RegisterWithLastID(stream string, id string, fn ConsumerFunc) {
if len(id) == 0 {
id = "0"
}
c.consumers[stream] = registeredConsumer{
fn: fn,
id: id,
}
}
// Register takes in a stream name and a ConsumerFunc that will be called when a
// message comes in from that stream. Register must be called at least once
// before Run is called. If the same stream name is passed in twice, the first
// ConsumerFunc is overwritten by the second.
func (c *Consumer) Register(stream string, fn ConsumerFunc) {
c.RegisterWithLastID(stream, "0", fn)
}
// Run starts all of the worker goroutines and starts processing from the
// streams that have been registered with Register. All errors will be sent to
// the Errors channel. If Register was never called, an error will be sent and
// Run will terminate early. The same will happen if an error occurs when
// creating the consumer group in Redis. Run will block until Shutdown is called
// and all of the in-flight messages have been processed.
func (c *Consumer) Run(ctx context.Context) {
runCtx, cancel := context.WithCancel(ctx)
defer cancel()
go func() {
<-runCtx.Done()
c.Shutdown()
}()
if len(c.consumers) == 0 {
c.sendError(errors.New("at least one consumer function needs to be registered"))
return
}
for stream, consumer := range c.consumers {
c.streams = append(c.streams, stream)
err := c.redis.XGroupCreateMkStream(runCtx, stream, c.options.GroupName, consumer.id).Err()
// ignoring the BUSYGROUP error makes this a noop
if err != nil && err.Error() != "BUSYGROUP Consumer Group name already exists" {
c.sendError(errors.Wrap(err, "error creating consumer group"))
return
}
}
for i := 0; i < len(c.consumers); i++ {
c.streams = append(c.streams, ">")
}
go c.reclaim(runCtx)
go c.poll(runCtx)
stop := newSignalHandler()
go func() {
<-stop
c.Shutdown()
}()
c.wg.Add(c.options.Concurrency)
for i := 0; i < c.options.Concurrency; i++ {
go c.work(runCtx)
}
c.wg.Wait()
}
// Shutdown stops new messages from being processed and tells the workers to
// wait until all in-flight messages have been processed, and then they exit.
// The order that things stop is 1) the reclaim process (if it's running), 2)
// the polling process, and 3) the worker processes.
func (c *Consumer) Shutdown() {
c.shutdownOnce.Do(func() {
c.stopReclaim <- struct{}{}
if c.options.VisibilityTimeout == 0 {
c.signalPollStop()
}
})
}
// reclaim runs in a separate goroutine and checks the list of pending messages
// in every stream. For every message, if it's been idle for longer than the
// VisibilityTimeout, it will attempt to claim that message for this consumer.
// If VisibilityTimeout is 0, this function returns early and no messages are
// reclaimed. It checks the list of pending messages according to
// ReclaimInterval.
func (c *Consumer) reclaim(ctx context.Context) {
if c.options.VisibilityTimeout == 0 {
return
}
ticker := time.NewTicker(c.options.ReclaimInterval)
defer ticker.Stop()
for {
select {
case <-c.stopReclaim:
// once the reclaim process has stopped, stop the polling process
c.signalPollStop()
return
case <-ctx.Done():
c.signalPollStop()
return
case <-ticker.C:
for stream := range c.consumers {
start := "-"
end := "+"
for {
available := c.availableCapacity()
if available <= 0 {
break
}
res, err := c.redis.XPendingExt(ctx, &redis.XPendingExtArgs{
Stream: stream,
Group: c.options.GroupName,
Start: start,
End: end,
Count: int64(available),
}).Result()
if err != nil && err != redis.Nil {
if ctx.Err() != nil {
c.signalPollStop()
return
}
c.sendError(errors.Wrap(err, "error listing pending messages"))
break
}
if len(res) == 0 {
break
}
msgs := make([]string, 0)
for _, r := range res {
if c.options.MaxDeliveryCount > 0 && r.RetryCount >= c.options.MaxDeliveryCount {
err = c.redis.XAck(ctx, stream, c.options.GroupName, r.ID).Err()
if err != nil {
c.sendError(errors.Wrapf(err, "error acknowledging after retry count exceeded for %q stream and %q message, ", stream, r.ID))
continue
}
}
if r.Idle >= c.options.VisibilityTimeout {
claimres, err := c.redis.XClaim(ctx, &redis.XClaimArgs{
Stream: stream,
Group: c.options.GroupName,
Consumer: c.options.Name,
MinIdle: c.options.VisibilityTimeout,
Messages: []string{r.ID},
}).Result()
if err != nil && err != redis.Nil {
if ctx.Err() != nil {
c.signalPollStop()
return
}
c.sendError(errors.Wrapf(err, "error claiming %d message(s)", len(msgs)))
break
}
// If the Redis nil error is returned, it means that
// the message no longer exists in the stream.
// However, it is still in a pending state. This
// could happen if a message was claimed by a
// consumer, that consumer died, and the message
// gets deleted (either through a XDEL call or
// through MAXLEN). Since the message no longer
// exists, the only way we can get it out of the
// pending state is to acknowledge it.
if err == redis.Nil {
err = c.redis.XAck(ctx, stream, c.options.GroupName, r.ID).Err()
if err != nil {
if ctx.Err() != nil {
c.signalPollStop()
return
}
c.sendError(errors.Wrapf(err, "error acknowledging after failed claim for %q stream and %q message", stream, r.ID))
continue
}
}
c.enqueue(stream, claimres)
}
}
newID, err := incrementMessageID(res[len(res)-1].ID)
if err != nil {
c.sendError(err)
break
}
start = newID
}
}
}
}
}
// poll constantly checks the streams using XREADGROUP to see if there are any
// messages for this consumer to process. It blocks for up to 5 seconds instead
// of blocking indefinitely so that it can periodically check to see if Shutdown
// was called.
func (c *Consumer) poll(ctx context.Context) {
for {
select {
case <-c.stopPoll:
// once polling has stopped (i.e. there will be no more messages
// put onto c.queue), close the queue so workers can drain and exit
c.closeQueue()
return
case <-ctx.Done():
c.Shutdown()
<-c.stopPoll
c.closeQueue()
return
default:
available := c.availableCapacity()
if available <= 0 {
time.Sleep(10 * time.Millisecond)
continue
}
res, err := c.redis.XReadGroup(ctx, &redis.XReadGroupArgs{
Group: c.options.GroupName,
Consumer: c.options.Name,
Streams: c.streams,
Count: int64(available),
Block: c.options.BlockingTimeout,
}).Result()
if err != nil {
if ctx.Err() != nil {
c.Shutdown()
<-c.stopPoll
c.closeQueue()
return
}
if err, ok := err.(net.Error); ok && err.Timeout() {
continue
}
if err == redis.Nil {
continue
}
c.sendError(errors.Wrap(err, "error reading redis stream"))
continue
}
for _, r := range res {
c.enqueue(r.Stream, r.Messages)
}
}
}
}
// enqueue takes a slice of XMessages, creates corresponding Messages, and sends
// them on the centralized channel for worker goroutines to process.
func (c *Consumer) enqueue(stream string, msgs []redis.XMessage) {
for _, m := range msgs {
msg := &Message{
ID: m.ID,
Stream: stream,
Values: m.Values,
}
c.queue <- msg
}
}
// work is called in a separate goroutine. The number of work goroutines is
// determined by Concurreny. Once it gets a message from the centralized
// channel, it calls the corrensponding ConsumerFunc depending on the stream it
// came from. If no error is returned from the ConsumerFunc, the message is
// acknowledged in Redis.
func (c *Consumer) work(ctx context.Context) {
defer c.wg.Done()
for msg := range c.queue {
err := c.process(msg)
if err != nil {
c.sendError(errors.Wrapf(err, "error calling ConsumerFunc for %q stream and %q message", msg.Stream, msg.ID))
continue
}
err = c.redis.XAck(ctx, msg.Stream, c.options.GroupName, msg.ID).Err()
if err != nil {
c.sendError(errors.Wrapf(err, "error acknowledging after success for %q stream and %q message", msg.Stream, msg.ID))
continue
}
}
}
func (c *Consumer) closeQueue() {
c.closeQueueOnce.Do(func() {
close(c.queue)
})
}
func (c *Consumer) signalPollStop() {
select {
case c.stopPoll <- struct{}{}:
default:
}
}
func (c *Consumer) availableCapacity() int {
return cap(c.queue) - len(c.queue)
}
func (c *Consumer) sendError(err error) {
select {
case c.Errors <- err:
default:
}
}
func (c *Consumer) process(msg *Message) (err error) {
defer func() {
if r := recover(); r != nil {
if e, ok := r.(error); ok {
err = errors.Wrap(e, "ConsumerFunc panic")
return
}
err = errors.Errorf("ConsumerFunc panic: %v", r)
}
}()
err = c.consumers[msg.Stream].fn(msg)
return
}