334 lines
8.6 KiB
Go
334 lines
8.6 KiB
Go
package consumer
|
|
|
|
import (
|
|
"context"
|
|
"errors"
|
|
"fmt"
|
|
"io"
|
|
"log"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/aws/aws-sdk-go-v2/aws"
|
|
"github.com/aws/aws-sdk-go-v2/config"
|
|
"github.com/aws/aws-sdk-go-v2/service/kinesis"
|
|
"github.com/aws/aws-sdk-go-v2/service/kinesis/types"
|
|
"github.com/harlow/kinesis-consumer/internal/deaggregator"
|
|
)
|
|
|
|
// Record wraps the record returned from the Kinesis library and
|
|
// extends to include the shard id.
|
|
type Record struct {
|
|
types.Record
|
|
ShardID string
|
|
MillisBehindLatest *int64
|
|
}
|
|
|
|
// New creates a kinesis consumer with default settings. Use Option to override
|
|
// any of the optional attributes.
|
|
func New(streamName string, opts ...Option) (*Consumer, error) {
|
|
if streamName == "" {
|
|
return nil, errors.New("must provide stream name")
|
|
}
|
|
|
|
// new consumer with noop storage, counter, and logger
|
|
c := &Consumer{
|
|
streamName: streamName,
|
|
initialShardIteratorType: types.ShardIteratorTypeLatest,
|
|
store: &noopStore{},
|
|
counter: &noopCounter{},
|
|
logger: &noopLogger{
|
|
logger: log.New(io.Discard, "", log.LstdFlags),
|
|
},
|
|
scanInterval: 250 * time.Millisecond,
|
|
maxRecords: 10000,
|
|
}
|
|
|
|
// override defaults
|
|
for _, opt := range opts {
|
|
opt(c)
|
|
}
|
|
|
|
// default client
|
|
if c.client == nil {
|
|
cfg, err := config.LoadDefaultConfig(context.TODO())
|
|
if err != nil {
|
|
log.Fatalf("unable to load SDK config, %v", err)
|
|
}
|
|
c.client = kinesis.NewFromConfig(cfg)
|
|
}
|
|
|
|
// default group consumes all shards
|
|
if c.group == nil {
|
|
c.group = NewAllGroup(c.client, c.store, streamName, c.logger)
|
|
}
|
|
|
|
return c, nil
|
|
}
|
|
|
|
// Consumer wraps the interaction with the Kinesis stream
|
|
type Consumer struct {
|
|
streamName string
|
|
initialShardIteratorType types.ShardIteratorType
|
|
initialTimestamp *time.Time
|
|
client kinesisClient
|
|
counter Counter
|
|
group Group
|
|
logger Logger
|
|
store Store
|
|
scanInterval time.Duration
|
|
maxRecords int64
|
|
isAggregated bool
|
|
shardClosedHandler ShardClosedHandler
|
|
}
|
|
|
|
// ScanFunc is the type of the function called for each message read
|
|
// from the stream. The record argument contains the original record
|
|
// returned from the AWS Kinesis library.
|
|
// If an error is returned, scanning stops. The sole exception is when the
|
|
// function returns the special value ErrSkipCheckpoint.
|
|
type ScanFunc func(*Record) error
|
|
|
|
// ErrSkipCheckpoint is used as a return value from ScanFunc to indicate that
|
|
// the current checkpoint should be skipped. It is not returned
|
|
// as an error by any function.
|
|
var ErrSkipCheckpoint = errors.New("skip checkpoint")
|
|
|
|
// Scan launches a goroutine to process each of the shards in the stream. The ScanFunc
|
|
// is passed through to each of the goroutines and called with each message pulled from
|
|
// the stream.
|
|
func (c *Consumer) Scan(ctx context.Context, fn ScanFunc) error {
|
|
ctx, cancel := context.WithCancel(ctx)
|
|
defer cancel()
|
|
|
|
var (
|
|
errC = make(chan error, 1)
|
|
shardC = make(chan types.Shard, 1)
|
|
)
|
|
|
|
go func() {
|
|
err := c.group.Start(ctx, shardC)
|
|
if err != nil {
|
|
errC <- fmt.Errorf("error starting scan: %w", err)
|
|
cancel()
|
|
}
|
|
<-ctx.Done()
|
|
close(shardC)
|
|
}()
|
|
|
|
wg := new(sync.WaitGroup)
|
|
// process each of the shards
|
|
s := newShardsInProcess()
|
|
for shard := range shardC {
|
|
shardId := aws.ToString(shard.ShardId)
|
|
if s.doesShardExist(shardId) {
|
|
// safetynet: if shard already in process by another goroutine, just skipping the request
|
|
continue
|
|
}
|
|
wg.Add(1)
|
|
go func(shardID string) {
|
|
s.addShard(shardID)
|
|
defer func() {
|
|
s.deleteShard(shardID)
|
|
}()
|
|
defer wg.Done()
|
|
var err error
|
|
if err = c.ScanShard(ctx, shardID, fn); err != nil {
|
|
err = fmt.Errorf("shard %s error: %w", shardID, err)
|
|
} else if closeable, ok := c.group.(CloseableGroup); !ok {
|
|
// group doesn't allow closure, skip calling CloseShard
|
|
} else if err = closeable.CloseShard(ctx, shardID); err != nil {
|
|
err = fmt.Errorf("shard closed CloseableGroup error: %w", err)
|
|
}
|
|
if err != nil {
|
|
select {
|
|
case errC <- fmt.Errorf("shard %s error: %w", shardID, err):
|
|
cancel()
|
|
default:
|
|
}
|
|
}
|
|
}(shardId)
|
|
}
|
|
|
|
go func() {
|
|
wg.Wait()
|
|
close(errC)
|
|
}()
|
|
|
|
return <-errC
|
|
}
|
|
|
|
// ScanShard loops over records on a specific shard, calls the callback func
|
|
// for each record and checkpoints the progress of scan.
|
|
func (c *Consumer) ScanShard(ctx context.Context, shardID string, fn ScanFunc) error {
|
|
// get last seq number from checkpoint
|
|
lastSeqNum, err := c.group.GetCheckpoint(c.streamName, shardID)
|
|
if err != nil {
|
|
return fmt.Errorf("get checkpoint error: %w", err)
|
|
}
|
|
|
|
// get shard iterator
|
|
shardIterator, err := c.getShardIterator(ctx, c.streamName, shardID, lastSeqNum)
|
|
if err != nil {
|
|
return fmt.Errorf("get shard iterator error: %w", err)
|
|
}
|
|
|
|
c.logger.Log("[CONSUMER] start scan:", shardID, lastSeqNum)
|
|
defer func() {
|
|
c.logger.Log("[CONSUMER] stop scan:", shardID)
|
|
}()
|
|
|
|
scanTicker := time.NewTicker(c.scanInterval)
|
|
defer scanTicker.Stop()
|
|
|
|
for {
|
|
resp, err := c.client.GetRecords(ctx, &kinesis.GetRecordsInput{
|
|
Limit: aws.Int32(int32(c.maxRecords)),
|
|
ShardIterator: shardIterator,
|
|
})
|
|
|
|
// attempt to recover from GetRecords error
|
|
if err != nil {
|
|
c.logger.Log("[CONSUMER] get records error:", err.Error())
|
|
|
|
if !isRetriableError(err) {
|
|
return fmt.Errorf("get records error: %v", err.Error())
|
|
}
|
|
|
|
shardIterator, err = c.getShardIterator(ctx, c.streamName, shardID, lastSeqNum)
|
|
if err != nil {
|
|
return fmt.Errorf("get shard iterator error: %w", err)
|
|
}
|
|
} else {
|
|
// loop over records, call callback func
|
|
var records []types.Record
|
|
|
|
// deaggregate records
|
|
if c.isAggregated {
|
|
records, err = deaggregateRecords(resp.Records)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
} else {
|
|
records = resp.Records
|
|
}
|
|
|
|
for _, r := range records {
|
|
select {
|
|
case <-ctx.Done():
|
|
return nil
|
|
default:
|
|
err := fn(&Record{r, shardID, resp.MillisBehindLatest})
|
|
if err != nil && !errors.Is(err, ErrSkipCheckpoint) {
|
|
return err
|
|
}
|
|
|
|
if err := c.group.SetCheckpoint(c.streamName, shardID, *r.SequenceNumber); err != nil {
|
|
return err
|
|
}
|
|
|
|
c.counter.Add("records", 1)
|
|
lastSeqNum = *r.SequenceNumber
|
|
}
|
|
}
|
|
|
|
if isShardClosed(resp.NextShardIterator, shardIterator) {
|
|
c.logger.Log("[CONSUMER] shard closed:", shardID)
|
|
|
|
if c.shardClosedHandler != nil {
|
|
if err := c.shardClosedHandler(c.streamName, shardID); err != nil {
|
|
return fmt.Errorf("shard closed handler error: %w", err)
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
shardIterator = resp.NextShardIterator
|
|
}
|
|
|
|
// Wait for next scan
|
|
select {
|
|
case <-ctx.Done():
|
|
return nil
|
|
case <-scanTicker.C:
|
|
continue
|
|
}
|
|
}
|
|
}
|
|
|
|
// temporary conversion func of []types.Record -> DeaggregateRecords([]*types.Record) -> []types.Record
|
|
func deaggregateRecords(in []types.Record) ([]types.Record, error) {
|
|
var recs []*types.Record
|
|
for _, rec := range in {
|
|
recs = append(recs, &rec)
|
|
}
|
|
|
|
deagg, err := deaggregator.DeaggregateRecords(recs)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
|
|
var out []types.Record
|
|
for _, rec := range deagg {
|
|
out = append(out, *rec)
|
|
}
|
|
return out, nil
|
|
}
|
|
|
|
func (c *Consumer) getShardIterator(ctx context.Context, streamName, shardID, seqNum string) (*string, error) {
|
|
params := &kinesis.GetShardIteratorInput{
|
|
ShardId: aws.String(shardID),
|
|
StreamName: aws.String(streamName),
|
|
}
|
|
|
|
if seqNum != "" {
|
|
params.ShardIteratorType = types.ShardIteratorTypeAfterSequenceNumber
|
|
params.StartingSequenceNumber = aws.String(seqNum)
|
|
} else if c.initialTimestamp != nil {
|
|
params.ShardIteratorType = types.ShardIteratorTypeAtTimestamp
|
|
params.Timestamp = c.initialTimestamp
|
|
} else {
|
|
params.ShardIteratorType = c.initialShardIteratorType
|
|
}
|
|
|
|
res, err := c.client.GetShardIterator(ctx, params)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
return res.ShardIterator, nil
|
|
}
|
|
|
|
func isRetriableError(err error) bool {
|
|
if oe := (*types.ExpiredIteratorException)(nil); errors.As(err, &oe) {
|
|
return true
|
|
}
|
|
if oe := (*types.ProvisionedThroughputExceededException)(nil); errors.As(err, &oe) {
|
|
return true
|
|
}
|
|
return false
|
|
}
|
|
|
|
func isShardClosed(nextShardIterator, currentShardIterator *string) bool {
|
|
return nextShardIterator == nil || currentShardIterator == nextShardIterator
|
|
}
|
|
|
|
type shards struct {
|
|
shardsInProcess sync.Map
|
|
}
|
|
|
|
func newShardsInProcess() *shards {
|
|
return &shards{}
|
|
}
|
|
|
|
func (s *shards) addShard(shardId string) {
|
|
s.shardsInProcess.Store(shardId, struct{}{})
|
|
}
|
|
|
|
func (s *shards) doesShardExist(shardId string) bool {
|
|
_, ok := s.shardsInProcess.Load(shardId)
|
|
return ok
|
|
}
|
|
|
|
func (s *shards) deleteShard(shardId string) {
|
|
s.shardsInProcess.Delete(shardId)
|
|
}
|