kinesis-consumer/consumer.go

145 lines
3 KiB
Go
Raw Normal View History

package connector
import (
"os"
"github.com/apex/log"
"github.com/apex/log/handlers/text"
"github.com/aws/aws-sdk-go/aws"
"github.com/aws/aws-sdk-go/aws/session"
"github.com/aws/aws-sdk-go/service/kinesis"
)
var (
maxRecordCount = 1000
maxBufferTime = "30s"
)
// NewConsumer creates a new kinesis connection and returns a
// new consumer initialized with app and stream name
func NewConsumer(appName, streamName string) *Consumer {
log.SetHandler(text.New(os.Stderr))
svc := kinesis.New(
session.New(
aws.NewConfig().WithMaxRetries(10),
),
2016-05-01 00:04:44 +00:00
)
return &Consumer{
appName: appName,
streamName: streamName,
svc: svc,
}
}
type Consumer struct {
appName string
streamName string
svc *kinesis.Kinesis
}
// Set `option` to `value`
func (c *Consumer) Set(option string, value interface{}) {
switch option {
case "maxRecordCount":
maxRecordCount = value.(int)
default:
log.Error("invalid option")
os.Exit(1)
}
}
// SetLogHandler allows users override logger
func (c *Consumer) SetLogHandler(handler log.Handler) {
log.SetHandler(handler)
}
2016-05-01 00:04:44 +00:00
// Start takes a handler and then loops over each of the shards
// processing each one with the handler.
func (c *Consumer) Start(handler Handler) {
2016-05-01 00:04:44 +00:00
resp, err := c.svc.DescribeStream(
&kinesis.DescribeStreamInput{
StreamName: aws.String(c.streamName),
},
)
if err != nil {
log.WithError(err).Error("DescribeStream")
os.Exit(1)
}
for _, shard := range resp.StreamDescription.Shards {
go c.handlerLoop(*shard.ShardId, handler)
}
}
func (c *Consumer) handlerLoop(shardID string, handler Handler) {
ctx := log.WithFields(log.Fields{
"app": c.appName,
"stream": c.streamName,
"shard": shardID,
})
buf := &Buffer{
MaxRecordCount: maxRecordCount,
}
checkpoint := &Checkpoint{
AppName: c.appName,
StreamName: c.streamName,
}
params := &kinesis.GetShardIteratorInput{
ShardId: aws.String(shardID),
StreamName: aws.String(c.streamName),
}
if checkpoint.CheckpointExists(shardID) {
params.ShardIteratorType = aws.String("AFTER_SEQUENCE_NUMBER")
params.StartingSequenceNumber = aws.String(checkpoint.SequenceNumber())
} else {
params.ShardIteratorType = aws.String("TRIM_HORIZON")
}
resp, err := c.svc.GetShardIterator(params)
if err != nil {
ctx.WithError(err).Error("getShardIterator")
os.Exit(1)
}
shardIterator := resp.ShardIterator
ctx.Info("processing")
for {
resp, err := c.svc.GetRecords(
&kinesis.GetRecordsInput{
ShardIterator: shardIterator,
},
)
if err != nil {
ctx.WithError(err).Error("getRecords")
2016-05-01 00:04:44 +00:00
os.Exit(1)
}
if len(resp.Records) > 0 {
for _, r := range resp.Records {
buf.AddRecord(r)
if buf.ShouldFlush() {
handler.HandleRecords(*buf)
ctx.WithField("count", buf.RecordCount()).Info("emitted")
checkpoint.SetCheckpoint(shardID, buf.LastSeq())
buf.Flush()
2016-02-08 21:21:54 +00:00
}
}
} else if resp.NextShardIterator == aws.String("") || shardIterator == resp.NextShardIterator {
ctx.Error("nextShardIterator")
os.Exit(1)
}
shardIterator = resp.NextShardIterator
}
}