Users of this library can now cache the checkpointer object

This commit is contained in:
Xavi Ramirez 2017-05-19 22:01:57 +00:00
parent 8da04c944f
commit 17cfe98efa
2 changed files with 28 additions and 26 deletions

View file

@ -10,6 +10,7 @@ import (
) )
type SampleRecordProcessor struct { type SampleRecordProcessor struct {
checkpointer *kcl.Checkpointer
sleepDuration time.Duration sleepDuration time.Duration
checkpointRetries int checkpointRetries int
checkpointFreq time.Duration checkpointFreq time.Duration
@ -26,14 +27,15 @@ func New() *SampleRecordProcessor {
} }
} }
func (srp *SampleRecordProcessor) Initialize(shardID string) error { func (srp *SampleRecordProcessor) Initialize(shardID string, checkpointer *kcl.Checkpointer) error {
srp.lastCheckpoint = time.Now() srp.lastCheckpoint = time.Now()
srp.checkpointer = checkpointer
return nil return nil
} }
func (srp *SampleRecordProcessor) checkpoint(checkpointer kcl.Checkpointer, sequenceNumber *string, subSequenceNumber *int) { func (srp *SampleRecordProcessor) checkpoint(sequenceNumber *string, subSequenceNumber *int) {
for n := -1; n < srp.checkpointRetries; n++ { for n := 0; n < srp.checkpointRetries+1; n++ {
err := checkpointer.Checkpoint(sequenceNumber, subSequenceNumber) err := srp.checkpointer.Checkpoint(sequenceNumber, subSequenceNumber)
if err == nil { if err == nil {
return return
} }
@ -66,7 +68,7 @@ func (srp *SampleRecordProcessor) shouldUpdateSequence(sequenceNumber *big.Int,
(sequenceNumber.Cmp(srp.largestSeq) == 0 && subSequenceNumber > srp.largestSubSeq) (sequenceNumber.Cmp(srp.largestSeq) == 0 && subSequenceNumber > srp.largestSubSeq)
} }
func (srp *SampleRecordProcessor) ProcessRecords(records []kcl.Record, checkpointer kcl.Checkpointer) error { func (srp *SampleRecordProcessor) ProcessRecords(records []kcl.Record) error {
for _, record := range records { for _, record := range records {
seqNumber := new(big.Int) seqNumber := new(big.Int)
if _, ok := seqNumber.SetString(record.SequenceNumber, 10); !ok { if _, ok := seqNumber.SetString(record.SequenceNumber, 10); !ok {
@ -80,16 +82,16 @@ func (srp *SampleRecordProcessor) ProcessRecords(records []kcl.Record, checkpoin
} }
if time.Now().Sub(srp.lastCheckpoint) > srp.checkpointFreq { if time.Now().Sub(srp.lastCheckpoint) > srp.checkpointFreq {
largestSeq := srp.largestSeq.String() largestSeq := srp.largestSeq.String()
srp.checkpoint(checkpointer, &largestSeq, &srp.largestSubSeq) srp.checkpoint(&largestSeq, &srp.largestSubSeq)
srp.lastCheckpoint = time.Now() srp.lastCheckpoint = time.Now()
} }
return nil return nil
} }
func (srp *SampleRecordProcessor) Shutdown(checkpointer kcl.Checkpointer, reason string) error { func (srp *SampleRecordProcessor) Shutdown(reason string) error {
if reason == "TERMINATE" { if reason == "TERMINATE" {
fmt.Fprintf(os.Stderr, "Was told to terminate, will attempt to checkpoint.\n") fmt.Fprintf(os.Stderr, "Was told to terminate, will attempt to checkpoint.\n")
srp.checkpoint(checkpointer, nil, nil) srp.checkpoint(nil, nil)
} else { } else {
fmt.Fprintf(os.Stderr, "Shutting down due to failover. Will not checkpoint.\n") fmt.Fprintf(os.Stderr, "Shutting down due to failover. Will not checkpoint.\n")
} }

View file

@ -9,16 +9,24 @@ import (
) )
type RecordProcessor interface { type RecordProcessor interface {
Initialize(shardID string) error Initialize(shardID string, checkpointer *Checkpointer) error
ProcessRecords(records []Record, checkpointer Checkpointer) error ProcessRecords(records []Record) error
Shutdown(checkpointer Checkpointer, reason string) error Shutdown(reason string) error
}
type CheckpointError struct {
e string
}
func (ce CheckpointError) Error() string {
return ce.e
} }
type Checkpointer struct { type Checkpointer struct {
ioHandler ioHandler ioHandler ioHandler
} }
func (c Checkpointer) getAction() (interface{}, error) { func (c *Checkpointer) getAction() (interface{}, error) {
line, err := c.ioHandler.readLine() line, err := c.ioHandler.readLine()
if err != nil { if err != nil {
return nil, err return nil, err
@ -30,15 +38,7 @@ func (c Checkpointer) getAction() (interface{}, error) {
return action, nil return action, nil
} }
type CheckpointError struct { func (c *Checkpointer) Checkpoint(sequenceNumber *string, subSequenceNumber *int) error {
e string
}
func (ce CheckpointError) Error() string {
return ce.e
}
func (c Checkpointer) Checkpoint(sequenceNumber *string, subSequenceNumber *int) error {
c.ioHandler.writeAction(ActionCheckpoint{ c.ioHandler.writeAction(ActionCheckpoint{
Action: "checkpoint", Action: "checkpoint",
SequenceNumber: sequenceNumber, SequenceNumber: sequenceNumber,
@ -178,7 +178,7 @@ func New(inputFile io.Reader, outputFile, errorFile io.Writer, recordProcessor R
} }
return &KCLProcess{ return &KCLProcess{
ioHandler: i, ioHandler: i,
checkpointer: Checkpointer{ checkpointer: &Checkpointer{
ioHandler: i, ioHandler: i,
}, },
recordProcessor: recordProcessor, recordProcessor: recordProcessor,
@ -187,7 +187,7 @@ func New(inputFile io.Reader, outputFile, errorFile io.Writer, recordProcessor R
type KCLProcess struct { type KCLProcess struct {
ioHandler ioHandler ioHandler ioHandler
checkpointer Checkpointer checkpointer *Checkpointer
recordProcessor RecordProcessor recordProcessor RecordProcessor
} }
@ -204,11 +204,11 @@ func (kclp *KCLProcess) reportDone(responseFor string) error {
func (kclp *KCLProcess) performAction(a interface{}) (string, error) { func (kclp *KCLProcess) performAction(a interface{}) (string, error) {
switch action := a.(type) { switch action := a.(type) {
case ActionInitialize: case ActionInitialize:
return action.Action, kclp.recordProcessor.Initialize(action.ShardID) return action.Action, kclp.recordProcessor.Initialize(action.ShardID, kclp.checkpointer)
case ActionProcessRecords: case ActionProcessRecords:
return action.Action, kclp.recordProcessor.ProcessRecords(action.Records, kclp.checkpointer) return action.Action, kclp.recordProcessor.ProcessRecords(action.Records)
case ActionShutdown: case ActionShutdown:
return action.Action, kclp.recordProcessor.Shutdown(kclp.checkpointer, action.Reason) return action.Action, kclp.recordProcessor.Shutdown(action.Reason)
default: default:
return "", fmt.Errorf("unknown action to dispatch: %s", action) return "", fmt.Errorf("unknown action to dispatch: %s", action)
} }