mirror of
https://github.com/seaweedfs/seaweedfs.git
synced 2024-01-19 02:48:24 +00:00
add message pipeline
This commit is contained in:
parent
15b6c7a6f0
commit
600d2f92a4
|
@ -80,12 +80,12 @@ func (p *PublishStreamProcessor) doFlush(stream mq_pb.SeaweedMessaging_PublishMe
|
||||||
}
|
}
|
||||||
|
|
||||||
builder := <-p.builders
|
builder := <-p.builders
|
||||||
bb := segment.NewMessageBatchBuilder(builder, p.ProducerId, p.ProducerEpoch, 3, 4)
|
bb := segment.NewMessageBatchBuilder(builder)
|
||||||
for _, m := range messages {
|
for _, m := range messages {
|
||||||
bb.AddMessage(p.messagesSequence, m.Ts.UnixNano(), m.Properties, m.Key, m.Content)
|
bb.AddMessage(p.messagesSequence, m.Ts.UnixNano(), m.Properties, m.Key, m.Content)
|
||||||
p.messagesSequence++
|
p.messagesSequence++
|
||||||
}
|
}
|
||||||
bb.BuildMessageBatch()
|
bb.BuildMessageBatch(p.ProducerId, p.ProducerEpoch, 3, 4)
|
||||||
defer func() {
|
defer func() {
|
||||||
p.builders <- builder
|
p.builders <- builder
|
||||||
}()
|
}()
|
||||||
|
|
53
weed/mq/messages/message_buffer.go
Normal file
53
weed/mq/messages/message_buffer.go
Normal file
|
@ -0,0 +1,53 @@
|
||||||
|
package messages
|
||||||
|
|
||||||
|
import (
|
||||||
|
flatbuffers "github.com/google/flatbuffers/go"
|
||||||
|
"github.com/seaweedfs/seaweedfs/weed/mq/segment"
|
||||||
|
)
|
||||||
|
|
||||||
|
type MessageBuffer struct {
|
||||||
|
fbsBuffer *flatbuffers.Builder
|
||||||
|
sequenceBase int64
|
||||||
|
counter int64
|
||||||
|
bb *segment.MessageBatchBuilder
|
||||||
|
isSealed bool
|
||||||
|
}
|
||||||
|
|
||||||
|
func NewMessageBuffer() *MessageBuffer {
|
||||||
|
t := &MessageBuffer{
|
||||||
|
fbsBuffer: flatbuffers.NewBuilder(4 * 1024 * 1024),
|
||||||
|
}
|
||||||
|
t.bb = segment.NewMessageBatchBuilder(t.fbsBuffer)
|
||||||
|
return t
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mb *MessageBuffer) Reset(sequenceBase int64) {
|
||||||
|
mb.sequenceBase = sequenceBase
|
||||||
|
mb.counter = 0
|
||||||
|
mb.bb.Reset()
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mb *MessageBuffer) AddMessage(message *Message) {
|
||||||
|
mb.bb.AddMessage(mb.sequenceBase, message.Ts.UnixMilli(), message.Properties, message.Key, message.Content)
|
||||||
|
mb.sequenceBase++
|
||||||
|
mb.counter++
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mb *MessageBuffer) Len() int {
|
||||||
|
return int(mb.counter)
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mb *MessageBuffer) Seal(producerId int32,
|
||||||
|
producerEpoch int32,
|
||||||
|
segmentId int32,
|
||||||
|
flags int32) {
|
||||||
|
mb.isSealed = true
|
||||||
|
mb.bb.BuildMessageBatch(producerId, producerEpoch, segmentId, flags)
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mb *MessageBuffer) Bytes() []byte {
|
||||||
|
if !mb.isSealed {
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
return mb.bb.GetBytes()
|
||||||
|
}
|
32
weed/mq/messages/message_buffer_mover.go
Normal file
32
weed/mq/messages/message_buffer_mover.go
Normal file
|
@ -0,0 +1,32 @@
|
||||||
|
package messages
|
||||||
|
|
||||||
|
import "fmt"
|
||||||
|
|
||||||
|
type MessageBufferMover interface {
|
||||||
|
Setup()
|
||||||
|
TearDown()
|
||||||
|
MoveBuffer(buffer *MessageBuffer) (MessageBufferReference, error) // should be thread-safe
|
||||||
|
}
|
||||||
|
type MessageBufferReference struct {
|
||||||
|
sequence int64
|
||||||
|
fileId string
|
||||||
|
}
|
||||||
|
|
||||||
|
var _ = MessageBufferMover(&EmptyMover{})
|
||||||
|
|
||||||
|
type EmptyMover struct {
|
||||||
|
}
|
||||||
|
|
||||||
|
func (e EmptyMover) Setup() {
|
||||||
|
}
|
||||||
|
|
||||||
|
func (e EmptyMover) TearDown() {
|
||||||
|
}
|
||||||
|
|
||||||
|
func (e EmptyMover) MoveBuffer(buffer *MessageBuffer) (MessageBufferReference, error) {
|
||||||
|
println("moving", buffer.sequenceBase)
|
||||||
|
return MessageBufferReference{
|
||||||
|
sequence: buffer.sequenceBase,
|
||||||
|
fileId: fmt.Sprintf("buffer %d", buffer.sequenceBase),
|
||||||
|
}, nil
|
||||||
|
}
|
161
weed/mq/messages/message_pipeline.go
Normal file
161
weed/mq/messages/message_pipeline.go
Normal file
|
@ -0,0 +1,161 @@
|
||||||
|
package messages
|
||||||
|
|
||||||
|
import (
|
||||||
|
"github.com/seaweedfs/seaweedfs/weed/util"
|
||||||
|
"google.golang.org/grpc"
|
||||||
|
"log"
|
||||||
|
"sync"
|
||||||
|
"sync/atomic"
|
||||||
|
"time"
|
||||||
|
)
|
||||||
|
|
||||||
|
type OnMessageFunc func(message *Message)
|
||||||
|
|
||||||
|
type MessagePipeline struct {
|
||||||
|
// atomic status
|
||||||
|
atomicPipelineStatus int64 // -1: stop
|
||||||
|
|
||||||
|
// attributes
|
||||||
|
ProducerId int32
|
||||||
|
ProducerEpoch int32
|
||||||
|
grpcDialOption grpc.DialOption
|
||||||
|
|
||||||
|
emptyBuffersChan chan *MessageBuffer
|
||||||
|
sealedBuffersChan chan *MessageBuffer
|
||||||
|
movedBuffersChan chan MessageBufferReference
|
||||||
|
onMessageFn OnMessageFunc
|
||||||
|
mover MessageBufferMover
|
||||||
|
moverPool *util.LimitedConcurrentExecutor
|
||||||
|
|
||||||
|
// control pipeline
|
||||||
|
doneChan chan struct{}
|
||||||
|
batchSize int
|
||||||
|
timeout time.Duration
|
||||||
|
|
||||||
|
incomingMessageLock sync.Mutex
|
||||||
|
incomingMessageBuffer *MessageBuffer
|
||||||
|
|
||||||
|
messageSequence int64
|
||||||
|
}
|
||||||
|
|
||||||
|
func NewMessagePipeline(producerId int32, workerCount int, batchSize int, timeout time.Duration, mover MessageBufferMover) *MessagePipeline {
|
||||||
|
t := &MessagePipeline{
|
||||||
|
ProducerId: producerId,
|
||||||
|
emptyBuffersChan: make(chan *MessageBuffer, workerCount),
|
||||||
|
sealedBuffersChan: make(chan *MessageBuffer, workerCount),
|
||||||
|
movedBuffersChan: make(chan MessageBufferReference, workerCount),
|
||||||
|
doneChan: make(chan struct{}),
|
||||||
|
batchSize: batchSize,
|
||||||
|
timeout: timeout,
|
||||||
|
moverPool: util.NewLimitedConcurrentExecutor(workerCount),
|
||||||
|
mover: mover,
|
||||||
|
}
|
||||||
|
go t.doLoopUpload()
|
||||||
|
return t
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mp *MessagePipeline) OutputChan() chan MessageBufferReference {
|
||||||
|
return mp.movedBuffersChan
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mp *MessagePipeline) AddMessage(message *Message) {
|
||||||
|
mp.incomingMessageLock.Lock()
|
||||||
|
defer mp.incomingMessageLock.Unlock()
|
||||||
|
|
||||||
|
// get existing message buffer or create a new one
|
||||||
|
if mp.incomingMessageBuffer == nil {
|
||||||
|
select {
|
||||||
|
case mp.incomingMessageBuffer = <-mp.emptyBuffersChan:
|
||||||
|
default:
|
||||||
|
mp.incomingMessageBuffer = NewMessageBuffer()
|
||||||
|
}
|
||||||
|
mp.incomingMessageBuffer.Reset(mp.messageSequence)
|
||||||
|
}
|
||||||
|
|
||||||
|
// add one message
|
||||||
|
mp.incomingMessageBuffer.AddMessage(message)
|
||||||
|
mp.messageSequence++
|
||||||
|
|
||||||
|
// seal the message buffer if full
|
||||||
|
if mp.incomingMessageBuffer.Len() >= mp.batchSize {
|
||||||
|
mp.incomingMessageBuffer.Seal(mp.ProducerId, mp.ProducerEpoch, 0, 0)
|
||||||
|
mp.sealedBuffersChan <- mp.incomingMessageBuffer
|
||||||
|
mp.incomingMessageBuffer = nil
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mp *MessagePipeline) doLoopUpload() {
|
||||||
|
|
||||||
|
mp.mover.Setup()
|
||||||
|
defer mp.mover.TearDown()
|
||||||
|
|
||||||
|
ticker := time.NewTicker(mp.timeout)
|
||||||
|
for {
|
||||||
|
status := atomic.LoadInt64(&mp.atomicPipelineStatus)
|
||||||
|
if status == -100 {
|
||||||
|
return
|
||||||
|
} else if status == -1 {
|
||||||
|
// entering shutting down mode
|
||||||
|
atomic.StoreInt64(&mp.atomicPipelineStatus, -2)
|
||||||
|
mp.incomingMessageLock.Lock()
|
||||||
|
mp.doFlushIncomingMessages()
|
||||||
|
mp.incomingMessageLock.Unlock()
|
||||||
|
}
|
||||||
|
|
||||||
|
select {
|
||||||
|
case messageBuffer := <-mp.sealedBuffersChan:
|
||||||
|
ticker.Reset(mp.timeout)
|
||||||
|
mp.moverPool.Execute(func() {
|
||||||
|
util.RetryForever("message mover", func() error {
|
||||||
|
if messageReference, flushErr := mp.mover.MoveBuffer(messageBuffer); flushErr != nil {
|
||||||
|
return flushErr
|
||||||
|
} else {
|
||||||
|
mp.movedBuffersChan <- messageReference
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}, func(err error) (shouldContinue bool) {
|
||||||
|
log.Printf("failed: %v", err)
|
||||||
|
return true
|
||||||
|
})
|
||||||
|
})
|
||||||
|
case <-ticker.C:
|
||||||
|
if atomic.LoadInt64(&mp.atomicPipelineStatus) == -2 {
|
||||||
|
atomic.StoreInt64(&mp.atomicPipelineStatus, -100)
|
||||||
|
return
|
||||||
|
}
|
||||||
|
mp.incomingMessageLock.Lock()
|
||||||
|
mp.doFlushIncomingMessages()
|
||||||
|
mp.incomingMessageLock.Unlock()
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
atomic.StoreInt64(&mp.atomicPipelineStatus, -100)
|
||||||
|
close(mp.movedBuffersChan)
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mp *MessagePipeline) doFlushIncomingMessages() {
|
||||||
|
if mp.incomingMessageBuffer == nil || mp.incomingMessageBuffer.Len() == 0 {
|
||||||
|
return
|
||||||
|
}
|
||||||
|
mp.incomingMessageBuffer.Seal(mp.ProducerId, mp.ProducerEpoch, 0, 0)
|
||||||
|
mp.sealedBuffersChan <- mp.incomingMessageBuffer
|
||||||
|
mp.incomingMessageBuffer = nil
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mp *MessagePipeline) ShutdownStart() {
|
||||||
|
if atomic.LoadInt64(&mp.atomicPipelineStatus) == 0 {
|
||||||
|
atomic.StoreInt64(&mp.atomicPipelineStatus, -1)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
func (mp *MessagePipeline) ShutdownWait() {
|
||||||
|
for atomic.LoadInt64(&mp.atomicPipelineStatus) != -100 {
|
||||||
|
time.Sleep(331 * time.Millisecond)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func (mp *MessagePipeline) ShutdownImmediate() {
|
||||||
|
if atomic.LoadInt64(&mp.atomicPipelineStatus) == 0 {
|
||||||
|
atomic.StoreInt64(&mp.atomicPipelineStatus, -100)
|
||||||
|
}
|
||||||
|
}
|
29
weed/mq/messages/message_pipeline_test.go
Normal file
29
weed/mq/messages/message_pipeline_test.go
Normal file
|
@ -0,0 +1,29 @@
|
||||||
|
package messages
|
||||||
|
|
||||||
|
import (
|
||||||
|
"testing"
|
||||||
|
"time"
|
||||||
|
)
|
||||||
|
|
||||||
|
func TestAddMessage(t *testing.T) {
|
||||||
|
mp := NewMessagePipeline(0, 3, 10, time.Second, &EmptyMover{})
|
||||||
|
go func() {
|
||||||
|
outChan := mp.OutputChan()
|
||||||
|
for mr := range outChan {
|
||||||
|
println(mr.sequence, mr.fileId)
|
||||||
|
}
|
||||||
|
}()
|
||||||
|
|
||||||
|
for i := 0; i < 100; i++ {
|
||||||
|
message := &Message{
|
||||||
|
Key: []byte("key"),
|
||||||
|
Content: []byte("data"),
|
||||||
|
Properties: nil,
|
||||||
|
Ts: time.Now(),
|
||||||
|
}
|
||||||
|
mp.AddMessage(message)
|
||||||
|
}
|
||||||
|
|
||||||
|
mp.ShutdownStart()
|
||||||
|
mp.ShutdownWait()
|
||||||
|
}
|
|
@ -7,10 +7,6 @@ import (
|
||||||
|
|
||||||
type MessageBatchBuilder struct {
|
type MessageBatchBuilder struct {
|
||||||
b *flatbuffers.Builder
|
b *flatbuffers.Builder
|
||||||
producerId int32
|
|
||||||
producerEpoch int32
|
|
||||||
segmentId int32
|
|
||||||
flags int32
|
|
||||||
messageOffsets []flatbuffers.UOffsetT
|
messageOffsets []flatbuffers.UOffsetT
|
||||||
segmentSeqBase int64
|
segmentSeqBase int64
|
||||||
segmentSeqLast int64
|
segmentSeqLast int64
|
||||||
|
@ -18,23 +14,19 @@ type MessageBatchBuilder struct {
|
||||||
tsMsLast int64
|
tsMsLast int64
|
||||||
}
|
}
|
||||||
|
|
||||||
func NewMessageBatchBuilder(b *flatbuffers.Builder,
|
func NewMessageBatchBuilder(b *flatbuffers.Builder) *MessageBatchBuilder {
|
||||||
producerId int32,
|
|
||||||
producerEpoch int32,
|
|
||||||
segmentId int32,
|
|
||||||
flags int32) *MessageBatchBuilder {
|
|
||||||
|
|
||||||
b.Reset()
|
b.Reset()
|
||||||
|
|
||||||
return &MessageBatchBuilder{
|
return &MessageBatchBuilder{
|
||||||
b: b,
|
b: b,
|
||||||
producerId: producerId,
|
|
||||||
producerEpoch: producerEpoch,
|
|
||||||
segmentId: segmentId,
|
|
||||||
flags: flags,
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func (builder *MessageBatchBuilder) Reset() {
|
||||||
|
builder.b.Reset()
|
||||||
|
}
|
||||||
|
|
||||||
func (builder *MessageBatchBuilder) AddMessage(segmentSeq int64, tsMs int64, properties map[string]string, key []byte, value []byte) {
|
func (builder *MessageBatchBuilder) AddMessage(segmentSeq int64, tsMs int64, properties map[string]string, key []byte, value []byte) {
|
||||||
if builder.segmentSeqBase == 0 {
|
if builder.segmentSeqBase == 0 {
|
||||||
builder.segmentSeqBase = segmentSeq
|
builder.segmentSeqBase = segmentSeq
|
||||||
|
@ -80,7 +72,10 @@ func (builder *MessageBatchBuilder) AddMessage(segmentSeq int64, tsMs int64, pro
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
func (builder *MessageBatchBuilder) BuildMessageBatch() {
|
func (builder *MessageBatchBuilder) BuildMessageBatch(producerId int32,
|
||||||
|
producerEpoch int32,
|
||||||
|
segmentId int32,
|
||||||
|
flags int32) {
|
||||||
message_fbs.MessageBatchStartMessagesVector(builder.b, len(builder.messageOffsets))
|
message_fbs.MessageBatchStartMessagesVector(builder.b, len(builder.messageOffsets))
|
||||||
for i := len(builder.messageOffsets) - 1; i >= 0; i-- {
|
for i := len(builder.messageOffsets) - 1; i >= 0; i-- {
|
||||||
builder.b.PrependUOffsetT(builder.messageOffsets[i])
|
builder.b.PrependUOffsetT(builder.messageOffsets[i])
|
||||||
|
@ -88,10 +83,10 @@ func (builder *MessageBatchBuilder) BuildMessageBatch() {
|
||||||
messagesOffset := builder.b.EndVector(len(builder.messageOffsets))
|
messagesOffset := builder.b.EndVector(len(builder.messageOffsets))
|
||||||
|
|
||||||
message_fbs.MessageBatchStart(builder.b)
|
message_fbs.MessageBatchStart(builder.b)
|
||||||
message_fbs.MessageBatchAddProducerId(builder.b, builder.producerId)
|
message_fbs.MessageBatchAddProducerId(builder.b, producerId)
|
||||||
message_fbs.MessageBatchAddProducerEpoch(builder.b, builder.producerEpoch)
|
message_fbs.MessageBatchAddProducerEpoch(builder.b, producerEpoch)
|
||||||
message_fbs.MessageBatchAddSegmentId(builder.b, builder.segmentId)
|
message_fbs.MessageBatchAddSegmentId(builder.b, segmentId)
|
||||||
message_fbs.MessageBatchAddFlags(builder.b, builder.flags)
|
message_fbs.MessageBatchAddFlags(builder.b, flags)
|
||||||
message_fbs.MessageBatchAddSegmentSeqBase(builder.b, builder.segmentSeqBase)
|
message_fbs.MessageBatchAddSegmentSeqBase(builder.b, builder.segmentSeqBase)
|
||||||
message_fbs.MessageBatchAddSegmentSeqMaxDelta(builder.b, int32(builder.segmentSeqLast-builder.segmentSeqBase))
|
message_fbs.MessageBatchAddSegmentSeqMaxDelta(builder.b, int32(builder.segmentSeqLast-builder.segmentSeqBase))
|
||||||
message_fbs.MessageBatchAddTsMsBase(builder.b, builder.tsMsBase)
|
message_fbs.MessageBatchAddTsMsBase(builder.b, builder.tsMsBase)
|
||||||
|
|
|
@ -14,11 +14,11 @@ func TestMessageSerde(t *testing.T) {
|
||||||
prop["n1"] = "v1"
|
prop["n1"] = "v1"
|
||||||
prop["n2"] = "v2"
|
prop["n2"] = "v2"
|
||||||
|
|
||||||
bb := NewMessageBatchBuilder(b, 1, 2, 3, 4)
|
bb := NewMessageBatchBuilder(b)
|
||||||
|
|
||||||
bb.AddMessage(5, 6, prop, []byte("the primary key"), []byte("body is here"))
|
bb.AddMessage(5, 6, prop, []byte("the primary key"), []byte("body is here"))
|
||||||
|
|
||||||
bb.BuildMessageBatch()
|
bb.BuildMessageBatch(1, 2, 3, 4)
|
||||||
|
|
||||||
buf := bb.GetBytes()
|
buf := bb.GetBytes()
|
||||||
|
|
||||||
|
|
Loading…
Reference in a new issue