Skip to content

Commit

Permalink
fixes #247: implement msg id function as pubsub option
Browse files Browse the repository at this point in the history
  • Loading branch information
protolambda committed Dec 16, 2019
1 parent 7269e41 commit 7981f9b
Show file tree
Hide file tree
Showing 6 changed files with 43 additions and 15 deletions.
2 changes: 2 additions & 0 deletions gossipsub.go
Original file line number Diff line number Diff line change
Expand Up @@ -75,6 +75,8 @@ func (gs *GossipSubRouter) Protocols() []protocol.ID {
func (gs *GossipSubRouter) Attach(p *PubSub) {
gs.p = p
gs.tracer = p.tracer
// start using the same msg ID function as PubSub for caching messages.
gs.mcache.ChangeMsgIdFn(p.msgID)
go gs.heartbeatTimer()
}

Expand Down
8 changes: 7 additions & 1 deletion mcache.go
Original file line number Diff line number Diff line change
Expand Up @@ -28,13 +28,19 @@ func NewMessageCache(gossip, history int) *MessageCache {
msgs: make(map[string]*pb.Message),
history: make([][]CacheEntry, history),
gossip: gossip,
msgID: DefaultMsgIdFn,
}
}

type MessageCache struct {
msgs map[string]*pb.Message
history [][]CacheEntry
gossip int
msgID MsgIdFunction
}

func (mc *MessageCache) ChangeMsgIdFn(msgID MsgIdFunction) {
mc.msgID = msgID
}

type CacheEntry struct {
Expand All @@ -43,7 +49,7 @@ type CacheEntry struct {
}

func (mc *MessageCache) Put(msg *pb.Message) {
mid := msgID(msg)
mid := mc.msgID(msg)
mc.msgs[mid] = msg
mc.history[0] = append(mc.history[0], CacheEntry{mid: mid, topics: msg.GetTopicIDs()})
}
Expand Down
1 change: 1 addition & 0 deletions mcache_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,7 @@ import (

func TestMessageCache(t *testing.T) {
mcache := NewMessageCache(3, 5)
msgID := DefaultMsgIdFn

msgs := make([]*pb.Message, 60)
for i := range msgs {
Expand Down
26 changes: 22 additions & 4 deletions pubsub.go
Original file line number Diff line number Diff line change
Expand Up @@ -117,6 +117,9 @@ type PubSub struct {
seenMessagesMx sync.Mutex
seenMessages *timecache.TimeCache

// function used to compute the ID for a message
msgID MsgIdFunction

// key for signing messages; nil when signing is disabled (default for now)
signKey crypto.PrivKey
// source ID for signed messages; corresponds to signKey
Expand Down Expand Up @@ -208,6 +211,7 @@ func NewPubSub(ctx context.Context, h host.Host, rt PubSubRouter, opts ...Option
blacklist: NewMapBlacklist(),
blacklistPeer: make(chan peer.ID),
seenMessages: timecache.NewTimeCache(TimeCacheDuration),
msgID: DefaultMsgIdFn,
counter: uint64(time.Now().UnixNano()),
}

Expand Down Expand Up @@ -240,6 +244,20 @@ func NewPubSub(ctx context.Context, h host.Host, rt PubSubRouter, opts ...Option
return ps, nil
}

// MsgIdFunction returns a unique ID for the passed Message, and PubSub can be customized to use any
// implementation of this function by configuring it with the Option from WithMessageIdFn.
type MsgIdFunction func(pmsg *pb.Message) string

// WithMessageIdFn is an option to customize the way a message ID is computed for a pubsub message.
// The default ID function is DefaultMsgIdFn (concatenate source and seq nr.),
// but it can be customized to e.g. the hash of the message.
func WithMessageIdFn(fn MsgIdFunction) Option {
return func(p *PubSub) error {
p.msgID = fn
return nil
}
}

// WithPeerOutboundQueueSize is an option to set the buffer size for outbound messages to a peer
// We start dropping messages to a peer if the outbound queue if full
func WithPeerOutboundQueueSize(size int) Option {
Expand Down Expand Up @@ -326,7 +344,7 @@ func WithDiscovery(d discovery.Discovery, opts ...DiscoverOpt) Option {
// WithEventTracer provides a tracer for the pubsub system
func WithEventTracer(tracer EventTracer) Option {
return func(p *PubSub) error {
p.tracer = &pubsubTracer{tracer: tracer, pid: p.host.ID()}
p.tracer = &pubsubTracer{tracer: tracer, pid: p.host.ID(), msgID: p.msgID}
return nil
}
}
Expand Down Expand Up @@ -730,8 +748,8 @@ func (p *PubSub) handleIncomingRPC(rpc *RPC) {
p.rt.HandleRPC(rpc)
}

// msgID returns a unique ID of the passed Message
func msgID(pmsg *pb.Message) string {
// DefaultMsgIdFn returns a unique ID of the passed Message
func DefaultMsgIdFn(pmsg *pb.Message) string {
return string(pmsg.GetFrom()) + string(pmsg.GetSeqno())
}

Expand Down Expand Up @@ -760,7 +778,7 @@ func (p *PubSub) pushMsg(msg *Message) {
}

// have we already seen and validated this message?
id := msgID(msg.Message)
id := p.msgID(msg.Message)
if p.seenMessage(id) {
p.tracer.DuplicateMessage(msg)
return
Expand Down
19 changes: 10 additions & 9 deletions trace.go
Original file line number Diff line number Diff line change
Expand Up @@ -18,6 +18,7 @@ type EventTracer interface {
type pubsubTracer struct {
tracer EventTracer
pid peer.ID
msgID MsgIdFunction
}

func (t *pubsubTracer) PublishMessage(msg *Message) {
Expand All @@ -31,7 +32,7 @@ func (t *pubsubTracer) PublishMessage(msg *Message) {
PeerID: []byte(t.pid),
Timestamp: &now,
PublishMessage: &pb.TraceEvent_PublishMessage{
MessageID: []byte(msgID(msg.Message)),
MessageID: []byte(t.msgID(msg.Message)),
Topics: msg.Message.TopicIDs,
},
}
Expand All @@ -50,7 +51,7 @@ func (t *pubsubTracer) RejectMessage(msg *Message, reason string) {
PeerID: []byte(t.pid),
Timestamp: &now,
RejectMessage: &pb.TraceEvent_RejectMessage{
MessageID: []byte(msgID(msg.Message)),
MessageID: []byte(t.msgID(msg.Message)),
ReceivedFrom: []byte(msg.ReceivedFrom),
Reason: &reason,
},
Expand All @@ -70,7 +71,7 @@ func (t *pubsubTracer) DuplicateMessage(msg *Message) {
PeerID: []byte(t.pid),
Timestamp: &now,
DuplicateMessage: &pb.TraceEvent_DuplicateMessage{
MessageID: []byte(msgID(msg.Message)),
MessageID: []byte(t.msgID(msg.Message)),
ReceivedFrom: []byte(msg.ReceivedFrom),
},
}
Expand All @@ -89,7 +90,7 @@ func (t *pubsubTracer) DeliverMessage(msg *Message) {
PeerID: []byte(t.pid),
Timestamp: &now,
DeliverMessage: &pb.TraceEvent_DeliverMessage{
MessageID: []byte(msgID(msg.Message)),
MessageID: []byte(t.msgID(msg.Message)),
},
}

Expand Down Expand Up @@ -146,7 +147,7 @@ func (t *pubsubTracer) RecvRPC(rpc *RPC) {
Timestamp: &now,
RecvRPC: &pb.TraceEvent_RecvRPC{
ReceivedFrom: []byte(rpc.from),
Meta: traceRPCMeta(rpc),
Meta: t.traceRPCMeta(rpc),
},
}

Expand All @@ -165,7 +166,7 @@ func (t *pubsubTracer) SendRPC(rpc *RPC, p peer.ID) {
Timestamp: &now,
SendRPC: &pb.TraceEvent_SendRPC{
SendTo: []byte(rpc.from),
Meta: traceRPCMeta(rpc),
Meta: t.traceRPCMeta(rpc),
},
}

Expand All @@ -184,20 +185,20 @@ func (t *pubsubTracer) DropRPC(rpc *RPC, p peer.ID) {
Timestamp: &now,
DropRPC: &pb.TraceEvent_DropRPC{
SendTo: []byte(rpc.from),
Meta: traceRPCMeta(rpc),
Meta: t.traceRPCMeta(rpc),
},
}

t.tracer.Trace(evt)
}

func traceRPCMeta(rpc *RPC) *pb.TraceEvent_RPCMeta {
func (t *pubsubTracer) traceRPCMeta(rpc *RPC) *pb.TraceEvent_RPCMeta {
rpcMeta := new(pb.TraceEvent_RPCMeta)

var msgs []*pb.TraceEvent_MessageMeta
for _, m := range rpc.Publish {
msgs = append(msgs, &pb.TraceEvent_MessageMeta{
MessageID: []byte(msgID(m)),
MessageID: []byte(t.msgID(m)),
Topics: m.TopicIDs,
})
}
Expand Down
2 changes: 1 addition & 1 deletion validation.go
Original file line number Diff line number Diff line change
Expand Up @@ -201,7 +201,7 @@ func (v *validation) validate(vals []*topicVal, src peer.ID, msg *Message) {

// we can mark the message as seen now that we have verified the signature
// and avoid invoking user validators more than once
id := msgID(msg.Message)
id := v.p.msgID(msg.Message)
if !v.p.markSeen(id) {
v.tracer.DuplicateMessage(msg)
return
Expand Down

0 comments on commit 7981f9b

Please sign in to comment.