123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477 |
- package networkdb
- import (
- "fmt"
- "net"
- "strings"
- "github.com/Sirupsen/logrus"
- "github.com/gogo/protobuf/proto"
- )
- type delegate struct {
- nDB *NetworkDB
- }
- func (d *delegate) NodeMeta(limit int) []byte {
- return []byte{}
- }
- func (nDB *NetworkDB) checkAndGetNode(nEvent *NodeEvent) *node {
- nDB.Lock()
- defer nDB.Unlock()
- for _, nodes := range []map[string]*node{
- nDB.failedNodes,
- nDB.leftNodes,
- nDB.nodes,
- } {
- if n, ok := nodes[nEvent.NodeName]; ok {
- if n.ltime >= nEvent.LTime {
- return nil
- }
- delete(nodes, n.Name)
- return n
- }
- }
- return nil
- }
- func (nDB *NetworkDB) purgeSameNode(n *node) {
- nDB.Lock()
- defer nDB.Unlock()
- prefix := strings.Split(n.Name, "-")[0]
- for _, nodes := range []map[string]*node{
- nDB.failedNodes,
- nDB.leftNodes,
- nDB.nodes,
- } {
- var nodeNames []string
- for name, node := range nodes {
- if strings.HasPrefix(name, prefix) && n.Addr.Equal(node.Addr) {
- nodeNames = append(nodeNames, name)
- }
- }
- for _, name := range nodeNames {
- delete(nodes, name)
- }
- }
- }
- func (nDB *NetworkDB) handleNodeEvent(nEvent *NodeEvent) bool {
- n := nDB.checkAndGetNode(nEvent)
- if n == nil {
- return false
- }
- nDB.purgeSameNode(n)
- n.ltime = nEvent.LTime
- switch nEvent.Type {
- case NodeEventTypeJoin:
- nDB.Lock()
- nDB.nodes[n.Name] = n
- nDB.Unlock()
- return true
- case NodeEventTypeLeave:
- nDB.Lock()
- nDB.leftNodes[n.Name] = n
- nDB.Unlock()
- return true
- }
- return false
- }
- func (nDB *NetworkDB) handleNetworkEvent(nEvent *NetworkEvent) bool {
- var flushEntries bool
- // Update our local clock if the received messages has newer
- // time.
- nDB.networkClock.Witness(nEvent.LTime)
- nDB.Lock()
- defer func() {
- nDB.Unlock()
- // When a node leaves a network on the last task removal cleanup the
- // local entries for this network & node combination. When the tasks
- // on a network are removed we could have missed the gossip updates.
- // Not doing this cleanup can leave stale entries because bulksyncs
- // from the node will no longer include this network state.
- //
- // deleteNodeNetworkEntries takes nDB lock.
- if flushEntries {
- nDB.deleteNodeNetworkEntries(nEvent.NetworkID, nEvent.NodeName)
- }
- }()
- if nEvent.NodeName == nDB.config.NodeName {
- return false
- }
- nodeNetworks, ok := nDB.networks[nEvent.NodeName]
- if !ok {
- // We haven't heard about this node at all. Ignore the leave
- if nEvent.Type == NetworkEventTypeLeave {
- return false
- }
- nodeNetworks = make(map[string]*network)
- nDB.networks[nEvent.NodeName] = nodeNetworks
- }
- if n, ok := nodeNetworks[nEvent.NetworkID]; ok {
- // We have the latest state. Ignore the event
- // since it is stale.
- if n.ltime >= nEvent.LTime {
- return false
- }
- n.ltime = nEvent.LTime
- n.leaving = nEvent.Type == NetworkEventTypeLeave
- if n.leaving {
- n.reapTime = reapInterval
- flushEntries = true
- }
- nDB.addNetworkNode(nEvent.NetworkID, nEvent.NodeName)
- return true
- }
- if nEvent.Type == NetworkEventTypeLeave {
- return false
- }
- // This remote network join is being seen the first time.
- nodeNetworks[nEvent.NetworkID] = &network{
- id: nEvent.NetworkID,
- ltime: nEvent.LTime,
- }
- nDB.addNetworkNode(nEvent.NetworkID, nEvent.NodeName)
- return true
- }
- func (nDB *NetworkDB) handleTableEvent(tEvent *TableEvent) bool {
- // Update our local clock if the received messages has newer
- // time.
- nDB.tableClock.Witness(tEvent.LTime)
- // Ignore the table events for networks that are in the process of going away
- nDB.RLock()
- networks := nDB.networks[nDB.config.NodeName]
- network, ok := networks[tEvent.NetworkID]
- nDB.RUnlock()
- if !ok || network.leaving {
- return true
- }
- e, err := nDB.getEntry(tEvent.TableName, tEvent.NetworkID, tEvent.Key)
- if err != nil && tEvent.Type == TableEventTypeDelete {
- // If it is a delete event and we don't have the entry here nothing to do.
- return false
- }
- if err == nil {
- // We have the latest state. Ignore the event
- // since it is stale.
- if e.ltime >= tEvent.LTime {
- return false
- }
- }
- e = &entry{
- ltime: tEvent.LTime,
- node: tEvent.NodeName,
- value: tEvent.Value,
- deleting: tEvent.Type == TableEventTypeDelete,
- }
- if e.deleting {
- e.reapTime = reapInterval
- }
- nDB.Lock()
- nDB.indexes[byTable].Insert(fmt.Sprintf("/%s/%s/%s", tEvent.TableName, tEvent.NetworkID, tEvent.Key), e)
- nDB.indexes[byNetwork].Insert(fmt.Sprintf("/%s/%s/%s", tEvent.NetworkID, tEvent.TableName, tEvent.Key), e)
- nDB.Unlock()
- var op opType
- switch tEvent.Type {
- case TableEventTypeCreate:
- op = opCreate
- case TableEventTypeUpdate:
- op = opUpdate
- case TableEventTypeDelete:
- op = opDelete
- }
- nDB.broadcaster.Write(makeEvent(op, tEvent.TableName, tEvent.NetworkID, tEvent.Key, tEvent.Value))
- return true
- }
- func (nDB *NetworkDB) handleCompound(buf []byte, isBulkSync bool) {
- // Decode the parts
- parts, err := decodeCompoundMessage(buf)
- if err != nil {
- logrus.Errorf("Failed to decode compound request: %v", err)
- return
- }
- // Handle each message
- for _, part := range parts {
- nDB.handleMessage(part, isBulkSync)
- }
- }
- func (nDB *NetworkDB) handleTableMessage(buf []byte, isBulkSync bool) {
- var tEvent TableEvent
- if err := proto.Unmarshal(buf, &tEvent); err != nil {
- logrus.Errorf("Error decoding table event message: %v", err)
- return
- }
- // Ignore messages that this node generated.
- if tEvent.NodeName == nDB.config.NodeName {
- return
- }
- // Do not rebroadcast a bulk sync
- if rebroadcast := nDB.handleTableEvent(&tEvent); rebroadcast && !isBulkSync {
- var err error
- buf, err = encodeRawMessage(MessageTypeTableEvent, buf)
- if err != nil {
- logrus.Errorf("Error marshalling gossip message for network event rebroadcast: %v", err)
- return
- }
- nDB.RLock()
- n, ok := nDB.networks[nDB.config.NodeName][tEvent.NetworkID]
- nDB.RUnlock()
- if !ok {
- return
- }
- broadcastQ := n.tableBroadcasts
- if broadcastQ == nil {
- return
- }
- broadcastQ.QueueBroadcast(&tableEventMessage{
- msg: buf,
- id: tEvent.NetworkID,
- tname: tEvent.TableName,
- key: tEvent.Key,
- node: nDB.config.NodeName,
- })
- }
- }
- func (nDB *NetworkDB) handleNodeMessage(buf []byte) {
- var nEvent NodeEvent
- if err := proto.Unmarshal(buf, &nEvent); err != nil {
- logrus.Errorf("Error decoding node event message: %v", err)
- return
- }
- if rebroadcast := nDB.handleNodeEvent(&nEvent); rebroadcast {
- var err error
- buf, err = encodeRawMessage(MessageTypeNodeEvent, buf)
- if err != nil {
- logrus.Errorf("Error marshalling gossip message for node event rebroadcast: %v", err)
- return
- }
- nDB.nodeBroadcasts.QueueBroadcast(&nodeEventMessage{
- msg: buf,
- })
- }
- }
- func (nDB *NetworkDB) handleNetworkMessage(buf []byte) {
- var nEvent NetworkEvent
- if err := proto.Unmarshal(buf, &nEvent); err != nil {
- logrus.Errorf("Error decoding network event message: %v", err)
- return
- }
- if rebroadcast := nDB.handleNetworkEvent(&nEvent); rebroadcast {
- var err error
- buf, err = encodeRawMessage(MessageTypeNetworkEvent, buf)
- if err != nil {
- logrus.Errorf("Error marshalling gossip message for network event rebroadcast: %v", err)
- return
- }
- nDB.networkBroadcasts.QueueBroadcast(&networkEventMessage{
- msg: buf,
- id: nEvent.NetworkID,
- node: nEvent.NodeName,
- })
- }
- }
- func (nDB *NetworkDB) handleBulkSync(buf []byte) {
- var bsm BulkSyncMessage
- if err := proto.Unmarshal(buf, &bsm); err != nil {
- logrus.Errorf("Error decoding bulk sync message: %v", err)
- return
- }
- if bsm.LTime > 0 {
- nDB.tableClock.Witness(bsm.LTime)
- }
- nDB.handleMessage(bsm.Payload, true)
- // Don't respond to a bulk sync which was not unsolicited
- if !bsm.Unsolicited {
- nDB.Lock()
- ch, ok := nDB.bulkSyncAckTbl[bsm.NodeName]
- if ok {
- close(ch)
- delete(nDB.bulkSyncAckTbl, bsm.NodeName)
- }
- nDB.Unlock()
- return
- }
- var nodeAddr net.IP
- nDB.RLock()
- if node, ok := nDB.nodes[bsm.NodeName]; ok {
- nodeAddr = node.Addr
- }
- nDB.RUnlock()
- if err := nDB.bulkSyncNode(bsm.Networks, bsm.NodeName, false); err != nil {
- logrus.Errorf("Error in responding to bulk sync from node %s: %v", nodeAddr, err)
- }
- }
- func (nDB *NetworkDB) handleMessage(buf []byte, isBulkSync bool) {
- mType, data, err := decodeMessage(buf)
- if err != nil {
- logrus.Errorf("Error decoding gossip message to get message type: %v", err)
- return
- }
- switch mType {
- case MessageTypeNodeEvent:
- nDB.handleNodeMessage(data)
- case MessageTypeNetworkEvent:
- nDB.handleNetworkMessage(data)
- case MessageTypeTableEvent:
- nDB.handleTableMessage(data, isBulkSync)
- case MessageTypeBulkSync:
- nDB.handleBulkSync(data)
- case MessageTypeCompound:
- nDB.handleCompound(data, isBulkSync)
- default:
- logrus.Errorf("%s: unknown message type %d", nDB.config.NodeName, mType)
- }
- }
- func (d *delegate) NotifyMsg(buf []byte) {
- if len(buf) == 0 {
- return
- }
- d.nDB.handleMessage(buf, false)
- }
- func (d *delegate) GetBroadcasts(overhead, limit int) [][]byte {
- msgs := d.nDB.networkBroadcasts.GetBroadcasts(overhead, limit)
- msgs = append(msgs, d.nDB.nodeBroadcasts.GetBroadcasts(overhead, limit)...)
- return msgs
- }
- func (d *delegate) LocalState(join bool) []byte {
- if join {
- // Update all the local node/network state to a new time to
- // force update on the node we are trying to rejoin, just in
- // case that node has these in leaving state still. This is
- // facilitate fast convergence after recovering from a gossip
- // failure.
- d.nDB.updateLocalNetworkTime()
- }
- d.nDB.RLock()
- defer d.nDB.RUnlock()
- pp := NetworkPushPull{
- LTime: d.nDB.networkClock.Time(),
- NodeName: d.nDB.config.NodeName,
- }
- for name, nn := range d.nDB.networks {
- for _, n := range nn {
- pp.Networks = append(pp.Networks, &NetworkEntry{
- LTime: n.ltime,
- NetworkID: n.id,
- NodeName: name,
- Leaving: n.leaving,
- })
- }
- }
- buf, err := encodeMessage(MessageTypePushPull, &pp)
- if err != nil {
- logrus.Errorf("Failed to encode local network state: %v", err)
- return nil
- }
- return buf
- }
- func (d *delegate) MergeRemoteState(buf []byte, isJoin bool) {
- if len(buf) == 0 {
- logrus.Error("zero byte remote network state received")
- return
- }
- var gMsg GossipMessage
- err := proto.Unmarshal(buf, &gMsg)
- if err != nil {
- logrus.Errorf("Error unmarshalling push pull messsage: %v", err)
- return
- }
- if gMsg.Type != MessageTypePushPull {
- logrus.Errorf("Invalid message type %v received from remote", buf[0])
- }
- pp := NetworkPushPull{}
- if err := proto.Unmarshal(gMsg.Data, &pp); err != nil {
- logrus.Errorf("Failed to decode remote network state: %v", err)
- return
- }
- nodeEvent := &NodeEvent{
- LTime: pp.LTime,
- NodeName: pp.NodeName,
- Type: NodeEventTypeJoin,
- }
- d.nDB.handleNodeEvent(nodeEvent)
- for _, n := range pp.Networks {
- nEvent := &NetworkEvent{
- LTime: n.LTime,
- NodeName: n.NodeName,
- NetworkID: n.NetworkID,
- Type: NetworkEventTypeJoin,
- }
- if n.Leaving {
- nEvent.Type = NetworkEventTypeLeave
- }
- d.nDB.handleNetworkEvent(nEvent)
- }
- }
|