7 years ago · 55e4cc7262
--- a/libnetwork/networkdb/broadcast.go
+++ b/libnetwork/networkdb/broadcast.go
@@ -110,7 +110,6 @@ type tableEventMessage struct {
 
				 	tname string
			
 
				 	key   string
			
 
				 	msg   []byte
			
 
				-	node  string
			
 
				 }
			
 
				 
			
 
				 func (m *tableEventMessage) Invalidates(other memberlist.Broadcast) bool {
			
@@ -168,7 +167,6 @@ func (nDB *NetworkDB) sendTableEvent(event TableEvent_Type, nid string, tname st
 
				 		id:    nid,
			
 
				 		tname: tname,
			
 
				 		key:   key,
			
 
				-		node:  nDB.config.NodeID,
			
 
				 	})
			
 
				 	return nil
			
 
				 }
			
--- a/libnetwork/networkdb/cluster.go
+++ b/libnetwork/networkdb/cluster.go
@@ -24,6 +24,9 @@ const (
 
				 	retryInterval         = 1 * time.Second
			
 
				 	nodeReapInterval      = 24 * time.Hour
			
 
				 	nodeReapPeriod        = 2 * time.Hour
			
 
				+	// considering a cluster with > 20 nodes and a drain speed of 100 msg/s
			
 
				+	// the following is roughly 1 minute
			
 
				+	maxQueueLenBroadcastOnSync = 500
			
 
				 )
			
 
				 
			
 
				 type logWriter struct{}
			
@@ -572,6 +575,7 @@ func (nDB *NetworkDB) bulkSync(nodes []string, all bool) ([]string, error) {
 
				 
			
 
				 	var err error
			
 
				 	var networks []string
			
 
				+	var success bool
			
 
				 	for _, node := range nodes {
			
 
				 		if node == nDB.config.NodeID {
			
 
				 			continue
			
@@ -579,21 +583,25 @@ func (nDB *NetworkDB) bulkSync(nodes []string, all bool) ([]string, error) {
 
				 		logrus.Debugf("%v(%v): Initiating bulk sync with node %v", nDB.config.Hostname, nDB.config.NodeID, node)
			
 
				 		networks = nDB.findCommonNetworks(node)
			
 
				 		err = nDB.bulkSyncNode(networks, node, true)
			
 
				-		// if its periodic bulksync stop after the first successful sync
			
 
				-		if !all && err == nil {
			
 
				-			break
			
 
				-		}
			
 
				 		if err != nil {
			
 
				 			err = fmt.Errorf("bulk sync to node %s failed: %v", node, err)
			
 
				 			logrus.Warn(err.Error())
			
 
				+		} else {
			
 
				+			// bulk sync succeeded
			
 
				+			success = true
			
 
				+			// if its periodic bulksync stop after the first successful sync
			
 
				+			if !all {
			
 
				+				break
			
 
				+			}
			
 
				 		}
			
 
				 	}
			
 
				 
			
 
				-	if err != nil {
			
 
				-		return nil, err
			
 
				+	if success {
			
 
				+		// if at least one node sync succeeded
			
 
				+		return networks, nil
			
 
				 	}
			
 
				 
			
 
				-	return networks, nil
			
 
				+	return nil, err
			
 
				 }
			
 
				 
			
 
				 // Bulk sync all the table entries belonging to a set of networks to a
			
--- a/libnetwork/networkdb/delegate.go
+++ b/libnetwork/networkdb/delegate.go
@@ -142,7 +142,7 @@ func (nDB *NetworkDB) handleNetworkEvent(nEvent *NetworkEvent) bool {
 
				 	return true
			
 
				 }
			
 
				 
			
 
				-func (nDB *NetworkDB) handleTableEvent(tEvent *TableEvent) bool {
			
 
				+func (nDB *NetworkDB) handleTableEvent(tEvent *TableEvent, isBulkSync bool) bool {
			
 
				 	// Update our local clock if the received messages has newer time.
			
 
				 	nDB.tableClock.Witness(tEvent.LTime)
			
 
				 
			
@@ -175,6 +175,14 @@ func (nDB *NetworkDB) handleTableEvent(tEvent *TableEvent) bool {
 
				 			nDB.Unlock()
			
 
				 			return false
			
 
				 		}
			
 
				+	} else if tEvent.Type == TableEventTypeDelete && !isBulkSync {
			
 
				+		nDB.Unlock()
			
 
				+		// We don't know the entry, the entry is being deleted and the message is an async message
			
 
				+		// In this case the safest approach is to ignore it, it is possible that the queue grew so much to
			
 
				+		// exceed the garbage collection time (the residual reap time that is in the message is not being
			
 
				+		// updated, to avoid inserting too many messages in the queue).
			
 
				+		// Instead the messages coming from TCP bulk sync are safe with the latest value for the garbage collection time
			
 
				+		return false
			
 
				 	}
			
 
				 
			
 
				 	e = &entry{
			
@@ -197,11 +205,17 @@ func (nDB *NetworkDB) handleTableEvent(tEvent *TableEvent) bool {
 
				 	nDB.Unlock()
			
 
				 
			
 
				 	if err != nil && tEvent.Type == TableEventTypeDelete {
			
 
				-		// If it is a delete event and we did not have a state for it, don't propagate to the application
			
 
				+		// Again we don't know the entry but this is coming from a TCP sync so the message body is up to date.
			
 
				+		// We had saved the state so to speed up convergence and be able to avoid accepting create events.
			
 
				+		// Now we will rebroadcast the message if 2 conditions are met:
			
 
				+		// 1) we had already synced this network (during the network join)
			
 
				+		// 2) the residual reapTime is higher than 1/6 of the total reapTime.
			
 
				 		// If the residual reapTime is lower or equal to 1/6 of the total reapTime don't bother broadcasting it around
			
 
				-		// most likely the cluster is already aware of it, if not who will sync with this node will catch the state too.
			
 
				-		// This also avoids that deletion of entries close to their garbage collection ends up circuling around forever
			
 
				-		return e.reapTime > nDB.config.reapEntryInterval/6
			
 
				+		// most likely the cluster is already aware of it
			
 
				+		// This also reduce the possibility that deletion of entries close to their garbage collection ends up circuling around
			
 
				+		// forever
			
 
				+		//logrus.Infof("exiting on delete not knowing the obj with rebroadcast:%t", network.inSync)
			
 
				+		return network.inSync && e.reapTime > nDB.config.reapEntryInterval/6
			
 
				 	}
			
 
				 
			
 
				 	var op opType
			
@@ -215,7 +229,7 @@ func (nDB *NetworkDB) handleTableEvent(tEvent *TableEvent) bool {
 
				 	}
			
 
				 
			
 
				 	nDB.broadcaster.Write(makeEvent(op, tEvent.TableName, tEvent.NetworkID, tEvent.Key, tEvent.Value))
			
 
				-	return true
			
 
				+	return network.inSync
			
 
				 }
			
 
				 
			
 
				 func (nDB *NetworkDB) handleCompound(buf []byte, isBulkSync bool) {
			
@@ -244,7 +258,7 @@ func (nDB *NetworkDB) handleTableMessage(buf []byte, isBulkSync bool) {
 
				 		return
			
 
				 	}
			
 
				 
			
 
				-	if rebroadcast := nDB.handleTableEvent(&tEvent); rebroadcast {
			
 
				+	if rebroadcast := nDB.handleTableEvent(&tEvent, isBulkSync); rebroadcast {
			
 
				 		var err error
			
 
				 		buf, err = encodeRawMessage(MessageTypeTableEvent, buf)
			
 
				 		if err != nil {
			
@@ -261,12 +275,16 @@ func (nDB *NetworkDB) handleTableMessage(buf []byte, isBulkSync bool) {
 
				 			return
			
 
				 		}
			
 
				 
			
 
				+		// if the queue is over the threshold, avoid distributing information coming from TCP sync
			
 
				+		if isBulkSync && n.tableBroadcasts.NumQueued() > maxQueueLenBroadcastOnSync {
			
 
				+			return
			
 
				+		}
			
 
				+
			
 
				 		n.tableBroadcasts.QueueBroadcast(&tableEventMessage{
			
 
				 			msg:   buf,
			
 
				 			id:    tEvent.NetworkID,
			
 
				 			tname: tEvent.TableName,
			
 
				 			key:   tEvent.Key,
			
 
				-			node:  tEvent.NodeName,
			
 
				 		})
			
 
				 	}
			
 
				 }
			
--- a/libnetwork/networkdb/networkdb.go
+++ b/libnetwork/networkdb/networkdb.go
@@ -130,6 +130,9 @@ type network struct {
 
				 	// Lamport time for the latest state of the entry.
			
 
				 	ltime serf.LamportTime
			
 
				 
			
 
				+	// Gets set to true after the first bulk sync happens
			
 
				+	inSync bool
			
 
				+
			
 
				 	// Node leave is in progress.
			
 
				 	leaving bool
			
 
				 
			
@@ -616,6 +619,7 @@ func (nDB *NetworkDB) JoinNetwork(nid string) error {
 
				 	}
			
 
				 	nDB.addNetworkNode(nid, nDB.config.NodeID)
			
 
				 	networkNodes := nDB.networkNodes[nid]
			
 
				+	n = nodeNetworks[nid]
			
 
				 	nDB.Unlock()
			
 
				 
			
 
				 	if err := nDB.sendNetworkEvent(nid, NetworkEventTypeJoin, ltime); err != nil {
			
@@ -627,6 +631,12 @@ func (nDB *NetworkDB) JoinNetwork(nid string) error {
 
				 		logrus.Errorf("Error bulk syncing while joining network %s: %v", nid, err)
			
 
				 	}
			
 
				 
			
 
				+	// Mark the network as being synced
			
 
				+	// note this is a best effort, we are not checking the result of the bulk sync
			
 
				+	nDB.Lock()
			
 
				+	n.inSync = true
			
 
				+	nDB.Unlock()
			
 
				+
			
 
				 	return nil
			
 
				 }