delegate.go 6.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315
  1. package networkdb
  2. import (
  3. "fmt"
  4. "time"
  5. "github.com/Sirupsen/logrus"
  6. "github.com/hashicorp/serf/serf"
  7. )
  8. type networkData struct {
  9. LTime serf.LamportTime
  10. ID string
  11. NodeName string
  12. Leaving bool
  13. }
  14. type networkPushPull struct {
  15. LTime serf.LamportTime
  16. Networks []networkData
  17. }
  18. type delegate struct {
  19. nDB *NetworkDB
  20. }
  21. func (d *delegate) NodeMeta(limit int) []byte {
  22. return []byte{}
  23. }
  24. func (nDB *NetworkDB) handleNetworkEvent(nEvent *networkEventData) bool {
  25. // Update our local clock if the received messages has newer
  26. // time.
  27. nDB.networkClock.Witness(nEvent.LTime)
  28. nDB.Lock()
  29. defer nDB.Unlock()
  30. nodeNetworks, ok := nDB.networks[nEvent.NodeName]
  31. if !ok {
  32. // We haven't heard about this node at all. Ignore the leave
  33. if nEvent.Event == networkLeave {
  34. return false
  35. }
  36. nodeNetworks = make(map[string]*network)
  37. nDB.networks[nEvent.NodeName] = nodeNetworks
  38. }
  39. if n, ok := nodeNetworks[nEvent.NetworkID]; ok {
  40. // We have the latest state. Ignore the event
  41. // since it is stale.
  42. if n.ltime >= nEvent.LTime {
  43. return false
  44. }
  45. n.ltime = nEvent.LTime
  46. n.leaving = nEvent.Event == networkLeave
  47. if n.leaving {
  48. n.leaveTime = time.Now()
  49. }
  50. return true
  51. }
  52. if nEvent.Event == networkLeave {
  53. return false
  54. }
  55. // This remote network join is being seen the first time.
  56. nodeNetworks[nEvent.NetworkID] = &network{
  57. id: nEvent.NetworkID,
  58. ltime: nEvent.LTime,
  59. }
  60. nDB.networkNodes[nEvent.NetworkID] = append(nDB.networkNodes[nEvent.NetworkID], nEvent.NodeName)
  61. return true
  62. }
  63. func (nDB *NetworkDB) handleTableEvent(tEvent *tableEventData) bool {
  64. // Update our local clock if the received messages has newer
  65. // time.
  66. nDB.tableClock.Witness(tEvent.LTime)
  67. if entry, err := nDB.getEntry(tEvent.TableName, tEvent.NetworkID, tEvent.Key); err == nil {
  68. // We have the latest state. Ignore the event
  69. // since it is stale.
  70. if entry.ltime >= tEvent.LTime {
  71. return false
  72. }
  73. }
  74. entry := &entry{
  75. ltime: tEvent.LTime,
  76. node: tEvent.NodeName,
  77. value: tEvent.Value,
  78. deleting: tEvent.Event == tableEntryDelete,
  79. }
  80. if entry.deleting {
  81. entry.deleteTime = time.Now()
  82. }
  83. nDB.Lock()
  84. nDB.indexes[byTable].Insert(fmt.Sprintf("/%s/%s/%s", tEvent.TableName, tEvent.NetworkID, tEvent.Key), entry)
  85. nDB.indexes[byNetwork].Insert(fmt.Sprintf("/%s/%s/%s", tEvent.NetworkID, tEvent.TableName, tEvent.Key), entry)
  86. nDB.Unlock()
  87. var op opType
  88. switch tEvent.Event {
  89. case tableEntryCreate:
  90. op = opCreate
  91. case tableEntryUpdate:
  92. op = opUpdate
  93. case tableEntryDelete:
  94. op = opDelete
  95. }
  96. nDB.broadcaster.Write(makeEvent(op, tEvent.TableName, tEvent.NetworkID, tEvent.Key, tEvent.Value))
  97. return true
  98. }
  99. func (nDB *NetworkDB) handleCompound(buf []byte) {
  100. // Decode the parts
  101. trunc, parts, err := decodeCompoundMessage(buf[1:])
  102. if err != nil {
  103. logrus.Errorf("Failed to decode compound request: %v", err)
  104. return
  105. }
  106. // Log any truncation
  107. if trunc > 0 {
  108. logrus.Warnf("Compound request had %d truncated messages", trunc)
  109. }
  110. // Handle each message
  111. for _, part := range parts {
  112. nDB.handleMessage(part)
  113. }
  114. }
  115. func (nDB *NetworkDB) handleTableMessage(buf []byte) {
  116. var tEvent tableEventData
  117. if err := decodeMessage(buf[1:], &tEvent); err != nil {
  118. logrus.Errorf("Error decoding table event message: %v", err)
  119. return
  120. }
  121. if rebroadcast := nDB.handleTableEvent(&tEvent); rebroadcast {
  122. // Copy the buffer since we cannot rely on the slice not changing
  123. newBuf := make([]byte, len(buf))
  124. copy(newBuf, buf)
  125. nDB.RLock()
  126. n, ok := nDB.networks[nDB.config.NodeName][tEvent.NetworkID]
  127. nDB.RUnlock()
  128. if !ok {
  129. return
  130. }
  131. broadcastQ := n.tableBroadcasts
  132. broadcastQ.QueueBroadcast(&tableEventMessage{
  133. msg: newBuf,
  134. id: tEvent.NetworkID,
  135. tname: tEvent.TableName,
  136. key: tEvent.Key,
  137. node: nDB.config.NodeName,
  138. })
  139. }
  140. }
  141. func (nDB *NetworkDB) handleNetworkMessage(buf []byte) {
  142. var nEvent networkEventData
  143. if err := decodeMessage(buf[1:], &nEvent); err != nil {
  144. logrus.Errorf("Error decoding network event message: %v", err)
  145. return
  146. }
  147. if rebroadcast := nDB.handleNetworkEvent(&nEvent); rebroadcast {
  148. // Copy the buffer since it we cannot rely on the slice not changing
  149. newBuf := make([]byte, len(buf))
  150. copy(newBuf, buf)
  151. nDB.networkBroadcasts.QueueBroadcast(&networkEventMessage{
  152. msg: newBuf,
  153. id: nEvent.NetworkID,
  154. node: nEvent.NodeName,
  155. })
  156. }
  157. }
  158. func (nDB *NetworkDB) handleBulkSync(buf []byte) {
  159. var bsm bulkSyncMessage
  160. if err := decodeMessage(buf[1:], &bsm); err != nil {
  161. logrus.Errorf("Error decoding bulk sync message: %v", err)
  162. return
  163. }
  164. if bsm.LTime > 0 {
  165. nDB.tableClock.Witness(bsm.LTime)
  166. }
  167. nDB.handleMessage(bsm.Payload)
  168. // Don't respond to a bulk sync which was not unsolicited
  169. if !bsm.Unsolicited {
  170. nDB.RLock()
  171. ch, ok := nDB.bulkSyncAckTbl[bsm.NodeName]
  172. nDB.RUnlock()
  173. if ok {
  174. close(ch)
  175. }
  176. return
  177. }
  178. if err := nDB.bulkSyncNode(bsm.Networks, bsm.NodeName, false); err != nil {
  179. logrus.Errorf("Error in responding to bulk sync from node %s: %v", nDB.nodes[bsm.NodeName].Addr, err)
  180. }
  181. }
  182. func (nDB *NetworkDB) handleMessage(buf []byte) {
  183. msgType := messageType(buf[0])
  184. switch msgType {
  185. case networkEventMsg:
  186. nDB.handleNetworkMessage(buf)
  187. case tableEventMsg:
  188. nDB.handleTableMessage(buf)
  189. case compoundMsg:
  190. nDB.handleCompound(buf)
  191. case bulkSyncMsg:
  192. nDB.handleBulkSync(buf)
  193. default:
  194. logrus.Errorf("%s: unknown message type %d payload = %v", nDB.config.NodeName, msgType, buf[:8])
  195. }
  196. }
  197. func (d *delegate) NotifyMsg(buf []byte) {
  198. if len(buf) == 0 {
  199. return
  200. }
  201. d.nDB.handleMessage(buf)
  202. }
  203. func (d *delegate) GetBroadcasts(overhead, limit int) [][]byte {
  204. return d.nDB.networkBroadcasts.GetBroadcasts(overhead, limit)
  205. }
  206. func (d *delegate) LocalState(join bool) []byte {
  207. d.nDB.RLock()
  208. defer d.nDB.RUnlock()
  209. pp := networkPushPull{
  210. LTime: d.nDB.networkClock.Time(),
  211. }
  212. for name, nn := range d.nDB.networks {
  213. for _, n := range nn {
  214. pp.Networks = append(pp.Networks, networkData{
  215. LTime: n.ltime,
  216. ID: n.id,
  217. NodeName: name,
  218. Leaving: n.leaving,
  219. })
  220. }
  221. }
  222. buf, err := encodeMessage(networkPushPullMsg, &pp)
  223. if err != nil {
  224. logrus.Errorf("Failed to encode local network state: %v", err)
  225. return nil
  226. }
  227. return buf
  228. }
  229. func (d *delegate) MergeRemoteState(buf []byte, isJoin bool) {
  230. if len(buf) == 0 {
  231. logrus.Error("zero byte remote network state received")
  232. return
  233. }
  234. if messageType(buf[0]) != networkPushPullMsg {
  235. logrus.Errorf("Invalid message type %v received from remote", buf[0])
  236. }
  237. pp := networkPushPull{}
  238. if err := decodeMessage(buf[1:], &pp); err != nil {
  239. logrus.Errorf("Failed to decode remote network state: %v", err)
  240. return
  241. }
  242. if pp.LTime > 0 {
  243. d.nDB.networkClock.Witness(pp.LTime)
  244. }
  245. for _, n := range pp.Networks {
  246. nEvent := &networkEventData{
  247. LTime: n.LTime,
  248. NodeName: n.NodeName,
  249. NetworkID: n.ID,
  250. Event: networkJoin,
  251. }
  252. if n.Leaving {
  253. nEvent.Event = networkLeave
  254. }
  255. d.nDB.handleNetworkEvent(nEvent)
  256. }
  257. }