nodemgmt.go 3.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121
  1. package networkdb
  2. import (
  3. "context"
  4. "fmt"
  5. "github.com/containerd/log"
  6. "github.com/hashicorp/memberlist"
  7. )
  8. type nodeState int
  9. const (
  10. nodeNotFound nodeState = -1
  11. nodeActiveState nodeState = 0
  12. nodeLeftState nodeState = 1
  13. nodeFailedState nodeState = 2
  14. )
  15. var nodeStateName = map[nodeState]string{
  16. -1: "NodeNotFound",
  17. 0: "NodeActive",
  18. 1: "NodeLeft",
  19. 2: "NodeFailed",
  20. }
  21. // findNode search the node into the 3 node lists and returns the node pointer and the list
  22. // where it got found
  23. func (nDB *NetworkDB) findNode(nodeName string) (*node, nodeState, map[string]*node) {
  24. for i, nodes := range []map[string]*node{
  25. nDB.nodes,
  26. nDB.leftNodes,
  27. nDB.failedNodes,
  28. } {
  29. if n, ok := nodes[nodeName]; ok {
  30. return n, nodeState(i), nodes
  31. }
  32. }
  33. return nil, nodeNotFound, nil
  34. }
  35. // changeNodeState changes the state of the node specified, returns true if the node was moved,
  36. // false if there was no need to change the node state. Error will be returned if the node does not
  37. // exists
  38. func (nDB *NetworkDB) changeNodeState(nodeName string, newState nodeState) (bool, error) {
  39. n, currState, m := nDB.findNode(nodeName)
  40. if n == nil {
  41. return false, fmt.Errorf("node %s not found", nodeName)
  42. }
  43. switch newState {
  44. case nodeActiveState:
  45. if currState == nodeActiveState {
  46. return false, nil
  47. }
  48. delete(m, nodeName)
  49. // reset the node reap time
  50. n.reapTime = 0
  51. nDB.nodes[nodeName] = n
  52. case nodeLeftState:
  53. if currState == nodeLeftState {
  54. return false, nil
  55. }
  56. delete(m, nodeName)
  57. nDB.leftNodes[nodeName] = n
  58. case nodeFailedState:
  59. if currState == nodeFailedState {
  60. return false, nil
  61. }
  62. delete(m, nodeName)
  63. nDB.failedNodes[nodeName] = n
  64. }
  65. log.G(context.TODO()).Infof("Node %s change state %s --> %s", nodeName, nodeStateName[currState], nodeStateName[newState])
  66. if newState == nodeLeftState || newState == nodeFailedState {
  67. // set the node reap time, if not already set
  68. // It is possible that a node passes from failed to left and the reaptime was already set so keep that value
  69. if n.reapTime == 0 {
  70. n.reapTime = nodeReapInterval
  71. }
  72. // The node leave or fails, delete all the entries created by it.
  73. // If the node was temporary down, deleting the entries will guarantee that the CREATE events will be accepted
  74. // If the node instead left because was going down, then it makes sense to just delete all its state
  75. nDB.deleteNodeFromNetworks(n.Name)
  76. nDB.deleteNodeTableEntries(n.Name)
  77. }
  78. return true, nil
  79. }
  80. func (nDB *NetworkDB) purgeReincarnation(mn *memberlist.Node) bool {
  81. for name, node := range nDB.nodes {
  82. if node.Addr.Equal(mn.Addr) && node.Port == mn.Port && mn.Name != name {
  83. log.G(context.TODO()).Infof("Node %s/%s, is the new incarnation of the active node %s/%s", mn.Name, mn.Addr, name, node.Addr)
  84. nDB.changeNodeState(name, nodeLeftState)
  85. return true
  86. }
  87. }
  88. for name, node := range nDB.failedNodes {
  89. if node.Addr.Equal(mn.Addr) && node.Port == mn.Port && mn.Name != name {
  90. log.G(context.TODO()).Infof("Node %s/%s, is the new incarnation of the failed node %s/%s", mn.Name, mn.Addr, name, node.Addr)
  91. nDB.changeNodeState(name, nodeLeftState)
  92. return true
  93. }
  94. }
  95. for name, node := range nDB.leftNodes {
  96. if node.Addr.Equal(mn.Addr) && node.Port == mn.Port && mn.Name != name {
  97. log.G(context.TODO()).Infof("Node %s/%s, is the new incarnation of the shutdown node %s/%s", mn.Name, mn.Addr, name, node.Addr)
  98. nDB.changeNodeState(name, nodeLeftState)
  99. return true
  100. }
  101. }
  102. return false
  103. }