docker_api_swarm_test.go 35 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084
  1. // +build !windows
  2. package main
  3. import (
  4. "fmt"
  5. "net/http"
  6. "os"
  7. "path/filepath"
  8. "strconv"
  9. "strings"
  10. "sync"
  11. "syscall"
  12. "time"
  13. "github.com/docker/docker/pkg/integration/checker"
  14. "github.com/docker/engine-api/types/swarm"
  15. "github.com/go-check/check"
  16. )
  17. var defaultReconciliationTimeout = 30 * time.Second
  18. func (s *DockerSwarmSuite) TestApiSwarmInit(c *check.C) {
  19. testRequires(c, Network)
  20. // todo: should find a better way to verify that components are running than /info
  21. d1 := s.AddDaemon(c, true, true)
  22. info, err := d1.info()
  23. c.Assert(err, checker.IsNil)
  24. c.Assert(info.ControlAvailable, checker.True)
  25. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  26. d2 := s.AddDaemon(c, true, false)
  27. info, err = d2.info()
  28. c.Assert(err, checker.IsNil)
  29. c.Assert(info.ControlAvailable, checker.False)
  30. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  31. // Leaving cluster
  32. c.Assert(d2.Leave(false), checker.IsNil)
  33. info, err = d2.info()
  34. c.Assert(err, checker.IsNil)
  35. c.Assert(info.ControlAvailable, checker.False)
  36. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  37. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: d1.joinTokens(c).Worker, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  38. info, err = d2.info()
  39. c.Assert(err, checker.IsNil)
  40. c.Assert(info.ControlAvailable, checker.False)
  41. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  42. // Current state restoring after restarts
  43. err = d1.Stop()
  44. c.Assert(err, checker.IsNil)
  45. err = d2.Stop()
  46. c.Assert(err, checker.IsNil)
  47. err = d1.Start()
  48. c.Assert(err, checker.IsNil)
  49. err = d2.Start()
  50. c.Assert(err, checker.IsNil)
  51. info, err = d1.info()
  52. c.Assert(err, checker.IsNil)
  53. c.Assert(info.ControlAvailable, checker.True)
  54. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  55. info, err = d2.info()
  56. c.Assert(err, checker.IsNil)
  57. c.Assert(info.ControlAvailable, checker.False)
  58. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  59. }
  60. func (s *DockerSwarmSuite) TestApiSwarmJoinToken(c *check.C) {
  61. testRequires(c, Network)
  62. d1 := s.AddDaemon(c, false, false)
  63. c.Assert(d1.Init(swarm.InitRequest{}), checker.IsNil)
  64. d2 := s.AddDaemon(c, false, false)
  65. err := d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  66. c.Assert(err, checker.NotNil)
  67. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  68. info, err := d2.info()
  69. c.Assert(err, checker.IsNil)
  70. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  71. err = d2.Join(swarm.JoinRequest{JoinToken: "foobaz", RemoteAddrs: []string{d1.listenAddr}})
  72. c.Assert(err, checker.NotNil)
  73. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  74. info, err = d2.info()
  75. c.Assert(err, checker.IsNil)
  76. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  77. workerToken := d1.joinTokens(c).Worker
  78. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  79. info, err = d2.info()
  80. c.Assert(err, checker.IsNil)
  81. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  82. c.Assert(d2.Leave(false), checker.IsNil)
  83. info, err = d2.info()
  84. c.Assert(err, checker.IsNil)
  85. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  86. // change tokens
  87. d1.rotateTokens(c)
  88. err = d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}})
  89. c.Assert(err, checker.NotNil)
  90. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  91. info, err = d2.info()
  92. c.Assert(err, checker.IsNil)
  93. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  94. workerToken = d1.joinTokens(c).Worker
  95. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  96. info, err = d2.info()
  97. c.Assert(err, checker.IsNil)
  98. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  99. c.Assert(d2.Leave(false), checker.IsNil)
  100. info, err = d2.info()
  101. c.Assert(err, checker.IsNil)
  102. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  103. // change spec, don't change tokens
  104. d1.updateSwarm(c, func(s *swarm.Spec) {})
  105. err = d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  106. c.Assert(err, checker.NotNil)
  107. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  108. info, err = d2.info()
  109. c.Assert(err, checker.IsNil)
  110. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  111. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  112. info, err = d2.info()
  113. c.Assert(err, checker.IsNil)
  114. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  115. c.Assert(d2.Leave(false), checker.IsNil)
  116. info, err = d2.info()
  117. c.Assert(err, checker.IsNil)
  118. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  119. }
  120. func (s *DockerSwarmSuite) TestApiSwarmCAHash(c *check.C) {
  121. testRequires(c, Network)
  122. d1 := s.AddDaemon(c, true, true)
  123. d2 := s.AddDaemon(c, false, false)
  124. splitToken := strings.Split(d1.joinTokens(c).Worker, "-")
  125. splitToken[2] = "1kxftv4ofnc6mt30lmgipg6ngf9luhwqopfk1tz6bdmnkubg0e"
  126. replacementToken := strings.Join(splitToken, "-")
  127. err := d2.Join(swarm.JoinRequest{JoinToken: replacementToken, RemoteAddrs: []string{d1.listenAddr}})
  128. c.Assert(err, checker.NotNil)
  129. c.Assert(err.Error(), checker.Contains, "remote CA does not match fingerprint")
  130. }
  131. func (s *DockerSwarmSuite) TestApiSwarmPromoteDemote(c *check.C) {
  132. testRequires(c, Network)
  133. d1 := s.AddDaemon(c, false, false)
  134. c.Assert(d1.Init(swarm.InitRequest{}), checker.IsNil)
  135. d2 := s.AddDaemon(c, true, false)
  136. info, err := d2.info()
  137. c.Assert(err, checker.IsNil)
  138. c.Assert(info.ControlAvailable, checker.False)
  139. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  140. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  141. n.Spec.Role = swarm.NodeRoleManager
  142. })
  143. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  144. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  145. n.Spec.Role = swarm.NodeRoleWorker
  146. })
  147. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.False)
  148. // Demoting last node should fail
  149. node := d1.getNode(c, d1.NodeID)
  150. node.Spec.Role = swarm.NodeRoleWorker
  151. url := fmt.Sprintf("/nodes/%s/update?version=%d", node.ID, node.Version.Index)
  152. status, out, err := d1.SockRequest("POST", url, node.Spec)
  153. c.Assert(err, checker.IsNil)
  154. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("output: %q", string(out)))
  155. c.Assert(string(out), checker.Contains, "last manager of the swarm")
  156. info, err = d1.info()
  157. c.Assert(err, checker.IsNil)
  158. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  159. c.Assert(info.ControlAvailable, checker.True)
  160. // Promote already demoted node
  161. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  162. n.Spec.Role = swarm.NodeRoleManager
  163. })
  164. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  165. }
  166. func (s *DockerSwarmSuite) TestApiSwarmServicesEmptyList(c *check.C) {
  167. testRequires(c, Network)
  168. d := s.AddDaemon(c, true, true)
  169. services := d.listServices(c)
  170. c.Assert(services, checker.NotNil)
  171. c.Assert(len(services), checker.Equals, 0, check.Commentf("services: %#v", services))
  172. }
  173. func (s *DockerSwarmSuite) TestApiSwarmServicesCreate(c *check.C) {
  174. testRequires(c, Network)
  175. d := s.AddDaemon(c, true, true)
  176. instances := 2
  177. id := d.createService(c, simpleTestService, setInstances(instances))
  178. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  179. service := d.getService(c, id)
  180. instances = 5
  181. d.updateService(c, service, setInstances(instances))
  182. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  183. d.removeService(c, service.ID)
  184. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 0)
  185. }
  186. func (s *DockerSwarmSuite) TestApiSwarmServicesMultipleAgents(c *check.C) {
  187. testRequires(c, Network)
  188. d1 := s.AddDaemon(c, true, true)
  189. d2 := s.AddDaemon(c, true, false)
  190. d3 := s.AddDaemon(c, true, false)
  191. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  192. instances := 9
  193. id := d1.createService(c, simpleTestService, setInstances(instances))
  194. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  195. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  196. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.GreaterThan, 0)
  197. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  198. // reconciliation on d2 node down
  199. c.Assert(d2.Stop(), checker.IsNil)
  200. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  201. // test downscaling
  202. instances = 5
  203. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  204. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  205. }
  206. func (s *DockerSwarmSuite) TestApiSwarmServicesCreateGlobal(c *check.C) {
  207. testRequires(c, Network)
  208. d1 := s.AddDaemon(c, true, true)
  209. d2 := s.AddDaemon(c, true, false)
  210. d3 := s.AddDaemon(c, true, false)
  211. d1.createService(c, simpleTestService, setGlobalMode)
  212. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, 1)
  213. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  214. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.Equals, 1)
  215. d4 := s.AddDaemon(c, true, false)
  216. d5 := s.AddDaemon(c, true, false)
  217. waitAndAssert(c, defaultReconciliationTimeout, d4.checkActiveContainerCount, checker.Equals, 1)
  218. waitAndAssert(c, defaultReconciliationTimeout, d5.checkActiveContainerCount, checker.Equals, 1)
  219. }
  220. func (s *DockerSwarmSuite) TestApiSwarmServicesUpdate(c *check.C) {
  221. const nodeCount = 3
  222. var daemons [nodeCount]*SwarmDaemon
  223. for i := 0; i < nodeCount; i++ {
  224. daemons[i] = s.AddDaemon(c, true, i == 0)
  225. }
  226. // wait for nodes ready
  227. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  228. // service image at start
  229. image1 := "busybox:latest"
  230. // target image in update
  231. image2 := "busybox:test"
  232. // create a different tag
  233. for _, d := range daemons {
  234. out, err := d.Cmd("tag", image1, image2)
  235. c.Assert(err, checker.IsNil, check.Commentf(out))
  236. }
  237. // create service
  238. instances := 5
  239. parallelism := 2
  240. id := daemons[0].createService(c, serviceForUpdate, setInstances(instances))
  241. // wait for tasks ready
  242. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  243. map[string]int{image1: instances})
  244. // issue service update
  245. service := daemons[0].getService(c, id)
  246. daemons[0].updateService(c, service, setImage(image2))
  247. // first batch
  248. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  249. map[string]int{image1: instances - parallelism, image2: parallelism})
  250. // 2nd batch
  251. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  252. map[string]int{image1: instances - 2*parallelism, image2: 2 * parallelism})
  253. // 3nd batch
  254. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  255. map[string]int{image2: instances})
  256. }
  257. func (s *DockerSwarmSuite) TestApiSwarmServiceConstraintRole(c *check.C) {
  258. const nodeCount = 3
  259. var daemons [nodeCount]*SwarmDaemon
  260. for i := 0; i < nodeCount; i++ {
  261. daemons[i] = s.AddDaemon(c, true, i == 0)
  262. }
  263. // wait for nodes ready
  264. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  265. // create service
  266. constraints := []string{"node.role==worker"}
  267. instances := 3
  268. id := daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  269. // wait for tasks ready
  270. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(c, id), checker.Equals, instances)
  271. // validate tasks are running on worker nodes
  272. tasks := daemons[0].getServiceTasks(c, id)
  273. for _, task := range tasks {
  274. node := daemons[0].getNode(c, task.NodeID)
  275. c.Assert(node.Spec.Role, checker.Equals, swarm.NodeRoleWorker)
  276. }
  277. //remove service
  278. daemons[0].removeService(c, id)
  279. // create service
  280. constraints = []string{"node.role!=worker"}
  281. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  282. // wait for tasks ready
  283. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(c, id), checker.Equals, instances)
  284. tasks = daemons[0].getServiceTasks(c, id)
  285. // validate tasks are running on manager nodes
  286. for _, task := range tasks {
  287. node := daemons[0].getNode(c, task.NodeID)
  288. c.Assert(node.Spec.Role, checker.Equals, swarm.NodeRoleManager)
  289. }
  290. //remove service
  291. daemons[0].removeService(c, id)
  292. // create service
  293. constraints = []string{"node.role==nosuchrole"}
  294. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  295. // wait for tasks created
  296. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(c, id), checker.Equals, instances)
  297. // let scheduler try
  298. time.Sleep(250 * time.Millisecond)
  299. // validate tasks are not assigned to any node
  300. tasks = daemons[0].getServiceTasks(c, id)
  301. for _, task := range tasks {
  302. c.Assert(task.NodeID, checker.Equals, "")
  303. }
  304. }
  305. func (s *DockerSwarmSuite) TestApiSwarmServiceConstraintLabel(c *check.C) {
  306. const nodeCount = 3
  307. var daemons [nodeCount]*SwarmDaemon
  308. for i := 0; i < nodeCount; i++ {
  309. daemons[i] = s.AddDaemon(c, true, i == 0)
  310. }
  311. // wait for nodes ready
  312. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  313. nodes := daemons[0].listNodes(c)
  314. c.Assert(len(nodes), checker.Equals, nodeCount)
  315. // add labels to nodes
  316. daemons[0].updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  317. n.Spec.Annotations.Labels = map[string]string{
  318. "security": "high",
  319. }
  320. })
  321. for i := 1; i < nodeCount; i++ {
  322. daemons[0].updateNode(c, nodes[i].ID, func(n *swarm.Node) {
  323. n.Spec.Annotations.Labels = map[string]string{
  324. "security": "low",
  325. }
  326. })
  327. }
  328. // create service
  329. instances := 3
  330. constraints := []string{"node.labels.security==high"}
  331. id := daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  332. // wait for tasks ready
  333. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(c, id), checker.Equals, instances)
  334. tasks := daemons[0].getServiceTasks(c, id)
  335. // validate all tasks are running on nodes[0]
  336. for _, task := range tasks {
  337. c.Assert(task.NodeID, checker.Equals, nodes[0].ID)
  338. }
  339. //remove service
  340. daemons[0].removeService(c, id)
  341. // create service
  342. constraints = []string{"node.labels.security!=high"}
  343. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  344. // wait for tasks ready
  345. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(c, id), checker.Equals, instances)
  346. tasks = daemons[0].getServiceTasks(c, id)
  347. // validate all tasks are NOT running on nodes[0]
  348. for _, task := range tasks {
  349. c.Assert(task.NodeID, checker.Not(checker.Equals), nodes[0].ID)
  350. }
  351. //remove service
  352. daemons[0].removeService(c, id)
  353. constraints = []string{"node.labels.security==medium"}
  354. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  355. // wait for tasks created
  356. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(c, id), checker.Equals, instances)
  357. // let scheduler try
  358. time.Sleep(250 * time.Millisecond)
  359. tasks = daemons[0].getServiceTasks(c, id)
  360. // validate tasks are not assigned
  361. for _, task := range tasks {
  362. c.Assert(task.NodeID, checker.Equals, "")
  363. }
  364. //remove service
  365. daemons[0].removeService(c, id)
  366. // multiple constraints
  367. constraints = []string{
  368. "node.labels.security==high",
  369. fmt.Sprintf("node.id==%s", nodes[1].ID),
  370. }
  371. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  372. // wait for tasks created
  373. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(c, id), checker.Equals, instances)
  374. // let scheduler try
  375. time.Sleep(250 * time.Millisecond)
  376. tasks = daemons[0].getServiceTasks(c, id)
  377. // validate tasks are not assigned
  378. for _, task := range tasks {
  379. c.Assert(task.NodeID, checker.Equals, "")
  380. }
  381. // make nodes[1] fulfills the constraints
  382. daemons[0].updateNode(c, nodes[1].ID, func(n *swarm.Node) {
  383. n.Spec.Annotations.Labels = map[string]string{
  384. "security": "high",
  385. }
  386. })
  387. // wait for tasks ready
  388. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(c, id), checker.Equals, instances)
  389. tasks = daemons[0].getServiceTasks(c, id)
  390. for _, task := range tasks {
  391. c.Assert(task.NodeID, checker.Equals, nodes[1].ID)
  392. }
  393. }
  394. func (s *DockerSwarmSuite) TestApiSwarmServicesStateReporting(c *check.C) {
  395. testRequires(c, Network)
  396. testRequires(c, SameHostDaemon)
  397. testRequires(c, DaemonIsLinux)
  398. d1 := s.AddDaemon(c, true, true)
  399. d2 := s.AddDaemon(c, true, true)
  400. d3 := s.AddDaemon(c, true, false)
  401. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept
  402. instances := 9
  403. d1.createService(c, simpleTestService, setInstances(instances))
  404. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  405. getContainers := func() map[string]*SwarmDaemon {
  406. m := make(map[string]*SwarmDaemon)
  407. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  408. for _, id := range d.activeContainers() {
  409. m[id] = d
  410. }
  411. }
  412. return m
  413. }
  414. containers := getContainers()
  415. c.Assert(containers, checker.HasLen, instances)
  416. var toRemove string
  417. for i := range containers {
  418. toRemove = i
  419. }
  420. _, err := containers[toRemove].Cmd("stop", toRemove)
  421. c.Assert(err, checker.IsNil)
  422. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  423. containers2 := getContainers()
  424. c.Assert(containers2, checker.HasLen, instances)
  425. for i := range containers {
  426. if i == toRemove {
  427. c.Assert(containers2[i], checker.IsNil)
  428. } else {
  429. c.Assert(containers2[i], checker.NotNil)
  430. }
  431. }
  432. containers = containers2
  433. for i := range containers {
  434. toRemove = i
  435. }
  436. // try with killing process outside of docker
  437. pidStr, err := containers[toRemove].Cmd("inspect", "-f", "{{.State.Pid}}", toRemove)
  438. c.Assert(err, checker.IsNil)
  439. pid, err := strconv.Atoi(strings.TrimSpace(pidStr))
  440. c.Assert(err, checker.IsNil)
  441. c.Assert(syscall.Kill(pid, syscall.SIGKILL), checker.IsNil)
  442. time.Sleep(time.Second) // give some time to handle the signal
  443. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  444. containers2 = getContainers()
  445. c.Assert(containers2, checker.HasLen, instances)
  446. for i := range containers {
  447. if i == toRemove {
  448. c.Assert(containers2[i], checker.IsNil)
  449. } else {
  450. c.Assert(containers2[i], checker.NotNil)
  451. }
  452. }
  453. }
  454. func (s *DockerSwarmSuite) TestApiSwarmLeaderProxy(c *check.C) {
  455. // add three managers, one of these is leader
  456. d1 := s.AddDaemon(c, true, true)
  457. d2 := s.AddDaemon(c, true, true)
  458. d3 := s.AddDaemon(c, true, true)
  459. // start a service by hitting each of the 3 managers
  460. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  461. s.Spec.Name = "test1"
  462. })
  463. d2.createService(c, simpleTestService, func(s *swarm.Service) {
  464. s.Spec.Name = "test2"
  465. })
  466. d3.createService(c, simpleTestService, func(s *swarm.Service) {
  467. s.Spec.Name = "test3"
  468. })
  469. // 3 services should be started now, because the requests were proxied to leader
  470. // query each node and make sure it returns 3 services
  471. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  472. services := d.listServices(c)
  473. c.Assert(services, checker.HasLen, 3)
  474. }
  475. }
  476. func (s *DockerSwarmSuite) TestApiSwarmLeaderElection(c *check.C) {
  477. // Create 3 nodes
  478. d1 := s.AddDaemon(c, true, true)
  479. d2 := s.AddDaemon(c, true, true)
  480. d3 := s.AddDaemon(c, true, true)
  481. // assert that the first node we made is the leader, and the other two are followers
  482. c.Assert(d1.getNode(c, d1.NodeID).ManagerStatus.Leader, checker.True)
  483. c.Assert(d1.getNode(c, d2.NodeID).ManagerStatus.Leader, checker.False)
  484. c.Assert(d1.getNode(c, d3.NodeID).ManagerStatus.Leader, checker.False)
  485. leader := d1
  486. // stop the leader
  487. leader.Stop()
  488. // wait for an election to occur
  489. var newleader *SwarmDaemon
  490. for _, d := range []*SwarmDaemon{d2, d3} {
  491. if d.getNode(c, d.NodeID).ManagerStatus.Leader {
  492. newleader = d
  493. break
  494. }
  495. }
  496. // assert that we have a new leader
  497. c.Assert(newleader, checker.NotNil)
  498. // add the old leader back
  499. leader.Start()
  500. // clear leader and reinit the followers list
  501. followers := make([]*SwarmDaemon, 0, 3)
  502. // pick out the leader and the followers again
  503. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  504. if d1.getNode(c, d.NodeID).ManagerStatus.Leader {
  505. leader = d
  506. } else {
  507. followers = append(followers, d)
  508. }
  509. }
  510. // verify that we still only have 1 leader and 2 followers
  511. c.Assert(leader, checker.NotNil)
  512. c.Assert(followers, checker.HasLen, 2)
  513. // and that after we added d1 back, the leader hasn't changed
  514. c.Assert(leader.NodeID, checker.Equals, newleader.NodeID)
  515. }
  516. func (s *DockerSwarmSuite) TestApiSwarmRaftQuorum(c *check.C) {
  517. testRequires(c, Network)
  518. d1 := s.AddDaemon(c, true, true)
  519. d2 := s.AddDaemon(c, true, true)
  520. d3 := s.AddDaemon(c, true, true)
  521. d1.createService(c, simpleTestService)
  522. c.Assert(d2.Stop(), checker.IsNil)
  523. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  524. s.Spec.Name = "top1"
  525. })
  526. c.Assert(d3.Stop(), checker.IsNil)
  527. var service swarm.Service
  528. simpleTestService(&service)
  529. service.Spec.Name = "top2"
  530. status, out, err := d1.SockRequest("POST", "/services/create", service.Spec)
  531. c.Assert(err, checker.IsNil)
  532. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("deadline exceeded", string(out)))
  533. c.Assert(d2.Start(), checker.IsNil)
  534. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  535. s.Spec.Name = "top3"
  536. })
  537. }
  538. func (s *DockerSwarmSuite) TestApiSwarmListNodes(c *check.C) {
  539. testRequires(c, Network)
  540. d1 := s.AddDaemon(c, true, true)
  541. d2 := s.AddDaemon(c, true, false)
  542. d3 := s.AddDaemon(c, true, false)
  543. nodes := d1.listNodes(c)
  544. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  545. loop0:
  546. for _, n := range nodes {
  547. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  548. if n.ID == d.NodeID {
  549. continue loop0
  550. }
  551. }
  552. c.Errorf("unknown nodeID %v", n.ID)
  553. }
  554. }
  555. func (s *DockerSwarmSuite) TestApiSwarmNodeUpdate(c *check.C) {
  556. testRequires(c, Network)
  557. d := s.AddDaemon(c, true, true)
  558. nodes := d.listNodes(c)
  559. d.updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  560. n.Spec.Availability = swarm.NodeAvailabilityPause
  561. })
  562. n := d.getNode(c, nodes[0].ID)
  563. c.Assert(n.Spec.Availability, checker.Equals, swarm.NodeAvailabilityPause)
  564. }
  565. func (s *DockerSwarmSuite) TestApiSwarmNodeDrainPause(c *check.C) {
  566. testRequires(c, Network)
  567. d1 := s.AddDaemon(c, true, true)
  568. d2 := s.AddDaemon(c, true, false)
  569. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  570. // start a service, expect balanced distribution
  571. instances := 8
  572. id := d1.createService(c, simpleTestService, setInstances(instances))
  573. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  574. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  575. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  576. // drain d2, all containers should move to d1
  577. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  578. n.Spec.Availability = swarm.NodeAvailabilityDrain
  579. })
  580. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  581. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  582. // set d2 back to active
  583. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  584. n.Spec.Availability = swarm.NodeAvailabilityActive
  585. })
  586. instances = 1
  587. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  588. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  589. instances = 8
  590. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  591. // drained node first so we don't get any old containers
  592. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  593. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  594. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  595. d2ContainerCount := len(d2.activeContainers())
  596. // set d2 to paused, scale service up, only d1 gets new tasks
  597. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  598. n.Spec.Availability = swarm.NodeAvailabilityPause
  599. })
  600. instances = 14
  601. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  602. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances-d2ContainerCount)
  603. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, d2ContainerCount)
  604. }
  605. func (s *DockerSwarmSuite) TestApiSwarmLeaveRemovesContainer(c *check.C) {
  606. testRequires(c, Network)
  607. d := s.AddDaemon(c, true, true)
  608. instances := 2
  609. d.createService(c, simpleTestService, setInstances(instances))
  610. id, err := d.Cmd("run", "-d", "busybox", "top")
  611. c.Assert(err, checker.IsNil)
  612. id = strings.TrimSpace(id)
  613. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances+1)
  614. c.Assert(d.Leave(false), checker.NotNil)
  615. c.Assert(d.Leave(true), checker.IsNil)
  616. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 1)
  617. id2, err := d.Cmd("ps", "-q")
  618. c.Assert(err, checker.IsNil)
  619. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  620. }
  621. // #23629
  622. func (s *DockerSwarmSuite) TestApiSwarmLeaveOnPendingJoin(c *check.C) {
  623. s.AddDaemon(c, true, true)
  624. d2 := s.AddDaemon(c, false, false)
  625. id, err := d2.Cmd("run", "-d", "busybox", "top")
  626. c.Assert(err, checker.IsNil)
  627. id = strings.TrimSpace(id)
  628. go d2.Join(swarm.JoinRequest{
  629. RemoteAddrs: []string{"nosuchhost:1234"},
  630. }) // will block on pending state
  631. waitAndAssert(c, defaultReconciliationTimeout, d2.checkLocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  632. c.Assert(d2.Leave(true), checker.IsNil)
  633. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  634. id2, err := d2.Cmd("ps", "-q")
  635. c.Assert(err, checker.IsNil)
  636. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  637. }
  638. // #23705
  639. func (s *DockerSwarmSuite) TestApiSwarmRestoreOnPendingJoin(c *check.C) {
  640. d := s.AddDaemon(c, false, false)
  641. go d.Join(swarm.JoinRequest{
  642. RemoteAddrs: []string{"nosuchhost:1234"},
  643. }) // will block on pending state
  644. waitAndAssert(c, defaultReconciliationTimeout, d.checkLocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  645. c.Assert(d.Stop(), checker.IsNil)
  646. c.Assert(d.Start(), checker.IsNil)
  647. info, err := d.info()
  648. c.Assert(err, checker.IsNil)
  649. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  650. }
  651. func (s *DockerSwarmSuite) TestApiSwarmManagerRestore(c *check.C) {
  652. testRequires(c, Network)
  653. d1 := s.AddDaemon(c, true, true)
  654. instances := 2
  655. id := d1.createService(c, simpleTestService, setInstances(instances))
  656. d1.getService(c, id)
  657. d1.Stop()
  658. d1.Start()
  659. d1.getService(c, id)
  660. d2 := s.AddDaemon(c, true, true)
  661. d2.getService(c, id)
  662. d2.Stop()
  663. d2.Start()
  664. d2.getService(c, id)
  665. d3 := s.AddDaemon(c, true, true)
  666. d3.getService(c, id)
  667. d3.Stop()
  668. d3.Start()
  669. d3.getService(c, id)
  670. d3.Kill()
  671. time.Sleep(1 * time.Second) // time to handle signal
  672. d3.Start()
  673. d3.getService(c, id)
  674. }
  675. func (s *DockerSwarmSuite) TestApiSwarmScaleNoRollingUpdate(c *check.C) {
  676. testRequires(c, Network)
  677. d := s.AddDaemon(c, true, true)
  678. instances := 2
  679. id := d.createService(c, simpleTestService, setInstances(instances))
  680. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  681. containers := d.activeContainers()
  682. instances = 4
  683. d.updateService(c, d.getService(c, id), setInstances(instances))
  684. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  685. containers2 := d.activeContainers()
  686. loop0:
  687. for _, c1 := range containers {
  688. for _, c2 := range containers2 {
  689. if c1 == c2 {
  690. continue loop0
  691. }
  692. }
  693. c.Errorf("container %v not found in new set %#v", c1, containers2)
  694. }
  695. }
  696. func (s *DockerSwarmSuite) TestApiSwarmInvalidAddress(c *check.C) {
  697. d := s.AddDaemon(c, false, false)
  698. req := swarm.InitRequest{
  699. ListenAddr: "",
  700. }
  701. status, _, err := d.SockRequest("POST", "/swarm/init", req)
  702. c.Assert(err, checker.IsNil)
  703. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  704. req2 := swarm.JoinRequest{
  705. ListenAddr: "0.0.0.0:2377",
  706. RemoteAddrs: []string{""},
  707. }
  708. status, _, err = d.SockRequest("POST", "/swarm/join", req2)
  709. c.Assert(err, checker.IsNil)
  710. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  711. }
  712. func (s *DockerSwarmSuite) TestApiSwarmForceNewCluster(c *check.C) {
  713. d1 := s.AddDaemon(c, true, true)
  714. d2 := s.AddDaemon(c, true, true)
  715. instances := 2
  716. id := d1.createService(c, simpleTestService, setInstances(instances))
  717. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  718. c.Assert(d2.Stop(), checker.IsNil)
  719. time.Sleep(5 * time.Second)
  720. c.Assert(d1.Init(swarm.InitRequest{
  721. ForceNewCluster: true,
  722. Spec: swarm.Spec{},
  723. }), checker.IsNil)
  724. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  725. d3 := s.AddDaemon(c, true, true)
  726. info, err := d3.info()
  727. c.Assert(err, checker.IsNil)
  728. c.Assert(info.ControlAvailable, checker.True)
  729. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  730. instances = 4
  731. d3.updateService(c, d3.getService(c, id), setInstances(instances))
  732. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  733. }
  734. func simpleTestService(s *swarm.Service) {
  735. var ureplicas uint64
  736. ureplicas = 1
  737. s.Spec = swarm.ServiceSpec{
  738. TaskTemplate: swarm.TaskSpec{
  739. ContainerSpec: swarm.ContainerSpec{
  740. Image: "busybox:latest",
  741. Command: []string{"/bin/top"},
  742. },
  743. },
  744. Mode: swarm.ServiceMode{
  745. Replicated: &swarm.ReplicatedService{
  746. Replicas: &ureplicas,
  747. },
  748. },
  749. }
  750. s.Spec.Name = "top"
  751. }
  752. func serviceForUpdate(s *swarm.Service) {
  753. var ureplicas uint64
  754. ureplicas = 1
  755. s.Spec = swarm.ServiceSpec{
  756. TaskTemplate: swarm.TaskSpec{
  757. ContainerSpec: swarm.ContainerSpec{
  758. Image: "busybox:latest",
  759. Command: []string{"/bin/top"},
  760. },
  761. },
  762. Mode: swarm.ServiceMode{
  763. Replicated: &swarm.ReplicatedService{
  764. Replicas: &ureplicas,
  765. },
  766. },
  767. UpdateConfig: &swarm.UpdateConfig{
  768. Parallelism: 2,
  769. Delay: 8 * time.Second,
  770. },
  771. }
  772. s.Spec.Name = "updatetest"
  773. }
  774. func setInstances(replicas int) serviceConstructor {
  775. ureplicas := uint64(replicas)
  776. return func(s *swarm.Service) {
  777. s.Spec.Mode = swarm.ServiceMode{
  778. Replicated: &swarm.ReplicatedService{
  779. Replicas: &ureplicas,
  780. },
  781. }
  782. }
  783. }
  784. func setImage(image string) serviceConstructor {
  785. return func(s *swarm.Service) {
  786. s.Spec.TaskTemplate.ContainerSpec.Image = image
  787. }
  788. }
  789. func setConstraints(constraints []string) serviceConstructor {
  790. return func(s *swarm.Service) {
  791. if s.Spec.TaskTemplate.Placement == nil {
  792. s.Spec.TaskTemplate.Placement = &swarm.Placement{}
  793. }
  794. s.Spec.TaskTemplate.Placement.Constraints = constraints
  795. }
  796. }
  797. func setGlobalMode(s *swarm.Service) {
  798. s.Spec.Mode = swarm.ServiceMode{
  799. Global: &swarm.GlobalService{},
  800. }
  801. }
  802. func checkClusterHealth(c *check.C, cl []*SwarmDaemon, managerCount, workerCount int) {
  803. var totalMCount, totalWCount int
  804. for _, d := range cl {
  805. info, err := d.info()
  806. c.Assert(err, check.IsNil)
  807. if !info.ControlAvailable {
  808. totalWCount++
  809. continue
  810. }
  811. var leaderFound bool
  812. totalMCount++
  813. var mCount, wCount int
  814. for _, n := range d.listNodes(c) {
  815. c.Assert(n.Status.State, checker.Equals, swarm.NodeStateReady, check.Commentf("state of node %s, reported by %s", n.ID, d.Info.NodeID))
  816. c.Assert(n.Spec.Availability, checker.Equals, swarm.NodeAvailabilityActive, check.Commentf("availability of node %s, reported by %s", n.ID, d.Info.NodeID))
  817. if n.Spec.Role == swarm.NodeRoleManager {
  818. c.Assert(n.ManagerStatus, checker.NotNil, check.Commentf("manager status of node %s (manager), reported by %s", n.ID, d.Info.NodeID))
  819. if n.ManagerStatus.Leader {
  820. leaderFound = true
  821. }
  822. mCount++
  823. } else {
  824. c.Assert(n.ManagerStatus, checker.IsNil, check.Commentf("manager status of node %s (worker), reported by %s", n.ID, d.Info.NodeID))
  825. wCount++
  826. }
  827. }
  828. c.Assert(leaderFound, checker.True, check.Commentf("lack of leader reported by node %s", info.NodeID))
  829. c.Assert(mCount, checker.Equals, managerCount, check.Commentf("managers count reported by node %s", info.NodeID))
  830. c.Assert(wCount, checker.Equals, workerCount, check.Commentf("workers count reported by node %s", info.NodeID))
  831. }
  832. c.Assert(totalMCount, checker.Equals, managerCount)
  833. c.Assert(totalWCount, checker.Equals, workerCount)
  834. }
  835. func (s *DockerSwarmSuite) TestApiSwarmRestartCluster(c *check.C) {
  836. mCount, wCount := 5, 1
  837. var nodes []*SwarmDaemon
  838. for i := 0; i < mCount; i++ {
  839. manager := s.AddDaemon(c, true, true)
  840. info, err := manager.info()
  841. c.Assert(err, checker.IsNil)
  842. c.Assert(info.ControlAvailable, checker.True)
  843. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  844. nodes = append(nodes, manager)
  845. }
  846. for i := 0; i < wCount; i++ {
  847. worker := s.AddDaemon(c, true, false)
  848. info, err := worker.info()
  849. c.Assert(err, checker.IsNil)
  850. c.Assert(info.ControlAvailable, checker.False)
  851. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  852. nodes = append(nodes, worker)
  853. }
  854. // stop whole cluster
  855. {
  856. var wg sync.WaitGroup
  857. wg.Add(len(nodes))
  858. errs := make(chan error, len(nodes))
  859. for _, d := range nodes {
  860. go func(daemon *SwarmDaemon) {
  861. defer wg.Done()
  862. if err := daemon.Stop(); err != nil {
  863. errs <- err
  864. }
  865. if root := os.Getenv("DOCKER_REMAP_ROOT"); root != "" {
  866. daemon.root = filepath.Dir(daemon.root)
  867. }
  868. }(d)
  869. }
  870. wg.Wait()
  871. close(errs)
  872. for err := range errs {
  873. c.Assert(err, check.IsNil)
  874. }
  875. }
  876. // start whole cluster
  877. {
  878. var wg sync.WaitGroup
  879. wg.Add(len(nodes))
  880. errs := make(chan error, len(nodes))
  881. for _, d := range nodes {
  882. go func(daemon *SwarmDaemon) {
  883. defer wg.Done()
  884. if err := daemon.Start("--iptables=false"); err != nil {
  885. errs <- err
  886. }
  887. }(d)
  888. }
  889. wg.Wait()
  890. close(errs)
  891. for err := range errs {
  892. c.Assert(err, check.IsNil)
  893. }
  894. }
  895. checkClusterHealth(c, nodes, mCount, wCount)
  896. }