docker_api_swarm_test.go 43 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207120812091210121112121213121412151216121712181219122012211222122312241225122612271228122912301231123212331234123512361237123812391240124112421243124412451246124712481249125012511252125312541255125612571258125912601261126212631264126512661267126812691270127112721273127412751276127712781279128012811282128312841285128612871288128912901291129212931294129512961297129812991300130113021303130413051306130713081309131013111312
  1. // +build !windows
  2. package main
  3. import (
  4. "fmt"
  5. "net/http"
  6. "os"
  7. "path/filepath"
  8. "strconv"
  9. "strings"
  10. "sync"
  11. "syscall"
  12. "time"
  13. "github.com/docker/docker/api/types/swarm"
  14. "github.com/docker/docker/pkg/integration/checker"
  15. "github.com/go-check/check"
  16. )
  17. var defaultReconciliationTimeout = 30 * time.Second
  18. func (s *DockerSwarmSuite) TestAPISwarmInit(c *check.C) {
  19. // todo: should find a better way to verify that components are running than /info
  20. d1 := s.AddDaemon(c, true, true)
  21. info, err := d1.info()
  22. c.Assert(err, checker.IsNil)
  23. c.Assert(info.ControlAvailable, checker.True)
  24. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  25. d2 := s.AddDaemon(c, true, false)
  26. info, err = d2.info()
  27. c.Assert(err, checker.IsNil)
  28. c.Assert(info.ControlAvailable, checker.False)
  29. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  30. // Leaving cluster
  31. c.Assert(d2.Leave(false), checker.IsNil)
  32. info, err = d2.info()
  33. c.Assert(err, checker.IsNil)
  34. c.Assert(info.ControlAvailable, checker.False)
  35. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  36. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: d1.joinTokens(c).Worker, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  37. info, err = d2.info()
  38. c.Assert(err, checker.IsNil)
  39. c.Assert(info.ControlAvailable, checker.False)
  40. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  41. // Current state restoring after restarts
  42. err = d1.Stop()
  43. c.Assert(err, checker.IsNil)
  44. err = d2.Stop()
  45. c.Assert(err, checker.IsNil)
  46. err = d1.Start()
  47. c.Assert(err, checker.IsNil)
  48. err = d2.Start()
  49. c.Assert(err, checker.IsNil)
  50. info, err = d1.info()
  51. c.Assert(err, checker.IsNil)
  52. c.Assert(info.ControlAvailable, checker.True)
  53. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  54. info, err = d2.info()
  55. c.Assert(err, checker.IsNil)
  56. c.Assert(info.ControlAvailable, checker.False)
  57. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  58. }
  59. func (s *DockerSwarmSuite) TestAPISwarmJoinToken(c *check.C) {
  60. d1 := s.AddDaemon(c, false, false)
  61. c.Assert(d1.Init(swarm.InitRequest{}), checker.IsNil)
  62. d2 := s.AddDaemon(c, false, false)
  63. err := d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  64. c.Assert(err, checker.NotNil)
  65. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  66. info, err := d2.info()
  67. c.Assert(err, checker.IsNil)
  68. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  69. err = d2.Join(swarm.JoinRequest{JoinToken: "foobaz", RemoteAddrs: []string{d1.listenAddr}})
  70. c.Assert(err, checker.NotNil)
  71. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  72. info, err = d2.info()
  73. c.Assert(err, checker.IsNil)
  74. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  75. workerToken := d1.joinTokens(c).Worker
  76. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  77. info, err = d2.info()
  78. c.Assert(err, checker.IsNil)
  79. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  80. c.Assert(d2.Leave(false), checker.IsNil)
  81. info, err = d2.info()
  82. c.Assert(err, checker.IsNil)
  83. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  84. // change tokens
  85. d1.rotateTokens(c)
  86. err = d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}})
  87. c.Assert(err, checker.NotNil)
  88. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  89. info, err = d2.info()
  90. c.Assert(err, checker.IsNil)
  91. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  92. workerToken = d1.joinTokens(c).Worker
  93. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  94. info, err = d2.info()
  95. c.Assert(err, checker.IsNil)
  96. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  97. c.Assert(d2.Leave(false), checker.IsNil)
  98. info, err = d2.info()
  99. c.Assert(err, checker.IsNil)
  100. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  101. // change spec, don't change tokens
  102. d1.updateSwarm(c, func(s *swarm.Spec) {})
  103. err = d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  104. c.Assert(err, checker.NotNil)
  105. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  106. info, err = d2.info()
  107. c.Assert(err, checker.IsNil)
  108. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  109. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  110. info, err = d2.info()
  111. c.Assert(err, checker.IsNil)
  112. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  113. c.Assert(d2.Leave(false), checker.IsNil)
  114. info, err = d2.info()
  115. c.Assert(err, checker.IsNil)
  116. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  117. }
  118. func (s *DockerSwarmSuite) TestAPISwarmCAHash(c *check.C) {
  119. d1 := s.AddDaemon(c, true, true)
  120. d2 := s.AddDaemon(c, false, false)
  121. splitToken := strings.Split(d1.joinTokens(c).Worker, "-")
  122. splitToken[2] = "1kxftv4ofnc6mt30lmgipg6ngf9luhwqopfk1tz6bdmnkubg0e"
  123. replacementToken := strings.Join(splitToken, "-")
  124. err := d2.Join(swarm.JoinRequest{JoinToken: replacementToken, RemoteAddrs: []string{d1.listenAddr}})
  125. c.Assert(err, checker.NotNil)
  126. c.Assert(err.Error(), checker.Contains, "remote CA does not match fingerprint")
  127. }
  128. func (s *DockerSwarmSuite) TestAPISwarmPromoteDemote(c *check.C) {
  129. d1 := s.AddDaemon(c, false, false)
  130. c.Assert(d1.Init(swarm.InitRequest{}), checker.IsNil)
  131. d2 := s.AddDaemon(c, true, false)
  132. info, err := d2.info()
  133. c.Assert(err, checker.IsNil)
  134. c.Assert(info.ControlAvailable, checker.False)
  135. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  136. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  137. n.Spec.Role = swarm.NodeRoleManager
  138. })
  139. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  140. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  141. n.Spec.Role = swarm.NodeRoleWorker
  142. })
  143. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.False)
  144. // Demoting last node should fail
  145. node := d1.getNode(c, d1.NodeID)
  146. node.Spec.Role = swarm.NodeRoleWorker
  147. url := fmt.Sprintf("/nodes/%s/update?version=%d", node.ID, node.Version.Index)
  148. status, out, err := d1.SockRequest("POST", url, node.Spec)
  149. c.Assert(err, checker.IsNil)
  150. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("output: %q", string(out)))
  151. c.Assert(string(out), checker.Contains, "last manager of the swarm")
  152. info, err = d1.info()
  153. c.Assert(err, checker.IsNil)
  154. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  155. c.Assert(info.ControlAvailable, checker.True)
  156. // Promote already demoted node
  157. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  158. n.Spec.Role = swarm.NodeRoleManager
  159. })
  160. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  161. }
  162. func (s *DockerSwarmSuite) TestAPISwarmServicesEmptyList(c *check.C) {
  163. d := s.AddDaemon(c, true, true)
  164. services := d.listServices(c)
  165. c.Assert(services, checker.NotNil)
  166. c.Assert(len(services), checker.Equals, 0, check.Commentf("services: %#v", services))
  167. }
  168. func (s *DockerSwarmSuite) TestAPISwarmServicesCreate(c *check.C) {
  169. d := s.AddDaemon(c, true, true)
  170. instances := 2
  171. id := d.createService(c, simpleTestService, setInstances(instances))
  172. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  173. service := d.getService(c, id)
  174. instances = 5
  175. d.updateService(c, service, setInstances(instances))
  176. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  177. d.removeService(c, service.ID)
  178. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 0)
  179. }
  180. func (s *DockerSwarmSuite) TestAPISwarmServicesMultipleAgents(c *check.C) {
  181. d1 := s.AddDaemon(c, true, true)
  182. d2 := s.AddDaemon(c, true, false)
  183. d3 := s.AddDaemon(c, true, false)
  184. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  185. instances := 9
  186. id := d1.createService(c, simpleTestService, setInstances(instances))
  187. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  188. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  189. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.GreaterThan, 0)
  190. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  191. // reconciliation on d2 node down
  192. c.Assert(d2.Stop(), checker.IsNil)
  193. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  194. // test downscaling
  195. instances = 5
  196. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  197. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  198. }
  199. func (s *DockerSwarmSuite) TestAPISwarmServicesCreateGlobal(c *check.C) {
  200. d1 := s.AddDaemon(c, true, true)
  201. d2 := s.AddDaemon(c, true, false)
  202. d3 := s.AddDaemon(c, true, false)
  203. d1.createService(c, simpleTestService, setGlobalMode)
  204. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, 1)
  205. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  206. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.Equals, 1)
  207. d4 := s.AddDaemon(c, true, false)
  208. d5 := s.AddDaemon(c, true, false)
  209. waitAndAssert(c, defaultReconciliationTimeout, d4.checkActiveContainerCount, checker.Equals, 1)
  210. waitAndAssert(c, defaultReconciliationTimeout, d5.checkActiveContainerCount, checker.Equals, 1)
  211. }
  212. func (s *DockerSwarmSuite) TestAPISwarmServicesUpdate(c *check.C) {
  213. const nodeCount = 3
  214. var daemons [nodeCount]*SwarmDaemon
  215. for i := 0; i < nodeCount; i++ {
  216. daemons[i] = s.AddDaemon(c, true, i == 0)
  217. }
  218. // wait for nodes ready
  219. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  220. // service image at start
  221. image1 := "busybox:latest"
  222. // target image in update
  223. image2 := "busybox:test"
  224. // create a different tag
  225. for _, d := range daemons {
  226. out, err := d.Cmd("tag", image1, image2)
  227. c.Assert(err, checker.IsNil, check.Commentf(out))
  228. }
  229. // create service
  230. instances := 5
  231. parallelism := 2
  232. id := daemons[0].createService(c, serviceForUpdate, setInstances(instances))
  233. // wait for tasks ready
  234. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  235. map[string]int{image1: instances})
  236. // issue service update
  237. service := daemons[0].getService(c, id)
  238. daemons[0].updateService(c, service, setImage(image2))
  239. // first batch
  240. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  241. map[string]int{image1: instances - parallelism, image2: parallelism})
  242. // 2nd batch
  243. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  244. map[string]int{image1: instances - 2*parallelism, image2: 2 * parallelism})
  245. // 3nd batch
  246. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  247. map[string]int{image2: instances})
  248. // Roll back to the previous version. This uses the CLI because
  249. // rollback is a client-side operation.
  250. out, err := daemons[0].Cmd("service", "update", "--rollback", id)
  251. c.Assert(err, checker.IsNil, check.Commentf(out))
  252. // first batch
  253. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  254. map[string]int{image2: instances - parallelism, image1: parallelism})
  255. // 2nd batch
  256. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  257. map[string]int{image2: instances - 2*parallelism, image1: 2 * parallelism})
  258. // 3nd batch
  259. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  260. map[string]int{image1: instances})
  261. }
  262. func (s *DockerSwarmSuite) TestAPISwarmServicesFailedUpdate(c *check.C) {
  263. const nodeCount = 3
  264. var daemons [nodeCount]*SwarmDaemon
  265. for i := 0; i < nodeCount; i++ {
  266. daemons[i] = s.AddDaemon(c, true, i == 0)
  267. }
  268. // wait for nodes ready
  269. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  270. // service image at start
  271. image1 := "busybox:latest"
  272. // target image in update
  273. image2 := "busybox:badtag"
  274. // create service
  275. instances := 5
  276. id := daemons[0].createService(c, serviceForUpdate, setInstances(instances))
  277. // wait for tasks ready
  278. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  279. map[string]int{image1: instances})
  280. // issue service update
  281. service := daemons[0].getService(c, id)
  282. daemons[0].updateService(c, service, setImage(image2), setFailureAction(swarm.UpdateFailureActionPause), setMaxFailureRatio(0.25), setParallelism(1))
  283. // should update 2 tasks and then pause
  284. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceUpdateState(id), checker.Equals, swarm.UpdateStatePaused)
  285. v, _ := daemons[0].checkServiceRunningTasks(id)(c)
  286. c.Assert(v, checker.Equals, instances-2)
  287. // Roll back to the previous version. This uses the CLI because
  288. // rollback is a client-side operation.
  289. out, err := daemons[0].Cmd("service", "update", "--rollback", id)
  290. c.Assert(err, checker.IsNil, check.Commentf(out))
  291. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  292. map[string]int{image1: instances})
  293. }
  294. func (s *DockerSwarmSuite) TestAPISwarmServiceConstraintRole(c *check.C) {
  295. const nodeCount = 3
  296. var daemons [nodeCount]*SwarmDaemon
  297. for i := 0; i < nodeCount; i++ {
  298. daemons[i] = s.AddDaemon(c, true, i == 0)
  299. }
  300. // wait for nodes ready
  301. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  302. // create service
  303. constraints := []string{"node.role==worker"}
  304. instances := 3
  305. id := daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  306. // wait for tasks ready
  307. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  308. // validate tasks are running on worker nodes
  309. tasks := daemons[0].getServiceTasks(c, id)
  310. for _, task := range tasks {
  311. node := daemons[0].getNode(c, task.NodeID)
  312. c.Assert(node.Spec.Role, checker.Equals, swarm.NodeRoleWorker)
  313. }
  314. //remove service
  315. daemons[0].removeService(c, id)
  316. // create service
  317. constraints = []string{"node.role!=worker"}
  318. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  319. // wait for tasks ready
  320. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  321. tasks = daemons[0].getServiceTasks(c, id)
  322. // validate tasks are running on manager nodes
  323. for _, task := range tasks {
  324. node := daemons[0].getNode(c, task.NodeID)
  325. c.Assert(node.Spec.Role, checker.Equals, swarm.NodeRoleManager)
  326. }
  327. //remove service
  328. daemons[0].removeService(c, id)
  329. // create service
  330. constraints = []string{"node.role==nosuchrole"}
  331. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  332. // wait for tasks created
  333. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  334. // let scheduler try
  335. time.Sleep(250 * time.Millisecond)
  336. // validate tasks are not assigned to any node
  337. tasks = daemons[0].getServiceTasks(c, id)
  338. for _, task := range tasks {
  339. c.Assert(task.NodeID, checker.Equals, "")
  340. }
  341. }
  342. func (s *DockerSwarmSuite) TestAPISwarmServiceConstraintLabel(c *check.C) {
  343. const nodeCount = 3
  344. var daemons [nodeCount]*SwarmDaemon
  345. for i := 0; i < nodeCount; i++ {
  346. daemons[i] = s.AddDaemon(c, true, i == 0)
  347. }
  348. // wait for nodes ready
  349. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  350. nodes := daemons[0].listNodes(c)
  351. c.Assert(len(nodes), checker.Equals, nodeCount)
  352. // add labels to nodes
  353. daemons[0].updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  354. n.Spec.Annotations.Labels = map[string]string{
  355. "security": "high",
  356. }
  357. })
  358. for i := 1; i < nodeCount; i++ {
  359. daemons[0].updateNode(c, nodes[i].ID, func(n *swarm.Node) {
  360. n.Spec.Annotations.Labels = map[string]string{
  361. "security": "low",
  362. }
  363. })
  364. }
  365. // create service
  366. instances := 3
  367. constraints := []string{"node.labels.security==high"}
  368. id := daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  369. // wait for tasks ready
  370. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  371. tasks := daemons[0].getServiceTasks(c, id)
  372. // validate all tasks are running on nodes[0]
  373. for _, task := range tasks {
  374. c.Assert(task.NodeID, checker.Equals, nodes[0].ID)
  375. }
  376. //remove service
  377. daemons[0].removeService(c, id)
  378. // create service
  379. constraints = []string{"node.labels.security!=high"}
  380. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  381. // wait for tasks ready
  382. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  383. tasks = daemons[0].getServiceTasks(c, id)
  384. // validate all tasks are NOT running on nodes[0]
  385. for _, task := range tasks {
  386. c.Assert(task.NodeID, checker.Not(checker.Equals), nodes[0].ID)
  387. }
  388. //remove service
  389. daemons[0].removeService(c, id)
  390. constraints = []string{"node.labels.security==medium"}
  391. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  392. // wait for tasks created
  393. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  394. // let scheduler try
  395. time.Sleep(250 * time.Millisecond)
  396. tasks = daemons[0].getServiceTasks(c, id)
  397. // validate tasks are not assigned
  398. for _, task := range tasks {
  399. c.Assert(task.NodeID, checker.Equals, "")
  400. }
  401. //remove service
  402. daemons[0].removeService(c, id)
  403. // multiple constraints
  404. constraints = []string{
  405. "node.labels.security==high",
  406. fmt.Sprintf("node.id==%s", nodes[1].ID),
  407. }
  408. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  409. // wait for tasks created
  410. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  411. // let scheduler try
  412. time.Sleep(250 * time.Millisecond)
  413. tasks = daemons[0].getServiceTasks(c, id)
  414. // validate tasks are not assigned
  415. for _, task := range tasks {
  416. c.Assert(task.NodeID, checker.Equals, "")
  417. }
  418. // make nodes[1] fulfills the constraints
  419. daemons[0].updateNode(c, nodes[1].ID, func(n *swarm.Node) {
  420. n.Spec.Annotations.Labels = map[string]string{
  421. "security": "high",
  422. }
  423. })
  424. // wait for tasks ready
  425. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  426. tasks = daemons[0].getServiceTasks(c, id)
  427. for _, task := range tasks {
  428. c.Assert(task.NodeID, checker.Equals, nodes[1].ID)
  429. }
  430. }
  431. func (s *DockerSwarmSuite) TestAPISwarmServicesStateReporting(c *check.C) {
  432. testRequires(c, SameHostDaemon)
  433. testRequires(c, DaemonIsLinux)
  434. d1 := s.AddDaemon(c, true, true)
  435. d2 := s.AddDaemon(c, true, true)
  436. d3 := s.AddDaemon(c, true, false)
  437. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept
  438. instances := 9
  439. d1.createService(c, simpleTestService, setInstances(instances))
  440. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  441. getContainers := func() map[string]*SwarmDaemon {
  442. m := make(map[string]*SwarmDaemon)
  443. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  444. for _, id := range d.activeContainers() {
  445. m[id] = d
  446. }
  447. }
  448. return m
  449. }
  450. containers := getContainers()
  451. c.Assert(containers, checker.HasLen, instances)
  452. var toRemove string
  453. for i := range containers {
  454. toRemove = i
  455. }
  456. _, err := containers[toRemove].Cmd("stop", toRemove)
  457. c.Assert(err, checker.IsNil)
  458. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  459. containers2 := getContainers()
  460. c.Assert(containers2, checker.HasLen, instances)
  461. for i := range containers {
  462. if i == toRemove {
  463. c.Assert(containers2[i], checker.IsNil)
  464. } else {
  465. c.Assert(containers2[i], checker.NotNil)
  466. }
  467. }
  468. containers = containers2
  469. for i := range containers {
  470. toRemove = i
  471. }
  472. // try with killing process outside of docker
  473. pidStr, err := containers[toRemove].Cmd("inspect", "-f", "{{.State.Pid}}", toRemove)
  474. c.Assert(err, checker.IsNil)
  475. pid, err := strconv.Atoi(strings.TrimSpace(pidStr))
  476. c.Assert(err, checker.IsNil)
  477. c.Assert(syscall.Kill(pid, syscall.SIGKILL), checker.IsNil)
  478. time.Sleep(time.Second) // give some time to handle the signal
  479. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  480. containers2 = getContainers()
  481. c.Assert(containers2, checker.HasLen, instances)
  482. for i := range containers {
  483. if i == toRemove {
  484. c.Assert(containers2[i], checker.IsNil)
  485. } else {
  486. c.Assert(containers2[i], checker.NotNil)
  487. }
  488. }
  489. }
  490. func (s *DockerSwarmSuite) TestAPISwarmLeaderProxy(c *check.C) {
  491. // add three managers, one of these is leader
  492. d1 := s.AddDaemon(c, true, true)
  493. d2 := s.AddDaemon(c, true, true)
  494. d3 := s.AddDaemon(c, true, true)
  495. // start a service by hitting each of the 3 managers
  496. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  497. s.Spec.Name = "test1"
  498. })
  499. d2.createService(c, simpleTestService, func(s *swarm.Service) {
  500. s.Spec.Name = "test2"
  501. })
  502. d3.createService(c, simpleTestService, func(s *swarm.Service) {
  503. s.Spec.Name = "test3"
  504. })
  505. // 3 services should be started now, because the requests were proxied to leader
  506. // query each node and make sure it returns 3 services
  507. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  508. services := d.listServices(c)
  509. c.Assert(services, checker.HasLen, 3)
  510. }
  511. }
  512. func (s *DockerSwarmSuite) TestAPISwarmLeaderElection(c *check.C) {
  513. // Create 3 nodes
  514. d1 := s.AddDaemon(c, true, true)
  515. d2 := s.AddDaemon(c, true, true)
  516. d3 := s.AddDaemon(c, true, true)
  517. // assert that the first node we made is the leader, and the other two are followers
  518. c.Assert(d1.getNode(c, d1.NodeID).ManagerStatus.Leader, checker.True)
  519. c.Assert(d1.getNode(c, d2.NodeID).ManagerStatus.Leader, checker.False)
  520. c.Assert(d1.getNode(c, d3.NodeID).ManagerStatus.Leader, checker.False)
  521. d1.Stop() // stop the leader
  522. var (
  523. leader *SwarmDaemon // keep track of leader
  524. followers []*SwarmDaemon // keep track of followers
  525. )
  526. checkLeader := func(nodes ...*SwarmDaemon) checkF {
  527. return func(c *check.C) (interface{}, check.CommentInterface) {
  528. // clear these out before each run
  529. leader = nil
  530. followers = nil
  531. for _, d := range nodes {
  532. if d.getNode(c, d.NodeID).ManagerStatus.Leader {
  533. leader = d
  534. } else {
  535. followers = append(followers, d)
  536. }
  537. }
  538. if leader == nil {
  539. return false, check.Commentf("no leader elected")
  540. }
  541. return true, check.Commentf("elected %v", leader.id)
  542. }
  543. }
  544. // wait for an election to occur
  545. waitAndAssert(c, defaultReconciliationTimeout, checkLeader(d2, d3), checker.True)
  546. // assert that we have a new leader
  547. c.Assert(leader, checker.NotNil)
  548. // Keep track of the current leader, since we want that to be chosen.
  549. stableleader := leader
  550. // add the d1, the initial leader, back
  551. d1.Start()
  552. // TODO(stevvooe): may need to wait for rejoin here
  553. // wait for possible election
  554. waitAndAssert(c, defaultReconciliationTimeout, checkLeader(d1, d2, d3), checker.True)
  555. // pick out the leader and the followers again
  556. // verify that we still only have 1 leader and 2 followers
  557. c.Assert(leader, checker.NotNil)
  558. c.Assert(followers, checker.HasLen, 2)
  559. // and that after we added d1 back, the leader hasn't changed
  560. c.Assert(leader.NodeID, checker.Equals, stableleader.NodeID)
  561. }
  562. func (s *DockerSwarmSuite) TestAPISwarmRaftQuorum(c *check.C) {
  563. d1 := s.AddDaemon(c, true, true)
  564. d2 := s.AddDaemon(c, true, true)
  565. d3 := s.AddDaemon(c, true, true)
  566. d1.createService(c, simpleTestService)
  567. c.Assert(d2.Stop(), checker.IsNil)
  568. // make sure there is a leader
  569. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  570. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  571. s.Spec.Name = "top1"
  572. })
  573. c.Assert(d3.Stop(), checker.IsNil)
  574. // make sure there is a leader
  575. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  576. var service swarm.Service
  577. simpleTestService(&service)
  578. service.Spec.Name = "top2"
  579. status, out, err := d1.SockRequest("POST", "/services/create", service.Spec)
  580. c.Assert(err, checker.IsNil)
  581. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("deadline exceeded", string(out)))
  582. c.Assert(d2.Start(), checker.IsNil)
  583. // make sure there is a leader
  584. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  585. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  586. s.Spec.Name = "top3"
  587. })
  588. }
  589. func (s *DockerSwarmSuite) TestAPISwarmListNodes(c *check.C) {
  590. d1 := s.AddDaemon(c, true, true)
  591. d2 := s.AddDaemon(c, true, false)
  592. d3 := s.AddDaemon(c, true, false)
  593. nodes := d1.listNodes(c)
  594. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  595. loop0:
  596. for _, n := range nodes {
  597. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  598. if n.ID == d.NodeID {
  599. continue loop0
  600. }
  601. }
  602. c.Errorf("unknown nodeID %v", n.ID)
  603. }
  604. }
  605. func (s *DockerSwarmSuite) TestAPISwarmNodeUpdate(c *check.C) {
  606. d := s.AddDaemon(c, true, true)
  607. nodes := d.listNodes(c)
  608. d.updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  609. n.Spec.Availability = swarm.NodeAvailabilityPause
  610. })
  611. n := d.getNode(c, nodes[0].ID)
  612. c.Assert(n.Spec.Availability, checker.Equals, swarm.NodeAvailabilityPause)
  613. }
  614. func (s *DockerSwarmSuite) TestAPISwarmNodeRemove(c *check.C) {
  615. testRequires(c, Network)
  616. d1 := s.AddDaemon(c, true, true)
  617. d2 := s.AddDaemon(c, true, false)
  618. _ = s.AddDaemon(c, true, false)
  619. nodes := d1.listNodes(c)
  620. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  621. // Getting the info so we can take the NodeID
  622. d2Info, err := d2.info()
  623. c.Assert(err, checker.IsNil)
  624. // forceful removal of d2 should work
  625. d1.removeNode(c, d2Info.NodeID, true)
  626. nodes = d1.listNodes(c)
  627. c.Assert(len(nodes), checker.Equals, 2, check.Commentf("nodes: %#v", nodes))
  628. // Restart the node that was removed
  629. err = d2.Restart()
  630. c.Assert(err, checker.IsNil)
  631. // Give some time for the node to rejoin
  632. time.Sleep(1 * time.Second)
  633. // Make sure the node didn't rejoin
  634. nodes = d1.listNodes(c)
  635. c.Assert(len(nodes), checker.Equals, 2, check.Commentf("nodes: %#v", nodes))
  636. }
  637. func (s *DockerSwarmSuite) TestAPISwarmNodeDrainPause(c *check.C) {
  638. d1 := s.AddDaemon(c, true, true)
  639. d2 := s.AddDaemon(c, true, false)
  640. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  641. // start a service, expect balanced distribution
  642. instances := 8
  643. id := d1.createService(c, simpleTestService, setInstances(instances))
  644. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  645. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  646. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  647. // drain d2, all containers should move to d1
  648. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  649. n.Spec.Availability = swarm.NodeAvailabilityDrain
  650. })
  651. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  652. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  653. // set d2 back to active
  654. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  655. n.Spec.Availability = swarm.NodeAvailabilityActive
  656. })
  657. instances = 1
  658. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  659. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  660. instances = 8
  661. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  662. // drained node first so we don't get any old containers
  663. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  664. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  665. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  666. d2ContainerCount := len(d2.activeContainers())
  667. // set d2 to paused, scale service up, only d1 gets new tasks
  668. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  669. n.Spec.Availability = swarm.NodeAvailabilityPause
  670. })
  671. instances = 14
  672. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  673. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances-d2ContainerCount)
  674. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, d2ContainerCount)
  675. }
  676. func (s *DockerSwarmSuite) TestAPISwarmLeaveRemovesContainer(c *check.C) {
  677. d := s.AddDaemon(c, true, true)
  678. instances := 2
  679. d.createService(c, simpleTestService, setInstances(instances))
  680. id, err := d.Cmd("run", "-d", "busybox", "top")
  681. c.Assert(err, checker.IsNil)
  682. id = strings.TrimSpace(id)
  683. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances+1)
  684. c.Assert(d.Leave(false), checker.NotNil)
  685. c.Assert(d.Leave(true), checker.IsNil)
  686. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 1)
  687. id2, err := d.Cmd("ps", "-q")
  688. c.Assert(err, checker.IsNil)
  689. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  690. }
  691. // #23629
  692. func (s *DockerSwarmSuite) TestAPISwarmLeaveOnPendingJoin(c *check.C) {
  693. testRequires(c, Network)
  694. s.AddDaemon(c, true, true)
  695. d2 := s.AddDaemon(c, false, false)
  696. id, err := d2.Cmd("run", "-d", "busybox", "top")
  697. c.Assert(err, checker.IsNil)
  698. id = strings.TrimSpace(id)
  699. err = d2.Join(swarm.JoinRequest{
  700. RemoteAddrs: []string{"123.123.123.123:1234"},
  701. })
  702. c.Assert(err, check.NotNil)
  703. c.Assert(err.Error(), checker.Contains, "Timeout was reached")
  704. info, err := d2.info()
  705. c.Assert(err, checker.IsNil)
  706. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  707. c.Assert(d2.Leave(true), checker.IsNil)
  708. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  709. id2, err := d2.Cmd("ps", "-q")
  710. c.Assert(err, checker.IsNil)
  711. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  712. }
  713. // #23705
  714. func (s *DockerSwarmSuite) TestAPISwarmRestoreOnPendingJoin(c *check.C) {
  715. testRequires(c, Network)
  716. d := s.AddDaemon(c, false, false)
  717. err := d.Join(swarm.JoinRequest{
  718. RemoteAddrs: []string{"123.123.123.123:1234"},
  719. })
  720. c.Assert(err, check.NotNil)
  721. c.Assert(err.Error(), checker.Contains, "Timeout was reached")
  722. waitAndAssert(c, defaultReconciliationTimeout, d.checkLocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  723. c.Assert(d.Stop(), checker.IsNil)
  724. c.Assert(d.Start(), checker.IsNil)
  725. info, err := d.info()
  726. c.Assert(err, checker.IsNil)
  727. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  728. }
  729. func (s *DockerSwarmSuite) TestAPISwarmManagerRestore(c *check.C) {
  730. d1 := s.AddDaemon(c, true, true)
  731. instances := 2
  732. id := d1.createService(c, simpleTestService, setInstances(instances))
  733. d1.getService(c, id)
  734. d1.Stop()
  735. d1.Start()
  736. d1.getService(c, id)
  737. d2 := s.AddDaemon(c, true, true)
  738. d2.getService(c, id)
  739. d2.Stop()
  740. d2.Start()
  741. d2.getService(c, id)
  742. d3 := s.AddDaemon(c, true, true)
  743. d3.getService(c, id)
  744. d3.Stop()
  745. d3.Start()
  746. d3.getService(c, id)
  747. d3.Kill()
  748. time.Sleep(1 * time.Second) // time to handle signal
  749. d3.Start()
  750. d3.getService(c, id)
  751. }
  752. func (s *DockerSwarmSuite) TestAPISwarmScaleNoRollingUpdate(c *check.C) {
  753. d := s.AddDaemon(c, true, true)
  754. instances := 2
  755. id := d.createService(c, simpleTestService, setInstances(instances))
  756. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  757. containers := d.activeContainers()
  758. instances = 4
  759. d.updateService(c, d.getService(c, id), setInstances(instances))
  760. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  761. containers2 := d.activeContainers()
  762. loop0:
  763. for _, c1 := range containers {
  764. for _, c2 := range containers2 {
  765. if c1 == c2 {
  766. continue loop0
  767. }
  768. }
  769. c.Errorf("container %v not found in new set %#v", c1, containers2)
  770. }
  771. }
  772. func (s *DockerSwarmSuite) TestAPISwarmInvalidAddress(c *check.C) {
  773. d := s.AddDaemon(c, false, false)
  774. req := swarm.InitRequest{
  775. ListenAddr: "",
  776. }
  777. status, _, err := d.SockRequest("POST", "/swarm/init", req)
  778. c.Assert(err, checker.IsNil)
  779. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  780. req2 := swarm.JoinRequest{
  781. ListenAddr: "0.0.0.0:2377",
  782. RemoteAddrs: []string{""},
  783. }
  784. status, _, err = d.SockRequest("POST", "/swarm/join", req2)
  785. c.Assert(err, checker.IsNil)
  786. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  787. }
  788. func (s *DockerSwarmSuite) TestAPISwarmForceNewCluster(c *check.C) {
  789. d1 := s.AddDaemon(c, true, true)
  790. d2 := s.AddDaemon(c, true, true)
  791. instances := 2
  792. id := d1.createService(c, simpleTestService, setInstances(instances))
  793. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  794. // drain d2, all containers should move to d1
  795. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  796. n.Spec.Availability = swarm.NodeAvailabilityDrain
  797. })
  798. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  799. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  800. c.Assert(d2.Stop(), checker.IsNil)
  801. c.Assert(d1.Init(swarm.InitRequest{
  802. ForceNewCluster: true,
  803. Spec: swarm.Spec{},
  804. }), checker.IsNil)
  805. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  806. d3 := s.AddDaemon(c, true, true)
  807. info, err := d3.info()
  808. c.Assert(err, checker.IsNil)
  809. c.Assert(info.ControlAvailable, checker.True)
  810. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  811. instances = 4
  812. d3.updateService(c, d3.getService(c, id), setInstances(instances))
  813. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  814. }
  815. func simpleTestService(s *swarm.Service) {
  816. ureplicas := uint64(1)
  817. restartDelay := time.Duration(100 * time.Millisecond)
  818. s.Spec = swarm.ServiceSpec{
  819. TaskTemplate: swarm.TaskSpec{
  820. ContainerSpec: swarm.ContainerSpec{
  821. Image: "busybox:latest",
  822. Command: []string{"/bin/top"},
  823. },
  824. RestartPolicy: &swarm.RestartPolicy{
  825. Delay: &restartDelay,
  826. },
  827. },
  828. Mode: swarm.ServiceMode{
  829. Replicated: &swarm.ReplicatedService{
  830. Replicas: &ureplicas,
  831. },
  832. },
  833. }
  834. s.Spec.Name = "top"
  835. }
  836. func serviceForUpdate(s *swarm.Service) {
  837. ureplicas := uint64(1)
  838. restartDelay := time.Duration(100 * time.Millisecond)
  839. s.Spec = swarm.ServiceSpec{
  840. TaskTemplate: swarm.TaskSpec{
  841. ContainerSpec: swarm.ContainerSpec{
  842. Image: "busybox:latest",
  843. Command: []string{"/bin/top"},
  844. },
  845. RestartPolicy: &swarm.RestartPolicy{
  846. Delay: &restartDelay,
  847. },
  848. },
  849. Mode: swarm.ServiceMode{
  850. Replicated: &swarm.ReplicatedService{
  851. Replicas: &ureplicas,
  852. },
  853. },
  854. UpdateConfig: &swarm.UpdateConfig{
  855. Parallelism: 2,
  856. Delay: 4 * time.Second,
  857. FailureAction: swarm.UpdateFailureActionContinue,
  858. },
  859. }
  860. s.Spec.Name = "updatetest"
  861. }
  862. func setInstances(replicas int) serviceConstructor {
  863. ureplicas := uint64(replicas)
  864. return func(s *swarm.Service) {
  865. s.Spec.Mode = swarm.ServiceMode{
  866. Replicated: &swarm.ReplicatedService{
  867. Replicas: &ureplicas,
  868. },
  869. }
  870. }
  871. }
  872. func setImage(image string) serviceConstructor {
  873. return func(s *swarm.Service) {
  874. s.Spec.TaskTemplate.ContainerSpec.Image = image
  875. }
  876. }
  877. func setFailureAction(failureAction string) serviceConstructor {
  878. return func(s *swarm.Service) {
  879. s.Spec.UpdateConfig.FailureAction = failureAction
  880. }
  881. }
  882. func setMaxFailureRatio(maxFailureRatio float32) serviceConstructor {
  883. return func(s *swarm.Service) {
  884. s.Spec.UpdateConfig.MaxFailureRatio = maxFailureRatio
  885. }
  886. }
  887. func setParallelism(parallelism uint64) serviceConstructor {
  888. return func(s *swarm.Service) {
  889. s.Spec.UpdateConfig.Parallelism = parallelism
  890. }
  891. }
  892. func setConstraints(constraints []string) serviceConstructor {
  893. return func(s *swarm.Service) {
  894. if s.Spec.TaskTemplate.Placement == nil {
  895. s.Spec.TaskTemplate.Placement = &swarm.Placement{}
  896. }
  897. s.Spec.TaskTemplate.Placement.Constraints = constraints
  898. }
  899. }
  900. func setGlobalMode(s *swarm.Service) {
  901. s.Spec.Mode = swarm.ServiceMode{
  902. Global: &swarm.GlobalService{},
  903. }
  904. }
  905. func checkClusterHealth(c *check.C, cl []*SwarmDaemon, managerCount, workerCount int) {
  906. var totalMCount, totalWCount int
  907. for _, d := range cl {
  908. var (
  909. info swarm.Info
  910. err error
  911. )
  912. // check info in a waitAndAssert, because if the cluster doesn't have a leader, `info` will return an error
  913. checkInfo := func(c *check.C) (interface{}, check.CommentInterface) {
  914. info, err = d.info()
  915. return err, check.Commentf("cluster not ready in time")
  916. }
  917. waitAndAssert(c, defaultReconciliationTimeout, checkInfo, checker.IsNil)
  918. if !info.ControlAvailable {
  919. totalWCount++
  920. continue
  921. }
  922. var leaderFound bool
  923. totalMCount++
  924. var mCount, wCount int
  925. for _, n := range d.listNodes(c) {
  926. waitReady := func(c *check.C) (interface{}, check.CommentInterface) {
  927. if n.Status.State == swarm.NodeStateReady {
  928. return true, nil
  929. }
  930. nn := d.getNode(c, n.ID)
  931. n = *nn
  932. return n.Status.State == swarm.NodeStateReady, check.Commentf("state of node %s, reported by %s", n.ID, d.Info.NodeID)
  933. }
  934. waitAndAssert(c, defaultReconciliationTimeout, waitReady, checker.True)
  935. waitActive := func(c *check.C) (interface{}, check.CommentInterface) {
  936. if n.Spec.Availability == swarm.NodeAvailabilityActive {
  937. return true, nil
  938. }
  939. nn := d.getNode(c, n.ID)
  940. n = *nn
  941. return n.Spec.Availability == swarm.NodeAvailabilityActive, check.Commentf("availability of node %s, reported by %s", n.ID, d.Info.NodeID)
  942. }
  943. waitAndAssert(c, defaultReconciliationTimeout, waitActive, checker.True)
  944. if n.Spec.Role == swarm.NodeRoleManager {
  945. c.Assert(n.ManagerStatus, checker.NotNil, check.Commentf("manager status of node %s (manager), reported by %s", n.ID, d.Info.NodeID))
  946. if n.ManagerStatus.Leader {
  947. leaderFound = true
  948. }
  949. mCount++
  950. } else {
  951. c.Assert(n.ManagerStatus, checker.IsNil, check.Commentf("manager status of node %s (worker), reported by %s", n.ID, d.Info.NodeID))
  952. wCount++
  953. }
  954. }
  955. c.Assert(leaderFound, checker.True, check.Commentf("lack of leader reported by node %s", info.NodeID))
  956. c.Assert(mCount, checker.Equals, managerCount, check.Commentf("managers count reported by node %s", info.NodeID))
  957. c.Assert(wCount, checker.Equals, workerCount, check.Commentf("workers count reported by node %s", info.NodeID))
  958. }
  959. c.Assert(totalMCount, checker.Equals, managerCount)
  960. c.Assert(totalWCount, checker.Equals, workerCount)
  961. }
  962. func (s *DockerSwarmSuite) TestAPISwarmRestartCluster(c *check.C) {
  963. mCount, wCount := 5, 1
  964. var nodes []*SwarmDaemon
  965. for i := 0; i < mCount; i++ {
  966. manager := s.AddDaemon(c, true, true)
  967. info, err := manager.info()
  968. c.Assert(err, checker.IsNil)
  969. c.Assert(info.ControlAvailable, checker.True)
  970. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  971. nodes = append(nodes, manager)
  972. }
  973. for i := 0; i < wCount; i++ {
  974. worker := s.AddDaemon(c, true, false)
  975. info, err := worker.info()
  976. c.Assert(err, checker.IsNil)
  977. c.Assert(info.ControlAvailable, checker.False)
  978. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  979. nodes = append(nodes, worker)
  980. }
  981. // stop whole cluster
  982. {
  983. var wg sync.WaitGroup
  984. wg.Add(len(nodes))
  985. errs := make(chan error, len(nodes))
  986. for _, d := range nodes {
  987. go func(daemon *SwarmDaemon) {
  988. defer wg.Done()
  989. if err := daemon.Stop(); err != nil {
  990. errs <- err
  991. }
  992. if root := os.Getenv("DOCKER_REMAP_ROOT"); root != "" {
  993. daemon.root = filepath.Dir(daemon.root)
  994. }
  995. }(d)
  996. }
  997. wg.Wait()
  998. close(errs)
  999. for err := range errs {
  1000. c.Assert(err, check.IsNil)
  1001. }
  1002. }
  1003. // start whole cluster
  1004. {
  1005. var wg sync.WaitGroup
  1006. wg.Add(len(nodes))
  1007. errs := make(chan error, len(nodes))
  1008. for _, d := range nodes {
  1009. go func(daemon *SwarmDaemon) {
  1010. defer wg.Done()
  1011. if err := daemon.Start("--iptables=false"); err != nil {
  1012. errs <- err
  1013. }
  1014. }(d)
  1015. }
  1016. wg.Wait()
  1017. close(errs)
  1018. for err := range errs {
  1019. c.Assert(err, check.IsNil)
  1020. }
  1021. }
  1022. checkClusterHealth(c, nodes, mCount, wCount)
  1023. }
  1024. func (s *DockerSwarmSuite) TestAPISwarmServicesUpdateWithName(c *check.C) {
  1025. d := s.AddDaemon(c, true, true)
  1026. instances := 2
  1027. id := d.createService(c, simpleTestService, setInstances(instances))
  1028. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  1029. service := d.getService(c, id)
  1030. instances = 5
  1031. setInstances(instances)(service)
  1032. url := fmt.Sprintf("/services/%s/update?version=%d", service.Spec.Name, service.Version.Index)
  1033. status, out, err := d.SockRequest("POST", url, service.Spec)
  1034. c.Assert(err, checker.IsNil)
  1035. c.Assert(status, checker.Equals, http.StatusOK, check.Commentf("output: %q", string(out)))
  1036. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  1037. }
  1038. func (s *DockerSwarmSuite) TestAPISwarmSecretsEmptyList(c *check.C) {
  1039. d := s.AddDaemon(c, true, true)
  1040. secrets := d.listSecrets(c)
  1041. c.Assert(secrets, checker.NotNil)
  1042. c.Assert(len(secrets), checker.Equals, 0, check.Commentf("secrets: %#v", secrets))
  1043. }
  1044. func (s *DockerSwarmSuite) TestAPISwarmSecretsCreate(c *check.C) {
  1045. d := s.AddDaemon(c, true, true)
  1046. testName := "test_secret"
  1047. id := d.createSecret(c, swarm.SecretSpec{
  1048. swarm.Annotations{
  1049. Name: testName,
  1050. },
  1051. []byte("TESTINGDATA"),
  1052. })
  1053. c.Assert(id, checker.Not(checker.Equals), "", check.Commentf("secrets: %s", id))
  1054. secrets := d.listSecrets(c)
  1055. c.Assert(len(secrets), checker.Equals, 1, check.Commentf("secrets: %#v", secrets))
  1056. name := secrets[0].Spec.Annotations.Name
  1057. c.Assert(name, checker.Equals, testName, check.Commentf("secret: %s", name))
  1058. }
  1059. func (s *DockerSwarmSuite) TestAPISwarmSecretsDelete(c *check.C) {
  1060. d := s.AddDaemon(c, true, true)
  1061. testName := "test_secret"
  1062. id := d.createSecret(c, swarm.SecretSpec{
  1063. swarm.Annotations{
  1064. Name: testName,
  1065. },
  1066. []byte("TESTINGDATA"),
  1067. })
  1068. c.Assert(id, checker.Not(checker.Equals), "", check.Commentf("secrets: %s", id))
  1069. secret := d.getSecret(c, id)
  1070. c.Assert(secret.ID, checker.Equals, id, check.Commentf("secret: %v", secret))
  1071. d.deleteSecret(c, secret.ID)
  1072. status, out, err := d.SockRequest("GET", "/secrets/"+id, nil)
  1073. c.Assert(err, checker.IsNil)
  1074. c.Assert(status, checker.Equals, http.StatusNotFound, check.Commentf("secret delete: %s", string(out)))
  1075. }