docker_api_swarm_test.go 46 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391
  1. // +build !windows
  2. package main
  3. import (
  4. "encoding/json"
  5. "fmt"
  6. "net/http"
  7. "os"
  8. "path/filepath"
  9. "strconv"
  10. "strings"
  11. "sync"
  12. "syscall"
  13. "time"
  14. "github.com/docker/docker/api/types"
  15. "github.com/docker/docker/api/types/container"
  16. "github.com/docker/docker/api/types/swarm"
  17. "github.com/docker/docker/pkg/integration/checker"
  18. "github.com/go-check/check"
  19. )
  20. var defaultReconciliationTimeout = 30 * time.Second
  21. func (s *DockerSwarmSuite) TestAPISwarmInit(c *check.C) {
  22. // todo: should find a better way to verify that components are running than /info
  23. d1 := s.AddDaemon(c, true, true)
  24. info, err := d1.info()
  25. c.Assert(err, checker.IsNil)
  26. c.Assert(info.ControlAvailable, checker.True)
  27. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  28. d2 := s.AddDaemon(c, true, false)
  29. info, err = d2.info()
  30. c.Assert(err, checker.IsNil)
  31. c.Assert(info.ControlAvailable, checker.False)
  32. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  33. // Leaving cluster
  34. c.Assert(d2.Leave(false), checker.IsNil)
  35. info, err = d2.info()
  36. c.Assert(err, checker.IsNil)
  37. c.Assert(info.ControlAvailable, checker.False)
  38. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  39. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: d1.joinTokens(c).Worker, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  40. info, err = d2.info()
  41. c.Assert(err, checker.IsNil)
  42. c.Assert(info.ControlAvailable, checker.False)
  43. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  44. // Current state restoring after restarts
  45. err = d1.Stop()
  46. c.Assert(err, checker.IsNil)
  47. err = d2.Stop()
  48. c.Assert(err, checker.IsNil)
  49. err = d1.Start()
  50. c.Assert(err, checker.IsNil)
  51. err = d2.Start()
  52. c.Assert(err, checker.IsNil)
  53. info, err = d1.info()
  54. c.Assert(err, checker.IsNil)
  55. c.Assert(info.ControlAvailable, checker.True)
  56. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  57. info, err = d2.info()
  58. c.Assert(err, checker.IsNil)
  59. c.Assert(info.ControlAvailable, checker.False)
  60. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  61. }
  62. func (s *DockerSwarmSuite) TestAPISwarmJoinToken(c *check.C) {
  63. d1 := s.AddDaemon(c, false, false)
  64. c.Assert(d1.Init(swarm.InitRequest{}), checker.IsNil)
  65. d2 := s.AddDaemon(c, false, false)
  66. err := d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  67. c.Assert(err, checker.NotNil)
  68. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  69. info, err := d2.info()
  70. c.Assert(err, checker.IsNil)
  71. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  72. err = d2.Join(swarm.JoinRequest{JoinToken: "foobaz", RemoteAddrs: []string{d1.listenAddr}})
  73. c.Assert(err, checker.NotNil)
  74. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  75. info, err = d2.info()
  76. c.Assert(err, checker.IsNil)
  77. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  78. workerToken := d1.joinTokens(c).Worker
  79. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  80. info, err = d2.info()
  81. c.Assert(err, checker.IsNil)
  82. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  83. c.Assert(d2.Leave(false), checker.IsNil)
  84. info, err = d2.info()
  85. c.Assert(err, checker.IsNil)
  86. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  87. // change tokens
  88. d1.rotateTokens(c)
  89. err = d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}})
  90. c.Assert(err, checker.NotNil)
  91. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  92. info, err = d2.info()
  93. c.Assert(err, checker.IsNil)
  94. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  95. workerToken = d1.joinTokens(c).Worker
  96. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  97. info, err = d2.info()
  98. c.Assert(err, checker.IsNil)
  99. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  100. c.Assert(d2.Leave(false), checker.IsNil)
  101. info, err = d2.info()
  102. c.Assert(err, checker.IsNil)
  103. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  104. // change spec, don't change tokens
  105. d1.updateSwarm(c, func(s *swarm.Spec) {})
  106. err = d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  107. c.Assert(err, checker.NotNil)
  108. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  109. info, err = d2.info()
  110. c.Assert(err, checker.IsNil)
  111. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  112. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  113. info, err = d2.info()
  114. c.Assert(err, checker.IsNil)
  115. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  116. c.Assert(d2.Leave(false), checker.IsNil)
  117. info, err = d2.info()
  118. c.Assert(err, checker.IsNil)
  119. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  120. }
  121. func (s *DockerSwarmSuite) TestAPISwarmCAHash(c *check.C) {
  122. d1 := s.AddDaemon(c, true, true)
  123. d2 := s.AddDaemon(c, false, false)
  124. splitToken := strings.Split(d1.joinTokens(c).Worker, "-")
  125. splitToken[2] = "1kxftv4ofnc6mt30lmgipg6ngf9luhwqopfk1tz6bdmnkubg0e"
  126. replacementToken := strings.Join(splitToken, "-")
  127. err := d2.Join(swarm.JoinRequest{JoinToken: replacementToken, RemoteAddrs: []string{d1.listenAddr}})
  128. c.Assert(err, checker.NotNil)
  129. c.Assert(err.Error(), checker.Contains, "remote CA does not match fingerprint")
  130. }
  131. func (s *DockerSwarmSuite) TestAPISwarmPromoteDemote(c *check.C) {
  132. d1 := s.AddDaemon(c, false, false)
  133. c.Assert(d1.Init(swarm.InitRequest{}), checker.IsNil)
  134. d2 := s.AddDaemon(c, true, false)
  135. info, err := d2.info()
  136. c.Assert(err, checker.IsNil)
  137. c.Assert(info.ControlAvailable, checker.False)
  138. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  139. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  140. n.Spec.Role = swarm.NodeRoleManager
  141. })
  142. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  143. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  144. n.Spec.Role = swarm.NodeRoleWorker
  145. })
  146. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.False)
  147. // Demoting last node should fail
  148. node := d1.getNode(c, d1.NodeID)
  149. node.Spec.Role = swarm.NodeRoleWorker
  150. url := fmt.Sprintf("/nodes/%s/update?version=%d", node.ID, node.Version.Index)
  151. status, out, err := d1.SockRequest("POST", url, node.Spec)
  152. c.Assert(err, checker.IsNil)
  153. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("output: %q", string(out)))
  154. c.Assert(string(out), checker.Contains, "last manager of the swarm")
  155. info, err = d1.info()
  156. c.Assert(err, checker.IsNil)
  157. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  158. c.Assert(info.ControlAvailable, checker.True)
  159. // Promote already demoted node
  160. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  161. n.Spec.Role = swarm.NodeRoleManager
  162. })
  163. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  164. }
  165. func (s *DockerSwarmSuite) TestAPISwarmServicesEmptyList(c *check.C) {
  166. d := s.AddDaemon(c, true, true)
  167. services := d.listServices(c)
  168. c.Assert(services, checker.NotNil)
  169. c.Assert(len(services), checker.Equals, 0, check.Commentf("services: %#v", services))
  170. }
  171. func (s *DockerSwarmSuite) TestAPISwarmServicesCreate(c *check.C) {
  172. d := s.AddDaemon(c, true, true)
  173. instances := 2
  174. id := d.createService(c, simpleTestService, setInstances(instances))
  175. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  176. service := d.getService(c, id)
  177. instances = 5
  178. d.updateService(c, service, setInstances(instances))
  179. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  180. d.removeService(c, service.ID)
  181. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 0)
  182. }
  183. func (s *DockerSwarmSuite) TestAPISwarmServicesMultipleAgents(c *check.C) {
  184. d1 := s.AddDaemon(c, true, true)
  185. d2 := s.AddDaemon(c, true, false)
  186. d3 := s.AddDaemon(c, true, false)
  187. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  188. instances := 9
  189. id := d1.createService(c, simpleTestService, setInstances(instances))
  190. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  191. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  192. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.GreaterThan, 0)
  193. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  194. // reconciliation on d2 node down
  195. c.Assert(d2.Stop(), checker.IsNil)
  196. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  197. // test downscaling
  198. instances = 5
  199. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  200. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  201. }
  202. func (s *DockerSwarmSuite) TestAPISwarmServicesCreateGlobal(c *check.C) {
  203. d1 := s.AddDaemon(c, true, true)
  204. d2 := s.AddDaemon(c, true, false)
  205. d3 := s.AddDaemon(c, true, false)
  206. d1.createService(c, simpleTestService, setGlobalMode)
  207. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, 1)
  208. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  209. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.Equals, 1)
  210. d4 := s.AddDaemon(c, true, false)
  211. d5 := s.AddDaemon(c, true, false)
  212. waitAndAssert(c, defaultReconciliationTimeout, d4.checkActiveContainerCount, checker.Equals, 1)
  213. waitAndAssert(c, defaultReconciliationTimeout, d5.checkActiveContainerCount, checker.Equals, 1)
  214. }
  215. func (s *DockerSwarmSuite) TestAPISwarmServicesUpdate(c *check.C) {
  216. const nodeCount = 3
  217. var daemons [nodeCount]*SwarmDaemon
  218. for i := 0; i < nodeCount; i++ {
  219. daemons[i] = s.AddDaemon(c, true, i == 0)
  220. }
  221. // wait for nodes ready
  222. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  223. // service image at start
  224. image1 := "busybox:latest"
  225. // target image in update
  226. image2 := "busybox:test"
  227. // create a different tag
  228. for _, d := range daemons {
  229. out, err := d.Cmd("tag", image1, image2)
  230. c.Assert(err, checker.IsNil, check.Commentf(out))
  231. }
  232. // create service
  233. instances := 5
  234. parallelism := 2
  235. id := daemons[0].createService(c, serviceForUpdate, setInstances(instances))
  236. // wait for tasks ready
  237. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  238. map[string]int{image1: instances})
  239. // issue service update
  240. service := daemons[0].getService(c, id)
  241. daemons[0].updateService(c, service, setImage(image2))
  242. // first batch
  243. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  244. map[string]int{image1: instances - parallelism, image2: parallelism})
  245. // 2nd batch
  246. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  247. map[string]int{image1: instances - 2*parallelism, image2: 2 * parallelism})
  248. // 3nd batch
  249. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  250. map[string]int{image2: instances})
  251. // Roll back to the previous version. This uses the CLI because
  252. // rollback is a client-side operation.
  253. out, err := daemons[0].Cmd("service", "update", "--rollback", id)
  254. c.Assert(err, checker.IsNil, check.Commentf(out))
  255. // first batch
  256. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  257. map[string]int{image2: instances - parallelism, image1: parallelism})
  258. // 2nd batch
  259. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  260. map[string]int{image2: instances - 2*parallelism, image1: 2 * parallelism})
  261. // 3nd batch
  262. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  263. map[string]int{image1: instances})
  264. }
  265. func (s *DockerSwarmSuite) TestAPISwarmServicesFailedUpdate(c *check.C) {
  266. const nodeCount = 3
  267. var daemons [nodeCount]*SwarmDaemon
  268. for i := 0; i < nodeCount; i++ {
  269. daemons[i] = s.AddDaemon(c, true, i == 0)
  270. }
  271. // wait for nodes ready
  272. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  273. // service image at start
  274. image1 := "busybox:latest"
  275. // target image in update
  276. image2 := "busybox:badtag"
  277. // create service
  278. instances := 5
  279. id := daemons[0].createService(c, serviceForUpdate, setInstances(instances))
  280. // wait for tasks ready
  281. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  282. map[string]int{image1: instances})
  283. // issue service update
  284. service := daemons[0].getService(c, id)
  285. daemons[0].updateService(c, service, setImage(image2), setFailureAction(swarm.UpdateFailureActionPause), setMaxFailureRatio(0.25), setParallelism(1))
  286. // should update 2 tasks and then pause
  287. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceUpdateState(id), checker.Equals, swarm.UpdateStatePaused)
  288. v, _ := daemons[0].checkServiceRunningTasks(id)(c)
  289. c.Assert(v, checker.Equals, instances-2)
  290. // Roll back to the previous version. This uses the CLI because
  291. // rollback is a client-side operation.
  292. out, err := daemons[0].Cmd("service", "update", "--rollback", id)
  293. c.Assert(err, checker.IsNil, check.Commentf(out))
  294. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  295. map[string]int{image1: instances})
  296. }
  297. func (s *DockerSwarmSuite) TestAPISwarmServiceConstraintRole(c *check.C) {
  298. const nodeCount = 3
  299. var daemons [nodeCount]*SwarmDaemon
  300. for i := 0; i < nodeCount; i++ {
  301. daemons[i] = s.AddDaemon(c, true, i == 0)
  302. }
  303. // wait for nodes ready
  304. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  305. // create service
  306. constraints := []string{"node.role==worker"}
  307. instances := 3
  308. id := daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  309. // wait for tasks ready
  310. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  311. // validate tasks are running on worker nodes
  312. tasks := daemons[0].getServiceTasks(c, id)
  313. for _, task := range tasks {
  314. node := daemons[0].getNode(c, task.NodeID)
  315. c.Assert(node.Spec.Role, checker.Equals, swarm.NodeRoleWorker)
  316. }
  317. //remove service
  318. daemons[0].removeService(c, id)
  319. // create service
  320. constraints = []string{"node.role!=worker"}
  321. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  322. // wait for tasks ready
  323. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  324. tasks = daemons[0].getServiceTasks(c, id)
  325. // validate tasks are running on manager nodes
  326. for _, task := range tasks {
  327. node := daemons[0].getNode(c, task.NodeID)
  328. c.Assert(node.Spec.Role, checker.Equals, swarm.NodeRoleManager)
  329. }
  330. //remove service
  331. daemons[0].removeService(c, id)
  332. // create service
  333. constraints = []string{"node.role==nosuchrole"}
  334. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  335. // wait for tasks created
  336. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  337. // let scheduler try
  338. time.Sleep(250 * time.Millisecond)
  339. // validate tasks are not assigned to any node
  340. tasks = daemons[0].getServiceTasks(c, id)
  341. for _, task := range tasks {
  342. c.Assert(task.NodeID, checker.Equals, "")
  343. }
  344. }
  345. func (s *DockerSwarmSuite) TestAPISwarmServiceConstraintLabel(c *check.C) {
  346. const nodeCount = 3
  347. var daemons [nodeCount]*SwarmDaemon
  348. for i := 0; i < nodeCount; i++ {
  349. daemons[i] = s.AddDaemon(c, true, i == 0)
  350. }
  351. // wait for nodes ready
  352. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  353. nodes := daemons[0].listNodes(c)
  354. c.Assert(len(nodes), checker.Equals, nodeCount)
  355. // add labels to nodes
  356. daemons[0].updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  357. n.Spec.Annotations.Labels = map[string]string{
  358. "security": "high",
  359. }
  360. })
  361. for i := 1; i < nodeCount; i++ {
  362. daemons[0].updateNode(c, nodes[i].ID, func(n *swarm.Node) {
  363. n.Spec.Annotations.Labels = map[string]string{
  364. "security": "low",
  365. }
  366. })
  367. }
  368. // create service
  369. instances := 3
  370. constraints := []string{"node.labels.security==high"}
  371. id := daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  372. // wait for tasks ready
  373. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  374. tasks := daemons[0].getServiceTasks(c, id)
  375. // validate all tasks are running on nodes[0]
  376. for _, task := range tasks {
  377. c.Assert(task.NodeID, checker.Equals, nodes[0].ID)
  378. }
  379. //remove service
  380. daemons[0].removeService(c, id)
  381. // create service
  382. constraints = []string{"node.labels.security!=high"}
  383. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  384. // wait for tasks ready
  385. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  386. tasks = daemons[0].getServiceTasks(c, id)
  387. // validate all tasks are NOT running on nodes[0]
  388. for _, task := range tasks {
  389. c.Assert(task.NodeID, checker.Not(checker.Equals), nodes[0].ID)
  390. }
  391. //remove service
  392. daemons[0].removeService(c, id)
  393. constraints = []string{"node.labels.security==medium"}
  394. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  395. // wait for tasks created
  396. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  397. // let scheduler try
  398. time.Sleep(250 * time.Millisecond)
  399. tasks = daemons[0].getServiceTasks(c, id)
  400. // validate tasks are not assigned
  401. for _, task := range tasks {
  402. c.Assert(task.NodeID, checker.Equals, "")
  403. }
  404. //remove service
  405. daemons[0].removeService(c, id)
  406. // multiple constraints
  407. constraints = []string{
  408. "node.labels.security==high",
  409. fmt.Sprintf("node.id==%s", nodes[1].ID),
  410. }
  411. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  412. // wait for tasks created
  413. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  414. // let scheduler try
  415. time.Sleep(250 * time.Millisecond)
  416. tasks = daemons[0].getServiceTasks(c, id)
  417. // validate tasks are not assigned
  418. for _, task := range tasks {
  419. c.Assert(task.NodeID, checker.Equals, "")
  420. }
  421. // make nodes[1] fulfills the constraints
  422. daemons[0].updateNode(c, nodes[1].ID, func(n *swarm.Node) {
  423. n.Spec.Annotations.Labels = map[string]string{
  424. "security": "high",
  425. }
  426. })
  427. // wait for tasks ready
  428. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  429. tasks = daemons[0].getServiceTasks(c, id)
  430. for _, task := range tasks {
  431. c.Assert(task.NodeID, checker.Equals, nodes[1].ID)
  432. }
  433. }
  434. func (s *DockerSwarmSuite) TestAPISwarmServicesStateReporting(c *check.C) {
  435. testRequires(c, SameHostDaemon)
  436. testRequires(c, DaemonIsLinux)
  437. d1 := s.AddDaemon(c, true, true)
  438. d2 := s.AddDaemon(c, true, true)
  439. d3 := s.AddDaemon(c, true, false)
  440. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept
  441. instances := 9
  442. d1.createService(c, simpleTestService, setInstances(instances))
  443. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  444. getContainers := func() map[string]*SwarmDaemon {
  445. m := make(map[string]*SwarmDaemon)
  446. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  447. for _, id := range d.activeContainers() {
  448. m[id] = d
  449. }
  450. }
  451. return m
  452. }
  453. containers := getContainers()
  454. c.Assert(containers, checker.HasLen, instances)
  455. var toRemove string
  456. for i := range containers {
  457. toRemove = i
  458. }
  459. _, err := containers[toRemove].Cmd("stop", toRemove)
  460. c.Assert(err, checker.IsNil)
  461. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  462. containers2 := getContainers()
  463. c.Assert(containers2, checker.HasLen, instances)
  464. for i := range containers {
  465. if i == toRemove {
  466. c.Assert(containers2[i], checker.IsNil)
  467. } else {
  468. c.Assert(containers2[i], checker.NotNil)
  469. }
  470. }
  471. containers = containers2
  472. for i := range containers {
  473. toRemove = i
  474. }
  475. // try with killing process outside of docker
  476. pidStr, err := containers[toRemove].Cmd("inspect", "-f", "{{.State.Pid}}", toRemove)
  477. c.Assert(err, checker.IsNil)
  478. pid, err := strconv.Atoi(strings.TrimSpace(pidStr))
  479. c.Assert(err, checker.IsNil)
  480. c.Assert(syscall.Kill(pid, syscall.SIGKILL), checker.IsNil)
  481. time.Sleep(time.Second) // give some time to handle the signal
  482. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  483. containers2 = getContainers()
  484. c.Assert(containers2, checker.HasLen, instances)
  485. for i := range containers {
  486. if i == toRemove {
  487. c.Assert(containers2[i], checker.IsNil)
  488. } else {
  489. c.Assert(containers2[i], checker.NotNil)
  490. }
  491. }
  492. }
  493. func (s *DockerSwarmSuite) TestAPISwarmLeaderProxy(c *check.C) {
  494. // add three managers, one of these is leader
  495. d1 := s.AddDaemon(c, true, true)
  496. d2 := s.AddDaemon(c, true, true)
  497. d3 := s.AddDaemon(c, true, true)
  498. // start a service by hitting each of the 3 managers
  499. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  500. s.Spec.Name = "test1"
  501. })
  502. d2.createService(c, simpleTestService, func(s *swarm.Service) {
  503. s.Spec.Name = "test2"
  504. })
  505. d3.createService(c, simpleTestService, func(s *swarm.Service) {
  506. s.Spec.Name = "test3"
  507. })
  508. // 3 services should be started now, because the requests were proxied to leader
  509. // query each node and make sure it returns 3 services
  510. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  511. services := d.listServices(c)
  512. c.Assert(services, checker.HasLen, 3)
  513. }
  514. }
  515. func (s *DockerSwarmSuite) TestAPISwarmLeaderElection(c *check.C) {
  516. // Create 3 nodes
  517. d1 := s.AddDaemon(c, true, true)
  518. d2 := s.AddDaemon(c, true, true)
  519. d3 := s.AddDaemon(c, true, true)
  520. // assert that the first node we made is the leader, and the other two are followers
  521. c.Assert(d1.getNode(c, d1.NodeID).ManagerStatus.Leader, checker.True)
  522. c.Assert(d1.getNode(c, d2.NodeID).ManagerStatus.Leader, checker.False)
  523. c.Assert(d1.getNode(c, d3.NodeID).ManagerStatus.Leader, checker.False)
  524. d1.Stop() // stop the leader
  525. var (
  526. leader *SwarmDaemon // keep track of leader
  527. followers []*SwarmDaemon // keep track of followers
  528. )
  529. checkLeader := func(nodes ...*SwarmDaemon) checkF {
  530. return func(c *check.C) (interface{}, check.CommentInterface) {
  531. // clear these out before each run
  532. leader = nil
  533. followers = nil
  534. for _, d := range nodes {
  535. if d.getNode(c, d.NodeID).ManagerStatus.Leader {
  536. leader = d
  537. } else {
  538. followers = append(followers, d)
  539. }
  540. }
  541. if leader == nil {
  542. return false, check.Commentf("no leader elected")
  543. }
  544. return true, check.Commentf("elected %v", leader.id)
  545. }
  546. }
  547. // wait for an election to occur
  548. waitAndAssert(c, defaultReconciliationTimeout, checkLeader(d2, d3), checker.True)
  549. // assert that we have a new leader
  550. c.Assert(leader, checker.NotNil)
  551. // Keep track of the current leader, since we want that to be chosen.
  552. stableleader := leader
  553. // add the d1, the initial leader, back
  554. d1.Start()
  555. // TODO(stevvooe): may need to wait for rejoin here
  556. // wait for possible election
  557. waitAndAssert(c, defaultReconciliationTimeout, checkLeader(d1, d2, d3), checker.True)
  558. // pick out the leader and the followers again
  559. // verify that we still only have 1 leader and 2 followers
  560. c.Assert(leader, checker.NotNil)
  561. c.Assert(followers, checker.HasLen, 2)
  562. // and that after we added d1 back, the leader hasn't changed
  563. c.Assert(leader.NodeID, checker.Equals, stableleader.NodeID)
  564. }
  565. func (s *DockerSwarmSuite) TestAPISwarmRaftQuorum(c *check.C) {
  566. d1 := s.AddDaemon(c, true, true)
  567. d2 := s.AddDaemon(c, true, true)
  568. d3 := s.AddDaemon(c, true, true)
  569. d1.createService(c, simpleTestService)
  570. c.Assert(d2.Stop(), checker.IsNil)
  571. // make sure there is a leader
  572. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  573. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  574. s.Spec.Name = "top1"
  575. })
  576. c.Assert(d3.Stop(), checker.IsNil)
  577. // make sure there is a leader
  578. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  579. var service swarm.Service
  580. simpleTestService(&service)
  581. service.Spec.Name = "top2"
  582. status, out, err := d1.SockRequest("POST", "/services/create", service.Spec)
  583. c.Assert(err, checker.IsNil)
  584. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("deadline exceeded", string(out)))
  585. c.Assert(d2.Start(), checker.IsNil)
  586. // make sure there is a leader
  587. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  588. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  589. s.Spec.Name = "top3"
  590. })
  591. }
  592. func (s *DockerSwarmSuite) TestAPISwarmListNodes(c *check.C) {
  593. d1 := s.AddDaemon(c, true, true)
  594. d2 := s.AddDaemon(c, true, false)
  595. d3 := s.AddDaemon(c, true, false)
  596. nodes := d1.listNodes(c)
  597. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  598. loop0:
  599. for _, n := range nodes {
  600. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  601. if n.ID == d.NodeID {
  602. continue loop0
  603. }
  604. }
  605. c.Errorf("unknown nodeID %v", n.ID)
  606. }
  607. }
  608. func (s *DockerSwarmSuite) TestAPISwarmNodeUpdate(c *check.C) {
  609. d := s.AddDaemon(c, true, true)
  610. nodes := d.listNodes(c)
  611. d.updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  612. n.Spec.Availability = swarm.NodeAvailabilityPause
  613. })
  614. n := d.getNode(c, nodes[0].ID)
  615. c.Assert(n.Spec.Availability, checker.Equals, swarm.NodeAvailabilityPause)
  616. }
  617. func (s *DockerSwarmSuite) TestAPISwarmNodeRemove(c *check.C) {
  618. testRequires(c, Network)
  619. d1 := s.AddDaemon(c, true, true)
  620. d2 := s.AddDaemon(c, true, false)
  621. _ = s.AddDaemon(c, true, false)
  622. nodes := d1.listNodes(c)
  623. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  624. // Getting the info so we can take the NodeID
  625. d2Info, err := d2.info()
  626. c.Assert(err, checker.IsNil)
  627. // forceful removal of d2 should work
  628. d1.removeNode(c, d2Info.NodeID, true)
  629. nodes = d1.listNodes(c)
  630. c.Assert(len(nodes), checker.Equals, 2, check.Commentf("nodes: %#v", nodes))
  631. // Restart the node that was removed
  632. err = d2.Restart()
  633. c.Assert(err, checker.IsNil)
  634. // Give some time for the node to rejoin
  635. time.Sleep(1 * time.Second)
  636. // Make sure the node didn't rejoin
  637. nodes = d1.listNodes(c)
  638. c.Assert(len(nodes), checker.Equals, 2, check.Commentf("nodes: %#v", nodes))
  639. }
  640. func (s *DockerSwarmSuite) TestAPISwarmNodeDrainPause(c *check.C) {
  641. d1 := s.AddDaemon(c, true, true)
  642. d2 := s.AddDaemon(c, true, false)
  643. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  644. // start a service, expect balanced distribution
  645. instances := 8
  646. id := d1.createService(c, simpleTestService, setInstances(instances))
  647. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  648. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  649. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  650. // drain d2, all containers should move to d1
  651. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  652. n.Spec.Availability = swarm.NodeAvailabilityDrain
  653. })
  654. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  655. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  656. // set d2 back to active
  657. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  658. n.Spec.Availability = swarm.NodeAvailabilityActive
  659. })
  660. instances = 1
  661. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  662. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  663. instances = 8
  664. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  665. // drained node first so we don't get any old containers
  666. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  667. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  668. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  669. d2ContainerCount := len(d2.activeContainers())
  670. // set d2 to paused, scale service up, only d1 gets new tasks
  671. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  672. n.Spec.Availability = swarm.NodeAvailabilityPause
  673. })
  674. instances = 14
  675. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  676. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances-d2ContainerCount)
  677. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, d2ContainerCount)
  678. }
  679. func (s *DockerSwarmSuite) TestAPISwarmLeaveRemovesContainer(c *check.C) {
  680. d := s.AddDaemon(c, true, true)
  681. instances := 2
  682. d.createService(c, simpleTestService, setInstances(instances))
  683. id, err := d.Cmd("run", "-d", "busybox", "top")
  684. c.Assert(err, checker.IsNil)
  685. id = strings.TrimSpace(id)
  686. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances+1)
  687. c.Assert(d.Leave(false), checker.NotNil)
  688. c.Assert(d.Leave(true), checker.IsNil)
  689. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 1)
  690. id2, err := d.Cmd("ps", "-q")
  691. c.Assert(err, checker.IsNil)
  692. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  693. }
  694. // #23629
  695. func (s *DockerSwarmSuite) TestAPISwarmLeaveOnPendingJoin(c *check.C) {
  696. testRequires(c, Network)
  697. s.AddDaemon(c, true, true)
  698. d2 := s.AddDaemon(c, false, false)
  699. id, err := d2.Cmd("run", "-d", "busybox", "top")
  700. c.Assert(err, checker.IsNil)
  701. id = strings.TrimSpace(id)
  702. err = d2.Join(swarm.JoinRequest{
  703. RemoteAddrs: []string{"123.123.123.123:1234"},
  704. })
  705. c.Assert(err, check.NotNil)
  706. c.Assert(err.Error(), checker.Contains, "Timeout was reached")
  707. info, err := d2.info()
  708. c.Assert(err, checker.IsNil)
  709. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  710. c.Assert(d2.Leave(true), checker.IsNil)
  711. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  712. id2, err := d2.Cmd("ps", "-q")
  713. c.Assert(err, checker.IsNil)
  714. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  715. }
  716. // #23705
  717. func (s *DockerSwarmSuite) TestAPISwarmRestoreOnPendingJoin(c *check.C) {
  718. testRequires(c, Network)
  719. d := s.AddDaemon(c, false, false)
  720. err := d.Join(swarm.JoinRequest{
  721. RemoteAddrs: []string{"123.123.123.123:1234"},
  722. })
  723. c.Assert(err, check.NotNil)
  724. c.Assert(err.Error(), checker.Contains, "Timeout was reached")
  725. waitAndAssert(c, defaultReconciliationTimeout, d.checkLocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  726. c.Assert(d.Stop(), checker.IsNil)
  727. c.Assert(d.Start(), checker.IsNil)
  728. info, err := d.info()
  729. c.Assert(err, checker.IsNil)
  730. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  731. }
  732. func (s *DockerSwarmSuite) TestAPISwarmManagerRestore(c *check.C) {
  733. d1 := s.AddDaemon(c, true, true)
  734. instances := 2
  735. id := d1.createService(c, simpleTestService, setInstances(instances))
  736. d1.getService(c, id)
  737. d1.Stop()
  738. d1.Start()
  739. d1.getService(c, id)
  740. d2 := s.AddDaemon(c, true, true)
  741. d2.getService(c, id)
  742. d2.Stop()
  743. d2.Start()
  744. d2.getService(c, id)
  745. d3 := s.AddDaemon(c, true, true)
  746. d3.getService(c, id)
  747. d3.Stop()
  748. d3.Start()
  749. d3.getService(c, id)
  750. d3.Kill()
  751. time.Sleep(1 * time.Second) // time to handle signal
  752. d3.Start()
  753. d3.getService(c, id)
  754. }
  755. func (s *DockerSwarmSuite) TestAPISwarmScaleNoRollingUpdate(c *check.C) {
  756. d := s.AddDaemon(c, true, true)
  757. instances := 2
  758. id := d.createService(c, simpleTestService, setInstances(instances))
  759. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  760. containers := d.activeContainers()
  761. instances = 4
  762. d.updateService(c, d.getService(c, id), setInstances(instances))
  763. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  764. containers2 := d.activeContainers()
  765. loop0:
  766. for _, c1 := range containers {
  767. for _, c2 := range containers2 {
  768. if c1 == c2 {
  769. continue loop0
  770. }
  771. }
  772. c.Errorf("container %v not found in new set %#v", c1, containers2)
  773. }
  774. }
  775. func (s *DockerSwarmSuite) TestAPISwarmInvalidAddress(c *check.C) {
  776. d := s.AddDaemon(c, false, false)
  777. req := swarm.InitRequest{
  778. ListenAddr: "",
  779. }
  780. status, _, err := d.SockRequest("POST", "/swarm/init", req)
  781. c.Assert(err, checker.IsNil)
  782. c.Assert(status, checker.Equals, http.StatusBadRequest)
  783. req2 := swarm.JoinRequest{
  784. ListenAddr: "0.0.0.0:2377",
  785. RemoteAddrs: []string{""},
  786. }
  787. status, _, err = d.SockRequest("POST", "/swarm/join", req2)
  788. c.Assert(err, checker.IsNil)
  789. c.Assert(status, checker.Equals, http.StatusBadRequest)
  790. }
  791. func (s *DockerSwarmSuite) TestAPISwarmForceNewCluster(c *check.C) {
  792. d1 := s.AddDaemon(c, true, true)
  793. d2 := s.AddDaemon(c, true, true)
  794. instances := 2
  795. id := d1.createService(c, simpleTestService, setInstances(instances))
  796. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  797. // drain d2, all containers should move to d1
  798. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  799. n.Spec.Availability = swarm.NodeAvailabilityDrain
  800. })
  801. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  802. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  803. c.Assert(d2.Stop(), checker.IsNil)
  804. c.Assert(d1.Init(swarm.InitRequest{
  805. ForceNewCluster: true,
  806. Spec: swarm.Spec{},
  807. }), checker.IsNil)
  808. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  809. d3 := s.AddDaemon(c, true, true)
  810. info, err := d3.info()
  811. c.Assert(err, checker.IsNil)
  812. c.Assert(info.ControlAvailable, checker.True)
  813. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  814. instances = 4
  815. d3.updateService(c, d3.getService(c, id), setInstances(instances))
  816. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  817. }
  818. func simpleTestService(s *swarm.Service) {
  819. ureplicas := uint64(1)
  820. restartDelay := time.Duration(100 * time.Millisecond)
  821. s.Spec = swarm.ServiceSpec{
  822. TaskTemplate: swarm.TaskSpec{
  823. ContainerSpec: swarm.ContainerSpec{
  824. Image: "busybox:latest",
  825. Command: []string{"/bin/top"},
  826. },
  827. RestartPolicy: &swarm.RestartPolicy{
  828. Delay: &restartDelay,
  829. },
  830. },
  831. Mode: swarm.ServiceMode{
  832. Replicated: &swarm.ReplicatedService{
  833. Replicas: &ureplicas,
  834. },
  835. },
  836. }
  837. s.Spec.Name = "top"
  838. }
  839. func serviceForUpdate(s *swarm.Service) {
  840. ureplicas := uint64(1)
  841. restartDelay := time.Duration(100 * time.Millisecond)
  842. s.Spec = swarm.ServiceSpec{
  843. TaskTemplate: swarm.TaskSpec{
  844. ContainerSpec: swarm.ContainerSpec{
  845. Image: "busybox:latest",
  846. Command: []string{"/bin/top"},
  847. },
  848. RestartPolicy: &swarm.RestartPolicy{
  849. Delay: &restartDelay,
  850. },
  851. },
  852. Mode: swarm.ServiceMode{
  853. Replicated: &swarm.ReplicatedService{
  854. Replicas: &ureplicas,
  855. },
  856. },
  857. UpdateConfig: &swarm.UpdateConfig{
  858. Parallelism: 2,
  859. Delay: 4 * time.Second,
  860. FailureAction: swarm.UpdateFailureActionContinue,
  861. },
  862. }
  863. s.Spec.Name = "updatetest"
  864. }
  865. func setInstances(replicas int) serviceConstructor {
  866. ureplicas := uint64(replicas)
  867. return func(s *swarm.Service) {
  868. s.Spec.Mode = swarm.ServiceMode{
  869. Replicated: &swarm.ReplicatedService{
  870. Replicas: &ureplicas,
  871. },
  872. }
  873. }
  874. }
  875. func setImage(image string) serviceConstructor {
  876. return func(s *swarm.Service) {
  877. s.Spec.TaskTemplate.ContainerSpec.Image = image
  878. }
  879. }
  880. func setFailureAction(failureAction string) serviceConstructor {
  881. return func(s *swarm.Service) {
  882. s.Spec.UpdateConfig.FailureAction = failureAction
  883. }
  884. }
  885. func setMaxFailureRatio(maxFailureRatio float32) serviceConstructor {
  886. return func(s *swarm.Service) {
  887. s.Spec.UpdateConfig.MaxFailureRatio = maxFailureRatio
  888. }
  889. }
  890. func setParallelism(parallelism uint64) serviceConstructor {
  891. return func(s *swarm.Service) {
  892. s.Spec.UpdateConfig.Parallelism = parallelism
  893. }
  894. }
  895. func setConstraints(constraints []string) serviceConstructor {
  896. return func(s *swarm.Service) {
  897. if s.Spec.TaskTemplate.Placement == nil {
  898. s.Spec.TaskTemplate.Placement = &swarm.Placement{}
  899. }
  900. s.Spec.TaskTemplate.Placement.Constraints = constraints
  901. }
  902. }
  903. func setGlobalMode(s *swarm.Service) {
  904. s.Spec.Mode = swarm.ServiceMode{
  905. Global: &swarm.GlobalService{},
  906. }
  907. }
  908. func checkClusterHealth(c *check.C, cl []*SwarmDaemon, managerCount, workerCount int) {
  909. var totalMCount, totalWCount int
  910. for _, d := range cl {
  911. var (
  912. info swarm.Info
  913. err error
  914. )
  915. // check info in a waitAndAssert, because if the cluster doesn't have a leader, `info` will return an error
  916. checkInfo := func(c *check.C) (interface{}, check.CommentInterface) {
  917. info, err = d.info()
  918. return err, check.Commentf("cluster not ready in time")
  919. }
  920. waitAndAssert(c, defaultReconciliationTimeout, checkInfo, checker.IsNil)
  921. if !info.ControlAvailable {
  922. totalWCount++
  923. continue
  924. }
  925. var leaderFound bool
  926. totalMCount++
  927. var mCount, wCount int
  928. for _, n := range d.listNodes(c) {
  929. waitReady := func(c *check.C) (interface{}, check.CommentInterface) {
  930. if n.Status.State == swarm.NodeStateReady {
  931. return true, nil
  932. }
  933. nn := d.getNode(c, n.ID)
  934. n = *nn
  935. return n.Status.State == swarm.NodeStateReady, check.Commentf("state of node %s, reported by %s", n.ID, d.Info.NodeID)
  936. }
  937. waitAndAssert(c, defaultReconciliationTimeout, waitReady, checker.True)
  938. waitActive := func(c *check.C) (interface{}, check.CommentInterface) {
  939. if n.Spec.Availability == swarm.NodeAvailabilityActive {
  940. return true, nil
  941. }
  942. nn := d.getNode(c, n.ID)
  943. n = *nn
  944. return n.Spec.Availability == swarm.NodeAvailabilityActive, check.Commentf("availability of node %s, reported by %s", n.ID, d.Info.NodeID)
  945. }
  946. waitAndAssert(c, defaultReconciliationTimeout, waitActive, checker.True)
  947. if n.Spec.Role == swarm.NodeRoleManager {
  948. c.Assert(n.ManagerStatus, checker.NotNil, check.Commentf("manager status of node %s (manager), reported by %s", n.ID, d.Info.NodeID))
  949. if n.ManagerStatus.Leader {
  950. leaderFound = true
  951. }
  952. mCount++
  953. } else {
  954. c.Assert(n.ManagerStatus, checker.IsNil, check.Commentf("manager status of node %s (worker), reported by %s", n.ID, d.Info.NodeID))
  955. wCount++
  956. }
  957. }
  958. c.Assert(leaderFound, checker.True, check.Commentf("lack of leader reported by node %s", info.NodeID))
  959. c.Assert(mCount, checker.Equals, managerCount, check.Commentf("managers count reported by node %s", info.NodeID))
  960. c.Assert(wCount, checker.Equals, workerCount, check.Commentf("workers count reported by node %s", info.NodeID))
  961. }
  962. c.Assert(totalMCount, checker.Equals, managerCount)
  963. c.Assert(totalWCount, checker.Equals, workerCount)
  964. }
  965. func (s *DockerSwarmSuite) TestAPISwarmRestartCluster(c *check.C) {
  966. mCount, wCount := 5, 1
  967. var nodes []*SwarmDaemon
  968. for i := 0; i < mCount; i++ {
  969. manager := s.AddDaemon(c, true, true)
  970. info, err := manager.info()
  971. c.Assert(err, checker.IsNil)
  972. c.Assert(info.ControlAvailable, checker.True)
  973. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  974. nodes = append(nodes, manager)
  975. }
  976. for i := 0; i < wCount; i++ {
  977. worker := s.AddDaemon(c, true, false)
  978. info, err := worker.info()
  979. c.Assert(err, checker.IsNil)
  980. c.Assert(info.ControlAvailable, checker.False)
  981. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  982. nodes = append(nodes, worker)
  983. }
  984. // stop whole cluster
  985. {
  986. var wg sync.WaitGroup
  987. wg.Add(len(nodes))
  988. errs := make(chan error, len(nodes))
  989. for _, d := range nodes {
  990. go func(daemon *SwarmDaemon) {
  991. defer wg.Done()
  992. if err := daemon.Stop(); err != nil {
  993. errs <- err
  994. }
  995. if root := os.Getenv("DOCKER_REMAP_ROOT"); root != "" {
  996. daemon.root = filepath.Dir(daemon.root)
  997. }
  998. }(d)
  999. }
  1000. wg.Wait()
  1001. close(errs)
  1002. for err := range errs {
  1003. c.Assert(err, check.IsNil)
  1004. }
  1005. }
  1006. // start whole cluster
  1007. {
  1008. var wg sync.WaitGroup
  1009. wg.Add(len(nodes))
  1010. errs := make(chan error, len(nodes))
  1011. for _, d := range nodes {
  1012. go func(daemon *SwarmDaemon) {
  1013. defer wg.Done()
  1014. if err := daemon.Start("--iptables=false"); err != nil {
  1015. errs <- err
  1016. }
  1017. }(d)
  1018. }
  1019. wg.Wait()
  1020. close(errs)
  1021. for err := range errs {
  1022. c.Assert(err, check.IsNil)
  1023. }
  1024. }
  1025. checkClusterHealth(c, nodes, mCount, wCount)
  1026. }
  1027. func (s *DockerSwarmSuite) TestAPISwarmServicesUpdateWithName(c *check.C) {
  1028. d := s.AddDaemon(c, true, true)
  1029. instances := 2
  1030. id := d.createService(c, simpleTestService, setInstances(instances))
  1031. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  1032. service := d.getService(c, id)
  1033. instances = 5
  1034. setInstances(instances)(service)
  1035. url := fmt.Sprintf("/services/%s/update?version=%d", service.Spec.Name, service.Version.Index)
  1036. status, out, err := d.SockRequest("POST", url, service.Spec)
  1037. c.Assert(err, checker.IsNil)
  1038. c.Assert(status, checker.Equals, http.StatusOK, check.Commentf("output: %q", string(out)))
  1039. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  1040. }
  1041. func (s *DockerSwarmSuite) TestAPISwarmSecretsEmptyList(c *check.C) {
  1042. d := s.AddDaemon(c, true, true)
  1043. secrets := d.listSecrets(c)
  1044. c.Assert(secrets, checker.NotNil)
  1045. c.Assert(len(secrets), checker.Equals, 0, check.Commentf("secrets: %#v", secrets))
  1046. }
  1047. func (s *DockerSwarmSuite) TestAPISwarmSecretsCreate(c *check.C) {
  1048. d := s.AddDaemon(c, true, true)
  1049. testName := "test_secret"
  1050. id := d.createSecret(c, swarm.SecretSpec{
  1051. swarm.Annotations{
  1052. Name: testName,
  1053. },
  1054. []byte("TESTINGDATA"),
  1055. })
  1056. c.Assert(id, checker.Not(checker.Equals), "", check.Commentf("secrets: %s", id))
  1057. secrets := d.listSecrets(c)
  1058. c.Assert(len(secrets), checker.Equals, 1, check.Commentf("secrets: %#v", secrets))
  1059. name := secrets[0].Spec.Annotations.Name
  1060. c.Assert(name, checker.Equals, testName, check.Commentf("secret: %s", name))
  1061. }
  1062. func (s *DockerSwarmSuite) TestAPISwarmSecretsDelete(c *check.C) {
  1063. d := s.AddDaemon(c, true, true)
  1064. testName := "test_secret"
  1065. id := d.createSecret(c, swarm.SecretSpec{
  1066. swarm.Annotations{
  1067. Name: testName,
  1068. },
  1069. []byte("TESTINGDATA"),
  1070. })
  1071. c.Assert(id, checker.Not(checker.Equals), "", check.Commentf("secrets: %s", id))
  1072. secret := d.getSecret(c, id)
  1073. c.Assert(secret.ID, checker.Equals, id, check.Commentf("secret: %v", secret))
  1074. d.deleteSecret(c, secret.ID)
  1075. status, out, err := d.SockRequest("GET", "/secrets/"+id, nil)
  1076. c.Assert(err, checker.IsNil)
  1077. c.Assert(status, checker.Equals, http.StatusNotFound, check.Commentf("secret delete: %s", string(out)))
  1078. }
  1079. // Test case for 30242, where duplicate networks, with different drivers `bridge` and `overlay`,
  1080. // caused both scopes to be `swarm` for `docker network inspect` and `docker network ls`.
  1081. // This test makes sure the fixes correctly output scopes instead.
  1082. func (s *DockerSwarmSuite) TestAPIDuplicateNetworks(c *check.C) {
  1083. d := s.AddDaemon(c, true, true)
  1084. name := "foo"
  1085. networkCreateRequest := types.NetworkCreateRequest{
  1086. Name: name,
  1087. NetworkCreate: types.NetworkCreate{
  1088. CheckDuplicate: false,
  1089. },
  1090. }
  1091. var n1 types.NetworkCreateResponse
  1092. networkCreateRequest.NetworkCreate.Driver = "bridge"
  1093. status, out, err := d.SockRequest("POST", "/networks/create", networkCreateRequest)
  1094. c.Assert(err, checker.IsNil, check.Commentf(string(out)))
  1095. c.Assert(status, checker.Equals, http.StatusCreated, check.Commentf(string(out)))
  1096. c.Assert(json.Unmarshal(out, &n1), checker.IsNil)
  1097. var n2 types.NetworkCreateResponse
  1098. networkCreateRequest.NetworkCreate.Driver = "overlay"
  1099. status, out, err = d.SockRequest("POST", "/networks/create", networkCreateRequest)
  1100. c.Assert(err, checker.IsNil, check.Commentf(string(out)))
  1101. c.Assert(status, checker.Equals, http.StatusCreated, check.Commentf(string(out)))
  1102. c.Assert(json.Unmarshal(out, &n2), checker.IsNil)
  1103. var r1 types.NetworkResource
  1104. status, out, err = d.SockRequest("GET", "/networks/"+n1.ID, nil)
  1105. c.Assert(err, checker.IsNil, check.Commentf(string(out)))
  1106. c.Assert(status, checker.Equals, http.StatusOK, check.Commentf(string(out)))
  1107. c.Assert(json.Unmarshal(out, &r1), checker.IsNil)
  1108. c.Assert(r1.Scope, checker.Equals, "local")
  1109. var r2 types.NetworkResource
  1110. status, out, err = d.SockRequest("GET", "/networks/"+n2.ID, nil)
  1111. c.Assert(err, checker.IsNil, check.Commentf(string(out)))
  1112. c.Assert(status, checker.Equals, http.StatusOK, check.Commentf(string(out)))
  1113. c.Assert(json.Unmarshal(out, &r2), checker.IsNil)
  1114. c.Assert(r2.Scope, checker.Equals, "swarm")
  1115. }
  1116. // Test case for 30178
  1117. func (s *DockerSwarmSuite) TestAPISwarmHealthcheckNone(c *check.C) {
  1118. d := s.AddDaemon(c, true, true)
  1119. out, err := d.Cmd("network", "create", "-d", "overlay", "lb")
  1120. c.Assert(err, checker.IsNil, check.Commentf(out))
  1121. instances := 1
  1122. d.createService(c, simpleTestService, setInstances(instances), func(s *swarm.Service) {
  1123. s.Spec.TaskTemplate.ContainerSpec.Healthcheck = &container.HealthConfig{}
  1124. s.Spec.TaskTemplate.Networks = []swarm.NetworkAttachmentConfig{
  1125. {Target: "lb"},
  1126. }
  1127. })
  1128. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  1129. containers := d.activeContainers()
  1130. out, err = d.Cmd("exec", containers[0], "ping", "-c1", "-W3", "top")
  1131. c.Assert(err, checker.IsNil, check.Commentf(out))
  1132. }