docker_api_swarm_test.go 45 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367
  1. // +build !windows
  2. package main
  3. import (
  4. "encoding/json"
  5. "fmt"
  6. "net/http"
  7. "os"
  8. "path/filepath"
  9. "strconv"
  10. "strings"
  11. "sync"
  12. "syscall"
  13. "time"
  14. "github.com/docker/docker/api/types"
  15. "github.com/docker/docker/api/types/swarm"
  16. "github.com/docker/docker/pkg/integration/checker"
  17. "github.com/go-check/check"
  18. )
  19. var defaultReconciliationTimeout = 30 * time.Second
  20. func (s *DockerSwarmSuite) TestAPISwarmInit(c *check.C) {
  21. // todo: should find a better way to verify that components are running than /info
  22. d1 := s.AddDaemon(c, true, true)
  23. info, err := d1.info()
  24. c.Assert(err, checker.IsNil)
  25. c.Assert(info.ControlAvailable, checker.True)
  26. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  27. d2 := s.AddDaemon(c, true, false)
  28. info, err = d2.info()
  29. c.Assert(err, checker.IsNil)
  30. c.Assert(info.ControlAvailable, checker.False)
  31. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  32. // Leaving cluster
  33. c.Assert(d2.Leave(false), checker.IsNil)
  34. info, err = d2.info()
  35. c.Assert(err, checker.IsNil)
  36. c.Assert(info.ControlAvailable, checker.False)
  37. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  38. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: d1.joinTokens(c).Worker, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  39. info, err = d2.info()
  40. c.Assert(err, checker.IsNil)
  41. c.Assert(info.ControlAvailable, checker.False)
  42. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  43. // Current state restoring after restarts
  44. err = d1.Stop()
  45. c.Assert(err, checker.IsNil)
  46. err = d2.Stop()
  47. c.Assert(err, checker.IsNil)
  48. err = d1.Start()
  49. c.Assert(err, checker.IsNil)
  50. err = d2.Start()
  51. c.Assert(err, checker.IsNil)
  52. info, err = d1.info()
  53. c.Assert(err, checker.IsNil)
  54. c.Assert(info.ControlAvailable, checker.True)
  55. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  56. info, err = d2.info()
  57. c.Assert(err, checker.IsNil)
  58. c.Assert(info.ControlAvailable, checker.False)
  59. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  60. }
  61. func (s *DockerSwarmSuite) TestAPISwarmJoinToken(c *check.C) {
  62. d1 := s.AddDaemon(c, false, false)
  63. c.Assert(d1.Init(swarm.InitRequest{}), checker.IsNil)
  64. d2 := s.AddDaemon(c, false, false)
  65. err := d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  66. c.Assert(err, checker.NotNil)
  67. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  68. info, err := d2.info()
  69. c.Assert(err, checker.IsNil)
  70. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  71. err = d2.Join(swarm.JoinRequest{JoinToken: "foobaz", RemoteAddrs: []string{d1.listenAddr}})
  72. c.Assert(err, checker.NotNil)
  73. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  74. info, err = d2.info()
  75. c.Assert(err, checker.IsNil)
  76. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  77. workerToken := d1.joinTokens(c).Worker
  78. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  79. info, err = d2.info()
  80. c.Assert(err, checker.IsNil)
  81. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  82. c.Assert(d2.Leave(false), checker.IsNil)
  83. info, err = d2.info()
  84. c.Assert(err, checker.IsNil)
  85. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  86. // change tokens
  87. d1.rotateTokens(c)
  88. err = d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}})
  89. c.Assert(err, checker.NotNil)
  90. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  91. info, err = d2.info()
  92. c.Assert(err, checker.IsNil)
  93. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  94. workerToken = d1.joinTokens(c).Worker
  95. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  96. info, err = d2.info()
  97. c.Assert(err, checker.IsNil)
  98. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  99. c.Assert(d2.Leave(false), checker.IsNil)
  100. info, err = d2.info()
  101. c.Assert(err, checker.IsNil)
  102. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  103. // change spec, don't change tokens
  104. d1.updateSwarm(c, func(s *swarm.Spec) {})
  105. err = d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  106. c.Assert(err, checker.NotNil)
  107. c.Assert(err.Error(), checker.Contains, "join token is necessary")
  108. info, err = d2.info()
  109. c.Assert(err, checker.IsNil)
  110. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  111. c.Assert(d2.Join(swarm.JoinRequest{JoinToken: workerToken, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  112. info, err = d2.info()
  113. c.Assert(err, checker.IsNil)
  114. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  115. c.Assert(d2.Leave(false), checker.IsNil)
  116. info, err = d2.info()
  117. c.Assert(err, checker.IsNil)
  118. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  119. }
  120. func (s *DockerSwarmSuite) TestAPISwarmCAHash(c *check.C) {
  121. d1 := s.AddDaemon(c, true, true)
  122. d2 := s.AddDaemon(c, false, false)
  123. splitToken := strings.Split(d1.joinTokens(c).Worker, "-")
  124. splitToken[2] = "1kxftv4ofnc6mt30lmgipg6ngf9luhwqopfk1tz6bdmnkubg0e"
  125. replacementToken := strings.Join(splitToken, "-")
  126. err := d2.Join(swarm.JoinRequest{JoinToken: replacementToken, RemoteAddrs: []string{d1.listenAddr}})
  127. c.Assert(err, checker.NotNil)
  128. c.Assert(err.Error(), checker.Contains, "remote CA does not match fingerprint")
  129. }
  130. func (s *DockerSwarmSuite) TestAPISwarmPromoteDemote(c *check.C) {
  131. d1 := s.AddDaemon(c, false, false)
  132. c.Assert(d1.Init(swarm.InitRequest{}), checker.IsNil)
  133. d2 := s.AddDaemon(c, true, false)
  134. info, err := d2.info()
  135. c.Assert(err, checker.IsNil)
  136. c.Assert(info.ControlAvailable, checker.False)
  137. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  138. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  139. n.Spec.Role = swarm.NodeRoleManager
  140. })
  141. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  142. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  143. n.Spec.Role = swarm.NodeRoleWorker
  144. })
  145. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.False)
  146. // Demoting last node should fail
  147. node := d1.getNode(c, d1.NodeID)
  148. node.Spec.Role = swarm.NodeRoleWorker
  149. url := fmt.Sprintf("/nodes/%s/update?version=%d", node.ID, node.Version.Index)
  150. status, out, err := d1.SockRequest("POST", url, node.Spec)
  151. c.Assert(err, checker.IsNil)
  152. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("output: %q", string(out)))
  153. c.Assert(string(out), checker.Contains, "last manager of the swarm")
  154. info, err = d1.info()
  155. c.Assert(err, checker.IsNil)
  156. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  157. c.Assert(info.ControlAvailable, checker.True)
  158. // Promote already demoted node
  159. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  160. n.Spec.Role = swarm.NodeRoleManager
  161. })
  162. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  163. }
  164. func (s *DockerSwarmSuite) TestAPISwarmServicesEmptyList(c *check.C) {
  165. d := s.AddDaemon(c, true, true)
  166. services := d.listServices(c)
  167. c.Assert(services, checker.NotNil)
  168. c.Assert(len(services), checker.Equals, 0, check.Commentf("services: %#v", services))
  169. }
  170. func (s *DockerSwarmSuite) TestAPISwarmServicesCreate(c *check.C) {
  171. d := s.AddDaemon(c, true, true)
  172. instances := 2
  173. id := d.createService(c, simpleTestService, setInstances(instances))
  174. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  175. service := d.getService(c, id)
  176. instances = 5
  177. d.updateService(c, service, setInstances(instances))
  178. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  179. d.removeService(c, service.ID)
  180. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 0)
  181. }
  182. func (s *DockerSwarmSuite) TestAPISwarmServicesMultipleAgents(c *check.C) {
  183. d1 := s.AddDaemon(c, true, true)
  184. d2 := s.AddDaemon(c, true, false)
  185. d3 := s.AddDaemon(c, true, false)
  186. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  187. instances := 9
  188. id := d1.createService(c, simpleTestService, setInstances(instances))
  189. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  190. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  191. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.GreaterThan, 0)
  192. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  193. // reconciliation on d2 node down
  194. c.Assert(d2.Stop(), checker.IsNil)
  195. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  196. // test downscaling
  197. instances = 5
  198. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  199. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  200. }
  201. func (s *DockerSwarmSuite) TestAPISwarmServicesCreateGlobal(c *check.C) {
  202. d1 := s.AddDaemon(c, true, true)
  203. d2 := s.AddDaemon(c, true, false)
  204. d3 := s.AddDaemon(c, true, false)
  205. d1.createService(c, simpleTestService, setGlobalMode)
  206. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, 1)
  207. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  208. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.Equals, 1)
  209. d4 := s.AddDaemon(c, true, false)
  210. d5 := s.AddDaemon(c, true, false)
  211. waitAndAssert(c, defaultReconciliationTimeout, d4.checkActiveContainerCount, checker.Equals, 1)
  212. waitAndAssert(c, defaultReconciliationTimeout, d5.checkActiveContainerCount, checker.Equals, 1)
  213. }
  214. func (s *DockerSwarmSuite) TestAPISwarmServicesUpdate(c *check.C) {
  215. const nodeCount = 3
  216. var daemons [nodeCount]*SwarmDaemon
  217. for i := 0; i < nodeCount; i++ {
  218. daemons[i] = s.AddDaemon(c, true, i == 0)
  219. }
  220. // wait for nodes ready
  221. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  222. // service image at start
  223. image1 := "busybox:latest"
  224. // target image in update
  225. image2 := "busybox:test"
  226. // create a different tag
  227. for _, d := range daemons {
  228. out, err := d.Cmd("tag", image1, image2)
  229. c.Assert(err, checker.IsNil, check.Commentf(out))
  230. }
  231. // create service
  232. instances := 5
  233. parallelism := 2
  234. id := daemons[0].createService(c, serviceForUpdate, setInstances(instances))
  235. // wait for tasks ready
  236. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  237. map[string]int{image1: instances})
  238. // issue service update
  239. service := daemons[0].getService(c, id)
  240. daemons[0].updateService(c, service, setImage(image2))
  241. // first batch
  242. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  243. map[string]int{image1: instances - parallelism, image2: parallelism})
  244. // 2nd batch
  245. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  246. map[string]int{image1: instances - 2*parallelism, image2: 2 * parallelism})
  247. // 3nd batch
  248. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  249. map[string]int{image2: instances})
  250. // Roll back to the previous version. This uses the CLI because
  251. // rollback is a client-side operation.
  252. out, err := daemons[0].Cmd("service", "update", "--rollback", id)
  253. c.Assert(err, checker.IsNil, check.Commentf(out))
  254. // first batch
  255. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  256. map[string]int{image2: instances - parallelism, image1: parallelism})
  257. // 2nd batch
  258. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  259. map[string]int{image2: instances - 2*parallelism, image1: 2 * parallelism})
  260. // 3nd batch
  261. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  262. map[string]int{image1: instances})
  263. }
  264. func (s *DockerSwarmSuite) TestAPISwarmServicesFailedUpdate(c *check.C) {
  265. const nodeCount = 3
  266. var daemons [nodeCount]*SwarmDaemon
  267. for i := 0; i < nodeCount; i++ {
  268. daemons[i] = s.AddDaemon(c, true, i == 0)
  269. }
  270. // wait for nodes ready
  271. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  272. // service image at start
  273. image1 := "busybox:latest"
  274. // target image in update
  275. image2 := "busybox:badtag"
  276. // create service
  277. instances := 5
  278. id := daemons[0].createService(c, serviceForUpdate, setInstances(instances))
  279. // wait for tasks ready
  280. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  281. map[string]int{image1: instances})
  282. // issue service update
  283. service := daemons[0].getService(c, id)
  284. daemons[0].updateService(c, service, setImage(image2), setFailureAction(swarm.UpdateFailureActionPause), setMaxFailureRatio(0.25), setParallelism(1))
  285. // should update 2 tasks and then pause
  286. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceUpdateState(id), checker.Equals, swarm.UpdateStatePaused)
  287. v, _ := daemons[0].checkServiceRunningTasks(id)(c)
  288. c.Assert(v, checker.Equals, instances-2)
  289. // Roll back to the previous version. This uses the CLI because
  290. // rollback is a client-side operation.
  291. out, err := daemons[0].Cmd("service", "update", "--rollback", id)
  292. c.Assert(err, checker.IsNil, check.Commentf(out))
  293. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkRunningTaskImages, checker.DeepEquals,
  294. map[string]int{image1: instances})
  295. }
  296. func (s *DockerSwarmSuite) TestAPISwarmServiceConstraintRole(c *check.C) {
  297. const nodeCount = 3
  298. var daemons [nodeCount]*SwarmDaemon
  299. for i := 0; i < nodeCount; i++ {
  300. daemons[i] = s.AddDaemon(c, true, i == 0)
  301. }
  302. // wait for nodes ready
  303. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  304. // create service
  305. constraints := []string{"node.role==worker"}
  306. instances := 3
  307. id := daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  308. // wait for tasks ready
  309. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  310. // validate tasks are running on worker nodes
  311. tasks := daemons[0].getServiceTasks(c, id)
  312. for _, task := range tasks {
  313. node := daemons[0].getNode(c, task.NodeID)
  314. c.Assert(node.Spec.Role, checker.Equals, swarm.NodeRoleWorker)
  315. }
  316. //remove service
  317. daemons[0].removeService(c, id)
  318. // create service
  319. constraints = []string{"node.role!=worker"}
  320. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  321. // wait for tasks ready
  322. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  323. tasks = daemons[0].getServiceTasks(c, id)
  324. // validate tasks are running on manager nodes
  325. for _, task := range tasks {
  326. node := daemons[0].getNode(c, task.NodeID)
  327. c.Assert(node.Spec.Role, checker.Equals, swarm.NodeRoleManager)
  328. }
  329. //remove service
  330. daemons[0].removeService(c, id)
  331. // create service
  332. constraints = []string{"node.role==nosuchrole"}
  333. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  334. // wait for tasks created
  335. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  336. // let scheduler try
  337. time.Sleep(250 * time.Millisecond)
  338. // validate tasks are not assigned to any node
  339. tasks = daemons[0].getServiceTasks(c, id)
  340. for _, task := range tasks {
  341. c.Assert(task.NodeID, checker.Equals, "")
  342. }
  343. }
  344. func (s *DockerSwarmSuite) TestAPISwarmServiceConstraintLabel(c *check.C) {
  345. const nodeCount = 3
  346. var daemons [nodeCount]*SwarmDaemon
  347. for i := 0; i < nodeCount; i++ {
  348. daemons[i] = s.AddDaemon(c, true, i == 0)
  349. }
  350. // wait for nodes ready
  351. waitAndAssert(c, 5*time.Second, daemons[0].checkNodeReadyCount, checker.Equals, nodeCount)
  352. nodes := daemons[0].listNodes(c)
  353. c.Assert(len(nodes), checker.Equals, nodeCount)
  354. // add labels to nodes
  355. daemons[0].updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  356. n.Spec.Annotations.Labels = map[string]string{
  357. "security": "high",
  358. }
  359. })
  360. for i := 1; i < nodeCount; i++ {
  361. daemons[0].updateNode(c, nodes[i].ID, func(n *swarm.Node) {
  362. n.Spec.Annotations.Labels = map[string]string{
  363. "security": "low",
  364. }
  365. })
  366. }
  367. // create service
  368. instances := 3
  369. constraints := []string{"node.labels.security==high"}
  370. id := daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  371. // wait for tasks ready
  372. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  373. tasks := daemons[0].getServiceTasks(c, id)
  374. // validate all tasks are running on nodes[0]
  375. for _, task := range tasks {
  376. c.Assert(task.NodeID, checker.Equals, nodes[0].ID)
  377. }
  378. //remove service
  379. daemons[0].removeService(c, id)
  380. // create service
  381. constraints = []string{"node.labels.security!=high"}
  382. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  383. // wait for tasks ready
  384. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  385. tasks = daemons[0].getServiceTasks(c, id)
  386. // validate all tasks are NOT running on nodes[0]
  387. for _, task := range tasks {
  388. c.Assert(task.NodeID, checker.Not(checker.Equals), nodes[0].ID)
  389. }
  390. //remove service
  391. daemons[0].removeService(c, id)
  392. constraints = []string{"node.labels.security==medium"}
  393. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  394. // wait for tasks created
  395. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  396. // let scheduler try
  397. time.Sleep(250 * time.Millisecond)
  398. tasks = daemons[0].getServiceTasks(c, id)
  399. // validate tasks are not assigned
  400. for _, task := range tasks {
  401. c.Assert(task.NodeID, checker.Equals, "")
  402. }
  403. //remove service
  404. daemons[0].removeService(c, id)
  405. // multiple constraints
  406. constraints = []string{
  407. "node.labels.security==high",
  408. fmt.Sprintf("node.id==%s", nodes[1].ID),
  409. }
  410. id = daemons[0].createService(c, simpleTestService, setConstraints(constraints), setInstances(instances))
  411. // wait for tasks created
  412. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceTasks(id), checker.Equals, instances)
  413. // let scheduler try
  414. time.Sleep(250 * time.Millisecond)
  415. tasks = daemons[0].getServiceTasks(c, id)
  416. // validate tasks are not assigned
  417. for _, task := range tasks {
  418. c.Assert(task.NodeID, checker.Equals, "")
  419. }
  420. // make nodes[1] fulfills the constraints
  421. daemons[0].updateNode(c, nodes[1].ID, func(n *swarm.Node) {
  422. n.Spec.Annotations.Labels = map[string]string{
  423. "security": "high",
  424. }
  425. })
  426. // wait for tasks ready
  427. waitAndAssert(c, defaultReconciliationTimeout, daemons[0].checkServiceRunningTasks(id), checker.Equals, instances)
  428. tasks = daemons[0].getServiceTasks(c, id)
  429. for _, task := range tasks {
  430. c.Assert(task.NodeID, checker.Equals, nodes[1].ID)
  431. }
  432. }
  433. func (s *DockerSwarmSuite) TestAPISwarmServicesStateReporting(c *check.C) {
  434. testRequires(c, SameHostDaemon)
  435. testRequires(c, DaemonIsLinux)
  436. d1 := s.AddDaemon(c, true, true)
  437. d2 := s.AddDaemon(c, true, true)
  438. d3 := s.AddDaemon(c, true, false)
  439. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept
  440. instances := 9
  441. d1.createService(c, simpleTestService, setInstances(instances))
  442. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  443. getContainers := func() map[string]*SwarmDaemon {
  444. m := make(map[string]*SwarmDaemon)
  445. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  446. for _, id := range d.activeContainers() {
  447. m[id] = d
  448. }
  449. }
  450. return m
  451. }
  452. containers := getContainers()
  453. c.Assert(containers, checker.HasLen, instances)
  454. var toRemove string
  455. for i := range containers {
  456. toRemove = i
  457. }
  458. _, err := containers[toRemove].Cmd("stop", toRemove)
  459. c.Assert(err, checker.IsNil)
  460. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  461. containers2 := getContainers()
  462. c.Assert(containers2, checker.HasLen, instances)
  463. for i := range containers {
  464. if i == toRemove {
  465. c.Assert(containers2[i], checker.IsNil)
  466. } else {
  467. c.Assert(containers2[i], checker.NotNil)
  468. }
  469. }
  470. containers = containers2
  471. for i := range containers {
  472. toRemove = i
  473. }
  474. // try with killing process outside of docker
  475. pidStr, err := containers[toRemove].Cmd("inspect", "-f", "{{.State.Pid}}", toRemove)
  476. c.Assert(err, checker.IsNil)
  477. pid, err := strconv.Atoi(strings.TrimSpace(pidStr))
  478. c.Assert(err, checker.IsNil)
  479. c.Assert(syscall.Kill(pid, syscall.SIGKILL), checker.IsNil)
  480. time.Sleep(time.Second) // give some time to handle the signal
  481. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  482. containers2 = getContainers()
  483. c.Assert(containers2, checker.HasLen, instances)
  484. for i := range containers {
  485. if i == toRemove {
  486. c.Assert(containers2[i], checker.IsNil)
  487. } else {
  488. c.Assert(containers2[i], checker.NotNil)
  489. }
  490. }
  491. }
  492. func (s *DockerSwarmSuite) TestAPISwarmLeaderProxy(c *check.C) {
  493. // add three managers, one of these is leader
  494. d1 := s.AddDaemon(c, true, true)
  495. d2 := s.AddDaemon(c, true, true)
  496. d3 := s.AddDaemon(c, true, true)
  497. // start a service by hitting each of the 3 managers
  498. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  499. s.Spec.Name = "test1"
  500. })
  501. d2.createService(c, simpleTestService, func(s *swarm.Service) {
  502. s.Spec.Name = "test2"
  503. })
  504. d3.createService(c, simpleTestService, func(s *swarm.Service) {
  505. s.Spec.Name = "test3"
  506. })
  507. // 3 services should be started now, because the requests were proxied to leader
  508. // query each node and make sure it returns 3 services
  509. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  510. services := d.listServices(c)
  511. c.Assert(services, checker.HasLen, 3)
  512. }
  513. }
  514. func (s *DockerSwarmSuite) TestAPISwarmLeaderElection(c *check.C) {
  515. // Create 3 nodes
  516. d1 := s.AddDaemon(c, true, true)
  517. d2 := s.AddDaemon(c, true, true)
  518. d3 := s.AddDaemon(c, true, true)
  519. // assert that the first node we made is the leader, and the other two are followers
  520. c.Assert(d1.getNode(c, d1.NodeID).ManagerStatus.Leader, checker.True)
  521. c.Assert(d1.getNode(c, d2.NodeID).ManagerStatus.Leader, checker.False)
  522. c.Assert(d1.getNode(c, d3.NodeID).ManagerStatus.Leader, checker.False)
  523. d1.Stop() // stop the leader
  524. var (
  525. leader *SwarmDaemon // keep track of leader
  526. followers []*SwarmDaemon // keep track of followers
  527. )
  528. checkLeader := func(nodes ...*SwarmDaemon) checkF {
  529. return func(c *check.C) (interface{}, check.CommentInterface) {
  530. // clear these out before each run
  531. leader = nil
  532. followers = nil
  533. for _, d := range nodes {
  534. if d.getNode(c, d.NodeID).ManagerStatus.Leader {
  535. leader = d
  536. } else {
  537. followers = append(followers, d)
  538. }
  539. }
  540. if leader == nil {
  541. return false, check.Commentf("no leader elected")
  542. }
  543. return true, check.Commentf("elected %v", leader.id)
  544. }
  545. }
  546. // wait for an election to occur
  547. waitAndAssert(c, defaultReconciliationTimeout, checkLeader(d2, d3), checker.True)
  548. // assert that we have a new leader
  549. c.Assert(leader, checker.NotNil)
  550. // Keep track of the current leader, since we want that to be chosen.
  551. stableleader := leader
  552. // add the d1, the initial leader, back
  553. d1.Start()
  554. // TODO(stevvooe): may need to wait for rejoin here
  555. // wait for possible election
  556. waitAndAssert(c, defaultReconciliationTimeout, checkLeader(d1, d2, d3), checker.True)
  557. // pick out the leader and the followers again
  558. // verify that we still only have 1 leader and 2 followers
  559. c.Assert(leader, checker.NotNil)
  560. c.Assert(followers, checker.HasLen, 2)
  561. // and that after we added d1 back, the leader hasn't changed
  562. c.Assert(leader.NodeID, checker.Equals, stableleader.NodeID)
  563. }
  564. func (s *DockerSwarmSuite) TestAPISwarmRaftQuorum(c *check.C) {
  565. d1 := s.AddDaemon(c, true, true)
  566. d2 := s.AddDaemon(c, true, true)
  567. d3 := s.AddDaemon(c, true, true)
  568. d1.createService(c, simpleTestService)
  569. c.Assert(d2.Stop(), checker.IsNil)
  570. // make sure there is a leader
  571. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  572. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  573. s.Spec.Name = "top1"
  574. })
  575. c.Assert(d3.Stop(), checker.IsNil)
  576. // make sure there is a leader
  577. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  578. var service swarm.Service
  579. simpleTestService(&service)
  580. service.Spec.Name = "top2"
  581. status, out, err := d1.SockRequest("POST", "/services/create", service.Spec)
  582. c.Assert(err, checker.IsNil)
  583. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("deadline exceeded", string(out)))
  584. c.Assert(d2.Start(), checker.IsNil)
  585. // make sure there is a leader
  586. waitAndAssert(c, defaultReconciliationTimeout, d1.checkLeader, checker.IsNil)
  587. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  588. s.Spec.Name = "top3"
  589. })
  590. }
  591. func (s *DockerSwarmSuite) TestAPISwarmListNodes(c *check.C) {
  592. d1 := s.AddDaemon(c, true, true)
  593. d2 := s.AddDaemon(c, true, false)
  594. d3 := s.AddDaemon(c, true, false)
  595. nodes := d1.listNodes(c)
  596. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  597. loop0:
  598. for _, n := range nodes {
  599. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  600. if n.ID == d.NodeID {
  601. continue loop0
  602. }
  603. }
  604. c.Errorf("unknown nodeID %v", n.ID)
  605. }
  606. }
  607. func (s *DockerSwarmSuite) TestAPISwarmNodeUpdate(c *check.C) {
  608. d := s.AddDaemon(c, true, true)
  609. nodes := d.listNodes(c)
  610. d.updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  611. n.Spec.Availability = swarm.NodeAvailabilityPause
  612. })
  613. n := d.getNode(c, nodes[0].ID)
  614. c.Assert(n.Spec.Availability, checker.Equals, swarm.NodeAvailabilityPause)
  615. }
  616. func (s *DockerSwarmSuite) TestAPISwarmNodeRemove(c *check.C) {
  617. testRequires(c, Network)
  618. d1 := s.AddDaemon(c, true, true)
  619. d2 := s.AddDaemon(c, true, false)
  620. _ = s.AddDaemon(c, true, false)
  621. nodes := d1.listNodes(c)
  622. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  623. // Getting the info so we can take the NodeID
  624. d2Info, err := d2.info()
  625. c.Assert(err, checker.IsNil)
  626. // forceful removal of d2 should work
  627. d1.removeNode(c, d2Info.NodeID, true)
  628. nodes = d1.listNodes(c)
  629. c.Assert(len(nodes), checker.Equals, 2, check.Commentf("nodes: %#v", nodes))
  630. // Restart the node that was removed
  631. err = d2.Restart()
  632. c.Assert(err, checker.IsNil)
  633. // Give some time for the node to rejoin
  634. time.Sleep(1 * time.Second)
  635. // Make sure the node didn't rejoin
  636. nodes = d1.listNodes(c)
  637. c.Assert(len(nodes), checker.Equals, 2, check.Commentf("nodes: %#v", nodes))
  638. }
  639. func (s *DockerSwarmSuite) TestAPISwarmNodeDrainPause(c *check.C) {
  640. d1 := s.AddDaemon(c, true, true)
  641. d2 := s.AddDaemon(c, true, false)
  642. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  643. // start a service, expect balanced distribution
  644. instances := 8
  645. id := d1.createService(c, simpleTestService, setInstances(instances))
  646. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  647. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  648. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  649. // drain d2, all containers should move to d1
  650. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  651. n.Spec.Availability = swarm.NodeAvailabilityDrain
  652. })
  653. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  654. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  655. // set d2 back to active
  656. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  657. n.Spec.Availability = swarm.NodeAvailabilityActive
  658. })
  659. instances = 1
  660. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  661. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  662. instances = 8
  663. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  664. // drained node first so we don't get any old containers
  665. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  666. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  667. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  668. d2ContainerCount := len(d2.activeContainers())
  669. // set d2 to paused, scale service up, only d1 gets new tasks
  670. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  671. n.Spec.Availability = swarm.NodeAvailabilityPause
  672. })
  673. instances = 14
  674. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  675. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances-d2ContainerCount)
  676. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, d2ContainerCount)
  677. }
  678. func (s *DockerSwarmSuite) TestAPISwarmLeaveRemovesContainer(c *check.C) {
  679. d := s.AddDaemon(c, true, true)
  680. instances := 2
  681. d.createService(c, simpleTestService, setInstances(instances))
  682. id, err := d.Cmd("run", "-d", "busybox", "top")
  683. c.Assert(err, checker.IsNil)
  684. id = strings.TrimSpace(id)
  685. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances+1)
  686. c.Assert(d.Leave(false), checker.NotNil)
  687. c.Assert(d.Leave(true), checker.IsNil)
  688. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 1)
  689. id2, err := d.Cmd("ps", "-q")
  690. c.Assert(err, checker.IsNil)
  691. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  692. }
  693. // #23629
  694. func (s *DockerSwarmSuite) TestAPISwarmLeaveOnPendingJoin(c *check.C) {
  695. testRequires(c, Network)
  696. s.AddDaemon(c, true, true)
  697. d2 := s.AddDaemon(c, false, false)
  698. id, err := d2.Cmd("run", "-d", "busybox", "top")
  699. c.Assert(err, checker.IsNil)
  700. id = strings.TrimSpace(id)
  701. err = d2.Join(swarm.JoinRequest{
  702. RemoteAddrs: []string{"123.123.123.123:1234"},
  703. })
  704. c.Assert(err, check.NotNil)
  705. c.Assert(err.Error(), checker.Contains, "Timeout was reached")
  706. info, err := d2.info()
  707. c.Assert(err, checker.IsNil)
  708. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  709. c.Assert(d2.Leave(true), checker.IsNil)
  710. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  711. id2, err := d2.Cmd("ps", "-q")
  712. c.Assert(err, checker.IsNil)
  713. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  714. }
  715. // #23705
  716. func (s *DockerSwarmSuite) TestAPISwarmRestoreOnPendingJoin(c *check.C) {
  717. testRequires(c, Network)
  718. d := s.AddDaemon(c, false, false)
  719. err := d.Join(swarm.JoinRequest{
  720. RemoteAddrs: []string{"123.123.123.123:1234"},
  721. })
  722. c.Assert(err, check.NotNil)
  723. c.Assert(err.Error(), checker.Contains, "Timeout was reached")
  724. waitAndAssert(c, defaultReconciliationTimeout, d.checkLocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  725. c.Assert(d.Stop(), checker.IsNil)
  726. c.Assert(d.Start(), checker.IsNil)
  727. info, err := d.info()
  728. c.Assert(err, checker.IsNil)
  729. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  730. }
  731. func (s *DockerSwarmSuite) TestAPISwarmManagerRestore(c *check.C) {
  732. d1 := s.AddDaemon(c, true, true)
  733. instances := 2
  734. id := d1.createService(c, simpleTestService, setInstances(instances))
  735. d1.getService(c, id)
  736. d1.Stop()
  737. d1.Start()
  738. d1.getService(c, id)
  739. d2 := s.AddDaemon(c, true, true)
  740. d2.getService(c, id)
  741. d2.Stop()
  742. d2.Start()
  743. d2.getService(c, id)
  744. d3 := s.AddDaemon(c, true, true)
  745. d3.getService(c, id)
  746. d3.Stop()
  747. d3.Start()
  748. d3.getService(c, id)
  749. d3.Kill()
  750. time.Sleep(1 * time.Second) // time to handle signal
  751. d3.Start()
  752. d3.getService(c, id)
  753. }
  754. func (s *DockerSwarmSuite) TestAPISwarmScaleNoRollingUpdate(c *check.C) {
  755. d := s.AddDaemon(c, true, true)
  756. instances := 2
  757. id := d.createService(c, simpleTestService, setInstances(instances))
  758. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  759. containers := d.activeContainers()
  760. instances = 4
  761. d.updateService(c, d.getService(c, id), setInstances(instances))
  762. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  763. containers2 := d.activeContainers()
  764. loop0:
  765. for _, c1 := range containers {
  766. for _, c2 := range containers2 {
  767. if c1 == c2 {
  768. continue loop0
  769. }
  770. }
  771. c.Errorf("container %v not found in new set %#v", c1, containers2)
  772. }
  773. }
  774. func (s *DockerSwarmSuite) TestAPISwarmInvalidAddress(c *check.C) {
  775. d := s.AddDaemon(c, false, false)
  776. req := swarm.InitRequest{
  777. ListenAddr: "",
  778. }
  779. status, _, err := d.SockRequest("POST", "/swarm/init", req)
  780. c.Assert(err, checker.IsNil)
  781. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  782. req2 := swarm.JoinRequest{
  783. ListenAddr: "0.0.0.0:2377",
  784. RemoteAddrs: []string{""},
  785. }
  786. status, _, err = d.SockRequest("POST", "/swarm/join", req2)
  787. c.Assert(err, checker.IsNil)
  788. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  789. }
  790. func (s *DockerSwarmSuite) TestAPISwarmForceNewCluster(c *check.C) {
  791. d1 := s.AddDaemon(c, true, true)
  792. d2 := s.AddDaemon(c, true, true)
  793. instances := 2
  794. id := d1.createService(c, simpleTestService, setInstances(instances))
  795. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  796. // drain d2, all containers should move to d1
  797. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  798. n.Spec.Availability = swarm.NodeAvailabilityDrain
  799. })
  800. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  801. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  802. c.Assert(d2.Stop(), checker.IsNil)
  803. c.Assert(d1.Init(swarm.InitRequest{
  804. ForceNewCluster: true,
  805. Spec: swarm.Spec{},
  806. }), checker.IsNil)
  807. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  808. d3 := s.AddDaemon(c, true, true)
  809. info, err := d3.info()
  810. c.Assert(err, checker.IsNil)
  811. c.Assert(info.ControlAvailable, checker.True)
  812. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  813. instances = 4
  814. d3.updateService(c, d3.getService(c, id), setInstances(instances))
  815. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  816. }
  817. func simpleTestService(s *swarm.Service) {
  818. ureplicas := uint64(1)
  819. restartDelay := time.Duration(100 * time.Millisecond)
  820. s.Spec = swarm.ServiceSpec{
  821. TaskTemplate: swarm.TaskSpec{
  822. ContainerSpec: swarm.ContainerSpec{
  823. Image: "busybox:latest",
  824. Command: []string{"/bin/top"},
  825. },
  826. RestartPolicy: &swarm.RestartPolicy{
  827. Delay: &restartDelay,
  828. },
  829. },
  830. Mode: swarm.ServiceMode{
  831. Replicated: &swarm.ReplicatedService{
  832. Replicas: &ureplicas,
  833. },
  834. },
  835. }
  836. s.Spec.Name = "top"
  837. }
  838. func serviceForUpdate(s *swarm.Service) {
  839. ureplicas := uint64(1)
  840. restartDelay := time.Duration(100 * time.Millisecond)
  841. s.Spec = swarm.ServiceSpec{
  842. TaskTemplate: swarm.TaskSpec{
  843. ContainerSpec: swarm.ContainerSpec{
  844. Image: "busybox:latest",
  845. Command: []string{"/bin/top"},
  846. },
  847. RestartPolicy: &swarm.RestartPolicy{
  848. Delay: &restartDelay,
  849. },
  850. },
  851. Mode: swarm.ServiceMode{
  852. Replicated: &swarm.ReplicatedService{
  853. Replicas: &ureplicas,
  854. },
  855. },
  856. UpdateConfig: &swarm.UpdateConfig{
  857. Parallelism: 2,
  858. Delay: 4 * time.Second,
  859. FailureAction: swarm.UpdateFailureActionContinue,
  860. },
  861. }
  862. s.Spec.Name = "updatetest"
  863. }
  864. func setInstances(replicas int) serviceConstructor {
  865. ureplicas := uint64(replicas)
  866. return func(s *swarm.Service) {
  867. s.Spec.Mode = swarm.ServiceMode{
  868. Replicated: &swarm.ReplicatedService{
  869. Replicas: &ureplicas,
  870. },
  871. }
  872. }
  873. }
  874. func setImage(image string) serviceConstructor {
  875. return func(s *swarm.Service) {
  876. s.Spec.TaskTemplate.ContainerSpec.Image = image
  877. }
  878. }
  879. func setFailureAction(failureAction string) serviceConstructor {
  880. return func(s *swarm.Service) {
  881. s.Spec.UpdateConfig.FailureAction = failureAction
  882. }
  883. }
  884. func setMaxFailureRatio(maxFailureRatio float32) serviceConstructor {
  885. return func(s *swarm.Service) {
  886. s.Spec.UpdateConfig.MaxFailureRatio = maxFailureRatio
  887. }
  888. }
  889. func setParallelism(parallelism uint64) serviceConstructor {
  890. return func(s *swarm.Service) {
  891. s.Spec.UpdateConfig.Parallelism = parallelism
  892. }
  893. }
  894. func setConstraints(constraints []string) serviceConstructor {
  895. return func(s *swarm.Service) {
  896. if s.Spec.TaskTemplate.Placement == nil {
  897. s.Spec.TaskTemplate.Placement = &swarm.Placement{}
  898. }
  899. s.Spec.TaskTemplate.Placement.Constraints = constraints
  900. }
  901. }
  902. func setGlobalMode(s *swarm.Service) {
  903. s.Spec.Mode = swarm.ServiceMode{
  904. Global: &swarm.GlobalService{},
  905. }
  906. }
  907. func checkClusterHealth(c *check.C, cl []*SwarmDaemon, managerCount, workerCount int) {
  908. var totalMCount, totalWCount int
  909. for _, d := range cl {
  910. var (
  911. info swarm.Info
  912. err error
  913. )
  914. // check info in a waitAndAssert, because if the cluster doesn't have a leader, `info` will return an error
  915. checkInfo := func(c *check.C) (interface{}, check.CommentInterface) {
  916. info, err = d.info()
  917. return err, check.Commentf("cluster not ready in time")
  918. }
  919. waitAndAssert(c, defaultReconciliationTimeout, checkInfo, checker.IsNil)
  920. if !info.ControlAvailable {
  921. totalWCount++
  922. continue
  923. }
  924. var leaderFound bool
  925. totalMCount++
  926. var mCount, wCount int
  927. for _, n := range d.listNodes(c) {
  928. waitReady := func(c *check.C) (interface{}, check.CommentInterface) {
  929. if n.Status.State == swarm.NodeStateReady {
  930. return true, nil
  931. }
  932. nn := d.getNode(c, n.ID)
  933. n = *nn
  934. return n.Status.State == swarm.NodeStateReady, check.Commentf("state of node %s, reported by %s", n.ID, d.Info.NodeID)
  935. }
  936. waitAndAssert(c, defaultReconciliationTimeout, waitReady, checker.True)
  937. waitActive := func(c *check.C) (interface{}, check.CommentInterface) {
  938. if n.Spec.Availability == swarm.NodeAvailabilityActive {
  939. return true, nil
  940. }
  941. nn := d.getNode(c, n.ID)
  942. n = *nn
  943. return n.Spec.Availability == swarm.NodeAvailabilityActive, check.Commentf("availability of node %s, reported by %s", n.ID, d.Info.NodeID)
  944. }
  945. waitAndAssert(c, defaultReconciliationTimeout, waitActive, checker.True)
  946. if n.Spec.Role == swarm.NodeRoleManager {
  947. c.Assert(n.ManagerStatus, checker.NotNil, check.Commentf("manager status of node %s (manager), reported by %s", n.ID, d.Info.NodeID))
  948. if n.ManagerStatus.Leader {
  949. leaderFound = true
  950. }
  951. mCount++
  952. } else {
  953. c.Assert(n.ManagerStatus, checker.IsNil, check.Commentf("manager status of node %s (worker), reported by %s", n.ID, d.Info.NodeID))
  954. wCount++
  955. }
  956. }
  957. c.Assert(leaderFound, checker.True, check.Commentf("lack of leader reported by node %s", info.NodeID))
  958. c.Assert(mCount, checker.Equals, managerCount, check.Commentf("managers count reported by node %s", info.NodeID))
  959. c.Assert(wCount, checker.Equals, workerCount, check.Commentf("workers count reported by node %s", info.NodeID))
  960. }
  961. c.Assert(totalMCount, checker.Equals, managerCount)
  962. c.Assert(totalWCount, checker.Equals, workerCount)
  963. }
  964. func (s *DockerSwarmSuite) TestAPISwarmRestartCluster(c *check.C) {
  965. mCount, wCount := 5, 1
  966. var nodes []*SwarmDaemon
  967. for i := 0; i < mCount; i++ {
  968. manager := s.AddDaemon(c, true, true)
  969. info, err := manager.info()
  970. c.Assert(err, checker.IsNil)
  971. c.Assert(info.ControlAvailable, checker.True)
  972. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  973. nodes = append(nodes, manager)
  974. }
  975. for i := 0; i < wCount; i++ {
  976. worker := s.AddDaemon(c, true, false)
  977. info, err := worker.info()
  978. c.Assert(err, checker.IsNil)
  979. c.Assert(info.ControlAvailable, checker.False)
  980. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  981. nodes = append(nodes, worker)
  982. }
  983. // stop whole cluster
  984. {
  985. var wg sync.WaitGroup
  986. wg.Add(len(nodes))
  987. errs := make(chan error, len(nodes))
  988. for _, d := range nodes {
  989. go func(daemon *SwarmDaemon) {
  990. defer wg.Done()
  991. if err := daemon.Stop(); err != nil {
  992. errs <- err
  993. }
  994. if root := os.Getenv("DOCKER_REMAP_ROOT"); root != "" {
  995. daemon.root = filepath.Dir(daemon.root)
  996. }
  997. }(d)
  998. }
  999. wg.Wait()
  1000. close(errs)
  1001. for err := range errs {
  1002. c.Assert(err, check.IsNil)
  1003. }
  1004. }
  1005. // start whole cluster
  1006. {
  1007. var wg sync.WaitGroup
  1008. wg.Add(len(nodes))
  1009. errs := make(chan error, len(nodes))
  1010. for _, d := range nodes {
  1011. go func(daemon *SwarmDaemon) {
  1012. defer wg.Done()
  1013. if err := daemon.Start("--iptables=false"); err != nil {
  1014. errs <- err
  1015. }
  1016. }(d)
  1017. }
  1018. wg.Wait()
  1019. close(errs)
  1020. for err := range errs {
  1021. c.Assert(err, check.IsNil)
  1022. }
  1023. }
  1024. checkClusterHealth(c, nodes, mCount, wCount)
  1025. }
  1026. func (s *DockerSwarmSuite) TestAPISwarmServicesUpdateWithName(c *check.C) {
  1027. d := s.AddDaemon(c, true, true)
  1028. instances := 2
  1029. id := d.createService(c, simpleTestService, setInstances(instances))
  1030. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  1031. service := d.getService(c, id)
  1032. instances = 5
  1033. setInstances(instances)(service)
  1034. url := fmt.Sprintf("/services/%s/update?version=%d", service.Spec.Name, service.Version.Index)
  1035. status, out, err := d.SockRequest("POST", url, service.Spec)
  1036. c.Assert(err, checker.IsNil)
  1037. c.Assert(status, checker.Equals, http.StatusOK, check.Commentf("output: %q", string(out)))
  1038. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  1039. }
  1040. func (s *DockerSwarmSuite) TestAPISwarmSecretsEmptyList(c *check.C) {
  1041. d := s.AddDaemon(c, true, true)
  1042. secrets := d.listSecrets(c)
  1043. c.Assert(secrets, checker.NotNil)
  1044. c.Assert(len(secrets), checker.Equals, 0, check.Commentf("secrets: %#v", secrets))
  1045. }
  1046. func (s *DockerSwarmSuite) TestAPISwarmSecretsCreate(c *check.C) {
  1047. d := s.AddDaemon(c, true, true)
  1048. testName := "test_secret"
  1049. id := d.createSecret(c, swarm.SecretSpec{
  1050. swarm.Annotations{
  1051. Name: testName,
  1052. },
  1053. []byte("TESTINGDATA"),
  1054. })
  1055. c.Assert(id, checker.Not(checker.Equals), "", check.Commentf("secrets: %s", id))
  1056. secrets := d.listSecrets(c)
  1057. c.Assert(len(secrets), checker.Equals, 1, check.Commentf("secrets: %#v", secrets))
  1058. name := secrets[0].Spec.Annotations.Name
  1059. c.Assert(name, checker.Equals, testName, check.Commentf("secret: %s", name))
  1060. }
  1061. func (s *DockerSwarmSuite) TestAPISwarmSecretsDelete(c *check.C) {
  1062. d := s.AddDaemon(c, true, true)
  1063. testName := "test_secret"
  1064. id := d.createSecret(c, swarm.SecretSpec{
  1065. swarm.Annotations{
  1066. Name: testName,
  1067. },
  1068. []byte("TESTINGDATA"),
  1069. })
  1070. c.Assert(id, checker.Not(checker.Equals), "", check.Commentf("secrets: %s", id))
  1071. secret := d.getSecret(c, id)
  1072. c.Assert(secret.ID, checker.Equals, id, check.Commentf("secret: %v", secret))
  1073. d.deleteSecret(c, secret.ID)
  1074. status, out, err := d.SockRequest("GET", "/secrets/"+id, nil)
  1075. c.Assert(err, checker.IsNil)
  1076. c.Assert(status, checker.Equals, http.StatusNotFound, check.Commentf("secret delete: %s", string(out)))
  1077. }
  1078. // Test case for 30242, where duplicate networks, with different drivers `bridge` and `overlay`,
  1079. // caused both scopes to be `swarm` for `docker network inspect` and `docker network ls`.
  1080. // This test makes sure the fixes correctly output scopes instead.
  1081. func (s *DockerSwarmSuite) TestAPIDuplicateNetworks(c *check.C) {
  1082. d := s.AddDaemon(c, true, true)
  1083. name := "foo"
  1084. networkCreateRequest := types.NetworkCreateRequest{
  1085. Name: name,
  1086. NetworkCreate: types.NetworkCreate{
  1087. CheckDuplicate: false,
  1088. },
  1089. }
  1090. var n1 types.NetworkCreateResponse
  1091. networkCreateRequest.NetworkCreate.Driver = "bridge"
  1092. status, out, err := d.SockRequest("POST", "/networks/create", networkCreateRequest)
  1093. c.Assert(err, checker.IsNil, check.Commentf(string(out)))
  1094. c.Assert(status, checker.Equals, http.StatusCreated, check.Commentf(string(out)))
  1095. c.Assert(json.Unmarshal(out, &n1), checker.IsNil)
  1096. var n2 types.NetworkCreateResponse
  1097. networkCreateRequest.NetworkCreate.Driver = "overlay"
  1098. status, out, err = d.SockRequest("POST", "/networks/create", networkCreateRequest)
  1099. c.Assert(err, checker.IsNil, check.Commentf(string(out)))
  1100. c.Assert(status, checker.Equals, http.StatusCreated, check.Commentf(string(out)))
  1101. c.Assert(json.Unmarshal(out, &n2), checker.IsNil)
  1102. var r1 types.NetworkResource
  1103. status, out, err = d.SockRequest("GET", "/networks/"+n1.ID, nil)
  1104. c.Assert(err, checker.IsNil, check.Commentf(string(out)))
  1105. c.Assert(status, checker.Equals, http.StatusOK, check.Commentf(string(out)))
  1106. c.Assert(json.Unmarshal(out, &r1), checker.IsNil)
  1107. c.Assert(r1.Scope, checker.Equals, "local")
  1108. var r2 types.NetworkResource
  1109. status, out, err = d.SockRequest("GET", "/networks/"+n2.ID, nil)
  1110. c.Assert(err, checker.IsNil, check.Commentf(string(out)))
  1111. c.Assert(status, checker.Equals, http.StatusOK, check.Commentf(string(out)))
  1112. c.Assert(json.Unmarshal(out, &r2), checker.IsNil)
  1113. c.Assert(r2.Scope, checker.Equals, "swarm")
  1114. }