docker_api_swarm_test.go 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806
  1. // +build !windows
  2. package main
  3. import (
  4. "fmt"
  5. "net/http"
  6. "strconv"
  7. "strings"
  8. "syscall"
  9. "time"
  10. "github.com/docker/docker/pkg/integration/checker"
  11. "github.com/docker/engine-api/types/swarm"
  12. "github.com/go-check/check"
  13. )
  14. var defaultReconciliationTimeout = 30 * time.Second
  15. func (s *DockerSwarmSuite) TestApiSwarmInit(c *check.C) {
  16. // todo: should find a better way to verify that components are running than /info
  17. d1 := s.AddDaemon(c, true, true)
  18. info, err := d1.info()
  19. c.Assert(err, checker.IsNil)
  20. c.Assert(info.ControlAvailable, checker.Equals, true)
  21. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  22. d2 := s.AddDaemon(c, true, false)
  23. info, err = d2.info()
  24. c.Assert(err, checker.IsNil)
  25. c.Assert(info.ControlAvailable, checker.Equals, false)
  26. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  27. // Leaving cluster
  28. c.Assert(d2.Leave(false), checker.IsNil)
  29. info, err = d2.info()
  30. c.Assert(err, checker.IsNil)
  31. c.Assert(info.ControlAvailable, checker.Equals, false)
  32. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  33. c.Assert(d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  34. info, err = d2.info()
  35. c.Assert(err, checker.IsNil)
  36. c.Assert(info.ControlAvailable, checker.Equals, false)
  37. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  38. // Current state restoring after restarts
  39. err = d1.Stop()
  40. c.Assert(err, checker.IsNil)
  41. err = d2.Stop()
  42. c.Assert(err, checker.IsNil)
  43. err = d1.Start()
  44. c.Assert(err, checker.IsNil)
  45. err = d2.Start()
  46. c.Assert(err, checker.IsNil)
  47. info, err = d1.info()
  48. c.Assert(err, checker.IsNil)
  49. c.Assert(info.ControlAvailable, checker.Equals, true)
  50. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  51. info, err = d2.info()
  52. c.Assert(err, checker.IsNil)
  53. c.Assert(info.ControlAvailable, checker.Equals, false)
  54. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  55. }
  56. func (s *DockerSwarmSuite) TestApiSwarmManualAcceptance(c *check.C) {
  57. s.testAPISwarmManualAcceptance(c, "")
  58. }
  59. func (s *DockerSwarmSuite) TestApiSwarmManualAcceptanceSecret(c *check.C) {
  60. s.testAPISwarmManualAcceptance(c, "foobaz")
  61. }
  62. func (s *DockerSwarmSuite) testAPISwarmManualAcceptance(c *check.C, secret string) {
  63. d1 := s.AddDaemon(c, false, false)
  64. c.Assert(d1.Init(swarm.InitRequest{
  65. Spec: swarm.Spec{
  66. AcceptancePolicy: swarm.AcceptancePolicy{
  67. Policies: []swarm.Policy{
  68. {Role: swarm.NodeRoleWorker, Secret: &secret},
  69. {Role: swarm.NodeRoleManager, Secret: &secret},
  70. },
  71. },
  72. },
  73. }), checker.IsNil)
  74. d2 := s.AddDaemon(c, false, false)
  75. err := d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  76. c.Assert(err, checker.NotNil)
  77. if secret == "" {
  78. c.Assert(err.Error(), checker.Contains, "needs to be accepted")
  79. info, err := d2.info()
  80. c.Assert(err, checker.IsNil)
  81. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  82. c.Assert(d2.Leave(false), checker.IsNil)
  83. info, err = d2.info()
  84. c.Assert(err, checker.IsNil)
  85. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  86. } else {
  87. c.Assert(err.Error(), checker.Contains, "valid secret token is necessary")
  88. info, err := d2.info()
  89. c.Assert(err, checker.IsNil)
  90. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  91. }
  92. d3 := s.AddDaemon(c, false, false)
  93. c.Assert(d3.Join(swarm.JoinRequest{Secret: secret, RemoteAddrs: []string{d1.listenAddr}}), checker.NotNil)
  94. info, err := d3.info()
  95. c.Assert(err, checker.IsNil)
  96. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  97. c.Assert(len(info.NodeID), checker.GreaterThan, 5)
  98. d1.updateNode(c, info.NodeID, func(n *swarm.Node) {
  99. n.Spec.Membership = swarm.NodeMembershipAccepted
  100. })
  101. for i := 0; ; i++ {
  102. info, err := d3.info()
  103. c.Assert(err, checker.IsNil)
  104. if info.LocalNodeState == swarm.LocalNodeStateActive {
  105. break
  106. }
  107. if i > 100 {
  108. c.Fatalf("node did not become active")
  109. }
  110. time.Sleep(200 * time.Millisecond)
  111. }
  112. }
  113. func (s *DockerSwarmSuite) TestApiSwarmSecretAcceptance(c *check.C) {
  114. d1 := s.AddDaemon(c, false, false)
  115. secret := "foobar"
  116. c.Assert(d1.Init(swarm.InitRequest{
  117. Spec: swarm.Spec{
  118. AcceptancePolicy: swarm.AcceptancePolicy{
  119. Policies: []swarm.Policy{
  120. {Role: swarm.NodeRoleWorker, Autoaccept: true, Secret: &secret},
  121. {Role: swarm.NodeRoleManager, Secret: &secret},
  122. },
  123. },
  124. },
  125. }), checker.IsNil)
  126. d2 := s.AddDaemon(c, false, false)
  127. err := d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  128. c.Assert(err, checker.NotNil)
  129. c.Assert(err.Error(), checker.Contains, "secret token is necessary")
  130. info, err := d2.info()
  131. c.Assert(err, checker.IsNil)
  132. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  133. err = d2.Join(swarm.JoinRequest{Secret: "foobaz", RemoteAddrs: []string{d1.listenAddr}})
  134. c.Assert(err, checker.NotNil)
  135. c.Assert(err.Error(), checker.Contains, "secret token is necessary")
  136. info, err = d2.info()
  137. c.Assert(err, checker.IsNil)
  138. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  139. c.Assert(d2.Join(swarm.JoinRequest{Secret: "foobar", RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  140. info, err = d2.info()
  141. c.Assert(err, checker.IsNil)
  142. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  143. c.Assert(d2.Leave(false), checker.IsNil)
  144. info, err = d2.info()
  145. c.Assert(err, checker.IsNil)
  146. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  147. // change secret
  148. d1.updateSwarm(c, func(s *swarm.Spec) {
  149. for i := range s.AcceptancePolicy.Policies {
  150. p := "foobaz"
  151. s.AcceptancePolicy.Policies[i].Secret = &p
  152. }
  153. })
  154. err = d2.Join(swarm.JoinRequest{Secret: "foobar", RemoteAddrs: []string{d1.listenAddr}})
  155. c.Assert(err, checker.NotNil)
  156. c.Assert(err.Error(), checker.Contains, "secret token is necessary")
  157. info, err = d2.info()
  158. c.Assert(err, checker.IsNil)
  159. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  160. c.Assert(d2.Join(swarm.JoinRequest{Secret: "foobaz", RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  161. info, err = d2.info()
  162. c.Assert(err, checker.IsNil)
  163. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  164. c.Assert(d2.Leave(false), checker.IsNil)
  165. info, err = d2.info()
  166. c.Assert(err, checker.IsNil)
  167. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  168. // change policy, don't change secret
  169. d1.updateSwarm(c, func(s *swarm.Spec) {
  170. for i, p := range s.AcceptancePolicy.Policies {
  171. if p.Role == swarm.NodeRoleManager {
  172. s.AcceptancePolicy.Policies[i].Autoaccept = false
  173. }
  174. s.AcceptancePolicy.Policies[i].Secret = nil
  175. }
  176. })
  177. err = d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  178. c.Assert(err, checker.NotNil)
  179. c.Assert(err.Error(), checker.Contains, "secret token is necessary")
  180. info, err = d2.info()
  181. c.Assert(err, checker.IsNil)
  182. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  183. c.Assert(d2.Join(swarm.JoinRequest{Secret: "foobaz", RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  184. info, err = d2.info()
  185. c.Assert(err, checker.IsNil)
  186. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  187. c.Assert(d2.Leave(false), checker.IsNil)
  188. info, err = d2.info()
  189. c.Assert(err, checker.IsNil)
  190. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  191. // clear secret
  192. d1.updateSwarm(c, func(s *swarm.Spec) {
  193. for i := range s.AcceptancePolicy.Policies {
  194. p := ""
  195. s.AcceptancePolicy.Policies[i].Secret = &p
  196. }
  197. })
  198. c.Assert(d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  199. info, err = d2.info()
  200. c.Assert(err, checker.IsNil)
  201. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  202. c.Assert(d2.Leave(false), checker.IsNil)
  203. info, err = d2.info()
  204. c.Assert(err, checker.IsNil)
  205. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  206. }
  207. func (s *DockerSwarmSuite) TestApiSwarmCAHash(c *check.C) {
  208. d1 := s.AddDaemon(c, true, true)
  209. d2 := s.AddDaemon(c, false, false)
  210. err := d2.Join(swarm.JoinRequest{CACertHash: "foobar", RemoteAddrs: []string{d1.listenAddr}})
  211. c.Assert(err, checker.NotNil)
  212. c.Assert(err.Error(), checker.Contains, "invalid checksum digest format")
  213. c.Assert(len(d1.CACertHash), checker.GreaterThan, 0)
  214. c.Assert(d2.Join(swarm.JoinRequest{CACertHash: d1.CACertHash, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  215. }
  216. func (s *DockerSwarmSuite) TestApiSwarmPromoteDemote(c *check.C) {
  217. d1 := s.AddDaemon(c, false, false)
  218. c.Assert(d1.Init(swarm.InitRequest{
  219. Spec: swarm.Spec{
  220. AcceptancePolicy: swarm.AcceptancePolicy{
  221. Policies: []swarm.Policy{
  222. {Role: swarm.NodeRoleWorker, Autoaccept: true},
  223. {Role: swarm.NodeRoleManager},
  224. },
  225. },
  226. },
  227. }), checker.IsNil)
  228. d2 := s.AddDaemon(c, true, false)
  229. info, err := d2.info()
  230. c.Assert(err, checker.IsNil)
  231. c.Assert(info.ControlAvailable, checker.Equals, false)
  232. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  233. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  234. n.Spec.Role = swarm.NodeRoleManager
  235. })
  236. for i := 0; ; i++ {
  237. info, err := d2.info()
  238. c.Assert(err, checker.IsNil)
  239. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  240. if info.ControlAvailable {
  241. break
  242. }
  243. if i > 100 {
  244. c.Errorf("node did not turn into manager")
  245. }
  246. time.Sleep(100 * time.Millisecond)
  247. }
  248. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  249. n.Spec.Role = swarm.NodeRoleWorker
  250. })
  251. for i := 0; ; i++ {
  252. info, err := d2.info()
  253. c.Assert(err, checker.IsNil)
  254. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  255. if !info.ControlAvailable {
  256. break
  257. }
  258. if i > 100 {
  259. c.Errorf("node did not turn into worker")
  260. }
  261. time.Sleep(100 * time.Millisecond)
  262. }
  263. // Demoting last node should fail
  264. node := d1.getNode(c, d1.NodeID)
  265. node.Spec.Role = swarm.NodeRoleWorker
  266. url := fmt.Sprintf("/nodes/%s/update?version=%d", node.ID, node.Version.Index)
  267. status, out, err := d1.SockRequest("POST", url, node.Spec)
  268. c.Assert(err, checker.IsNil)
  269. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("output: %q", string(out)))
  270. c.Assert(string(out), checker.Contains, "last manager of the swarm")
  271. info, err = d1.info()
  272. c.Assert(err, checker.IsNil)
  273. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  274. c.Assert(info.ControlAvailable, checker.Equals, true)
  275. // Promote already demoted node
  276. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  277. n.Spec.Role = swarm.NodeRoleManager
  278. })
  279. for i := 0; ; i++ {
  280. info, err := d2.info()
  281. c.Assert(err, checker.IsNil)
  282. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  283. if info.ControlAvailable {
  284. break
  285. }
  286. if i > 100 {
  287. c.Errorf("node did not turn into manager")
  288. }
  289. time.Sleep(100 * time.Millisecond)
  290. }
  291. }
  292. func (s *DockerSwarmSuite) TestApiSwarmServicesCreate(c *check.C) {
  293. d := s.AddDaemon(c, true, true)
  294. instances := 2
  295. id := d.createService(c, simpleTestService, setInstances(instances))
  296. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  297. service := d.getService(c, id)
  298. instances = 5
  299. d.updateService(c, service, setInstances(instances))
  300. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  301. d.removeService(c, service.ID)
  302. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 0)
  303. }
  304. func (s *DockerSwarmSuite) TestApiSwarmServicesMultipleAgents(c *check.C) {
  305. d1 := s.AddDaemon(c, true, true)
  306. d2 := s.AddDaemon(c, true, false)
  307. d3 := s.AddDaemon(c, true, false)
  308. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  309. instances := 9
  310. id := d1.createService(c, simpleTestService, setInstances(instances))
  311. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  312. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  313. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.GreaterThan, 0)
  314. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  315. // reconciliation on d2 node down
  316. c.Assert(d2.Stop(), checker.IsNil)
  317. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  318. // test downscaling
  319. instances = 5
  320. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  321. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  322. }
  323. func (s *DockerSwarmSuite) TestApiSwarmServicesCreateGlobal(c *check.C) {
  324. d1 := s.AddDaemon(c, true, true)
  325. d2 := s.AddDaemon(c, true, false)
  326. d3 := s.AddDaemon(c, true, false)
  327. d1.createService(c, simpleTestService, setGlobalMode)
  328. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, 1)
  329. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  330. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.Equals, 1)
  331. d4 := s.AddDaemon(c, true, false)
  332. d5 := s.AddDaemon(c, true, false)
  333. waitAndAssert(c, defaultReconciliationTimeout, d4.checkActiveContainerCount, checker.Equals, 1)
  334. waitAndAssert(c, defaultReconciliationTimeout, d5.checkActiveContainerCount, checker.Equals, 1)
  335. }
  336. func (s *DockerSwarmSuite) TestApiSwarmServicesStateReporting(c *check.C) {
  337. testRequires(c, SameHostDaemon)
  338. testRequires(c, DaemonIsLinux)
  339. d1 := s.AddDaemon(c, true, true)
  340. d2 := s.AddDaemon(c, true, true)
  341. d3 := s.AddDaemon(c, true, false)
  342. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept
  343. instances := 9
  344. d1.createService(c, simpleTestService, setInstances(instances))
  345. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  346. getContainers := func() map[string]*SwarmDaemon {
  347. m := make(map[string]*SwarmDaemon)
  348. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  349. for _, id := range d.activeContainers() {
  350. m[id] = d
  351. }
  352. }
  353. return m
  354. }
  355. containers := getContainers()
  356. c.Assert(containers, checker.HasLen, instances)
  357. var toRemove string
  358. for i := range containers {
  359. toRemove = i
  360. }
  361. _, err := containers[toRemove].Cmd("stop", toRemove)
  362. c.Assert(err, checker.IsNil)
  363. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  364. containers2 := getContainers()
  365. c.Assert(containers2, checker.HasLen, instances)
  366. for i := range containers {
  367. if i == toRemove {
  368. c.Assert(containers2[i], checker.IsNil)
  369. } else {
  370. c.Assert(containers2[i], checker.NotNil)
  371. }
  372. }
  373. containers = containers2
  374. for i := range containers {
  375. toRemove = i
  376. }
  377. // try with killing process outside of docker
  378. pidStr, err := containers[toRemove].Cmd("inspect", "-f", "{{.State.Pid}}", toRemove)
  379. c.Assert(err, checker.IsNil)
  380. pid, err := strconv.Atoi(strings.TrimSpace(pidStr))
  381. c.Assert(err, checker.IsNil)
  382. c.Assert(syscall.Kill(pid, syscall.SIGKILL), checker.IsNil)
  383. time.Sleep(time.Second) // give some time to handle the signal
  384. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  385. containers2 = getContainers()
  386. c.Assert(containers2, checker.HasLen, instances)
  387. for i := range containers {
  388. if i == toRemove {
  389. c.Assert(containers2[i], checker.IsNil)
  390. } else {
  391. c.Assert(containers2[i], checker.NotNil)
  392. }
  393. }
  394. }
  395. func (s *DockerSwarmSuite) TestApiSwarmRaftQuorum(c *check.C) {
  396. d1 := s.AddDaemon(c, true, true)
  397. d2 := s.AddDaemon(c, true, true)
  398. d3 := s.AddDaemon(c, true, true)
  399. d1.createService(c, simpleTestService)
  400. c.Assert(d2.Stop(), checker.IsNil)
  401. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  402. s.Spec.Name = "top1"
  403. })
  404. c.Assert(d3.Stop(), checker.IsNil)
  405. var service swarm.Service
  406. simpleTestService(&service)
  407. service.Spec.Name = "top2"
  408. status, out, err := d1.SockRequest("POST", "/services/create", service.Spec)
  409. c.Assert(err, checker.IsNil)
  410. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("deadline exceeded", string(out)))
  411. c.Assert(d2.Start(), checker.IsNil)
  412. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  413. s.Spec.Name = "top3"
  414. })
  415. }
  416. func (s *DockerSwarmSuite) TestApiSwarmListNodes(c *check.C) {
  417. d1 := s.AddDaemon(c, true, true)
  418. d2 := s.AddDaemon(c, true, false)
  419. d3 := s.AddDaemon(c, true, false)
  420. nodes := d1.listNodes(c)
  421. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  422. loop0:
  423. for _, n := range nodes {
  424. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  425. if n.ID == d.NodeID {
  426. continue loop0
  427. }
  428. }
  429. c.Errorf("unknown nodeID %v", n.ID)
  430. }
  431. }
  432. func (s *DockerSwarmSuite) TestApiSwarmNodeUpdate(c *check.C) {
  433. d := s.AddDaemon(c, true, true)
  434. nodes := d.listNodes(c)
  435. d.updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  436. n.Spec.Availability = swarm.NodeAvailabilityPause
  437. })
  438. n := d.getNode(c, nodes[0].ID)
  439. c.Assert(n.Spec.Availability, checker.Equals, swarm.NodeAvailabilityPause)
  440. }
  441. func (s *DockerSwarmSuite) TestApiSwarmNodeDrainPause(c *check.C) {
  442. d1 := s.AddDaemon(c, true, true)
  443. d2 := s.AddDaemon(c, true, false)
  444. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  445. // start a service, expect balanced distribution
  446. instances := 8
  447. id := d1.createService(c, simpleTestService, setInstances(instances))
  448. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  449. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  450. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  451. // drain d2, all containers should move to d1
  452. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  453. n.Spec.Availability = swarm.NodeAvailabilityDrain
  454. })
  455. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  456. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  457. // set d2 back to active
  458. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  459. n.Spec.Availability = swarm.NodeAvailabilityActive
  460. })
  461. instances = 1
  462. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  463. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  464. instances = 8
  465. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  466. // drained node first so we don't get any old containers
  467. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  468. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  469. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  470. d2ContainerCount := len(d2.activeContainers())
  471. // set d2 to paused, scale service up, only d1 gets new tasks
  472. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  473. n.Spec.Availability = swarm.NodeAvailabilityPause
  474. })
  475. instances = 14
  476. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  477. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances-d2ContainerCount)
  478. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, d2ContainerCount)
  479. }
  480. func (s *DockerSwarmSuite) TestApiSwarmLeaveRemovesContainer(c *check.C) {
  481. d := s.AddDaemon(c, true, true)
  482. instances := 2
  483. d.createService(c, simpleTestService, setInstances(instances))
  484. id, err := d.Cmd("run", "-d", "busybox", "top")
  485. c.Assert(err, checker.IsNil)
  486. id = strings.TrimSpace(id)
  487. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances+1)
  488. c.Assert(d.Leave(false), checker.NotNil)
  489. c.Assert(d.Leave(true), checker.IsNil)
  490. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 1)
  491. id2, err := d.Cmd("ps", "-q")
  492. c.Assert(err, checker.IsNil)
  493. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  494. }
  495. // #23629
  496. func (s *DockerSwarmSuite) TestApiSwarmLeaveOnPendingJoin(c *check.C) {
  497. s.AddDaemon(c, true, true)
  498. d2 := s.AddDaemon(c, false, false)
  499. id, err := d2.Cmd("run", "-d", "busybox", "top")
  500. c.Assert(err, checker.IsNil)
  501. id = strings.TrimSpace(id)
  502. go d2.Join(swarm.JoinRequest{
  503. RemoteAddrs: []string{"nosuchhost:1234"},
  504. }) // will block on pending state
  505. for i := 0; ; i++ {
  506. info, err := d2.info()
  507. c.Assert(err, checker.IsNil)
  508. if info.LocalNodeState == swarm.LocalNodeStatePending {
  509. break
  510. }
  511. if i > 100 {
  512. c.Fatalf("node did not go to pending state: %v", info.LocalNodeState)
  513. }
  514. time.Sleep(100 * time.Millisecond)
  515. }
  516. c.Assert(d2.Leave(true), checker.IsNil)
  517. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  518. id2, err := d2.Cmd("ps", "-q")
  519. c.Assert(err, checker.IsNil)
  520. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  521. }
  522. // #23705
  523. func (s *DockerSwarmSuite) TestApiSwarmRestoreOnPendingJoin(c *check.C) {
  524. d := s.AddDaemon(c, false, false)
  525. go d.Join(swarm.JoinRequest{
  526. RemoteAddrs: []string{"nosuchhost:1234"},
  527. }) // will block on pending state
  528. for i := 0; ; i++ {
  529. info, err := d.info()
  530. c.Assert(err, checker.IsNil)
  531. if info.LocalNodeState == swarm.LocalNodeStatePending {
  532. break
  533. }
  534. if i > 100 {
  535. c.Fatalf("node did not go to pending state: %v", info.LocalNodeState)
  536. }
  537. time.Sleep(100 * time.Millisecond)
  538. }
  539. c.Assert(d.Stop(), checker.IsNil)
  540. c.Assert(d.Start(), checker.IsNil)
  541. info, err := d.info()
  542. c.Assert(err, checker.IsNil)
  543. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  544. }
  545. func (s *DockerSwarmSuite) TestApiSwarmManagerRestore(c *check.C) {
  546. d1 := s.AddDaemon(c, true, true)
  547. instances := 2
  548. id := d1.createService(c, simpleTestService, setInstances(instances))
  549. d1.getService(c, id)
  550. d1.Stop()
  551. d1.Start()
  552. d1.getService(c, id)
  553. d2 := s.AddDaemon(c, true, true)
  554. d2.getService(c, id)
  555. d2.Stop()
  556. d2.Start()
  557. d2.getService(c, id)
  558. d3 := s.AddDaemon(c, true, true)
  559. d3.getService(c, id)
  560. d3.Stop()
  561. d3.Start()
  562. d3.getService(c, id)
  563. d3.Kill()
  564. time.Sleep(1 * time.Second) // time to handle signal
  565. d3.Start()
  566. d3.getService(c, id)
  567. }
  568. func (s *DockerSwarmSuite) TestApiSwarmScaleNoRollingUpdate(c *check.C) {
  569. d := s.AddDaemon(c, true, true)
  570. instances := 2
  571. id := d.createService(c, simpleTestService, setInstances(instances))
  572. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  573. containers := d.activeContainers()
  574. instances = 4
  575. d.updateService(c, d.getService(c, id), setInstances(instances))
  576. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  577. containers2 := d.activeContainers()
  578. loop0:
  579. for _, c1 := range containers {
  580. for _, c2 := range containers2 {
  581. if c1 == c2 {
  582. continue loop0
  583. }
  584. }
  585. c.Errorf("container %v not found in new set %#v", c1, containers2)
  586. }
  587. }
  588. func (s *DockerSwarmSuite) TestApiSwarmInvalidAddress(c *check.C) {
  589. d := s.AddDaemon(c, false, false)
  590. req := swarm.InitRequest{
  591. ListenAddr: "",
  592. }
  593. status, _, err := d.SockRequest("POST", "/swarm/init", req)
  594. c.Assert(err, checker.IsNil)
  595. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  596. req2 := swarm.JoinRequest{
  597. ListenAddr: "0.0.0.0:2377",
  598. RemoteAddrs: []string{""},
  599. }
  600. status, _, err = d.SockRequest("POST", "/swarm/join", req2)
  601. c.Assert(err, checker.IsNil)
  602. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  603. }
  604. func (s *DockerSwarmSuite) TestApiSwarmForceNewCluster(c *check.C) {
  605. d1 := s.AddDaemon(c, true, true)
  606. d2 := s.AddDaemon(c, true, true)
  607. instances := 2
  608. id := d1.createService(c, simpleTestService, setInstances(instances))
  609. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  610. c.Assert(d2.Stop(), checker.IsNil)
  611. time.Sleep(5 * time.Second)
  612. c.Assert(d1.Init(swarm.InitRequest{
  613. ForceNewCluster: true,
  614. Spec: swarm.Spec{
  615. AcceptancePolicy: autoAcceptPolicy,
  616. },
  617. }), checker.IsNil)
  618. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  619. d3 := s.AddDaemon(c, true, true)
  620. info, err := d3.info()
  621. c.Assert(err, checker.IsNil)
  622. c.Assert(info.ControlAvailable, checker.Equals, true)
  623. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  624. instances = 4
  625. d3.updateService(c, d3.getService(c, id), setInstances(instances))
  626. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  627. }
  628. func simpleTestService(s *swarm.Service) {
  629. var ureplicas uint64
  630. ureplicas = 1
  631. s.Spec = swarm.ServiceSpec{
  632. TaskTemplate: swarm.TaskSpec{
  633. ContainerSpec: swarm.ContainerSpec{
  634. Image: "busybox:latest",
  635. Command: []string{"/bin/top"},
  636. },
  637. },
  638. Mode: swarm.ServiceMode{
  639. Replicated: &swarm.ReplicatedService{
  640. Replicas: &ureplicas,
  641. },
  642. },
  643. }
  644. s.Spec.Name = "top"
  645. }
  646. func setInstances(replicas int) serviceConstructor {
  647. ureplicas := uint64(replicas)
  648. return func(s *swarm.Service) {
  649. s.Spec.Mode = swarm.ServiceMode{
  650. Replicated: &swarm.ReplicatedService{
  651. Replicas: &ureplicas,
  652. },
  653. }
  654. }
  655. }
  656. func setGlobalMode(s *swarm.Service) {
  657. s.Spec.Mode = swarm.ServiceMode{
  658. Global: &swarm.GlobalService{},
  659. }
  660. }