docker_api_swarm_test.go 31 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953
  1. // +build !windows
  2. package main
  3. import (
  4. "fmt"
  5. "net/http"
  6. "os"
  7. "path/filepath"
  8. "strconv"
  9. "strings"
  10. "sync"
  11. "syscall"
  12. "time"
  13. "github.com/docker/docker/pkg/integration/checker"
  14. "github.com/docker/engine-api/types/swarm"
  15. "github.com/go-check/check"
  16. )
  17. var defaultReconciliationTimeout = 30 * time.Second
  18. func (s *DockerSwarmSuite) TestApiSwarmInit(c *check.C) {
  19. testRequires(c, Network)
  20. // todo: should find a better way to verify that components are running than /info
  21. d1 := s.AddDaemon(c, true, true)
  22. info, err := d1.info()
  23. c.Assert(err, checker.IsNil)
  24. c.Assert(info.ControlAvailable, checker.True)
  25. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  26. d2 := s.AddDaemon(c, true, false)
  27. info, err = d2.info()
  28. c.Assert(err, checker.IsNil)
  29. c.Assert(info.ControlAvailable, checker.False)
  30. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  31. // Leaving cluster
  32. c.Assert(d2.Leave(false), checker.IsNil)
  33. info, err = d2.info()
  34. c.Assert(err, checker.IsNil)
  35. c.Assert(info.ControlAvailable, checker.False)
  36. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  37. c.Assert(d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  38. info, err = d2.info()
  39. c.Assert(err, checker.IsNil)
  40. c.Assert(info.ControlAvailable, checker.False)
  41. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  42. // Current state restoring after restarts
  43. err = d1.Stop()
  44. c.Assert(err, checker.IsNil)
  45. err = d2.Stop()
  46. c.Assert(err, checker.IsNil)
  47. err = d1.Start()
  48. c.Assert(err, checker.IsNil)
  49. err = d2.Start()
  50. c.Assert(err, checker.IsNil)
  51. info, err = d1.info()
  52. c.Assert(err, checker.IsNil)
  53. c.Assert(info.ControlAvailable, checker.True)
  54. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  55. info, err = d2.info()
  56. c.Assert(err, checker.IsNil)
  57. c.Assert(info.ControlAvailable, checker.False)
  58. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  59. }
  60. func (s *DockerSwarmSuite) TestApiSwarmManualAcceptance(c *check.C) {
  61. testRequires(c, Network)
  62. s.testAPISwarmManualAcceptance(c, "")
  63. }
  64. func (s *DockerSwarmSuite) TestApiSwarmManualAcceptanceSecret(c *check.C) {
  65. testRequires(c, Network)
  66. s.testAPISwarmManualAcceptance(c, "foobaz")
  67. }
  68. func (s *DockerSwarmSuite) testAPISwarmManualAcceptance(c *check.C, secret string) {
  69. d1 := s.AddDaemon(c, false, false)
  70. c.Assert(d1.Init(swarm.InitRequest{
  71. Spec: swarm.Spec{
  72. AcceptancePolicy: swarm.AcceptancePolicy{
  73. Policies: []swarm.Policy{
  74. {Role: swarm.NodeRoleWorker, Secret: &secret},
  75. {Role: swarm.NodeRoleManager, Secret: &secret},
  76. },
  77. },
  78. },
  79. }), checker.IsNil)
  80. d2 := s.AddDaemon(c, false, false)
  81. err := d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  82. c.Assert(err, checker.NotNil)
  83. if secret == "" {
  84. c.Assert(err.Error(), checker.Contains, "needs to be accepted")
  85. info, err := d2.info()
  86. c.Assert(err, checker.IsNil)
  87. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  88. c.Assert(d2.Leave(false), checker.IsNil)
  89. info, err = d2.info()
  90. c.Assert(err, checker.IsNil)
  91. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  92. } else {
  93. c.Assert(err.Error(), checker.Contains, "valid secret token is necessary")
  94. info, err := d2.info()
  95. c.Assert(err, checker.IsNil)
  96. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  97. }
  98. d3 := s.AddDaemon(c, false, false)
  99. c.Assert(d3.Join(swarm.JoinRequest{Secret: secret, RemoteAddrs: []string{d1.listenAddr}}), checker.NotNil)
  100. info, err := d3.info()
  101. c.Assert(err, checker.IsNil)
  102. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  103. c.Assert(len(info.NodeID), checker.GreaterThan, 5)
  104. d1.updateNode(c, info.NodeID, func(n *swarm.Node) {
  105. n.Spec.Membership = swarm.NodeMembershipAccepted
  106. })
  107. waitAndAssert(c, defaultReconciliationTimeout, d3.checkLocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  108. }
  109. func (s *DockerSwarmSuite) TestApiSwarmSecretAcceptance(c *check.C) {
  110. testRequires(c, Network)
  111. d1 := s.AddDaemon(c, false, false)
  112. secret := "foobar"
  113. c.Assert(d1.Init(swarm.InitRequest{
  114. Spec: swarm.Spec{
  115. AcceptancePolicy: swarm.AcceptancePolicy{
  116. Policies: []swarm.Policy{
  117. {Role: swarm.NodeRoleWorker, Autoaccept: true, Secret: &secret},
  118. {Role: swarm.NodeRoleManager, Secret: &secret},
  119. },
  120. },
  121. },
  122. }), checker.IsNil)
  123. d2 := s.AddDaemon(c, false, false)
  124. err := d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  125. c.Assert(err, checker.NotNil)
  126. c.Assert(err.Error(), checker.Contains, "secret token is necessary")
  127. info, err := d2.info()
  128. c.Assert(err, checker.IsNil)
  129. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  130. err = d2.Join(swarm.JoinRequest{Secret: "foobaz", RemoteAddrs: []string{d1.listenAddr}})
  131. c.Assert(err, checker.NotNil)
  132. c.Assert(err.Error(), checker.Contains, "secret token is necessary")
  133. info, err = d2.info()
  134. c.Assert(err, checker.IsNil)
  135. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  136. c.Assert(d2.Join(swarm.JoinRequest{Secret: "foobar", RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  137. info, err = d2.info()
  138. c.Assert(err, checker.IsNil)
  139. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  140. c.Assert(d2.Leave(false), checker.IsNil)
  141. info, err = d2.info()
  142. c.Assert(err, checker.IsNil)
  143. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  144. // change secret
  145. d1.updateSwarm(c, func(s *swarm.Spec) {
  146. for i := range s.AcceptancePolicy.Policies {
  147. p := "foobaz"
  148. s.AcceptancePolicy.Policies[i].Secret = &p
  149. }
  150. })
  151. err = d2.Join(swarm.JoinRequest{Secret: "foobar", RemoteAddrs: []string{d1.listenAddr}})
  152. c.Assert(err, checker.NotNil)
  153. c.Assert(err.Error(), checker.Contains, "secret token is necessary")
  154. info, err = d2.info()
  155. c.Assert(err, checker.IsNil)
  156. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  157. c.Assert(d2.Join(swarm.JoinRequest{Secret: "foobaz", RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  158. info, err = d2.info()
  159. c.Assert(err, checker.IsNil)
  160. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  161. c.Assert(d2.Leave(false), checker.IsNil)
  162. info, err = d2.info()
  163. c.Assert(err, checker.IsNil)
  164. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  165. // change policy, don't change secret
  166. d1.updateSwarm(c, func(s *swarm.Spec) {
  167. for i, p := range s.AcceptancePolicy.Policies {
  168. if p.Role == swarm.NodeRoleManager {
  169. s.AcceptancePolicy.Policies[i].Autoaccept = false
  170. }
  171. s.AcceptancePolicy.Policies[i].Secret = nil
  172. }
  173. })
  174. err = d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}})
  175. c.Assert(err, checker.NotNil)
  176. c.Assert(err.Error(), checker.Contains, "secret token is necessary")
  177. info, err = d2.info()
  178. c.Assert(err, checker.IsNil)
  179. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  180. c.Assert(d2.Join(swarm.JoinRequest{Secret: "foobaz", RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  181. info, err = d2.info()
  182. c.Assert(err, checker.IsNil)
  183. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  184. c.Assert(d2.Leave(false), checker.IsNil)
  185. info, err = d2.info()
  186. c.Assert(err, checker.IsNil)
  187. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  188. // clear secret
  189. d1.updateSwarm(c, func(s *swarm.Spec) {
  190. for i := range s.AcceptancePolicy.Policies {
  191. p := ""
  192. s.AcceptancePolicy.Policies[i].Secret = &p
  193. }
  194. })
  195. c.Assert(d2.Join(swarm.JoinRequest{RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  196. info, err = d2.info()
  197. c.Assert(err, checker.IsNil)
  198. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  199. c.Assert(d2.Leave(false), checker.IsNil)
  200. info, err = d2.info()
  201. c.Assert(err, checker.IsNil)
  202. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  203. }
  204. func (s *DockerSwarmSuite) TestApiSwarmCAHash(c *check.C) {
  205. testRequires(c, Network)
  206. d1 := s.AddDaemon(c, true, true)
  207. d2 := s.AddDaemon(c, false, false)
  208. err := d2.Join(swarm.JoinRequest{CACertHash: "foobar", RemoteAddrs: []string{d1.listenAddr}})
  209. c.Assert(err, checker.NotNil)
  210. c.Assert(err.Error(), checker.Contains, "invalid checksum digest format")
  211. c.Assert(len(d1.CACertHash), checker.GreaterThan, 0)
  212. c.Assert(d2.Join(swarm.JoinRequest{CACertHash: d1.CACertHash, RemoteAddrs: []string{d1.listenAddr}}), checker.IsNil)
  213. }
  214. func (s *DockerSwarmSuite) TestApiSwarmPromoteDemote(c *check.C) {
  215. testRequires(c, Network)
  216. d1 := s.AddDaemon(c, false, false)
  217. c.Assert(d1.Init(swarm.InitRequest{
  218. Spec: swarm.Spec{
  219. AcceptancePolicy: swarm.AcceptancePolicy{
  220. Policies: []swarm.Policy{
  221. {Role: swarm.NodeRoleWorker, Autoaccept: true},
  222. {Role: swarm.NodeRoleManager},
  223. },
  224. },
  225. },
  226. }), checker.IsNil)
  227. d2 := s.AddDaemon(c, true, false)
  228. info, err := d2.info()
  229. c.Assert(err, checker.IsNil)
  230. c.Assert(info.ControlAvailable, checker.False)
  231. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  232. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  233. n.Spec.Role = swarm.NodeRoleManager
  234. })
  235. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  236. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  237. n.Spec.Role = swarm.NodeRoleWorker
  238. })
  239. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.False)
  240. // Demoting last node should fail
  241. node := d1.getNode(c, d1.NodeID)
  242. node.Spec.Role = swarm.NodeRoleWorker
  243. url := fmt.Sprintf("/nodes/%s/update?version=%d", node.ID, node.Version.Index)
  244. status, out, err := d1.SockRequest("POST", url, node.Spec)
  245. c.Assert(err, checker.IsNil)
  246. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("output: %q", string(out)))
  247. c.Assert(string(out), checker.Contains, "last manager of the swarm")
  248. info, err = d1.info()
  249. c.Assert(err, checker.IsNil)
  250. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  251. c.Assert(info.ControlAvailable, checker.True)
  252. // Promote already demoted node
  253. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  254. n.Spec.Role = swarm.NodeRoleManager
  255. })
  256. waitAndAssert(c, defaultReconciliationTimeout, d2.checkControlAvailable, checker.True)
  257. }
  258. func (s *DockerSwarmSuite) TestApiSwarmServicesEmptyList(c *check.C) {
  259. testRequires(c, Network)
  260. d := s.AddDaemon(c, true, true)
  261. services := d.listServices(c)
  262. c.Assert(services, checker.NotNil)
  263. c.Assert(len(services), checker.Equals, 0, check.Commentf("services: %#v", services))
  264. }
  265. func (s *DockerSwarmSuite) TestApiSwarmServicesCreate(c *check.C) {
  266. testRequires(c, Network)
  267. d := s.AddDaemon(c, true, true)
  268. instances := 2
  269. id := d.createService(c, simpleTestService, setInstances(instances))
  270. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  271. service := d.getService(c, id)
  272. instances = 5
  273. d.updateService(c, service, setInstances(instances))
  274. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  275. d.removeService(c, service.ID)
  276. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 0)
  277. }
  278. func (s *DockerSwarmSuite) TestApiSwarmServicesMultipleAgents(c *check.C) {
  279. testRequires(c, Network)
  280. d1 := s.AddDaemon(c, true, true)
  281. d2 := s.AddDaemon(c, true, false)
  282. d3 := s.AddDaemon(c, true, false)
  283. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  284. instances := 9
  285. id := d1.createService(c, simpleTestService, setInstances(instances))
  286. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  287. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  288. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.GreaterThan, 0)
  289. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  290. // reconciliation on d2 node down
  291. c.Assert(d2.Stop(), checker.IsNil)
  292. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  293. // test downscaling
  294. instances = 5
  295. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  296. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  297. }
  298. func (s *DockerSwarmSuite) TestApiSwarmServicesCreateGlobal(c *check.C) {
  299. testRequires(c, Network)
  300. d1 := s.AddDaemon(c, true, true)
  301. d2 := s.AddDaemon(c, true, false)
  302. d3 := s.AddDaemon(c, true, false)
  303. d1.createService(c, simpleTestService, setGlobalMode)
  304. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, 1)
  305. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  306. waitAndAssert(c, defaultReconciliationTimeout, d3.checkActiveContainerCount, checker.Equals, 1)
  307. d4 := s.AddDaemon(c, true, false)
  308. d5 := s.AddDaemon(c, true, false)
  309. waitAndAssert(c, defaultReconciliationTimeout, d4.checkActiveContainerCount, checker.Equals, 1)
  310. waitAndAssert(c, defaultReconciliationTimeout, d5.checkActiveContainerCount, checker.Equals, 1)
  311. }
  312. func (s *DockerSwarmSuite) TestApiSwarmServicesStateReporting(c *check.C) {
  313. testRequires(c, Network)
  314. testRequires(c, SameHostDaemon)
  315. testRequires(c, DaemonIsLinux)
  316. d1 := s.AddDaemon(c, true, true)
  317. d2 := s.AddDaemon(c, true, true)
  318. d3 := s.AddDaemon(c, true, false)
  319. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept
  320. instances := 9
  321. d1.createService(c, simpleTestService, setInstances(instances))
  322. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  323. getContainers := func() map[string]*SwarmDaemon {
  324. m := make(map[string]*SwarmDaemon)
  325. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  326. for _, id := range d.activeContainers() {
  327. m[id] = d
  328. }
  329. }
  330. return m
  331. }
  332. containers := getContainers()
  333. c.Assert(containers, checker.HasLen, instances)
  334. var toRemove string
  335. for i := range containers {
  336. toRemove = i
  337. }
  338. _, err := containers[toRemove].Cmd("stop", toRemove)
  339. c.Assert(err, checker.IsNil)
  340. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  341. containers2 := getContainers()
  342. c.Assert(containers2, checker.HasLen, instances)
  343. for i := range containers {
  344. if i == toRemove {
  345. c.Assert(containers2[i], checker.IsNil)
  346. } else {
  347. c.Assert(containers2[i], checker.NotNil)
  348. }
  349. }
  350. containers = containers2
  351. for i := range containers {
  352. toRemove = i
  353. }
  354. // try with killing process outside of docker
  355. pidStr, err := containers[toRemove].Cmd("inspect", "-f", "{{.State.Pid}}", toRemove)
  356. c.Assert(err, checker.IsNil)
  357. pid, err := strconv.Atoi(strings.TrimSpace(pidStr))
  358. c.Assert(err, checker.IsNil)
  359. c.Assert(syscall.Kill(pid, syscall.SIGKILL), checker.IsNil)
  360. time.Sleep(time.Second) // give some time to handle the signal
  361. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  362. containers2 = getContainers()
  363. c.Assert(containers2, checker.HasLen, instances)
  364. for i := range containers {
  365. if i == toRemove {
  366. c.Assert(containers2[i], checker.IsNil)
  367. } else {
  368. c.Assert(containers2[i], checker.NotNil)
  369. }
  370. }
  371. }
  372. func (s *DockerSwarmSuite) TestApiSwarmLeaderProxy(c *check.C) {
  373. // add three managers, one of these is leader
  374. d1 := s.AddDaemon(c, true, true)
  375. d2 := s.AddDaemon(c, true, true)
  376. d3 := s.AddDaemon(c, true, true)
  377. // start a service by hitting each of the 3 managers
  378. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  379. s.Spec.Name = "test1"
  380. })
  381. d2.createService(c, simpleTestService, func(s *swarm.Service) {
  382. s.Spec.Name = "test2"
  383. })
  384. d3.createService(c, simpleTestService, func(s *swarm.Service) {
  385. s.Spec.Name = "test3"
  386. })
  387. // 3 services should be started now, because the requests were proxied to leader
  388. // query each node and make sure it returns 3 services
  389. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  390. services := d.listServices(c)
  391. c.Assert(services, checker.HasLen, 3)
  392. }
  393. }
  394. func (s *DockerSwarmSuite) TestApiSwarmLeaderElection(c *check.C) {
  395. // Create 3 nodes
  396. d1 := s.AddDaemon(c, true, true)
  397. d2 := s.AddDaemon(c, true, true)
  398. d3 := s.AddDaemon(c, true, true)
  399. // assert that the first node we made is the leader, and the other two are followers
  400. c.Assert(d1.getNode(c, d1.NodeID).ManagerStatus.Leader, checker.True)
  401. c.Assert(d1.getNode(c, d2.NodeID).ManagerStatus.Leader, checker.False)
  402. c.Assert(d1.getNode(c, d3.NodeID).ManagerStatus.Leader, checker.False)
  403. leader := d1
  404. // stop the leader
  405. leader.Stop()
  406. // wait for an election to occur
  407. var newleader *SwarmDaemon
  408. for _, d := range []*SwarmDaemon{d2, d3} {
  409. if d.getNode(c, d.NodeID).ManagerStatus.Leader {
  410. newleader = d
  411. break
  412. }
  413. }
  414. // assert that we have a new leader
  415. c.Assert(newleader, checker.NotNil)
  416. // add the old leader back
  417. leader.Start()
  418. // clear leader and reinit the followers list
  419. followers := make([]*SwarmDaemon, 0, 3)
  420. // pick out the leader and the followers again
  421. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  422. if d1.getNode(c, d.NodeID).ManagerStatus.Leader {
  423. leader = d
  424. } else {
  425. followers = append(followers, d)
  426. }
  427. }
  428. // verify that we still only have 1 leader and 2 followers
  429. c.Assert(leader, checker.NotNil)
  430. c.Assert(followers, checker.HasLen, 2)
  431. // and that after we added d1 back, the leader hasn't changed
  432. c.Assert(leader.NodeID, checker.Equals, newleader.NodeID)
  433. }
  434. func (s *DockerSwarmSuite) TestApiSwarmRaftQuorum(c *check.C) {
  435. testRequires(c, Network)
  436. d1 := s.AddDaemon(c, true, true)
  437. d2 := s.AddDaemon(c, true, true)
  438. d3 := s.AddDaemon(c, true, true)
  439. d1.createService(c, simpleTestService)
  440. c.Assert(d2.Stop(), checker.IsNil)
  441. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  442. s.Spec.Name = "top1"
  443. })
  444. c.Assert(d3.Stop(), checker.IsNil)
  445. var service swarm.Service
  446. simpleTestService(&service)
  447. service.Spec.Name = "top2"
  448. status, out, err := d1.SockRequest("POST", "/services/create", service.Spec)
  449. c.Assert(err, checker.IsNil)
  450. c.Assert(status, checker.Equals, http.StatusInternalServerError, check.Commentf("deadline exceeded", string(out)))
  451. c.Assert(d2.Start(), checker.IsNil)
  452. d1.createService(c, simpleTestService, func(s *swarm.Service) {
  453. s.Spec.Name = "top3"
  454. })
  455. }
  456. func (s *DockerSwarmSuite) TestApiSwarmListNodes(c *check.C) {
  457. testRequires(c, Network)
  458. d1 := s.AddDaemon(c, true, true)
  459. d2 := s.AddDaemon(c, true, false)
  460. d3 := s.AddDaemon(c, true, false)
  461. nodes := d1.listNodes(c)
  462. c.Assert(len(nodes), checker.Equals, 3, check.Commentf("nodes: %#v", nodes))
  463. loop0:
  464. for _, n := range nodes {
  465. for _, d := range []*SwarmDaemon{d1, d2, d3} {
  466. if n.ID == d.NodeID {
  467. continue loop0
  468. }
  469. }
  470. c.Errorf("unknown nodeID %v", n.ID)
  471. }
  472. }
  473. func (s *DockerSwarmSuite) TestApiSwarmNodeUpdate(c *check.C) {
  474. testRequires(c, Network)
  475. d := s.AddDaemon(c, true, true)
  476. nodes := d.listNodes(c)
  477. d.updateNode(c, nodes[0].ID, func(n *swarm.Node) {
  478. n.Spec.Availability = swarm.NodeAvailabilityPause
  479. })
  480. n := d.getNode(c, nodes[0].ID)
  481. c.Assert(n.Spec.Availability, checker.Equals, swarm.NodeAvailabilityPause)
  482. }
  483. func (s *DockerSwarmSuite) TestApiSwarmNodeDrainPause(c *check.C) {
  484. testRequires(c, Network)
  485. d1 := s.AddDaemon(c, true, true)
  486. d2 := s.AddDaemon(c, true, false)
  487. time.Sleep(1 * time.Second) // make sure all daemons are ready to accept tasks
  488. // start a service, expect balanced distribution
  489. instances := 8
  490. id := d1.createService(c, simpleTestService, setInstances(instances))
  491. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  492. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  493. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  494. // drain d2, all containers should move to d1
  495. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  496. n.Spec.Availability = swarm.NodeAvailabilityDrain
  497. })
  498. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  499. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 0)
  500. // set d2 back to active
  501. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  502. n.Spec.Availability = swarm.NodeAvailabilityActive
  503. })
  504. instances = 1
  505. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  506. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  507. instances = 8
  508. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  509. // drained node first so we don't get any old containers
  510. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.GreaterThan, 0)
  511. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.GreaterThan, 0)
  512. waitAndAssert(c, defaultReconciliationTimeout*2, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  513. d2ContainerCount := len(d2.activeContainers())
  514. // set d2 to paused, scale service up, only d1 gets new tasks
  515. d1.updateNode(c, d2.NodeID, func(n *swarm.Node) {
  516. n.Spec.Availability = swarm.NodeAvailabilityPause
  517. })
  518. instances = 14
  519. d1.updateService(c, d1.getService(c, id), setInstances(instances))
  520. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances-d2ContainerCount)
  521. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, d2ContainerCount)
  522. }
  523. func (s *DockerSwarmSuite) TestApiSwarmLeaveRemovesContainer(c *check.C) {
  524. testRequires(c, Network)
  525. d := s.AddDaemon(c, true, true)
  526. instances := 2
  527. d.createService(c, simpleTestService, setInstances(instances))
  528. id, err := d.Cmd("run", "-d", "busybox", "top")
  529. c.Assert(err, checker.IsNil)
  530. id = strings.TrimSpace(id)
  531. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances+1)
  532. c.Assert(d.Leave(false), checker.NotNil)
  533. c.Assert(d.Leave(true), checker.IsNil)
  534. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, 1)
  535. id2, err := d.Cmd("ps", "-q")
  536. c.Assert(err, checker.IsNil)
  537. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  538. }
  539. // #23629
  540. func (s *DockerSwarmSuite) TestApiSwarmLeaveOnPendingJoin(c *check.C) {
  541. s.AddDaemon(c, true, true)
  542. d2 := s.AddDaemon(c, false, false)
  543. id, err := d2.Cmd("run", "-d", "busybox", "top")
  544. c.Assert(err, checker.IsNil)
  545. id = strings.TrimSpace(id)
  546. go d2.Join(swarm.JoinRequest{
  547. RemoteAddrs: []string{"nosuchhost:1234"},
  548. }) // will block on pending state
  549. waitAndAssert(c, defaultReconciliationTimeout, d2.checkLocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  550. c.Assert(d2.Leave(true), checker.IsNil)
  551. waitAndAssert(c, defaultReconciliationTimeout, d2.checkActiveContainerCount, checker.Equals, 1)
  552. id2, err := d2.Cmd("ps", "-q")
  553. c.Assert(err, checker.IsNil)
  554. c.Assert(id, checker.HasPrefix, strings.TrimSpace(id2))
  555. }
  556. // #23705
  557. func (s *DockerSwarmSuite) TestApiSwarmRestoreOnPendingJoin(c *check.C) {
  558. d := s.AddDaemon(c, false, false)
  559. go d.Join(swarm.JoinRequest{
  560. RemoteAddrs: []string{"nosuchhost:1234"},
  561. }) // will block on pending state
  562. waitAndAssert(c, defaultReconciliationTimeout, d.checkLocalNodeState, checker.Equals, swarm.LocalNodeStatePending)
  563. c.Assert(d.Stop(), checker.IsNil)
  564. c.Assert(d.Start(), checker.IsNil)
  565. info, err := d.info()
  566. c.Assert(err, checker.IsNil)
  567. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateInactive)
  568. }
  569. func (s *DockerSwarmSuite) TestApiSwarmManagerRestore(c *check.C) {
  570. testRequires(c, Network)
  571. d1 := s.AddDaemon(c, true, true)
  572. instances := 2
  573. id := d1.createService(c, simpleTestService, setInstances(instances))
  574. d1.getService(c, id)
  575. d1.Stop()
  576. d1.Start()
  577. d1.getService(c, id)
  578. d2 := s.AddDaemon(c, true, true)
  579. d2.getService(c, id)
  580. d2.Stop()
  581. d2.Start()
  582. d2.getService(c, id)
  583. d3 := s.AddDaemon(c, true, true)
  584. d3.getService(c, id)
  585. d3.Stop()
  586. d3.Start()
  587. d3.getService(c, id)
  588. d3.Kill()
  589. time.Sleep(1 * time.Second) // time to handle signal
  590. d3.Start()
  591. d3.getService(c, id)
  592. }
  593. func (s *DockerSwarmSuite) TestApiSwarmScaleNoRollingUpdate(c *check.C) {
  594. testRequires(c, Network)
  595. d := s.AddDaemon(c, true, true)
  596. instances := 2
  597. id := d.createService(c, simpleTestService, setInstances(instances))
  598. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  599. containers := d.activeContainers()
  600. instances = 4
  601. d.updateService(c, d.getService(c, id), setInstances(instances))
  602. waitAndAssert(c, defaultReconciliationTimeout, d.checkActiveContainerCount, checker.Equals, instances)
  603. containers2 := d.activeContainers()
  604. loop0:
  605. for _, c1 := range containers {
  606. for _, c2 := range containers2 {
  607. if c1 == c2 {
  608. continue loop0
  609. }
  610. }
  611. c.Errorf("container %v not found in new set %#v", c1, containers2)
  612. }
  613. }
  614. func (s *DockerSwarmSuite) TestApiSwarmInvalidAddress(c *check.C) {
  615. d := s.AddDaemon(c, false, false)
  616. req := swarm.InitRequest{
  617. ListenAddr: "",
  618. }
  619. status, _, err := d.SockRequest("POST", "/swarm/init", req)
  620. c.Assert(err, checker.IsNil)
  621. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  622. req2 := swarm.JoinRequest{
  623. ListenAddr: "0.0.0.0:2377",
  624. RemoteAddrs: []string{""},
  625. }
  626. status, _, err = d.SockRequest("POST", "/swarm/join", req2)
  627. c.Assert(err, checker.IsNil)
  628. c.Assert(status, checker.Equals, http.StatusInternalServerError)
  629. }
  630. func (s *DockerSwarmSuite) TestApiSwarmForceNewCluster(c *check.C) {
  631. d1 := s.AddDaemon(c, true, true)
  632. d2 := s.AddDaemon(c, true, true)
  633. instances := 2
  634. id := d1.createService(c, simpleTestService, setInstances(instances))
  635. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d2.checkActiveContainerCount), checker.Equals, instances)
  636. c.Assert(d2.Stop(), checker.IsNil)
  637. time.Sleep(5 * time.Second)
  638. c.Assert(d1.Init(swarm.InitRequest{
  639. ForceNewCluster: true,
  640. Spec: swarm.Spec{
  641. AcceptancePolicy: autoAcceptPolicy,
  642. },
  643. }), checker.IsNil)
  644. waitAndAssert(c, defaultReconciliationTimeout, d1.checkActiveContainerCount, checker.Equals, instances)
  645. d3 := s.AddDaemon(c, true, true)
  646. info, err := d3.info()
  647. c.Assert(err, checker.IsNil)
  648. c.Assert(info.ControlAvailable, checker.True)
  649. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  650. instances = 4
  651. d3.updateService(c, d3.getService(c, id), setInstances(instances))
  652. waitAndAssert(c, defaultReconciliationTimeout, reducedCheck(sumAsIntegers, d1.checkActiveContainerCount, d3.checkActiveContainerCount), checker.Equals, instances)
  653. }
  654. func simpleTestService(s *swarm.Service) {
  655. var ureplicas uint64
  656. ureplicas = 1
  657. s.Spec = swarm.ServiceSpec{
  658. TaskTemplate: swarm.TaskSpec{
  659. ContainerSpec: swarm.ContainerSpec{
  660. Image: "busybox:latest",
  661. Command: []string{"/bin/top"},
  662. },
  663. },
  664. Mode: swarm.ServiceMode{
  665. Replicated: &swarm.ReplicatedService{
  666. Replicas: &ureplicas,
  667. },
  668. },
  669. }
  670. s.Spec.Name = "top"
  671. }
  672. func setInstances(replicas int) serviceConstructor {
  673. ureplicas := uint64(replicas)
  674. return func(s *swarm.Service) {
  675. s.Spec.Mode = swarm.ServiceMode{
  676. Replicated: &swarm.ReplicatedService{
  677. Replicas: &ureplicas,
  678. },
  679. }
  680. }
  681. }
  682. func setGlobalMode(s *swarm.Service) {
  683. s.Spec.Mode = swarm.ServiceMode{
  684. Global: &swarm.GlobalService{},
  685. }
  686. }
  687. func checkClusterHealth(c *check.C, cl []*SwarmDaemon, managerCount, workerCount int) {
  688. var totalMCount, totalWCount int
  689. for _, d := range cl {
  690. info, err := d.info()
  691. c.Assert(err, check.IsNil)
  692. if !info.ControlAvailable {
  693. totalWCount++
  694. continue
  695. }
  696. var leaderFound bool
  697. totalMCount++
  698. var mCount, wCount int
  699. for _, n := range d.listNodes(c) {
  700. c.Assert(n.Status.State, checker.Equals, swarm.NodeStateReady, check.Commentf("state of node %s, reported by %s", n.ID, d.Info.NodeID))
  701. c.Assert(n.Spec.Availability, checker.Equals, swarm.NodeAvailabilityActive, check.Commentf("availability of node %s, reported by %s", n.ID, d.Info.NodeID))
  702. c.Assert(n.Spec.Membership, checker.Equals, swarm.NodeMembershipAccepted, check.Commentf("membership of node %s, reported by %s", n.ID, d.Info.NodeID))
  703. if n.Spec.Role == swarm.NodeRoleManager {
  704. c.Assert(n.ManagerStatus, checker.NotNil, check.Commentf("manager status of node %s (manager), reported by %s", n.ID, d.Info.NodeID))
  705. if n.ManagerStatus.Leader {
  706. leaderFound = true
  707. }
  708. mCount++
  709. } else {
  710. c.Assert(n.ManagerStatus, checker.IsNil, check.Commentf("manager status of node %s (worker), reported by %s", n.ID, d.Info.NodeID))
  711. wCount++
  712. }
  713. }
  714. c.Assert(leaderFound, checker.True, check.Commentf("lack of leader reported by node %s", info.NodeID))
  715. c.Assert(mCount, checker.Equals, managerCount, check.Commentf("managers count reported by node %s", info.NodeID))
  716. c.Assert(wCount, checker.Equals, workerCount, check.Commentf("workers count reported by node %s", info.NodeID))
  717. }
  718. c.Assert(totalMCount, checker.Equals, managerCount)
  719. c.Assert(totalWCount, checker.Equals, workerCount)
  720. }
  721. func (s *DockerSwarmSuite) TestApiSwarmRestartCluster(c *check.C) {
  722. mCount, wCount := 5, 1
  723. var nodes []*SwarmDaemon
  724. for i := 0; i < mCount; i++ {
  725. manager := s.AddDaemon(c, true, true)
  726. info, err := manager.info()
  727. c.Assert(err, checker.IsNil)
  728. c.Assert(info.ControlAvailable, checker.True)
  729. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  730. nodes = append(nodes, manager)
  731. }
  732. for i := 0; i < wCount; i++ {
  733. worker := s.AddDaemon(c, true, false)
  734. info, err := worker.info()
  735. c.Assert(err, checker.IsNil)
  736. c.Assert(info.ControlAvailable, checker.False)
  737. c.Assert(info.LocalNodeState, checker.Equals, swarm.LocalNodeStateActive)
  738. nodes = append(nodes, worker)
  739. }
  740. // stop whole cluster
  741. {
  742. var wg sync.WaitGroup
  743. wg.Add(len(nodes))
  744. errs := make(chan error, len(nodes))
  745. for _, d := range nodes {
  746. go func(daemon *SwarmDaemon) {
  747. defer wg.Done()
  748. if err := daemon.Stop(); err != nil {
  749. errs <- err
  750. }
  751. if root := os.Getenv("DOCKER_REMAP_ROOT"); root != "" {
  752. daemon.root = filepath.Dir(daemon.root)
  753. }
  754. }(d)
  755. }
  756. wg.Wait()
  757. close(errs)
  758. for err := range errs {
  759. c.Assert(err, check.IsNil)
  760. }
  761. }
  762. // start whole cluster
  763. {
  764. var wg sync.WaitGroup
  765. wg.Add(len(nodes))
  766. errs := make(chan error, len(nodes))
  767. for _, d := range nodes {
  768. go func(daemon *SwarmDaemon) {
  769. defer wg.Done()
  770. if err := daemon.Start("--iptables=false"); err != nil {
  771. errs <- err
  772. }
  773. }(d)
  774. }
  775. wg.Wait()
  776. close(errs)
  777. for err := range errs {
  778. c.Assert(err, check.IsNil)
  779. }
  780. }
  781. checkClusterHealth(c, nodes, mCount, wCount)
  782. }