docker_cli_service_health_test.go 6.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191
  1. // +build !windows
  2. package main
  3. import (
  4. "strconv"
  5. "strings"
  6. "github.com/docker/docker/daemon/cluster/executor/container"
  7. "github.com/docker/docker/pkg/integration/checker"
  8. "github.com/docker/engine-api/types/swarm"
  9. "github.com/go-check/check"
  10. )
  11. // start a service, and then make its task unhealthy during running
  12. // finally, unhealthy task should be detected and killed
  13. func (s *DockerSwarmSuite) TestServiceHealthRun(c *check.C) {
  14. testRequires(c, DaemonIsLinux) // busybox doesn't work on Windows
  15. d := s.AddDaemon(c, true, true)
  16. // build image with health-check
  17. // note: use `daemon.buildImageWithOut` to build, do not use `buildImage` to build
  18. imageName := "testhealth"
  19. _, _, err := d.buildImageWithOut(imageName,
  20. `FROM busybox
  21. RUN touch /status
  22. HEALTHCHECK --interval=1s --timeout=1s --retries=1\
  23. CMD cat /status`,
  24. true)
  25. c.Check(err, check.IsNil)
  26. serviceName := "healthServiceRun"
  27. out, err := d.Cmd("service", "create", "--name", serviceName, imageName, "top")
  28. c.Assert(err, checker.IsNil, check.Commentf(out))
  29. id := strings.TrimSpace(out)
  30. var tasks []swarm.Task
  31. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  32. tasks = d.getServiceTasks(c, id)
  33. return tasks, nil
  34. }, checker.HasLen, 1)
  35. task := tasks[0]
  36. // wait for task to start
  37. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  38. task = d.getTask(c, task.ID)
  39. return task.Status.State, nil
  40. }, checker.Equals, swarm.TaskStateStarting)
  41. containerID := task.Status.ContainerStatus.ContainerID
  42. // wait for container to be healthy
  43. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  44. out, _ := d.Cmd("inspect", "--format={{.State.Health.Status}}", containerID)
  45. return strings.TrimSpace(out), nil
  46. }, checker.Equals, "healthy")
  47. // make it fail
  48. d.Cmd("exec", containerID, "rm", "/status")
  49. // wait for container to be unhealthy
  50. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  51. out, _ := d.Cmd("inspect", "--format={{.State.Health.Status}}", containerID)
  52. return strings.TrimSpace(out), nil
  53. }, checker.Equals, "unhealthy")
  54. // Task should be terminated
  55. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  56. task = d.getTask(c, task.ID)
  57. return task.Status.State, nil
  58. }, checker.Equals, swarm.TaskStateFailed)
  59. if !strings.Contains(task.Status.Err, container.ErrContainerUnhealthy.Error()) {
  60. c.Fatal("unhealthy task exits because of other error")
  61. }
  62. }
  63. // start a service whose task is unhealthy at beginning
  64. // its tasks should be blocked in starting stage, until health check is passed
  65. func (s *DockerSwarmSuite) TestServiceHealthStart(c *check.C) {
  66. testRequires(c, DaemonIsLinux) // busybox doesn't work on Windows
  67. d := s.AddDaemon(c, true, true)
  68. // service started from this image won't pass health check
  69. imageName := "testhealth"
  70. _, _, err := d.buildImageWithOut(imageName,
  71. `FROM busybox
  72. HEALTHCHECK --interval=1s --timeout=1s --retries=1024\
  73. CMD cat /status`,
  74. true)
  75. c.Check(err, check.IsNil)
  76. serviceName := "healthServiceStart"
  77. out, err := d.Cmd("service", "create", "--name", serviceName, imageName, "top")
  78. c.Assert(err, checker.IsNil, check.Commentf(out))
  79. id := strings.TrimSpace(out)
  80. var tasks []swarm.Task
  81. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  82. tasks = d.getServiceTasks(c, id)
  83. return tasks, nil
  84. }, checker.HasLen, 1)
  85. task := tasks[0]
  86. // wait for task to start
  87. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  88. task = d.getTask(c, task.ID)
  89. return task.Status.State, nil
  90. }, checker.Equals, swarm.TaskStateStarting)
  91. containerID := task.Status.ContainerStatus.ContainerID
  92. // wait for health check to work
  93. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  94. out, _ := d.Cmd("inspect", "--format={{.State.Health.FailingStreak}}", containerID)
  95. failingStreak, _ := strconv.Atoi(strings.TrimSpace(out))
  96. return failingStreak, nil
  97. }, checker.GreaterThan, 0)
  98. // task should be blocked at starting status
  99. task = d.getTask(c, task.ID)
  100. c.Assert(task.Status.State, check.Equals, swarm.TaskStateStarting)
  101. // make it healthy
  102. d.Cmd("exec", containerID, "touch", "/status")
  103. // Task should be at running status
  104. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  105. task = d.getTask(c, task.ID)
  106. return task.Status.State, nil
  107. }, checker.Equals, swarm.TaskStateRunning)
  108. }
  109. // start a service whose task is unhealthy at beginning
  110. // its tasks should be blocked in starting stage, until health check is passed
  111. func (s *DockerSwarmSuite) TestServiceHealthUpdate(c *check.C) {
  112. testRequires(c, DaemonIsLinux) // busybox doesn't work on Windows
  113. d := s.AddDaemon(c, true, true)
  114. // service started from this image won't pass health check
  115. imageName := "testhealth"
  116. _, _, err := d.buildImageWithOut(imageName,
  117. `FROM busybox
  118. HEALTHCHECK --interval=1s --timeout=1s --retries=1024\
  119. CMD cat /status`,
  120. true)
  121. c.Check(err, check.IsNil)
  122. serviceName := "healthServiceStart"
  123. out, err := d.Cmd("service", "create", "--name", serviceName, imageName, "top")
  124. c.Assert(err, checker.IsNil, check.Commentf(out))
  125. id := strings.TrimSpace(out)
  126. var tasks []swarm.Task
  127. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  128. tasks = d.getServiceTasks(c, id)
  129. return tasks, nil
  130. }, checker.HasLen, 1)
  131. task := tasks[0]
  132. // wait for task to start
  133. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  134. task = d.getTask(c, task.ID)
  135. return task.Status.State, nil
  136. }, checker.Equals, swarm.TaskStateStarting)
  137. containerID := task.Status.ContainerStatus.ContainerID
  138. // wait for health check to work
  139. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  140. out, _ := d.Cmd("inspect", "--format={{.State.Health.FailingStreak}}", containerID)
  141. failingStreak, _ := strconv.Atoi(strings.TrimSpace(out))
  142. return failingStreak, nil
  143. }, checker.GreaterThan, 0)
  144. // task should be blocked at starting status
  145. task = d.getTask(c, task.ID)
  146. c.Assert(task.Status.State, check.Equals, swarm.TaskStateStarting)
  147. // make it healthy
  148. d.Cmd("exec", containerID, "touch", "/status")
  149. // Task should be at running status
  150. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  151. task = d.getTask(c, task.ID)
  152. return task.Status.State, nil
  153. }, checker.Equals, swarm.TaskStateRunning)
  154. }