docker_cli_service_health_test.go 4.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137
  1. // +build !windows
  2. package main
  3. import (
  4. "strconv"
  5. "strings"
  6. "github.com/docker/docker/api/types/swarm"
  7. "github.com/docker/docker/daemon/cluster/executor/container"
  8. "github.com/docker/docker/integration-cli/checker"
  9. "github.com/docker/docker/integration-cli/cli"
  10. "github.com/docker/docker/integration-cli/cli/build"
  11. "github.com/go-check/check"
  12. "gotest.tools/assert"
  13. "gotest.tools/icmd"
  14. )
  15. // start a service, and then make its task unhealthy during running
  16. // finally, unhealthy task should be detected and killed
  17. func (s *DockerSwarmSuite) TestServiceHealthRun(c *check.C) {
  18. testRequires(c, DaemonIsLinux) // busybox doesn't work on Windows
  19. d := s.AddDaemon(c, true, true)
  20. // build image with health-check
  21. imageName := "testhealth"
  22. result := cli.BuildCmd(c, imageName, cli.Daemon(d),
  23. build.WithDockerfile(`FROM busybox
  24. RUN touch /status
  25. HEALTHCHECK --interval=1s --timeout=5s --retries=1\
  26. CMD cat /status`),
  27. )
  28. result.Assert(c, icmd.Success)
  29. serviceName := "healthServiceRun"
  30. out, err := d.Cmd("service", "create", "--no-resolve-image", "--detach=true", "--name", serviceName, imageName, "top")
  31. assert.NilError(c, err, out)
  32. id := strings.TrimSpace(out)
  33. var tasks []swarm.Task
  34. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  35. tasks = d.GetServiceTasks(c, id)
  36. return tasks, nil
  37. }, checker.HasLen, 1)
  38. task := tasks[0]
  39. // wait for task to start
  40. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  41. task = d.GetTask(c, task.ID)
  42. return task.Status.State, nil
  43. }, checker.Equals, swarm.TaskStateRunning)
  44. containerID := task.Status.ContainerStatus.ContainerID
  45. // wait for container to be healthy
  46. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  47. out, _ := d.Cmd("inspect", "--format={{.State.Health.Status}}", containerID)
  48. return strings.TrimSpace(out), nil
  49. }, checker.Equals, "healthy")
  50. // make it fail
  51. d.Cmd("exec", containerID, "rm", "/status")
  52. // wait for container to be unhealthy
  53. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  54. out, _ := d.Cmd("inspect", "--format={{.State.Health.Status}}", containerID)
  55. return strings.TrimSpace(out), nil
  56. }, checker.Equals, "unhealthy")
  57. // Task should be terminated
  58. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  59. task = d.GetTask(c, task.ID)
  60. return task.Status.State, nil
  61. }, checker.Equals, swarm.TaskStateFailed)
  62. if !strings.Contains(task.Status.Err, container.ErrContainerUnhealthy.Error()) {
  63. c.Fatal("unhealthy task exits because of other error")
  64. }
  65. }
  66. // start a service whose task is unhealthy at beginning
  67. // its tasks should be blocked in starting stage, until health check is passed
  68. func (s *DockerSwarmSuite) TestServiceHealthStart(c *check.C) {
  69. testRequires(c, DaemonIsLinux) // busybox doesn't work on Windows
  70. d := s.AddDaemon(c, true, true)
  71. // service started from this image won't pass health check
  72. imageName := "testhealth"
  73. result := cli.BuildCmd(c, imageName, cli.Daemon(d),
  74. build.WithDockerfile(`FROM busybox
  75. HEALTHCHECK --interval=1s --timeout=1s --retries=1024\
  76. CMD cat /status`),
  77. )
  78. result.Assert(c, icmd.Success)
  79. serviceName := "healthServiceStart"
  80. out, err := d.Cmd("service", "create", "--no-resolve-image", "--detach=true", "--name", serviceName, imageName, "top")
  81. assert.NilError(c, err, out)
  82. id := strings.TrimSpace(out)
  83. var tasks []swarm.Task
  84. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  85. tasks = d.GetServiceTasks(c, id)
  86. return tasks, nil
  87. }, checker.HasLen, 1)
  88. task := tasks[0]
  89. // wait for task to start
  90. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  91. task = d.GetTask(c, task.ID)
  92. return task.Status.State, nil
  93. }, checker.Equals, swarm.TaskStateStarting)
  94. containerID := task.Status.ContainerStatus.ContainerID
  95. // wait for health check to work
  96. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  97. out, _ := d.Cmd("inspect", "--format={{.State.Health.FailingStreak}}", containerID)
  98. failingStreak, _ := strconv.Atoi(strings.TrimSpace(out))
  99. return failingStreak, nil
  100. }, checker.GreaterThan, 0)
  101. // task should be blocked at starting status
  102. task = d.GetTask(c, task.ID)
  103. assert.Assert(c, task.Status.State, check.Equals, swarm.TaskStateStarting)
  104. // make it healthy
  105. d.Cmd("exec", containerID, "touch", "/status")
  106. // Task should be at running status
  107. waitAndAssert(c, defaultReconciliationTimeout, func(c *check.C) (interface{}, check.CommentInterface) {
  108. task = d.GetTask(c, task.ID)
  109. return task.Status.State, nil
  110. }, checker.Equals, swarm.TaskStateRunning)
  111. }