service_windows.go 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387
  1. package main
  2. import (
  3. "bytes"
  4. "context"
  5. "errors"
  6. "fmt"
  7. "io"
  8. "os"
  9. "path/filepath"
  10. "time"
  11. "github.com/containerd/log"
  12. "github.com/spf13/pflag"
  13. "golang.org/x/sys/windows"
  14. "golang.org/x/sys/windows/svc"
  15. "golang.org/x/sys/windows/svc/debug"
  16. "golang.org/x/sys/windows/svc/eventlog"
  17. "golang.org/x/sys/windows/svc/mgr"
  18. )
  19. var (
  20. flServiceName *string
  21. flRegisterService *bool
  22. flUnregisterService *bool
  23. flRunService *bool
  24. oldStderr windows.Handle
  25. panicFile *os.File
  26. service *handler
  27. )
  28. const (
  29. // These should match the values in event_messages.mc.
  30. eventInfo = 1
  31. eventWarn = 1
  32. eventError = 1
  33. eventDebug = 2
  34. eventPanic = 3
  35. eventFatal = 4
  36. eventExtraOffset = 10 // Add this to any event to get a string that supports extended data
  37. )
  38. func installServiceFlags(flags *pflag.FlagSet) {
  39. flServiceName = flags.String("service-name", "docker", "Set the Windows service name")
  40. flRegisterService = flags.Bool("register-service", false, "Register the service and exit")
  41. flUnregisterService = flags.Bool("unregister-service", false, "Unregister the service and exit")
  42. flRunService = flags.Bool("run-service", false, "")
  43. _ = flags.MarkHidden("run-service")
  44. }
  45. type handler struct {
  46. tosvc chan bool
  47. fromsvc chan error
  48. daemonCli *DaemonCli
  49. }
  50. type etwHook struct {
  51. log *eventlog.Log
  52. }
  53. func (h *etwHook) Levels() []log.Level {
  54. return []log.Level{
  55. log.PanicLevel,
  56. log.FatalLevel,
  57. log.ErrorLevel,
  58. log.WarnLevel,
  59. log.InfoLevel,
  60. log.DebugLevel,
  61. }
  62. }
  63. func (h *etwHook) Fire(e *log.Entry) error {
  64. var (
  65. etype uint16
  66. eid uint32
  67. )
  68. switch e.Level {
  69. case log.PanicLevel:
  70. etype = windows.EVENTLOG_ERROR_TYPE
  71. eid = eventPanic
  72. case log.FatalLevel:
  73. etype = windows.EVENTLOG_ERROR_TYPE
  74. eid = eventFatal
  75. case log.ErrorLevel:
  76. etype = windows.EVENTLOG_ERROR_TYPE
  77. eid = eventError
  78. case log.WarnLevel:
  79. etype = windows.EVENTLOG_WARNING_TYPE
  80. eid = eventWarn
  81. case log.InfoLevel:
  82. etype = windows.EVENTLOG_INFORMATION_TYPE
  83. eid = eventInfo
  84. case log.DebugLevel:
  85. etype = windows.EVENTLOG_INFORMATION_TYPE
  86. eid = eventDebug
  87. default:
  88. return errors.New("unknown level")
  89. }
  90. // If there is additional data, include it as a second string.
  91. exts := ""
  92. if len(e.Data) > 0 {
  93. fs := bytes.Buffer{}
  94. for k, v := range e.Data {
  95. fs.WriteString(k)
  96. fs.WriteByte('=')
  97. fmt.Fprint(&fs, v)
  98. fs.WriteByte(' ')
  99. }
  100. exts = fs.String()[:fs.Len()-1]
  101. eid += eventExtraOffset
  102. }
  103. if h.log == nil {
  104. fmt.Fprintf(os.Stderr, "%s [%s]\n", e.Message, exts)
  105. return nil
  106. }
  107. var (
  108. ss [2]*uint16
  109. err error
  110. )
  111. ss[0], err = windows.UTF16PtrFromString(e.Message)
  112. if err != nil {
  113. return err
  114. }
  115. count := uint16(1)
  116. if exts != "" {
  117. ss[1], err = windows.UTF16PtrFromString(exts)
  118. if err != nil {
  119. return err
  120. }
  121. count++
  122. }
  123. return windows.ReportEvent(h.log.Handle, etype, 0, eid, 0, count, 0, &ss[0], nil)
  124. }
  125. func registerService() error {
  126. p, err := os.Executable()
  127. if err != nil {
  128. return err
  129. }
  130. m, err := mgr.Connect()
  131. if err != nil {
  132. return err
  133. }
  134. defer m.Disconnect()
  135. c := mgr.Config{
  136. ServiceType: windows.SERVICE_WIN32_OWN_PROCESS,
  137. StartType: mgr.StartAutomatic,
  138. ErrorControl: mgr.ErrorNormal,
  139. Dependencies: []string{},
  140. DisplayName: "Docker Engine",
  141. }
  142. // Configure the service to launch with the arguments that were just passed.
  143. args := []string{"--run-service"}
  144. for _, a := range os.Args[1:] {
  145. if a != "--register-service" && a != "--unregister-service" {
  146. args = append(args, a)
  147. }
  148. }
  149. s, err := m.CreateService(*flServiceName, p, c, args...)
  150. if err != nil {
  151. return err
  152. }
  153. defer s.Close()
  154. err = s.SetRecoveryActions(
  155. []mgr.RecoveryAction{
  156. {Type: mgr.ServiceRestart, Delay: 15 * time.Second},
  157. {Type: mgr.ServiceRestart, Delay: 15 * time.Second},
  158. {Type: mgr.NoAction},
  159. },
  160. uint32(24*time.Hour/time.Second),
  161. )
  162. if err != nil {
  163. return err
  164. }
  165. return eventlog.Install(*flServiceName, p, false, eventlog.Info|eventlog.Warning|eventlog.Error)
  166. }
  167. func unregisterService() error {
  168. m, err := mgr.Connect()
  169. if err != nil {
  170. return err
  171. }
  172. defer m.Disconnect()
  173. s, err := m.OpenService(*flServiceName)
  174. if err != nil {
  175. return err
  176. }
  177. defer s.Close()
  178. eventlog.Remove(*flServiceName)
  179. err = s.Delete()
  180. if err != nil {
  181. return err
  182. }
  183. return nil
  184. }
  185. // initService is the entry point for running the daemon as a Windows
  186. // service. It returns an indication to stop (if registering/un-registering);
  187. // an indication of whether it is running as a service; and an error.
  188. func initService(daemonCli *DaemonCli) (bool, bool, error) {
  189. if *flUnregisterService {
  190. if *flRegisterService {
  191. return true, false, errors.New("--register-service and --unregister-service cannot be used together")
  192. }
  193. return true, false, unregisterService()
  194. }
  195. if *flRegisterService {
  196. return true, false, registerService()
  197. }
  198. if !*flRunService {
  199. return false, false, nil
  200. }
  201. // Check if we're running as a Windows service or interactively.
  202. isService, err := svc.IsWindowsService()
  203. if err != nil {
  204. return false, false, err
  205. }
  206. h := &handler{
  207. tosvc: make(chan bool),
  208. fromsvc: make(chan error),
  209. daemonCli: daemonCli,
  210. }
  211. var eventLog *eventlog.Log
  212. if isService {
  213. eventLog, err = eventlog.Open(*flServiceName)
  214. if err != nil {
  215. return false, false, err
  216. }
  217. }
  218. log.L.Logger.AddHook(&etwHook{eventLog})
  219. log.L.Logger.SetOutput(io.Discard)
  220. service = h
  221. go func() {
  222. if isService {
  223. err = svc.Run(*flServiceName, h)
  224. } else {
  225. err = debug.Run(*flServiceName, h)
  226. }
  227. h.fromsvc <- err
  228. }()
  229. // Wait for the first signal from the service handler.
  230. err = <-h.fromsvc
  231. if err != nil {
  232. return false, false, err
  233. }
  234. return false, true, nil
  235. }
  236. func (h *handler) started() error {
  237. // This must be delayed until daemonCli initializes Config.Root
  238. err := initPanicFile(filepath.Join(h.daemonCli.Config.Root, "panic.log"))
  239. if err != nil {
  240. return err
  241. }
  242. h.tosvc <- false
  243. return nil
  244. }
  245. func (h *handler) stopped(err error) {
  246. log.G(context.TODO()).Debugf("Stopping service: %v", err)
  247. h.tosvc <- err != nil
  248. <-h.fromsvc
  249. }
  250. func (h *handler) Execute(_ []string, r <-chan svc.ChangeRequest, s chan<- svc.Status) (bool, uint32) {
  251. s <- svc.Status{State: svc.StartPending, Accepts: 0}
  252. // Unblock initService()
  253. h.fromsvc <- nil
  254. // Wait for initialization to complete.
  255. failed := <-h.tosvc
  256. if failed {
  257. log.G(context.TODO()).Debug("Aborting service start due to failure during initialization")
  258. return true, 1
  259. }
  260. s <- svc.Status{State: svc.Running, Accepts: svc.AcceptStop | svc.AcceptShutdown | svc.Accepted(windows.SERVICE_ACCEPT_PARAMCHANGE)}
  261. log.G(context.TODO()).Debug("Service running")
  262. Loop:
  263. for {
  264. select {
  265. case failed = <-h.tosvc:
  266. break Loop
  267. case c := <-r:
  268. switch c.Cmd {
  269. case svc.Cmd(windows.SERVICE_CONTROL_PARAMCHANGE):
  270. h.daemonCli.reloadConfig()
  271. case svc.Interrogate:
  272. s <- c.CurrentStatus
  273. case svc.Stop, svc.Shutdown:
  274. s <- svc.Status{State: svc.StopPending, Accepts: 0}
  275. h.daemonCli.stop()
  276. }
  277. }
  278. }
  279. removePanicFile()
  280. if failed {
  281. return true, 1
  282. }
  283. return false, 0
  284. }
  285. func initPanicFile(path string) error {
  286. var err error
  287. panicFile, err = os.OpenFile(path, os.O_CREATE|os.O_WRONLY|os.O_APPEND, 0o200)
  288. if err != nil {
  289. return err
  290. }
  291. st, err := panicFile.Stat()
  292. if err != nil {
  293. return err
  294. }
  295. // If there are contents in the file already, move the file out of the way
  296. // and replace it.
  297. if st.Size() > 0 {
  298. panicFile.Close()
  299. os.Rename(path, path+".old")
  300. panicFile, err = os.Create(path)
  301. if err != nil {
  302. return err
  303. }
  304. }
  305. // Update STD_ERROR_HANDLE to point to the panic file so that Go writes to
  306. // it when it panics. Remember the old stderr to restore it before removing
  307. // the panic file.
  308. h, err := windows.GetStdHandle(windows.STD_ERROR_HANDLE)
  309. if err != nil {
  310. return err
  311. }
  312. oldStderr = h
  313. err = windows.SetStdHandle(windows.STD_ERROR_HANDLE, windows.Handle(panicFile.Fd()))
  314. if err != nil {
  315. return err
  316. }
  317. // Reset os.Stderr to the panic file (so fmt.Fprintf(os.Stderr,...) actually gets redirected)
  318. os.Stderr = os.NewFile(panicFile.Fd(), "/dev/stderr")
  319. // Force threads that panic to write to stderr (the panicFile handle now), otherwise it will go into the ether
  320. log.L.Logger.SetOutput(os.Stderr)
  321. return nil
  322. }
  323. func removePanicFile() {
  324. if st, err := panicFile.Stat(); err == nil {
  325. if st.Size() == 0 {
  326. windows.SetStdHandle(windows.STD_ERROR_HANDLE, oldStderr)
  327. panicFile.Close()
  328. os.Remove(panicFile.Name())
  329. }
  330. }
  331. }