services.go 19 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597
  1. package cluster
  2. import (
  3. "encoding/base64"
  4. "encoding/json"
  5. "fmt"
  6. "io"
  7. "os"
  8. "strconv"
  9. "strings"
  10. "time"
  11. "github.com/docker/distribution/reference"
  12. apitypes "github.com/docker/docker/api/types"
  13. "github.com/docker/docker/api/types/backend"
  14. types "github.com/docker/docker/api/types/swarm"
  15. timetypes "github.com/docker/docker/api/types/time"
  16. "github.com/docker/docker/daemon/cluster/convert"
  17. runconfigopts "github.com/docker/docker/runconfig/opts"
  18. swarmapi "github.com/docker/swarmkit/api"
  19. gogotypes "github.com/gogo/protobuf/types"
  20. "github.com/pkg/errors"
  21. "github.com/sirupsen/logrus"
  22. "golang.org/x/net/context"
  23. )
  24. // GetServices returns all services of a managed swarm cluster.
  25. func (c *Cluster) GetServices(options apitypes.ServiceListOptions) ([]types.Service, error) {
  26. c.mu.RLock()
  27. defer c.mu.RUnlock()
  28. state := c.currentNodeState()
  29. if !state.IsActiveManager() {
  30. return nil, c.errNoManager(state)
  31. }
  32. // We move the accepted filter check here as "mode" filter
  33. // is processed in the daemon, not in SwarmKit. So it might
  34. // be good to have accepted file check in the same file as
  35. // the filter processing (in the for loop below).
  36. accepted := map[string]bool{
  37. "name": true,
  38. "id": true,
  39. "label": true,
  40. "mode": true,
  41. "runtime": true,
  42. }
  43. if err := options.Filters.Validate(accepted); err != nil {
  44. return nil, err
  45. }
  46. if len(options.Filters.Get("runtime")) == 0 {
  47. // Default to using the container runtime filter
  48. options.Filters.Add("runtime", string(types.RuntimeContainer))
  49. }
  50. filters := &swarmapi.ListServicesRequest_Filters{
  51. NamePrefixes: options.Filters.Get("name"),
  52. IDPrefixes: options.Filters.Get("id"),
  53. Labels: runconfigopts.ConvertKVStringsToMap(options.Filters.Get("label")),
  54. Runtimes: options.Filters.Get("runtime"),
  55. }
  56. ctx, cancel := c.getRequestContext()
  57. defer cancel()
  58. r, err := state.controlClient.ListServices(
  59. ctx,
  60. &swarmapi.ListServicesRequest{Filters: filters})
  61. if err != nil {
  62. return nil, err
  63. }
  64. services := make([]types.Service, 0, len(r.Services))
  65. for _, service := range r.Services {
  66. if options.Filters.Include("mode") {
  67. var mode string
  68. switch service.Spec.GetMode().(type) {
  69. case *swarmapi.ServiceSpec_Global:
  70. mode = "global"
  71. case *swarmapi.ServiceSpec_Replicated:
  72. mode = "replicated"
  73. }
  74. if !options.Filters.ExactMatch("mode", mode) {
  75. continue
  76. }
  77. }
  78. svcs, err := convert.ServiceFromGRPC(*service)
  79. if err != nil {
  80. return nil, err
  81. }
  82. services = append(services, svcs)
  83. }
  84. return services, nil
  85. }
  86. // GetService returns a service based on an ID or name.
  87. func (c *Cluster) GetService(input string, insertDefaults bool) (types.Service, error) {
  88. var service *swarmapi.Service
  89. if err := c.lockedManagerAction(func(ctx context.Context, state nodeState) error {
  90. s, err := getService(ctx, state.controlClient, input, insertDefaults)
  91. if err != nil {
  92. return err
  93. }
  94. service = s
  95. return nil
  96. }); err != nil {
  97. return types.Service{}, err
  98. }
  99. svc, err := convert.ServiceFromGRPC(*service)
  100. if err != nil {
  101. return types.Service{}, err
  102. }
  103. return svc, nil
  104. }
  105. // CreateService creates a new service in a managed swarm cluster.
  106. func (c *Cluster) CreateService(s types.ServiceSpec, encodedAuth string, queryRegistry bool) (*apitypes.ServiceCreateResponse, error) {
  107. var resp *apitypes.ServiceCreateResponse
  108. err := c.lockedManagerAction(func(ctx context.Context, state nodeState) error {
  109. err := c.populateNetworkID(ctx, state.controlClient, &s)
  110. if err != nil {
  111. return err
  112. }
  113. serviceSpec, err := convert.ServiceSpecToGRPC(s)
  114. if err != nil {
  115. return convertError{err}
  116. }
  117. resp = &apitypes.ServiceCreateResponse{}
  118. switch serviceSpec.Task.Runtime.(type) {
  119. // handle other runtimes here
  120. case *swarmapi.TaskSpec_Generic:
  121. switch serviceSpec.Task.GetGeneric().Kind {
  122. case string(types.RuntimePlugin):
  123. info, _ := c.config.Backend.SystemInfo()
  124. if !info.ExperimentalBuild {
  125. return fmt.Errorf("runtime type %q only supported in experimental", types.RuntimePlugin)
  126. }
  127. if s.TaskTemplate.PluginSpec == nil {
  128. return errors.New("plugin spec must be set")
  129. }
  130. default:
  131. return fmt.Errorf("unsupported runtime type: %q", serviceSpec.Task.GetGeneric().Kind)
  132. }
  133. r, err := state.controlClient.CreateService(ctx, &swarmapi.CreateServiceRequest{Spec: &serviceSpec})
  134. if err != nil {
  135. return err
  136. }
  137. resp.ID = r.Service.ID
  138. case *swarmapi.TaskSpec_Container:
  139. ctnr := serviceSpec.Task.GetContainer()
  140. if ctnr == nil {
  141. return errors.New("service does not use container tasks")
  142. }
  143. if encodedAuth != "" {
  144. ctnr.PullOptions = &swarmapi.ContainerSpec_PullOptions{RegistryAuth: encodedAuth}
  145. }
  146. // retrieve auth config from encoded auth
  147. authConfig := &apitypes.AuthConfig{}
  148. if encodedAuth != "" {
  149. authReader := strings.NewReader(encodedAuth)
  150. dec := json.NewDecoder(base64.NewDecoder(base64.URLEncoding, authReader))
  151. if err := dec.Decode(authConfig); err != nil {
  152. logrus.Warnf("invalid authconfig: %v", err)
  153. }
  154. }
  155. // pin image by digest for API versions < 1.30
  156. // TODO(nishanttotla): The check on "DOCKER_SERVICE_PREFER_OFFLINE_IMAGE"
  157. // should be removed in the future. Since integration tests only use the
  158. // latest API version, so this is no longer required.
  159. if os.Getenv("DOCKER_SERVICE_PREFER_OFFLINE_IMAGE") != "1" && queryRegistry {
  160. digestImage, err := c.imageWithDigestString(ctx, ctnr.Image, authConfig)
  161. if err != nil {
  162. logrus.Warnf("unable to pin image %s to digest: %s", ctnr.Image, err.Error())
  163. // warning in the client response should be concise
  164. resp.Warnings = append(resp.Warnings, digestWarning(ctnr.Image))
  165. } else if ctnr.Image != digestImage {
  166. logrus.Debugf("pinning image %s by digest: %s", ctnr.Image, digestImage)
  167. ctnr.Image = digestImage
  168. } else {
  169. logrus.Debugf("creating service using supplied digest reference %s", ctnr.Image)
  170. }
  171. // Replace the context with a fresh one.
  172. // If we timed out while communicating with the
  173. // registry, then "ctx" will already be expired, which
  174. // would cause UpdateService below to fail. Reusing
  175. // "ctx" could make it impossible to create a service
  176. // if the registry is slow or unresponsive.
  177. var cancel func()
  178. ctx, cancel = c.getRequestContext()
  179. defer cancel()
  180. }
  181. r, err := state.controlClient.CreateService(ctx, &swarmapi.CreateServiceRequest{Spec: &serviceSpec})
  182. if err != nil {
  183. return err
  184. }
  185. resp.ID = r.Service.ID
  186. }
  187. return nil
  188. })
  189. return resp, err
  190. }
  191. // UpdateService updates existing service to match new properties.
  192. func (c *Cluster) UpdateService(serviceIDOrName string, version uint64, spec types.ServiceSpec, flags apitypes.ServiceUpdateOptions, queryRegistry bool) (*apitypes.ServiceUpdateResponse, error) {
  193. var resp *apitypes.ServiceUpdateResponse
  194. err := c.lockedManagerAction(func(ctx context.Context, state nodeState) error {
  195. err := c.populateNetworkID(ctx, state.controlClient, &spec)
  196. if err != nil {
  197. return err
  198. }
  199. serviceSpec, err := convert.ServiceSpecToGRPC(spec)
  200. if err != nil {
  201. return convertError{err}
  202. }
  203. currentService, err := getService(ctx, state.controlClient, serviceIDOrName, false)
  204. if err != nil {
  205. return err
  206. }
  207. resp = &apitypes.ServiceUpdateResponse{}
  208. switch serviceSpec.Task.Runtime.(type) {
  209. case *swarmapi.TaskSpec_Generic:
  210. switch serviceSpec.Task.GetGeneric().Kind {
  211. case string(types.RuntimePlugin):
  212. if spec.TaskTemplate.PluginSpec == nil {
  213. return errors.New("plugin spec must be set")
  214. }
  215. }
  216. case *swarmapi.TaskSpec_Container:
  217. newCtnr := serviceSpec.Task.GetContainer()
  218. if newCtnr == nil {
  219. return errors.New("service does not use container tasks")
  220. }
  221. encodedAuth := flags.EncodedRegistryAuth
  222. if encodedAuth != "" {
  223. newCtnr.PullOptions = &swarmapi.ContainerSpec_PullOptions{RegistryAuth: encodedAuth}
  224. } else {
  225. // this is needed because if the encodedAuth isn't being updated then we
  226. // shouldn't lose it, and continue to use the one that was already present
  227. var ctnr *swarmapi.ContainerSpec
  228. switch flags.RegistryAuthFrom {
  229. case apitypes.RegistryAuthFromSpec, "":
  230. ctnr = currentService.Spec.Task.GetContainer()
  231. case apitypes.RegistryAuthFromPreviousSpec:
  232. if currentService.PreviousSpec == nil {
  233. return errors.New("service does not have a previous spec")
  234. }
  235. ctnr = currentService.PreviousSpec.Task.GetContainer()
  236. default:
  237. return errors.New("unsupported registryAuthFrom value")
  238. }
  239. if ctnr == nil {
  240. return errors.New("service does not use container tasks")
  241. }
  242. newCtnr.PullOptions = ctnr.PullOptions
  243. // update encodedAuth so it can be used to pin image by digest
  244. if ctnr.PullOptions != nil {
  245. encodedAuth = ctnr.PullOptions.RegistryAuth
  246. }
  247. }
  248. // retrieve auth config from encoded auth
  249. authConfig := &apitypes.AuthConfig{}
  250. if encodedAuth != "" {
  251. if err := json.NewDecoder(base64.NewDecoder(base64.URLEncoding, strings.NewReader(encodedAuth))).Decode(authConfig); err != nil {
  252. logrus.Warnf("invalid authconfig: %v", err)
  253. }
  254. }
  255. // pin image by digest for API versions < 1.30
  256. // TODO(nishanttotla): The check on "DOCKER_SERVICE_PREFER_OFFLINE_IMAGE"
  257. // should be removed in the future. Since integration tests only use the
  258. // latest API version, so this is no longer required.
  259. if os.Getenv("DOCKER_SERVICE_PREFER_OFFLINE_IMAGE") != "1" && queryRegistry {
  260. digestImage, err := c.imageWithDigestString(ctx, newCtnr.Image, authConfig)
  261. if err != nil {
  262. logrus.Warnf("unable to pin image %s to digest: %s", newCtnr.Image, err.Error())
  263. // warning in the client response should be concise
  264. resp.Warnings = append(resp.Warnings, digestWarning(newCtnr.Image))
  265. } else if newCtnr.Image != digestImage {
  266. logrus.Debugf("pinning image %s by digest: %s", newCtnr.Image, digestImage)
  267. newCtnr.Image = digestImage
  268. } else {
  269. logrus.Debugf("updating service using supplied digest reference %s", newCtnr.Image)
  270. }
  271. // Replace the context with a fresh one.
  272. // If we timed out while communicating with the
  273. // registry, then "ctx" will already be expired, which
  274. // would cause UpdateService below to fail. Reusing
  275. // "ctx" could make it impossible to update a service
  276. // if the registry is slow or unresponsive.
  277. var cancel func()
  278. ctx, cancel = c.getRequestContext()
  279. defer cancel()
  280. }
  281. }
  282. var rollback swarmapi.UpdateServiceRequest_Rollback
  283. switch flags.Rollback {
  284. case "", "none":
  285. rollback = swarmapi.UpdateServiceRequest_NONE
  286. case "previous":
  287. rollback = swarmapi.UpdateServiceRequest_PREVIOUS
  288. default:
  289. return fmt.Errorf("unrecognized rollback option %s", flags.Rollback)
  290. }
  291. _, err = state.controlClient.UpdateService(
  292. ctx,
  293. &swarmapi.UpdateServiceRequest{
  294. ServiceID: currentService.ID,
  295. Spec: &serviceSpec,
  296. ServiceVersion: &swarmapi.Version{
  297. Index: version,
  298. },
  299. Rollback: rollback,
  300. },
  301. )
  302. return err
  303. })
  304. return resp, err
  305. }
  306. // RemoveService removes a service from a managed swarm cluster.
  307. func (c *Cluster) RemoveService(input string) error {
  308. return c.lockedManagerAction(func(ctx context.Context, state nodeState) error {
  309. service, err := getService(ctx, state.controlClient, input, false)
  310. if err != nil {
  311. return err
  312. }
  313. _, err = state.controlClient.RemoveService(ctx, &swarmapi.RemoveServiceRequest{ServiceID: service.ID})
  314. return err
  315. })
  316. }
  317. // ServiceLogs collects service logs and writes them back to `config.OutStream`
  318. func (c *Cluster) ServiceLogs(ctx context.Context, selector *backend.LogSelector, config *apitypes.ContainerLogsOptions) (<-chan *backend.LogMessage, error) {
  319. c.mu.RLock()
  320. defer c.mu.RUnlock()
  321. state := c.currentNodeState()
  322. if !state.IsActiveManager() {
  323. return nil, c.errNoManager(state)
  324. }
  325. swarmSelector, err := convertSelector(ctx, state.controlClient, selector)
  326. if err != nil {
  327. return nil, errors.Wrap(err, "error making log selector")
  328. }
  329. // set the streams we'll use
  330. stdStreams := []swarmapi.LogStream{}
  331. if config.ShowStdout {
  332. stdStreams = append(stdStreams, swarmapi.LogStreamStdout)
  333. }
  334. if config.ShowStderr {
  335. stdStreams = append(stdStreams, swarmapi.LogStreamStderr)
  336. }
  337. // Get tail value squared away - the number of previous log lines we look at
  338. var tail int64
  339. // in ContainerLogs, if the tail value is ANYTHING non-integer, we just set
  340. // it to -1 (all). i don't agree with that, but i also think no tail value
  341. // should be legitimate. if you don't pass tail, we assume you want "all"
  342. if config.Tail == "all" || config.Tail == "" {
  343. // tail of 0 means send all logs on the swarmkit side
  344. tail = 0
  345. } else {
  346. t, err := strconv.Atoi(config.Tail)
  347. if err != nil {
  348. return nil, errors.New("tail value must be a positive integer or \"all\"")
  349. }
  350. if t < 0 {
  351. return nil, errors.New("negative tail values not supported")
  352. }
  353. // we actually use negative tail in swarmkit to represent messages
  354. // backwards starting from the beginning. also, -1 means no logs. so,
  355. // basically, for api compat with docker container logs, add one and
  356. // flip the sign. we error above if you try to negative tail, which
  357. // isn't supported by docker (and would error deeper in the stack
  358. // anyway)
  359. //
  360. // See the logs protobuf for more information
  361. tail = int64(-(t + 1))
  362. }
  363. // get the since value - the time in the past we're looking at logs starting from
  364. var sinceProto *gogotypes.Timestamp
  365. if config.Since != "" {
  366. s, n, err := timetypes.ParseTimestamps(config.Since, 0)
  367. if err != nil {
  368. return nil, errors.Wrap(err, "could not parse since timestamp")
  369. }
  370. since := time.Unix(s, n)
  371. sinceProto, err = gogotypes.TimestampProto(since)
  372. if err != nil {
  373. return nil, errors.Wrap(err, "could not parse timestamp to proto")
  374. }
  375. }
  376. stream, err := state.logsClient.SubscribeLogs(ctx, &swarmapi.SubscribeLogsRequest{
  377. Selector: swarmSelector,
  378. Options: &swarmapi.LogSubscriptionOptions{
  379. Follow: config.Follow,
  380. Streams: stdStreams,
  381. Tail: tail,
  382. Since: sinceProto,
  383. },
  384. })
  385. if err != nil {
  386. return nil, err
  387. }
  388. messageChan := make(chan *backend.LogMessage, 1)
  389. go func() {
  390. defer close(messageChan)
  391. for {
  392. // Check the context before doing anything.
  393. select {
  394. case <-ctx.Done():
  395. return
  396. default:
  397. }
  398. subscribeMsg, err := stream.Recv()
  399. if err == io.EOF {
  400. return
  401. }
  402. // if we're not io.EOF, push the message in and return
  403. if err != nil {
  404. select {
  405. case <-ctx.Done():
  406. case messageChan <- &backend.LogMessage{Err: err}:
  407. }
  408. return
  409. }
  410. for _, msg := range subscribeMsg.Messages {
  411. // make a new message
  412. m := new(backend.LogMessage)
  413. m.Attrs = make([]backend.LogAttr, 0, len(msg.Attrs)+3)
  414. // add the timestamp, adding the error if it fails
  415. m.Timestamp, err = gogotypes.TimestampFromProto(msg.Timestamp)
  416. if err != nil {
  417. m.Err = err
  418. }
  419. nodeKey := contextPrefix + ".node.id"
  420. serviceKey := contextPrefix + ".service.id"
  421. taskKey := contextPrefix + ".task.id"
  422. // copy over all of the details
  423. for _, d := range msg.Attrs {
  424. switch d.Key {
  425. case nodeKey, serviceKey, taskKey:
  426. // we have the final say over context details (in case there
  427. // is a conflict (if the user added a detail with a context's
  428. // key for some reason))
  429. default:
  430. m.Attrs = append(m.Attrs, backend.LogAttr{Key: d.Key, Value: d.Value})
  431. }
  432. }
  433. m.Attrs = append(m.Attrs,
  434. backend.LogAttr{Key: nodeKey, Value: msg.Context.NodeID},
  435. backend.LogAttr{Key: serviceKey, Value: msg.Context.ServiceID},
  436. backend.LogAttr{Key: taskKey, Value: msg.Context.TaskID},
  437. )
  438. switch msg.Stream {
  439. case swarmapi.LogStreamStdout:
  440. m.Source = "stdout"
  441. case swarmapi.LogStreamStderr:
  442. m.Source = "stderr"
  443. }
  444. m.Line = msg.Data
  445. // there could be a case where the reader stops accepting
  446. // messages and the context is canceled. we need to check that
  447. // here, or otherwise we risk blocking forever on the message
  448. // send.
  449. select {
  450. case <-ctx.Done():
  451. return
  452. case messageChan <- m:
  453. }
  454. }
  455. }
  456. }()
  457. return messageChan, nil
  458. }
  459. // convertSelector takes a backend.LogSelector, which contains raw names that
  460. // may or may not be valid, and converts them to an api.LogSelector proto. It
  461. // returns an error if something fails
  462. func convertSelector(ctx context.Context, cc swarmapi.ControlClient, selector *backend.LogSelector) (*swarmapi.LogSelector, error) {
  463. // don't rely on swarmkit to resolve IDs, do it ourselves
  464. swarmSelector := &swarmapi.LogSelector{}
  465. for _, s := range selector.Services {
  466. service, err := getService(ctx, cc, s, false)
  467. if err != nil {
  468. return nil, err
  469. }
  470. c := service.Spec.Task.GetContainer()
  471. if c == nil {
  472. return nil, errors.New("logs only supported on container tasks")
  473. }
  474. swarmSelector.ServiceIDs = append(swarmSelector.ServiceIDs, service.ID)
  475. }
  476. for _, t := range selector.Tasks {
  477. task, err := getTask(ctx, cc, t)
  478. if err != nil {
  479. return nil, err
  480. }
  481. c := task.Spec.GetContainer()
  482. if c == nil {
  483. return nil, errors.New("logs only supported on container tasks")
  484. }
  485. swarmSelector.TaskIDs = append(swarmSelector.TaskIDs, task.ID)
  486. }
  487. return swarmSelector, nil
  488. }
  489. // imageWithDigestString takes an image such as name or name:tag
  490. // and returns the image pinned to a digest, such as name@sha256:34234
  491. func (c *Cluster) imageWithDigestString(ctx context.Context, image string, authConfig *apitypes.AuthConfig) (string, error) {
  492. ref, err := reference.ParseAnyReference(image)
  493. if err != nil {
  494. return "", err
  495. }
  496. namedRef, ok := ref.(reference.Named)
  497. if !ok {
  498. if _, ok := ref.(reference.Digested); ok {
  499. return image, nil
  500. }
  501. return "", errors.Errorf("unknown image reference format: %s", image)
  502. }
  503. // only query registry if not a canonical reference (i.e. with digest)
  504. if _, ok := namedRef.(reference.Canonical); !ok {
  505. namedRef = reference.TagNameOnly(namedRef)
  506. taggedRef, ok := namedRef.(reference.NamedTagged)
  507. if !ok {
  508. return "", errors.Errorf("image reference not tagged: %s", image)
  509. }
  510. repo, _, err := c.config.Backend.GetRepository(ctx, taggedRef, authConfig)
  511. if err != nil {
  512. return "", err
  513. }
  514. dscrptr, err := repo.Tags(ctx).Get(ctx, taggedRef.Tag())
  515. if err != nil {
  516. return "", err
  517. }
  518. namedDigestedRef, err := reference.WithDigest(taggedRef, dscrptr.Digest)
  519. if err != nil {
  520. return "", err
  521. }
  522. // return familiar form until interface updated to return type
  523. return reference.FamiliarString(namedDigestedRef), nil
  524. }
  525. // reference already contains a digest, so just return it
  526. return reference.FamiliarString(ref), nil
  527. }
  528. // digestWarning constructs a formatted warning string
  529. // using the image name that could not be pinned by digest. The
  530. // formatting is hardcoded, but could me made smarter in the future
  531. func digestWarning(image string) string {
  532. return fmt.Sprintf("image %s could not be accessed on a registry to record\nits digest. Each node will access %s independently,\npossibly leading to different nodes running different\nversions of the image.\n", image, image)
  533. }