cluster.go 9.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303
  1. package controlapi
  2. import (
  3. "context"
  4. "strings"
  5. "time"
  6. "github.com/docker/swarmkit/api"
  7. "github.com/docker/swarmkit/ca"
  8. "github.com/docker/swarmkit/log"
  9. "github.com/docker/swarmkit/manager/encryption"
  10. "github.com/docker/swarmkit/manager/state/store"
  11. gogotypes "github.com/gogo/protobuf/types"
  12. "google.golang.org/grpc/codes"
  13. "google.golang.org/grpc/status"
  14. )
  15. const (
  16. // expiredCertGrace is the amount of time to keep a node in the
  17. // blacklist beyond its certificate expiration timestamp.
  18. expiredCertGrace = 24 * time.Hour * 7
  19. // inbuilt default subnet size
  20. inbuiltSubnetSize = 24
  21. )
  22. var (
  23. // inbuilt default address pool
  24. inbuiltDefaultAddressPool = []string{"10.0.0.0/8"}
  25. )
  26. func validateClusterSpec(spec *api.ClusterSpec) error {
  27. if spec == nil {
  28. return status.Errorf(codes.InvalidArgument, errInvalidArgument.Error())
  29. }
  30. // Validate that expiry time being provided is valid, and over our minimum
  31. if spec.CAConfig.NodeCertExpiry != nil {
  32. expiry, err := gogotypes.DurationFromProto(spec.CAConfig.NodeCertExpiry)
  33. if err != nil {
  34. return status.Errorf(codes.InvalidArgument, errInvalidArgument.Error())
  35. }
  36. if expiry < ca.MinNodeCertExpiration {
  37. return status.Errorf(codes.InvalidArgument, "minimum certificate expiry time is: %s", ca.MinNodeCertExpiration)
  38. }
  39. }
  40. // Validate that AcceptancePolicies only include Secrets that are bcrypted
  41. // TODO(diogo): Add a global list of acceptance algorithms. We only support bcrypt for now.
  42. if len(spec.AcceptancePolicy.Policies) > 0 {
  43. for _, policy := range spec.AcceptancePolicy.Policies {
  44. if policy.Secret != nil && strings.ToLower(policy.Secret.Alg) != "bcrypt" {
  45. return status.Errorf(codes.InvalidArgument, "hashing algorithm is not supported: %s", policy.Secret.Alg)
  46. }
  47. }
  48. }
  49. // Validate that heartbeatPeriod time being provided is valid
  50. if spec.Dispatcher.HeartbeatPeriod != nil {
  51. heartbeatPeriod, err := gogotypes.DurationFromProto(spec.Dispatcher.HeartbeatPeriod)
  52. if err != nil {
  53. return status.Errorf(codes.InvalidArgument, errInvalidArgument.Error())
  54. }
  55. if heartbeatPeriod < 0 {
  56. return status.Errorf(codes.InvalidArgument, "heartbeat time period cannot be a negative duration")
  57. }
  58. }
  59. if spec.Annotations.Name != store.DefaultClusterName {
  60. return status.Errorf(codes.InvalidArgument, "modification of cluster name is not allowed")
  61. }
  62. return nil
  63. }
  64. // GetCluster returns a Cluster given a ClusterID.
  65. // - Returns `InvalidArgument` if ClusterID is not provided.
  66. // - Returns `NotFound` if the Cluster is not found.
  67. func (s *Server) GetCluster(ctx context.Context, request *api.GetClusterRequest) (*api.GetClusterResponse, error) {
  68. if request.ClusterID == "" {
  69. return nil, status.Errorf(codes.InvalidArgument, errInvalidArgument.Error())
  70. }
  71. var cluster *api.Cluster
  72. s.store.View(func(tx store.ReadTx) {
  73. cluster = store.GetCluster(tx, request.ClusterID)
  74. })
  75. if cluster == nil {
  76. return nil, status.Errorf(codes.NotFound, "cluster %s not found", request.ClusterID)
  77. }
  78. redactedClusters := redactClusters([]*api.Cluster{cluster})
  79. // WARN: we should never return cluster here. We need to redact the private fields first.
  80. return &api.GetClusterResponse{
  81. Cluster: redactedClusters[0],
  82. }, nil
  83. }
  84. // UpdateCluster updates a Cluster referenced by ClusterID with the given ClusterSpec.
  85. // - Returns `NotFound` if the Cluster is not found.
  86. // - Returns `InvalidArgument` if the ClusterSpec is malformed.
  87. // - Returns `Unimplemented` if the ClusterSpec references unimplemented features.
  88. // - Returns an error if the update fails.
  89. func (s *Server) UpdateCluster(ctx context.Context, request *api.UpdateClusterRequest) (*api.UpdateClusterResponse, error) {
  90. if request.ClusterID == "" || request.ClusterVersion == nil {
  91. return nil, status.Errorf(codes.InvalidArgument, errInvalidArgument.Error())
  92. }
  93. if err := validateClusterSpec(request.Spec); err != nil {
  94. return nil, err
  95. }
  96. var cluster *api.Cluster
  97. err := s.store.Update(func(tx store.Tx) error {
  98. cluster = store.GetCluster(tx, request.ClusterID)
  99. if cluster == nil {
  100. return status.Errorf(codes.NotFound, "cluster %s not found", request.ClusterID)
  101. }
  102. // This ensures that we have the current rootCA with which to generate tokens (expiration doesn't matter
  103. // for generating the tokens)
  104. rootCA, err := ca.RootCAFromAPI(ctx, &cluster.RootCA, ca.DefaultNodeCertExpiration)
  105. if err != nil {
  106. log.G(ctx).WithField(
  107. "method", "(*controlapi.Server).UpdateCluster").WithError(err).Error("invalid cluster root CA")
  108. return status.Errorf(codes.Internal, "error loading cluster rootCA for update")
  109. }
  110. cluster.Meta.Version = *request.ClusterVersion
  111. cluster.Spec = *request.Spec.Copy()
  112. expireBlacklistedCerts(cluster)
  113. if request.Rotation.WorkerJoinToken {
  114. cluster.RootCA.JoinTokens.Worker = ca.GenerateJoinToken(&rootCA, cluster.FIPS)
  115. }
  116. if request.Rotation.ManagerJoinToken {
  117. cluster.RootCA.JoinTokens.Manager = ca.GenerateJoinToken(&rootCA, cluster.FIPS)
  118. }
  119. updatedRootCA, err := validateCAConfig(ctx, s.securityConfig, cluster)
  120. if err != nil {
  121. return err
  122. }
  123. cluster.RootCA = *updatedRootCA
  124. var unlockKeys []*api.EncryptionKey
  125. var managerKey *api.EncryptionKey
  126. for _, eKey := range cluster.UnlockKeys {
  127. if eKey.Subsystem == ca.ManagerRole {
  128. if !cluster.Spec.EncryptionConfig.AutoLockManagers {
  129. continue
  130. }
  131. managerKey = eKey
  132. }
  133. unlockKeys = append(unlockKeys, eKey)
  134. }
  135. switch {
  136. case !cluster.Spec.EncryptionConfig.AutoLockManagers:
  137. break
  138. case managerKey == nil:
  139. unlockKeys = append(unlockKeys, &api.EncryptionKey{
  140. Subsystem: ca.ManagerRole,
  141. Key: encryption.GenerateSecretKey(),
  142. })
  143. case request.Rotation.ManagerUnlockKey:
  144. managerKey.Key = encryption.GenerateSecretKey()
  145. }
  146. cluster.UnlockKeys = unlockKeys
  147. return store.UpdateCluster(tx, cluster)
  148. })
  149. if err != nil {
  150. return nil, err
  151. }
  152. redactedClusters := redactClusters([]*api.Cluster{cluster})
  153. // WARN: we should never return cluster here. We need to redact the private fields first.
  154. return &api.UpdateClusterResponse{
  155. Cluster: redactedClusters[0],
  156. }, nil
  157. }
  158. func filterClusters(candidates []*api.Cluster, filters ...func(*api.Cluster) bool) []*api.Cluster {
  159. result := []*api.Cluster{}
  160. for _, c := range candidates {
  161. match := true
  162. for _, f := range filters {
  163. if !f(c) {
  164. match = false
  165. break
  166. }
  167. }
  168. if match {
  169. result = append(result, c)
  170. }
  171. }
  172. return result
  173. }
  174. // ListClusters returns a list of all clusters.
  175. func (s *Server) ListClusters(ctx context.Context, request *api.ListClustersRequest) (*api.ListClustersResponse, error) {
  176. var (
  177. clusters []*api.Cluster
  178. err error
  179. )
  180. s.store.View(func(tx store.ReadTx) {
  181. switch {
  182. case request.Filters != nil && len(request.Filters.Names) > 0:
  183. clusters, err = store.FindClusters(tx, buildFilters(store.ByName, request.Filters.Names))
  184. case request.Filters != nil && len(request.Filters.NamePrefixes) > 0:
  185. clusters, err = store.FindClusters(tx, buildFilters(store.ByNamePrefix, request.Filters.NamePrefixes))
  186. case request.Filters != nil && len(request.Filters.IDPrefixes) > 0:
  187. clusters, err = store.FindClusters(tx, buildFilters(store.ByIDPrefix, request.Filters.IDPrefixes))
  188. default:
  189. clusters, err = store.FindClusters(tx, store.All)
  190. }
  191. })
  192. if err != nil {
  193. return nil, err
  194. }
  195. if request.Filters != nil {
  196. clusters = filterClusters(clusters,
  197. func(e *api.Cluster) bool {
  198. return filterContains(e.Spec.Annotations.Name, request.Filters.Names)
  199. },
  200. func(e *api.Cluster) bool {
  201. return filterContainsPrefix(e.Spec.Annotations.Name, request.Filters.NamePrefixes)
  202. },
  203. func(e *api.Cluster) bool {
  204. return filterContainsPrefix(e.ID, request.Filters.IDPrefixes)
  205. },
  206. func(e *api.Cluster) bool {
  207. return filterMatchLabels(e.Spec.Annotations.Labels, request.Filters.Labels)
  208. },
  209. )
  210. }
  211. // WARN: we should never return cluster here. We need to redact the private fields first.
  212. return &api.ListClustersResponse{
  213. Clusters: redactClusters(clusters),
  214. }, nil
  215. }
  216. // redactClusters is a method that enforces a whitelist of fields that are ok to be
  217. // returned in the Cluster object. It should filter out all sensitive information.
  218. func redactClusters(clusters []*api.Cluster) []*api.Cluster {
  219. var redactedClusters []*api.Cluster
  220. // Only add public fields to the new clusters
  221. for _, cluster := range clusters {
  222. // Copy all the mandatory fields
  223. // Do not copy secret keys
  224. redactedSpec := cluster.Spec.Copy()
  225. redactedSpec.CAConfig.SigningCAKey = nil
  226. // the cert is not a secret, but if API users get the cluster spec and then update,
  227. // then because the cert is included but not the key, the user can get update errors
  228. // or unintended consequences (such as telling swarm to forget about the key so long
  229. // as there is a corresponding external CA)
  230. redactedSpec.CAConfig.SigningCACert = nil
  231. redactedRootCA := cluster.RootCA.Copy()
  232. redactedRootCA.CAKey = nil
  233. if r := redactedRootCA.RootRotation; r != nil {
  234. r.CAKey = nil
  235. }
  236. newCluster := &api.Cluster{
  237. ID: cluster.ID,
  238. Meta: cluster.Meta,
  239. Spec: *redactedSpec,
  240. RootCA: *redactedRootCA,
  241. BlacklistedCertificates: cluster.BlacklistedCertificates,
  242. DefaultAddressPool: cluster.DefaultAddressPool,
  243. SubnetSize: cluster.SubnetSize,
  244. }
  245. if newCluster.DefaultAddressPool == nil {
  246. // This is just for CLI display. Set the inbuilt default pool for
  247. // user reference.
  248. newCluster.DefaultAddressPool = inbuiltDefaultAddressPool
  249. newCluster.SubnetSize = inbuiltSubnetSize
  250. }
  251. redactedClusters = append(redactedClusters, newCluster)
  252. }
  253. return redactedClusters
  254. }
  255. func expireBlacklistedCerts(cluster *api.Cluster) {
  256. nowMinusGrace := time.Now().Add(-expiredCertGrace)
  257. for cn, blacklistedCert := range cluster.BlacklistedCertificates {
  258. if blacklistedCert.Expiry == nil {
  259. continue
  260. }
  261. expiry, err := gogotypes.TimestampFromProto(blacklistedCert.Expiry)
  262. if err == nil && nowMinusGrace.After(expiry) {
  263. delete(cluster.BlacklistedCertificates, cn)
  264. }
  265. }
  266. }