541fda8e90
This package was moved to a separate repository, using the steps below: # install filter-repo (https://github.com/newren/git-filter-repo/blob/main/INSTALL.md) brew install git-filter-repo cd ~/projects # create a temporary clone of docker git clone https://github.com/docker/docker.git moby_pubsub_temp cd moby_pubsub_temp # for reference git rev-parse HEAD # -->572ca799db
# remove all code, except for pkg/pubsub, license, and notice, and rename pkg/pubsub to / git filter-repo --path pkg/pubsub/ --path LICENSE --path NOTICE --path-rename pkg/pubsub/: # remove canonical imports git revert -s -S 585ff0ebbe6bc25b801a0e0087dd5353099cb72e # initialize module go mod init github.com/moby/pubsub go mod tidy Signed-off-by: Sebastiaan van Stijn <github@gone.nl> (cherry picked from commit0249afc523
) Signed-off-by: Sebastiaan van Stijn <github@gone.nl>
153 lines
4.1 KiB
Go
153 lines
4.1 KiB
Go
package stats // import "github.com/docker/docker/daemon/stats"
|
|
|
|
import (
|
|
"bufio"
|
|
"sync"
|
|
"time"
|
|
|
|
"github.com/docker/docker/api/types"
|
|
"github.com/docker/docker/container"
|
|
"github.com/docker/docker/errdefs"
|
|
"github.com/moby/pubsub"
|
|
"github.com/sirupsen/logrus"
|
|
)
|
|
|
|
// Collector manages and provides container resource stats
|
|
type Collector struct {
|
|
m sync.Mutex
|
|
cond *sync.Cond
|
|
supervisor supervisor
|
|
interval time.Duration
|
|
publishers map[*container.Container]*pubsub.Publisher
|
|
bufReader *bufio.Reader
|
|
}
|
|
|
|
// NewCollector creates a stats collector that will poll the supervisor with the specified interval
|
|
func NewCollector(supervisor supervisor, interval time.Duration) *Collector {
|
|
s := &Collector{
|
|
interval: interval,
|
|
supervisor: supervisor,
|
|
publishers: make(map[*container.Container]*pubsub.Publisher),
|
|
bufReader: bufio.NewReaderSize(nil, 128),
|
|
}
|
|
s.cond = sync.NewCond(&s.m)
|
|
return s
|
|
}
|
|
|
|
type supervisor interface {
|
|
// GetContainerStats collects all the stats related to a container
|
|
GetContainerStats(container *container.Container) (*types.StatsJSON, error)
|
|
}
|
|
|
|
// Collect registers the container with the collector and adds it to
|
|
// the event loop for collection on the specified interval returning
|
|
// a channel for the subscriber to receive on.
|
|
func (s *Collector) Collect(c *container.Container) chan interface{} {
|
|
s.cond.L.Lock()
|
|
defer s.cond.L.Unlock()
|
|
|
|
publisher, exists := s.publishers[c]
|
|
if !exists {
|
|
publisher = pubsub.NewPublisher(100*time.Millisecond, 1024)
|
|
s.publishers[c] = publisher
|
|
}
|
|
|
|
s.cond.Broadcast()
|
|
return publisher.Subscribe()
|
|
}
|
|
|
|
// StopCollection closes the channels for all subscribers and removes
|
|
// the container from metrics collection.
|
|
func (s *Collector) StopCollection(c *container.Container) {
|
|
s.m.Lock()
|
|
if publisher, exists := s.publishers[c]; exists {
|
|
publisher.Close()
|
|
delete(s.publishers, c)
|
|
}
|
|
s.m.Unlock()
|
|
}
|
|
|
|
// Unsubscribe removes a specific subscriber from receiving updates for a container's stats.
|
|
func (s *Collector) Unsubscribe(c *container.Container, ch chan interface{}) {
|
|
s.m.Lock()
|
|
publisher := s.publishers[c]
|
|
if publisher != nil {
|
|
publisher.Evict(ch)
|
|
if publisher.Len() == 0 {
|
|
delete(s.publishers, c)
|
|
}
|
|
}
|
|
s.m.Unlock()
|
|
}
|
|
|
|
// Run starts the collectors and will indefinitely collect stats from the supervisor
|
|
func (s *Collector) Run() {
|
|
type publishersPair struct {
|
|
container *container.Container
|
|
publisher *pubsub.Publisher
|
|
}
|
|
// we cannot determine the capacity here.
|
|
// it will grow enough in first iteration
|
|
var pairs []publishersPair
|
|
|
|
for {
|
|
s.cond.L.Lock()
|
|
for len(s.publishers) == 0 {
|
|
s.cond.Wait()
|
|
}
|
|
|
|
// it does not make sense in the first iteration,
|
|
// but saves allocations in further iterations
|
|
pairs = pairs[:0]
|
|
|
|
for container, publisher := range s.publishers {
|
|
// copy pointers here to release the lock ASAP
|
|
pairs = append(pairs, publishersPair{container, publisher})
|
|
}
|
|
|
|
s.cond.L.Unlock()
|
|
|
|
onlineCPUs, err := s.getNumberOnlineCPUs()
|
|
if err != nil {
|
|
logrus.Errorf("collecting system online cpu count: %v", err)
|
|
continue
|
|
}
|
|
|
|
for _, pair := range pairs {
|
|
stats, err := s.supervisor.GetContainerStats(pair.container)
|
|
|
|
switch err.(type) {
|
|
case nil:
|
|
// Sample system CPU usage close to container usage to avoid
|
|
// noise in metric calculations.
|
|
systemUsage, err := s.getSystemCPUUsage()
|
|
if err != nil {
|
|
logrus.WithError(err).WithField("container_id", pair.container.ID).Errorf("collecting system cpu usage")
|
|
continue
|
|
}
|
|
|
|
// FIXME: move to containerd on Linux (not Windows)
|
|
stats.CPUStats.SystemUsage = systemUsage
|
|
stats.CPUStats.OnlineCPUs = onlineCPUs
|
|
|
|
pair.publisher.Publish(*stats)
|
|
|
|
case errdefs.ErrConflict, errdefs.ErrNotFound:
|
|
// publish empty stats containing only name and ID if not running or not found
|
|
pair.publisher.Publish(types.StatsJSON{
|
|
Name: pair.container.Name,
|
|
ID: pair.container.ID,
|
|
})
|
|
|
|
default:
|
|
logrus.Errorf("collecting stats for %s: %v", pair.container.ID, err)
|
|
pair.publisher.Publish(types.StatsJSON{
|
|
Name: pair.container.Name,
|
|
ID: pair.container.ID,
|
|
})
|
|
}
|
|
}
|
|
|
|
time.Sleep(s.interval)
|
|
}
|
|
}
|