618be9ff68
* properly update the time structure within event to ensure it works in time-machine * move LIVE and TIMEMACHINE to pkg/types : less code needs to import leakybucket package, and we avoid duplicating constants
383 lines
12 KiB
Go
383 lines
12 KiB
Go
package leakybucket
|
|
|
|
import (
|
|
"fmt"
|
|
"sync"
|
|
"sync/atomic"
|
|
"time"
|
|
|
|
"github.com/crowdsecurity/crowdsec/pkg/time/rate"
|
|
"github.com/crowdsecurity/crowdsec/pkg/types"
|
|
"github.com/davecgh/go-spew/spew"
|
|
"github.com/mohae/deepcopy"
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
log "github.com/sirupsen/logrus"
|
|
"gopkg.in/tomb.v2"
|
|
)
|
|
|
|
// those constants are now defined in types/constants
|
|
// const (
|
|
// LIVE = iota
|
|
// TIMEMACHINE
|
|
// )
|
|
|
|
// Leaky represents one instance of a bucket
|
|
type Leaky struct {
|
|
Name string
|
|
Mode int //LIVE or TIMEMACHINE
|
|
//the limiter is what holds the proper "leaky aspect", it determines when/if we can pour objects
|
|
Limiter rate.RateLimiter `json:"-"`
|
|
SerializedState rate.Lstate
|
|
//Queue is used to held the cache of objects in the bucket, it is used to know 'how many' objects we have in buffer.
|
|
Queue *Queue
|
|
//Leaky buckets are receiving message through a chan
|
|
In chan *types.Event `json:"-"`
|
|
//Leaky buckets are pushing their overflows through a chan
|
|
Out chan *Queue `json:"-"`
|
|
// shared for all buckets (the idea is to kill this afterwards)
|
|
AllOut chan types.Event `json:"-"`
|
|
//max capacity (for burst)
|
|
Capacity int
|
|
//CacheRatio is the number of elements that should be kept in memory (compared to capacity)
|
|
CacheSize int
|
|
//the unique identifier of the bucket (a hash)
|
|
Mapkey string
|
|
// chan for signaling
|
|
Signal chan bool `json:"-"`
|
|
Suicide chan bool `json:"-"`
|
|
Reprocess bool
|
|
Simulated bool
|
|
Uuid string
|
|
First_ts time.Time
|
|
Last_ts time.Time
|
|
Ovflw_ts time.Time
|
|
Total_count int
|
|
Leakspeed time.Duration
|
|
BucketConfig *BucketFactory
|
|
Duration time.Duration
|
|
Pour func(*Leaky, types.Event) `json:"-"`
|
|
//Profiling when set to true enables profiling of bucket
|
|
Profiling bool
|
|
timedOverflow bool
|
|
conditionalOverflow bool
|
|
logger *log.Entry
|
|
scopeType types.ScopeType
|
|
hash string
|
|
scenarioVersion string
|
|
tomb *tomb.Tomb
|
|
wgPour *sync.WaitGroup
|
|
wgDumpState *sync.WaitGroup
|
|
mutex *sync.Mutex //used only for TIMEMACHINE mode to allow garbage collection without races
|
|
}
|
|
|
|
var BucketsPour = prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Name: "cs_bucket_poured_total",
|
|
Help: "Total events were poured in bucket.",
|
|
},
|
|
[]string{"source", "type", "name"},
|
|
)
|
|
|
|
var BucketsOverflow = prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Name: "cs_bucket_overflowed_total",
|
|
Help: "Total buckets overflowed.",
|
|
},
|
|
[]string{"name"},
|
|
)
|
|
|
|
var BucketsCanceled = prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Name: "cs_bucket_canceled_total",
|
|
Help: "Total buckets canceled.",
|
|
},
|
|
[]string{"name"},
|
|
)
|
|
|
|
var BucketsUnderflow = prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Name: "cs_bucket_underflowed_total",
|
|
Help: "Total buckets underflowed.",
|
|
},
|
|
[]string{"name"},
|
|
)
|
|
|
|
var BucketsInstantiation = prometheus.NewCounterVec(
|
|
prometheus.CounterOpts{
|
|
Name: "cs_bucket_created_total",
|
|
Help: "Total buckets were instantiated.",
|
|
},
|
|
[]string{"name"},
|
|
)
|
|
|
|
var BucketsCurrentCount = prometheus.NewGaugeVec(
|
|
prometheus.GaugeOpts{
|
|
Name: "cs_buckets",
|
|
Help: "Number of buckets that currently exist.",
|
|
},
|
|
[]string{"name"},
|
|
)
|
|
|
|
var LeakyRoutineCount int64
|
|
|
|
// Newleaky creates a new leaky bucket from a BucketFactory
|
|
// Events created by the bucket (overflow, bucket empty) are sent to a chan defined by BucketFactory
|
|
// The leaky bucket implementation is based on rate limiter (see https://godoc.org/golang.org/x/time/rate)
|
|
// There's a trick to have an event said when the bucket gets empty to allow its destruction
|
|
func NewLeaky(bucketFactory BucketFactory) *Leaky {
|
|
bucketFactory.logger.Tracef("Instantiating live bucket %s", bucketFactory.Name)
|
|
return FromFactory(bucketFactory)
|
|
}
|
|
|
|
func FromFactory(bucketFactory BucketFactory) *Leaky {
|
|
var limiter rate.RateLimiter
|
|
//golang rate limiter. It's mainly intended for http rate limiter
|
|
Qsize := bucketFactory.Capacity
|
|
if bucketFactory.CacheSize > 0 {
|
|
//cache is smaller than actual capacity
|
|
if bucketFactory.CacheSize <= bucketFactory.Capacity {
|
|
Qsize = bucketFactory.CacheSize
|
|
//bucket might be counter (infinite size), allow cache limitation
|
|
} else if bucketFactory.Capacity == -1 {
|
|
Qsize = bucketFactory.CacheSize
|
|
}
|
|
}
|
|
if bucketFactory.Capacity == -1 {
|
|
//In this case we allow all events to pass.
|
|
//maybe in the future we could avoid using a limiter
|
|
limiter = &rate.AlwaysFull{}
|
|
} else {
|
|
limiter = rate.NewLimiter(rate.Every(bucketFactory.leakspeed), bucketFactory.Capacity)
|
|
}
|
|
BucketsInstantiation.With(prometheus.Labels{"name": bucketFactory.Name}).Inc()
|
|
|
|
//create the leaky bucket per se
|
|
l := &Leaky{
|
|
Name: bucketFactory.Name,
|
|
Limiter: limiter,
|
|
Uuid: seed.Generate(),
|
|
Queue: NewQueue(Qsize),
|
|
CacheSize: bucketFactory.CacheSize,
|
|
Out: make(chan *Queue, 1),
|
|
Suicide: make(chan bool, 1),
|
|
AllOut: bucketFactory.ret,
|
|
Capacity: bucketFactory.Capacity,
|
|
Leakspeed: bucketFactory.leakspeed,
|
|
BucketConfig: &bucketFactory,
|
|
Pour: Pour,
|
|
Reprocess: bucketFactory.Reprocess,
|
|
Profiling: bucketFactory.Profiling,
|
|
Mode: types.LIVE,
|
|
scopeType: bucketFactory.ScopeType,
|
|
scenarioVersion: bucketFactory.ScenarioVersion,
|
|
hash: bucketFactory.hash,
|
|
Simulated: bucketFactory.Simulated,
|
|
tomb: bucketFactory.tomb,
|
|
wgPour: bucketFactory.wgPour,
|
|
wgDumpState: bucketFactory.wgDumpState,
|
|
mutex: &sync.Mutex{},
|
|
}
|
|
if l.BucketConfig.Capacity > 0 && l.BucketConfig.leakspeed != time.Duration(0) {
|
|
l.Duration = time.Duration(l.BucketConfig.Capacity+1) * l.BucketConfig.leakspeed
|
|
}
|
|
if l.BucketConfig.duration != time.Duration(0) {
|
|
l.Duration = l.BucketConfig.duration
|
|
l.timedOverflow = true
|
|
}
|
|
|
|
if l.BucketConfig.Type == "conditional" {
|
|
l.conditionalOverflow = true
|
|
l.Duration = l.BucketConfig.leakspeed
|
|
}
|
|
return l
|
|
}
|
|
|
|
/* for now mimic a leak routine */
|
|
//LeakRoutine us the life of a bucket. It dies when the bucket underflows or overflows
|
|
func LeakRoutine(leaky *Leaky) error {
|
|
|
|
var (
|
|
durationTickerChan = make(<-chan time.Time)
|
|
durationTicker *time.Ticker
|
|
firstEvent = true
|
|
)
|
|
|
|
defer types.CatchPanic(fmt.Sprintf("crowdsec/LeakRoutine/%s", leaky.Name))
|
|
|
|
BucketsCurrentCount.With(prometheus.Labels{"name": leaky.Name}).Inc()
|
|
defer BucketsCurrentCount.With(prometheus.Labels{"name": leaky.Name}).Dec()
|
|
|
|
/*todo : we create a logger at runtime while we want leakroutine to be up asap, might not be a good idea*/
|
|
leaky.logger = leaky.BucketConfig.logger.WithFields(log.Fields{"capacity": leaky.Capacity, "partition": leaky.Mapkey, "bucket_id": leaky.Uuid})
|
|
|
|
//We copy the processors, as they are coming from the BucketFactory, and thus are shared between buckets
|
|
//If we don't copy, processors using local cache (such as Uniq) are subject to race conditions
|
|
//This can lead to creating buckets that will discard their first events, preventing the underflow ticker from being initialized
|
|
//and preventing them from being destroyed
|
|
processors := deepcopy.Copy(leaky.BucketConfig.processors).([]Processor)
|
|
|
|
leaky.Signal <- true
|
|
atomic.AddInt64(&LeakyRoutineCount, 1)
|
|
defer atomic.AddInt64(&LeakyRoutineCount, -1)
|
|
|
|
for _, f := range processors {
|
|
err := f.OnBucketInit(leaky.BucketConfig)
|
|
if err != nil {
|
|
leaky.logger.Errorf("Problem at bucket initializiation. Bail out %T : %v", f, err)
|
|
close(leaky.Signal)
|
|
return fmt.Errorf("Problem at bucket initializiation. Bail out %T : %v", f, err)
|
|
}
|
|
}
|
|
|
|
leaky.logger.Debugf("Leaky routine starting, lifetime : %s", leaky.Duration)
|
|
for {
|
|
select {
|
|
/*receiving an event*/
|
|
case msg := <-leaky.In:
|
|
/*the msg var use is confusing and is redeclared in a different type :/*/
|
|
for _, processor := range processors {
|
|
msg = processor.OnBucketPour(leaky.BucketConfig)(*msg, leaky)
|
|
// if &msg == nil we stop processing
|
|
if msg == nil {
|
|
goto End
|
|
}
|
|
}
|
|
if leaky.logger.Level >= log.TraceLevel {
|
|
leaky.logger.Tracef("Pour event: %s", spew.Sdump(msg))
|
|
}
|
|
BucketsPour.With(prometheus.Labels{"name": leaky.Name, "source": msg.Line.Src, "type": msg.Line.Module}).Inc()
|
|
|
|
leaky.Pour(leaky, *msg) // glue for now
|
|
|
|
for _, processor := range processors {
|
|
msg = processor.AfterBucketPour(leaky.BucketConfig)(*msg, leaky)
|
|
if msg == nil {
|
|
goto End
|
|
}
|
|
}
|
|
|
|
//Clear cache on behalf of pour
|
|
|
|
// if durationTicker isn't initialized, then we're pouring our first event
|
|
|
|
// reinitialize the durationTicker when it's not a counter bucket
|
|
if !leaky.timedOverflow || firstEvent {
|
|
if firstEvent {
|
|
durationTicker = time.NewTicker(leaky.Duration)
|
|
durationTickerChan = durationTicker.C
|
|
defer durationTicker.Stop()
|
|
} else {
|
|
durationTicker.Reset(leaky.Duration)
|
|
}
|
|
}
|
|
firstEvent = false
|
|
/*we overflowed*/
|
|
case ofw := <-leaky.Out:
|
|
leaky.overflow(ofw)
|
|
return nil
|
|
/*suiciiiide*/
|
|
case <-leaky.Suicide:
|
|
close(leaky.Signal)
|
|
BucketsCanceled.With(prometheus.Labels{"name": leaky.Name}).Inc()
|
|
leaky.logger.Debugf("Suicide triggered")
|
|
leaky.AllOut <- types.Event{Type: types.OVFLW, Overflow: types.RuntimeAlert{Mapkey: leaky.Mapkey}}
|
|
leaky.logger.Tracef("Returning from leaky routine.")
|
|
return nil
|
|
/*we underflow or reach bucket deadline (timers)*/
|
|
case <-durationTickerChan:
|
|
var (
|
|
alert types.RuntimeAlert
|
|
err error
|
|
)
|
|
leaky.Ovflw_ts = time.Now().UTC()
|
|
close(leaky.Signal)
|
|
ofw := leaky.Queue
|
|
alert = types.RuntimeAlert{Mapkey: leaky.Mapkey}
|
|
|
|
if leaky.timedOverflow {
|
|
BucketsOverflow.With(prometheus.Labels{"name": leaky.Name}).Inc()
|
|
|
|
alert, err = NewAlert(leaky, ofw)
|
|
if err != nil {
|
|
log.Errorf("%s", err)
|
|
}
|
|
for _, f := range leaky.BucketConfig.processors {
|
|
alert, ofw = f.OnBucketOverflow(leaky.BucketConfig)(leaky, alert, ofw)
|
|
if ofw == nil {
|
|
leaky.logger.Debugf("Overflow has been discarded (%T)", f)
|
|
break
|
|
}
|
|
}
|
|
leaky.logger.Infof("Timed Overflow")
|
|
} else {
|
|
leaky.logger.Debugf("bucket underflow, destroy")
|
|
BucketsUnderflow.With(prometheus.Labels{"name": leaky.Name}).Inc()
|
|
|
|
}
|
|
if leaky.logger.Level >= log.TraceLevel {
|
|
/*don't sdump if it's not going to printed, it's expensive*/
|
|
leaky.logger.Tracef("Overflow event: %s", spew.Sdump(types.Event{Overflow: alert}))
|
|
}
|
|
|
|
leaky.AllOut <- types.Event{Overflow: alert, Type: types.OVFLW}
|
|
leaky.logger.Tracef("Returning from leaky routine.")
|
|
return nil
|
|
case <-leaky.tomb.Dying():
|
|
leaky.logger.Debugf("Bucket externally killed, return")
|
|
for len(leaky.Out) > 0 {
|
|
ofw := <-leaky.Out
|
|
leaky.overflow(ofw)
|
|
}
|
|
leaky.AllOut <- types.Event{Type: types.OVFLW, Overflow: types.RuntimeAlert{Mapkey: leaky.Mapkey}}
|
|
return nil
|
|
|
|
}
|
|
End:
|
|
}
|
|
}
|
|
|
|
func Pour(leaky *Leaky, msg types.Event) {
|
|
leaky.wgDumpState.Wait()
|
|
leaky.wgPour.Add(1)
|
|
defer leaky.wgPour.Done()
|
|
|
|
leaky.Total_count += 1
|
|
if leaky.First_ts.IsZero() {
|
|
leaky.First_ts = time.Now().UTC()
|
|
}
|
|
leaky.Last_ts = time.Now().UTC()
|
|
|
|
if leaky.Limiter.Allow() || leaky.conditionalOverflow {
|
|
leaky.Queue.Add(msg)
|
|
} else {
|
|
leaky.Ovflw_ts = time.Now().UTC()
|
|
leaky.logger.Debugf("Last event to be poured, bucket overflow.")
|
|
leaky.Queue.Add(msg)
|
|
leaky.Out <- leaky.Queue
|
|
}
|
|
}
|
|
|
|
func (leaky *Leaky) overflow(ofw *Queue) {
|
|
close(leaky.Signal)
|
|
alert, err := NewAlert(leaky, ofw)
|
|
if err != nil {
|
|
log.Errorf("%s", err)
|
|
}
|
|
leaky.logger.Tracef("Overflow hooks time : %v", leaky.BucketConfig.processors)
|
|
for _, f := range leaky.BucketConfig.processors {
|
|
alert, ofw = f.OnBucketOverflow(leaky.BucketConfig)(leaky, alert, ofw)
|
|
if ofw == nil {
|
|
leaky.logger.Debugf("Overflow has been discarded (%T)", f)
|
|
break
|
|
}
|
|
}
|
|
if leaky.logger.Level >= log.TraceLevel {
|
|
leaky.logger.Tracef("Overflow event: %s", spew.Sdump(alert))
|
|
}
|
|
mt, _ := leaky.Ovflw_ts.MarshalText()
|
|
leaky.logger.Tracef("overflow time : %s", mt)
|
|
|
|
BucketsOverflow.With(prometheus.Labels{"name": leaky.Name}).Inc()
|
|
|
|
leaky.AllOut <- types.Event{Overflow: alert, Type: types.OVFLW, MarshaledTime: string(mt)}
|
|
}
|