tracker/stats/percentile.go

113 lines
2.5 KiB
Go
Raw Normal View History

package stats
import (
2014-07-22 14:57:36 -04:00
"encoding/json"
2014-07-22 12:26:31 -04:00
"math"
"sort"
2014-07-22 12:42:56 -04:00
"sync/atomic"
)
2014-07-22 15:02:47 -04:00
// Percentile implements an efficient percentile calculation of
// arbitrary float64 samples.
type Percentile struct {
percentile float64
2014-07-22 12:26:31 -04:00
samples int64
offset int64
2014-07-22 12:42:56 -04:00
values []float64
2014-07-22 12:47:17 -04:00
value uint64 // These bits are really a float64.
}
// NewPercentile returns a Percentile with a given threshold.
func NewPercentile(percentile float64) *Percentile {
return &Percentile{
percentile: percentile,
// 256 samples is fast, and accurate for most distributions.
values: make([]float64, 0, 256),
}
}
// NewPercentileWithWindow returns a Percentile with a given threshold
2014-07-22 15:02:47 -04:00
// and window size (accuracy).
func NewPercentileWithWindow(percentile float64, sampleWindow int) *Percentile {
return &Percentile{
percentile: percentile,
2014-07-22 12:47:17 -04:00
values: make([]float64, 0, sampleWindow),
}
}
2014-07-22 15:02:47 -04:00
// Value returns the current value at the stored percentile.
// It is thread-safe, and may be called concurrently with AddSample.
func (p *Percentile) Value() float64 {
bits := atomic.LoadUint64(&p.value)
return math.Float64frombits(bits)
}
// AddSample adds a single float64 sample to the data set.
// It is not thread-safe, and not be called concurrently.
func (p *Percentile) AddSample(sample float64) {
2014-07-22 12:26:31 -04:00
p.samples++
if len(p.values) == cap(p.values) {
2014-07-22 12:26:31 -04:00
target := float64(p.samples)*p.percentile - float64(cap(p.values))/2
offset := round(math.Max(target, 0))
if sample > p.values[0] {
if offset > p.offset {
idx := sort.SearchFloat64s(p.values[1:], sample)
copy(p.values, p.values[1:idx+1])
p.values[idx] = sample
p.offset++
} else if sample < p.values[len(p.values)-1] {
idx := sort.SearchFloat64s(p.values, sample)
copy(p.values[idx+1:], p.values[idx:])
p.values[idx] = sample
}
} else {
if offset > p.offset {
p.offset++
} else {
copy(p.values[1:], p.values)
p.values[0] = sample
}
}
} else {
idx := sort.SearchFloat64s(p.values, sample)
p.values = p.values[:len(p.values)+1]
copy(p.values[idx+1:], p.values[idx:])
p.values[idx] = sample
}
2014-07-22 12:42:56 -04:00
2014-07-22 12:47:17 -04:00
bits := math.Float64bits(p.values[p.index()])
atomic.StoreUint64(&p.value, bits)
}
2014-07-22 12:26:31 -04:00
func (p *Percentile) index() int64 {
idx := round(float64(p.samples)*p.percentile - float64(p.offset))
last := int64(len(p.values)) - 1
if idx > last {
return last
}
return idx
}
2014-07-22 14:57:36 -04:00
func (p *Percentile) MarshalJSON() ([]byte, error) {
return json.Marshal(p.Value())
}
func round(value float64) int64 {
if value < 0.0 {
value -= 0.5
} else {
value += 0.5
}
return int64(value)
}