2014-07-22 02:41:39 -04:00
|
|
|
package stats
|
|
|
|
|
|
|
|
import (
|
2014-07-22 14:57:36 -04:00
|
|
|
"encoding/json"
|
2014-07-22 12:26:31 -04:00
|
|
|
"math"
|
2014-07-22 02:41:39 -04:00
|
|
|
"sort"
|
2014-07-22 12:42:56 -04:00
|
|
|
"sync/atomic"
|
2014-07-22 02:41:39 -04:00
|
|
|
)
|
|
|
|
|
2014-07-22 15:02:47 -04:00
|
|
|
// Percentile implements an efficient percentile calculation of
|
|
|
|
// arbitrary float64 samples.
|
2014-07-22 02:41:39 -04:00
|
|
|
type Percentile struct {
|
|
|
|
percentile float64
|
2014-07-22 12:26:31 -04:00
|
|
|
|
|
|
|
samples int64
|
|
|
|
offset int64
|
2014-07-22 12:42:56 -04:00
|
|
|
|
|
|
|
values []float64
|
2014-07-22 12:47:17 -04:00
|
|
|
value uint64 // These bits are really a float64.
|
2014-07-22 02:41:39 -04:00
|
|
|
}
|
|
|
|
|
2014-07-22 23:13:59 -04:00
|
|
|
// NewPercentile returns a Percentile with a given threshold.
|
|
|
|
func NewPercentile(percentile float64) *Percentile {
|
|
|
|
return &Percentile{
|
|
|
|
percentile: percentile,
|
|
|
|
|
|
|
|
// 256 samples is fast, and accurate for most distributions.
|
|
|
|
values: make([]float64, 0, 256),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// NewPercentileWithWindow returns a Percentile with a given threshold
|
2014-07-22 15:02:47 -04:00
|
|
|
// and window size (accuracy).
|
2014-07-22 23:13:59 -04:00
|
|
|
func NewPercentileWithWindow(percentile float64, sampleWindow int) *Percentile {
|
2014-07-22 02:41:39 -04:00
|
|
|
return &Percentile{
|
|
|
|
percentile: percentile,
|
2014-07-22 12:47:17 -04:00
|
|
|
values: make([]float64, 0, sampleWindow),
|
2014-07-22 02:41:39 -04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-07-22 15:02:47 -04:00
|
|
|
// Value returns the current value at the stored percentile.
|
|
|
|
// It is thread-safe, and may be called concurrently with AddSample.
|
|
|
|
func (p *Percentile) Value() float64 {
|
|
|
|
bits := atomic.LoadUint64(&p.value)
|
|
|
|
return math.Float64frombits(bits)
|
|
|
|
}
|
|
|
|
|
|
|
|
// AddSample adds a single float64 sample to the data set.
|
|
|
|
// It is not thread-safe, and not be called concurrently.
|
2014-07-22 02:41:39 -04:00
|
|
|
func (p *Percentile) AddSample(sample float64) {
|
2014-07-22 12:26:31 -04:00
|
|
|
p.samples++
|
|
|
|
|
2014-07-22 23:00:12 -04:00
|
|
|
if len(p.values) == cap(p.values) {
|
2014-07-22 12:26:31 -04:00
|
|
|
target := float64(p.samples)*p.percentile - float64(cap(p.values))/2
|
|
|
|
offset := round(math.Max(target, 0))
|
|
|
|
|
|
|
|
if sample > p.values[0] {
|
|
|
|
if offset > p.offset {
|
|
|
|
idx := sort.SearchFloat64s(p.values[1:], sample)
|
|
|
|
copy(p.values, p.values[1:idx+1])
|
|
|
|
|
|
|
|
p.values[idx] = sample
|
|
|
|
p.offset++
|
|
|
|
} else if sample < p.values[len(p.values)-1] {
|
|
|
|
idx := sort.SearchFloat64s(p.values, sample)
|
|
|
|
copy(p.values[idx+1:], p.values[idx:])
|
|
|
|
|
|
|
|
p.values[idx] = sample
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
if offset > p.offset {
|
|
|
|
p.offset++
|
|
|
|
} else {
|
|
|
|
copy(p.values[1:], p.values)
|
|
|
|
p.values[0] = sample
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
idx := sort.SearchFloat64s(p.values, sample)
|
|
|
|
p.values = p.values[:len(p.values)+1]
|
|
|
|
copy(p.values[idx+1:], p.values[idx:])
|
|
|
|
p.values[idx] = sample
|
|
|
|
}
|
2014-07-22 12:42:56 -04:00
|
|
|
|
2014-07-22 12:47:17 -04:00
|
|
|
bits := math.Float64bits(p.values[p.index()])
|
|
|
|
atomic.StoreUint64(&p.value, bits)
|
2014-07-22 02:41:39 -04:00
|
|
|
}
|
|
|
|
|
2014-07-22 12:26:31 -04:00
|
|
|
func (p *Percentile) index() int64 {
|
|
|
|
idx := round(float64(p.samples)*p.percentile - float64(p.offset))
|
|
|
|
last := int64(len(p.values)) - 1
|
|
|
|
|
|
|
|
if idx > last {
|
|
|
|
return last
|
|
|
|
}
|
|
|
|
|
|
|
|
return idx
|
2014-07-22 02:41:39 -04:00
|
|
|
}
|
|
|
|
|
2014-07-22 14:57:36 -04:00
|
|
|
func (p *Percentile) MarshalJSON() ([]byte, error) {
|
|
|
|
return json.Marshal(p.Value())
|
|
|
|
}
|
|
|
|
|
2014-07-22 02:41:39 -04:00
|
|
|
func round(value float64) int64 {
|
|
|
|
if value < 0.0 {
|
|
|
|
value -= 0.5
|
|
|
|
} else {
|
|
|
|
value += 0.5
|
|
|
|
}
|
|
|
|
|
|
|
|
return int64(value)
|
|
|
|
}
|