8e5b17cf13
Signed-off-by: Mrunal Patel <mrunalp@gmail.com>
198 lines
5.5 KiB
Go
198 lines
5.5 KiB
Go
package stats
|
|
|
|
import (
|
|
"bytes"
|
|
"fmt"
|
|
"io"
|
|
"log"
|
|
"math"
|
|
"strconv"
|
|
"strings"
|
|
)
|
|
|
|
// Histogram accumulates values in the form of a histogram with
|
|
// exponentially increased bucket sizes.
|
|
type Histogram struct {
|
|
// Count is the total number of values added to the histogram.
|
|
Count int64
|
|
// Sum is the sum of all the values added to the histogram.
|
|
Sum int64
|
|
// SumOfSquares is the sum of squares of all values.
|
|
SumOfSquares int64
|
|
// Min is the minimum of all the values added to the histogram.
|
|
Min int64
|
|
// Max is the maximum of all the values added to the histogram.
|
|
Max int64
|
|
// Buckets contains all the buckets of the histogram.
|
|
Buckets []HistogramBucket
|
|
|
|
opts HistogramOptions
|
|
logBaseBucketSize float64
|
|
oneOverLogOnePlusGrowthFactor float64
|
|
}
|
|
|
|
// HistogramOptions contains the parameters that define the histogram's buckets.
|
|
// The first bucket of the created histogram (with index 0) contains [min, min+n)
|
|
// where n = BaseBucketSize, min = MinValue.
|
|
// Bucket i (i>=1) contains [min + n * m^(i-1), min + n * m^i), where m = 1+GrowthFactor.
|
|
// The type of the values is int64.
|
|
type HistogramOptions struct {
|
|
// NumBuckets is the number of buckets.
|
|
NumBuckets int
|
|
// GrowthFactor is the growth factor of the buckets. A value of 0.1
|
|
// indicates that bucket N+1 will be 10% larger than bucket N.
|
|
GrowthFactor float64
|
|
// BaseBucketSize is the size of the first bucket.
|
|
BaseBucketSize float64
|
|
// MinValue is the lower bound of the first bucket.
|
|
MinValue int64
|
|
}
|
|
|
|
// HistogramBucket represents one histogram bucket.
|
|
type HistogramBucket struct {
|
|
// LowBound is the lower bound of the bucket.
|
|
LowBound float64
|
|
// Count is the number of values in the bucket.
|
|
Count int64
|
|
}
|
|
|
|
// NewHistogram returns a pointer to a new Histogram object that was created
|
|
// with the provided options.
|
|
func NewHistogram(opts HistogramOptions) *Histogram {
|
|
if opts.NumBuckets == 0 {
|
|
opts.NumBuckets = 32
|
|
}
|
|
if opts.BaseBucketSize == 0.0 {
|
|
opts.BaseBucketSize = 1.0
|
|
}
|
|
h := Histogram{
|
|
Buckets: make([]HistogramBucket, opts.NumBuckets),
|
|
Min: math.MaxInt64,
|
|
Max: math.MinInt64,
|
|
|
|
opts: opts,
|
|
logBaseBucketSize: math.Log(opts.BaseBucketSize),
|
|
oneOverLogOnePlusGrowthFactor: 1 / math.Log(1+opts.GrowthFactor),
|
|
}
|
|
m := 1.0 + opts.GrowthFactor
|
|
delta := opts.BaseBucketSize
|
|
h.Buckets[0].LowBound = float64(opts.MinValue)
|
|
for i := 1; i < opts.NumBuckets; i++ {
|
|
h.Buckets[i].LowBound = float64(opts.MinValue) + delta
|
|
delta = delta * m
|
|
}
|
|
return &h
|
|
}
|
|
|
|
// Print writes textual output of the histogram values.
|
|
func (h *Histogram) Print(w io.Writer) {
|
|
avg := float64(h.Sum) / float64(h.Count)
|
|
fmt.Fprintf(w, "Count: %d Min: %d Max: %d Avg: %.2f\n", h.Count, h.Min, h.Max, avg)
|
|
fmt.Fprintf(w, "%s\n", strings.Repeat("-", 60))
|
|
if h.Count <= 0 {
|
|
return
|
|
}
|
|
|
|
maxBucketDigitLen := len(strconv.FormatFloat(h.Buckets[len(h.Buckets)-1].LowBound, 'f', 6, 64))
|
|
if maxBucketDigitLen < 3 {
|
|
// For "inf".
|
|
maxBucketDigitLen = 3
|
|
}
|
|
maxCountDigitLen := len(strconv.FormatInt(h.Count, 10))
|
|
percentMulti := 100 / float64(h.Count)
|
|
|
|
accCount := int64(0)
|
|
for i, b := range h.Buckets {
|
|
fmt.Fprintf(w, "[%*f, ", maxBucketDigitLen, b.LowBound)
|
|
if i+1 < len(h.Buckets) {
|
|
fmt.Fprintf(w, "%*f)", maxBucketDigitLen, h.Buckets[i+1].LowBound)
|
|
} else {
|
|
fmt.Fprintf(w, "%*s)", maxBucketDigitLen, "inf")
|
|
}
|
|
|
|
accCount += b.Count
|
|
fmt.Fprintf(w, " %*d %5.1f%% %5.1f%%", maxCountDigitLen, b.Count, float64(b.Count)*percentMulti, float64(accCount)*percentMulti)
|
|
|
|
const barScale = 0.1
|
|
barLength := int(float64(b.Count)*percentMulti*barScale + 0.5)
|
|
fmt.Fprintf(w, " %s\n", strings.Repeat("#", barLength))
|
|
}
|
|
}
|
|
|
|
// String returns the textual output of the histogram values as string.
|
|
func (h *Histogram) String() string {
|
|
var b bytes.Buffer
|
|
h.Print(&b)
|
|
return b.String()
|
|
}
|
|
|
|
// Clear resets all the content of histogram.
|
|
func (h *Histogram) Clear() {
|
|
h.Count = 0
|
|
h.Sum = 0
|
|
h.SumOfSquares = 0
|
|
h.Min = math.MaxInt64
|
|
h.Max = math.MinInt64
|
|
for i := range h.Buckets {
|
|
h.Buckets[i].Count = 0
|
|
}
|
|
}
|
|
|
|
// Opts returns a copy of the options used to create the Histogram.
|
|
func (h *Histogram) Opts() HistogramOptions {
|
|
return h.opts
|
|
}
|
|
|
|
// Add adds a value to the histogram.
|
|
func (h *Histogram) Add(value int64) error {
|
|
bucket, err := h.findBucket(value)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
h.Buckets[bucket].Count++
|
|
h.Count++
|
|
h.Sum += value
|
|
h.SumOfSquares += value * value
|
|
if value < h.Min {
|
|
h.Min = value
|
|
}
|
|
if value > h.Max {
|
|
h.Max = value
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func (h *Histogram) findBucket(value int64) (int, error) {
|
|
delta := float64(value - h.opts.MinValue)
|
|
var b int
|
|
if delta >= h.opts.BaseBucketSize {
|
|
// b = log_{1+growthFactor} (delta / baseBucketSize) + 1
|
|
// = log(delta / baseBucketSize) / log(1+growthFactor) + 1
|
|
// = (log(delta) - log(baseBucketSize)) * (1 / log(1+growthFactor)) + 1
|
|
b = int((math.Log(delta)-h.logBaseBucketSize)*h.oneOverLogOnePlusGrowthFactor + 1)
|
|
}
|
|
if b >= len(h.Buckets) {
|
|
return 0, fmt.Errorf("no bucket for value: %d", value)
|
|
}
|
|
return b, nil
|
|
}
|
|
|
|
// Merge takes another histogram h2, and merges its content into h.
|
|
// The two histograms must be created by equivalent HistogramOptions.
|
|
func (h *Histogram) Merge(h2 *Histogram) {
|
|
if h.opts != h2.opts {
|
|
log.Fatalf("failed to merge histograms, created by inequivalent options")
|
|
}
|
|
h.Count += h2.Count
|
|
h.Sum += h2.Sum
|
|
h.SumOfSquares += h2.SumOfSquares
|
|
if h2.Min < h.Min {
|
|
h.Min = h2.Min
|
|
}
|
|
if h2.Max > h.Max {
|
|
h.Max = h2.Max
|
|
}
|
|
for i, b := range h2.Buckets {
|
|
h.Buckets[i].Count += b.Count
|
|
}
|
|
}
|