benchstat/table.go - perf - Git at Google

 // Copyright 2017 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 package benchstat

 import (
 	"fmt"
 	"strings"

 	"golang.org/x/perf/internal/stats"
 )

 // A Table is a table for display in the benchstat output.
 type Table struct {
 	Metric      string
 	OldNewDelta bool // is this an old-new-delta table?
 	Configs     []string
 	Groups      []string
 	Rows        []*Row
 }

 // A Row is a table row for display in the benchstat output.
 type Row struct {
 	Benchmark string     // benchmark name
 	Group     string     // group name
 	Scaler    Scaler     // formatter for stats means
 	Metrics   []*Metrics // columns of statistics
 	PctDelta  float64    // unformatted percent change
 	Delta     string     // formatted percent change
 	Note      string     // additional information
 	Change    int        // +1 better, -1 worse, 0 unchanged
 }

 // Tables returns tables comparing the benchmarks in the collection.
 func (c *Collection) Tables() []*Table {
 	deltaTest := c.DeltaTest
 	if deltaTest == nil {
 		deltaTest = UTest
 	}
 	alpha := c.Alpha
 	if alpha == 0 {
 		alpha = 0.05
 	}

 	// Update statistics.
 	for _, m := range c.Metrics {
 		m.computeStats()
 	}

 	var tables []*Table
 	key := Key{}
 	for _, key.Unit = range c.Units {
 		table := new(Table)
 		table.Configs = c.Configs
 		table.Groups = c.Groups
 		table.Metric = metricOf(key.Unit)
 		table.OldNewDelta = len(c.Configs) == 2
 		for _, key.Group = range c.Groups {
 			for _, key.Benchmark = range c.Benchmarks[key.Group] {
 				row := &Row{Benchmark: key.Benchmark}
 				if len(c.Groups) > 1 {
 					// Show group headers if there is more than one group.
 					row.Group = key.Group
 				}

 				for _, key.Config = range c.Configs {
 					m := c.Metrics[key]
 					if m == nil {
 						row.Metrics = append(row.Metrics, new(Metrics))
 						continue
 					}
 					row.Metrics = append(row.Metrics, m)
 					if row.Scaler == nil {
 						row.Scaler = NewScaler(m.Mean, m.Unit)
 					}
 				}

 				// If there are only two configs being compared, add stats.
 				if table.OldNewDelta {
 					k0 := key
 					k0.Config = c.Configs[0]
 					k1 := key
 					k1.Config = c.Configs[1]
 					old := c.Metrics[k0]
 					new := c.Metrics[k1]
 					// If one is missing, omit row entirely.
 					// TODO: Control this better.
 					if old == nil || new == nil {
 						continue
 					}
 					pval, testerr := deltaTest(old, new)
 					row.PctDelta = 0.00
 					row.Delta = "~"
 					if testerr == stats.ErrZeroVariance {
 						row.Note = "(zero variance)"
 					} else if testerr == stats.ErrSampleSize {
 						row.Note = "(too few samples)"
 					} else if testerr == stats.ErrSamplesEqual {
 						row.Note = "(all equal)"
 					} else if testerr != nil {
 						row.Note = fmt.Sprintf("(%s)", testerr)
 					} else if pval < alpha {
 						if new.Mean == old.Mean {
 							row.Delta = "0.00%"
 						} else {
 							pct := ((new.Mean / old.Mean) - 1.0) * 100.0
 							row.PctDelta = pct
 							row.Delta = fmt.Sprintf("%+.2f%%", pct)
 							if pct < 0 == (table.Metric != "speed") { // smaller is better, except speeds
 								row.Change = +1
 							} else {
 								row.Change = -1
 							}
 						}
 					}
 					if row.Note == "" && pval != -1 {
 						row.Note = fmt.Sprintf("(p=%0.3f n=%d+%d)", pval, len(old.RValues), len(new.RValues))
 					}
 				}

 				table.Rows = append(table.Rows, row)
 			}
 		}

 		if len(table.Rows) > 0 {
 			if c.Order != nil {
 				Sort(table, c.Order)
 			}
 			if c.AddGeoMean {
 				addGeomean(c, table, key.Unit, table.OldNewDelta)
 			}
 			tables = append(tables, table)
 		}
 	}

 	return tables
 }

 var metricSuffix = map[string]string{
 	"ns/op": "time/op",
 	"ns/GC": "time/GC",
 	"B/op":  "alloc/op",
 	"MB/s":  "speed",
 }

 // metricOf returns the name of the metric with the given unit.
 func metricOf(unit string) string {
 	if s := metricSuffix[unit]; s != "" {
 		return s
 	}
 	for s, suff := range metricSuffix {
 		if dashs := "-" + s; strings.HasSuffix(unit, dashs) {
 			prefix := strings.TrimSuffix(unit, dashs)
 			return prefix + "-" + suff
 		}
 	}
 	return unit
 }

 // addGeomean adds a "geomean" row to the table,
 // showing the geometric mean of all the benchmarks.
 func addGeomean(c *Collection, t *Table, unit string, delta bool) {
 	row := &Row{Benchmark: "[Geo mean]"}
 	key := Key{Unit: unit}
 	geomeans := []float64{}
 	maxCount := 0
 	for _, key.Config = range c.Configs {
 		var means []float64
 		for _, key.Group = range c.Groups {
 			for _, key.Benchmark = range c.Benchmarks[key.Group] {
 				m := c.Metrics[key]
 				// Omit 0 values from the geomean calculation,
 				// as these either make the geomean undefined
 				// or zero (depending on who you ask). This
 				// typically comes up with things like
 				// allocation counts, where it's fine to just
 				// ignore the benchmark.
 				if m != nil && m.Mean != 0 {
 					means = append(means, m.Mean)
 				}
 			}
 		}
 		if len(means) > maxCount {
 			maxCount = len(means)
 		}
 		if len(means) == 0 {
 			row.Metrics = append(row.Metrics, new(Metrics))
 			delta = false
 		} else {
 			geomean := stats.GeoMean(means)
 			geomeans = append(geomeans, geomean)
 			if row.Scaler == nil {
 				row.Scaler = NewScaler(geomean, unit)
 			}
 			row.Metrics = append(row.Metrics, &Metrics{
 				Unit: unit,
 				Mean: geomean,
 			})
 		}
 	}
 	if maxCount <= 1 {
 		// Only one benchmark contributed to this geomean.
 		// Since the geomean is the same as the benchmark
 		// result, don't bother outputting it.
 		return
 	}
 	if delta {
 		pct := ((geomeans[1] / geomeans[0]) - 1.0) * 100.0
 		row.PctDelta = pct
 		row.Delta = fmt.Sprintf("%+.2f%%", pct)
 	}
 	t.Rows = append(t.Rows, row)
 }
	// Copyright 2017 The Go Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style
	// license that can be found in the LICENSE file.

	package benchstat

	import (
	"fmt"
	"strings"

	"golang.org/x/perf/internal/stats"
	)

	// A Table is a table for display in the benchstat output.
	type Table struct {
	Metric string
	OldNewDelta bool // is this an old-new-delta table?
	Configs []string
	Groups []string
	Rows []*Row
	}

	// A Row is a table row for display in the benchstat output.
	type Row struct {
	Benchmark string // benchmark name
	Group string // group name
	Scaler Scaler // formatter for stats means
	Metrics []*Metrics // columns of statistics
	PctDelta float64 // unformatted percent change
	Delta string // formatted percent change
	Note string // additional information
	Change int // +1 better, -1 worse, 0 unchanged
	}

	// Tables returns tables comparing the benchmarks in the collection.
	func (c Collection) Tables() []Table {
	deltaTest := c.DeltaTest
	if deltaTest == nil {
	deltaTest = UTest
	}
	alpha := c.Alpha
	if alpha == 0 {
	alpha = 0.05
	}

	// Update statistics.
	for _, m := range c.Metrics {
	m.computeStats()
	}

	var tables []*Table
	key := Key{}
	for _, key.Unit = range c.Units {
	table := new(Table)
	table.Configs = c.Configs
	table.Groups = c.Groups
	table.Metric = metricOf(key.Unit)
	table.OldNewDelta = len(c.Configs) == 2
	for _, key.Group = range c.Groups {
	for _, key.Benchmark = range c.Benchmarks[key.Group] {
	row := &Row{Benchmark: key.Benchmark}
	if len(c.Groups) > 1 {
	// Show group headers if there is more than one group.
	row.Group = key.Group
	}

	for _, key.Config = range c.Configs {
	m := c.Metrics[key]
	if m == nil {
	row.Metrics = append(row.Metrics, new(Metrics))
	continue
	}
	row.Metrics = append(row.Metrics, m)
	if row.Scaler == nil {
	row.Scaler = NewScaler(m.Mean, m.Unit)
	}
	}

	// If there are only two configs being compared, add stats.
	if table.OldNewDelta {
	k0 := key
	k0.Config = c.Configs[0]
	k1 := key
	k1.Config = c.Configs[1]
	old := c.Metrics[k0]
	new := c.Metrics[k1]
	// If one is missing, omit row entirely.
	// TODO: Control this better.
	if old == nil \|\| new == nil {
	continue
	}
	pval, testerr := deltaTest(old, new)
	row.PctDelta = 0.00
	row.Delta = "~"
	if testerr == stats.ErrZeroVariance {
	row.Note = "(zero variance)"
	} else if testerr == stats.ErrSampleSize {
	row.Note = "(too few samples)"
	} else if testerr == stats.ErrSamplesEqual {
	row.Note = "(all equal)"
	} else if testerr != nil {
	row.Note = fmt.Sprintf("(%s)", testerr)
	} else if pval < alpha {
	if new.Mean == old.Mean {
	row.Delta = "0.00%"
	} else {
	pct := ((new.Mean / old.Mean) - 1.0) * 100.0
	row.PctDelta = pct
	row.Delta = fmt.Sprintf("%+.2f%%", pct)
	if pct < 0 == (table.Metric != "speed") { // smaller is better, except speeds
	row.Change = +1
	} else {
	row.Change = -1
	}
	}
	}
	if row.Note == "" && pval != -1 {
	row.Note = fmt.Sprintf("(p=%0.3f n=%d+%d)", pval, len(old.RValues), len(new.RValues))
	}
	}

	table.Rows = append(table.Rows, row)
	}
	}

	if len(table.Rows) > 0 {
	if c.Order != nil {
	Sort(table, c.Order)
	}
	if c.AddGeoMean {
	addGeomean(c, table, key.Unit, table.OldNewDelta)
	}
	tables = append(tables, table)
	}
	}

	return tables
	}

	var metricSuffix = map[string]string{
	"ns/op": "time/op",
	"ns/GC": "time/GC",
	"B/op": "alloc/op",
	"MB/s": "speed",
	}

	// metricOf returns the name of the metric with the given unit.
	func metricOf(unit string) string {
	if s := metricSuffix[unit]; s != "" {
	return s
	}
	for s, suff := range metricSuffix {
	if dashs := "-" + s; strings.HasSuffix(unit, dashs) {
	prefix := strings.TrimSuffix(unit, dashs)
	return prefix + "-" + suff
	}
	}
	return unit
	}

	// addGeomean adds a "geomean" row to the table,
	// showing the geometric mean of all the benchmarks.
	func addGeomean(c Collection, t Table, unit string, delta bool) {
	row := &Row{Benchmark: "[Geo mean]"}
	key := Key{Unit: unit}
	geomeans := []float64{}
	maxCount := 0
	for _, key.Config = range c.Configs {
	var means []float64
	for _, key.Group = range c.Groups {
	for _, key.Benchmark = range c.Benchmarks[key.Group] {
	m := c.Metrics[key]
	// Omit 0 values from the geomean calculation,
	// as these either make the geomean undefined
	// or zero (depending on who you ask). This
	// typically comes up with things like
	// allocation counts, where it's fine to just
	// ignore the benchmark.
	if m != nil && m.Mean != 0 {
	means = append(means, m.Mean)
	}
	}
	}
	if len(means) > maxCount {
	maxCount = len(means)
	}
	if len(means) == 0 {
	row.Metrics = append(row.Metrics, new(Metrics))
	delta = false
	} else {
	geomean := stats.GeoMean(means)
	geomeans = append(geomeans, geomean)
	if row.Scaler == nil {
	row.Scaler = NewScaler(geomean, unit)
	}
	row.Metrics = append(row.Metrics, &Metrics{
	Unit: unit,
	Mean: geomean,
	})
	}
	}
	if maxCount <= 1 {
	// Only one benchmark contributed to this geomean.
	// Since the geomean is the same as the benchmark
	// result, don't bother outputting it.
	return
	}
	if delta {
	pct := ((geomeans[1] / geomeans[0]) - 1.0) * 100.0
	row.PctDelta = pct
	row.Delta = fmt.Sprintf("%+.2f%%", pct)
	}
	t.Rows = append(t.Rows, row)
	}