mirror of
https://github.com/autc04/Retro68.git
synced 2024-12-01 11:52:47 +00:00
174 lines
4.6 KiB
Go
174 lines
4.6 KiB
Go
// Copyright 2009 The Go Authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style
|
|
// license that can be found in the LICENSE file.
|
|
|
|
// Calibration used to determine thresholds for using
|
|
// different algorithms. Ideally, this would be converted
|
|
// to go generate to create thresholds.go
|
|
|
|
// This file prints execution times for the Mul benchmark
|
|
// given different Karatsuba thresholds. The result may be
|
|
// used to manually fine-tune the threshold constant. The
|
|
// results are somewhat fragile; use repeated runs to get
|
|
// a clear picture.
|
|
|
|
// Calculates lower and upper thresholds for when basicSqr
|
|
// is faster than standard multiplication.
|
|
|
|
// Usage: go test -run=TestCalibrate -v -calibrate
|
|
|
|
package big
|
|
|
|
import (
|
|
"flag"
|
|
"fmt"
|
|
"testing"
|
|
"time"
|
|
)
|
|
|
|
var calibrate = flag.Bool("calibrate", false, "run calibration test")
|
|
|
|
const (
|
|
sqrModeMul = "mul(x, x)"
|
|
sqrModeBasic = "basicSqr(x)"
|
|
sqrModeKaratsuba = "karatsubaSqr(x)"
|
|
)
|
|
|
|
func TestCalibrate(t *testing.T) {
|
|
if !*calibrate {
|
|
return
|
|
}
|
|
|
|
computeKaratsubaThresholds()
|
|
|
|
// compute basicSqrThreshold where overhead becomes negligible
|
|
minSqr := computeSqrThreshold(10, 30, 1, 3, sqrModeMul, sqrModeBasic)
|
|
// compute karatsubaSqrThreshold where karatsuba is faster
|
|
maxSqr := computeSqrThreshold(200, 500, 10, 3, sqrModeBasic, sqrModeKaratsuba)
|
|
if minSqr != 0 {
|
|
fmt.Printf("found basicSqrThreshold = %d\n", minSqr)
|
|
} else {
|
|
fmt.Println("no basicSqrThreshold found")
|
|
}
|
|
if maxSqr != 0 {
|
|
fmt.Printf("found karatsubaSqrThreshold = %d\n", maxSqr)
|
|
} else {
|
|
fmt.Println("no karatsubaSqrThreshold found")
|
|
}
|
|
}
|
|
|
|
func karatsubaLoad(b *testing.B) {
|
|
BenchmarkMul(b)
|
|
}
|
|
|
|
// measureKaratsuba returns the time to run a Karatsuba-relevant benchmark
|
|
// given Karatsuba threshold th.
|
|
func measureKaratsuba(th int) time.Duration {
|
|
th, karatsubaThreshold = karatsubaThreshold, th
|
|
res := testing.Benchmark(karatsubaLoad)
|
|
karatsubaThreshold = th
|
|
return time.Duration(res.NsPerOp())
|
|
}
|
|
|
|
func computeKaratsubaThresholds() {
|
|
fmt.Printf("Multiplication times for varying Karatsuba thresholds\n")
|
|
fmt.Printf("(run repeatedly for good results)\n")
|
|
|
|
// determine Tk, the work load execution time using basic multiplication
|
|
Tb := measureKaratsuba(1e9) // th == 1e9 => Karatsuba multiplication disabled
|
|
fmt.Printf("Tb = %10s\n", Tb)
|
|
|
|
// thresholds
|
|
th := 4
|
|
th1 := -1
|
|
th2 := -1
|
|
|
|
var deltaOld time.Duration
|
|
for count := -1; count != 0 && th < 128; count-- {
|
|
// determine Tk, the work load execution time using Karatsuba multiplication
|
|
Tk := measureKaratsuba(th)
|
|
|
|
// improvement over Tb
|
|
delta := (Tb - Tk) * 100 / Tb
|
|
|
|
fmt.Printf("th = %3d Tk = %10s %4d%%", th, Tk, delta)
|
|
|
|
// determine break-even point
|
|
if Tk < Tb && th1 < 0 {
|
|
th1 = th
|
|
fmt.Print(" break-even point")
|
|
}
|
|
|
|
// determine diminishing return
|
|
if 0 < delta && delta < deltaOld && th2 < 0 {
|
|
th2 = th
|
|
fmt.Print(" diminishing return")
|
|
}
|
|
deltaOld = delta
|
|
|
|
fmt.Println()
|
|
|
|
// trigger counter
|
|
if th1 >= 0 && th2 >= 0 && count < 0 {
|
|
count = 10 // this many extra measurements after we got both thresholds
|
|
}
|
|
|
|
th++
|
|
}
|
|
}
|
|
|
|
func measureSqr(words, nruns int, mode string) time.Duration {
|
|
// more runs for better statistics
|
|
initBasicSqr, initKaratsubaSqr := basicSqrThreshold, karatsubaSqrThreshold
|
|
|
|
switch mode {
|
|
case sqrModeMul:
|
|
basicSqrThreshold = words + 1
|
|
case sqrModeBasic:
|
|
basicSqrThreshold, karatsubaSqrThreshold = words-1, words+1
|
|
case sqrModeKaratsuba:
|
|
karatsubaSqrThreshold = words - 1
|
|
}
|
|
|
|
var testval int64
|
|
for i := 0; i < nruns; i++ {
|
|
res := testing.Benchmark(func(b *testing.B) { benchmarkNatSqr(b, words) })
|
|
testval += res.NsPerOp()
|
|
}
|
|
testval /= int64(nruns)
|
|
|
|
basicSqrThreshold, karatsubaSqrThreshold = initBasicSqr, initKaratsubaSqr
|
|
|
|
return time.Duration(testval)
|
|
}
|
|
|
|
func computeSqrThreshold(from, to, step, nruns int, lower, upper string) int {
|
|
fmt.Printf("Calibrating threshold between %s and %s\n", lower, upper)
|
|
fmt.Printf("Looking for a timing difference for x between %d - %d words by %d step\n", from, to, step)
|
|
var initPos bool
|
|
var threshold int
|
|
for i := from; i <= to; i += step {
|
|
baseline := measureSqr(i, nruns, lower)
|
|
testval := measureSqr(i, nruns, upper)
|
|
pos := baseline > testval
|
|
delta := baseline - testval
|
|
percent := delta * 100 / baseline
|
|
fmt.Printf("words = %3d deltaT = %10s (%4d%%) is %s better: %v", i, delta, percent, upper, pos)
|
|
if i == from {
|
|
initPos = pos
|
|
}
|
|
if threshold == 0 && pos != initPos {
|
|
threshold = i
|
|
fmt.Printf(" threshold found")
|
|
}
|
|
fmt.Println()
|
|
|
|
}
|
|
if threshold != 0 {
|
|
fmt.Printf("Found threshold = %d between %d - %d\n", threshold, from, to)
|
|
} else {
|
|
fmt.Printf("Found NO threshold between %d - %d\n", from, to)
|
|
}
|
|
return threshold
|
|
}
|