~linaro-toolchain-dev/cortex-strings/trunk

« back to all changes in this revision

Viewing changes to scripts/bench.py

Committer: Michael Hope
Date: 2011-09-08 03:27:40 UTC
Revision ID: michael.hope@linaro.org-20110908032740-l0rx3olleapcwk6f

Benchmark more sizes and alignments. Make the figures bigger to make the text smaller. Put the 'this' results first.

files added:
scripts/trim.sh

files modified:
scripts/bench.py

scripts/libplot.py

scripts/plot-align.py

scripts/plot-sizes.py

scripts/plot-top.py

Show diffs side-by-side

added added

removed removed

scripts/bench.py

# Prefix to the executables

build = '../build/try-'

DEFAULTS = 'memchr memcpy memset strchr strcmp strcpy strlen'

DEFAULTS = 'memcpy memset memchr strchr strcmp strcpy strlen'

HAS = {

'this': DEFAULTS + ' bounce',

'this': 'bounce ' + DEFAULTS,

'bionic': DEFAULTS,

'glibc': DEFAULTS,

'newlib': DEFAULTS,

'csl': 'memcpy memset'

}

ORDER = 'this'.split()

def run(cache, variant, function, bytes, loops, alignment=8):

def run(cache, variant, function, bytes, loops, alignment=8, quiet=False):

"""Perform a single run, exercising the cache as appropriate."""

key = ':'.join('%s' % x for x in (variant, function, bytes, loops, alignment))

if key in cache:

print cache[key]

got = cache[key]

else:

xbuild = build

cmd = '%(xbuild)s%(variant)s -t %(function)s -c %(bytes)s -l %(loops)s -a %(alignment)s' % locals()

try:

got = subprocess.check_output(cmd.split()).strip()

cache[key] = got

print got

except OSError, ex:

assert False, 'Error %s while running %s' % (ex, cmd)

sys.stdout.flush()

parts = got.split(':')

took = float(parts[5])

cache[key] = got

if not quiet:

print got

sys.stdout.flush()

return took

def run_many(cache, variants, bytes, alignments):

for variant in variants:

functions = HAS[variant].split()

for function in functions:

for alignment in alignments:

# We want the data to come out in a useful order. So fix an

# alignment and function, and do all sizes for a variant first

bytes = sorted(bytes)

mid = bytes[len(bytes)/2]

# Use the ordering in 'this' as the default

all_functions = HAS['this'].split()

# Find all other functions

for functions in HAS.values():

for function in functions.split():

if function not in all_functions:

all_functions.append(function)

for alignment in alignments:

for function in all_functions:

for variant in variants:

if function not in HAS[variant].split():

continue

# Run a tracer through and see how long it takes and

# adjust the number of loops based on that. Not great

# for memchr() and similar which are O(n), but it will

# do

f = 50000000

want = 5.0

loops = int(f / math.sqrt(max(1, mid)))

took = run(cache, variant, function, mid, loops, alignment, quiet=True)

# Keep it reasonable for silly routines like bounce

factor = min(20, max(0.05, want/took))

f = f * factor

# Round f to a few significant figures

scale = 10**int(math.log10(f) - 1)

f = scale*int(f/scale)

for b in sorted(bytes):

# Figure out the number of loops to give a roughly consistent run

loops = int(50000000*5 / math.sqrt(b))

loops = int(f / math.sqrt(max(1, b)))

run(cache, variant, function, b, loops, alignment)

def run_top(cache):

variants = sorted(HAS.keys())

bytes = set([128])

bytes.update([2**x for x in range(0, 14)])

# bytes.extend([2**x - 1 for x in range(1, 14)])

# bytes.extend([int(1.3*x) for x in range(1, 45)])

alignments = [8, 16] #1, 2, 4, 8, 16, 32]

alignments = [16]

# Upper limit in bytes to test to

top = 512*1024

# Test all powers of 2

step1 = 2.0

# Test intermediate powers of 1.4

step2 = 1.4

100

101

# Figure out how many steps get us up to the top

102

steps1 = int(round(math.log(top) / math.log(step1)))

103

steps2 = int(round(math.log(top) / math.log(step2)))

104

105

bytes = []

106

bytes.extend([int(step1**x) for x in range(0, steps1+1)])

107

bytes.extend([int(step2**x) for x in range(0, steps2+1)])

108

109

alignments = [8, 16, 4, 1, 2, 32]

110

111

run_many(cache, variants, bytes, alignments)

112

Older »