~linaro-toolchain-dev/cortex-strings/trunk

« back to all changes in this revision

Viewing changes to scripts/bench.py

Committer: Will Newton
Date: 2013-06-25 14:07:04 UTC
Revision ID: will.newton@linaro.org-20130625140704-jp1ad8y2p8d416qk

Support multiple runs of each benchmark.

files added:
.bzrignore

Makefile.am

README

autogen.sh

benchmarks

benchmarks/dhry

benchmarks/dhry/dhry.h

benchmarks/dhry/dhry_1.c

benchmarks/dhry/dhry_2.c

benchmarks/multi

benchmarks/multi/harness.c

configure.ac

reference/bionic-a15

reference/bionic-a15/memcmp.S

reference/bionic-a15/memcpy.S

reference/bionic-a15/memset.S

reference/bionic-a15/strcmp.S

reference/bionic-a15/strcpy.S

reference/bionic-a15/strlen.c

reference/bionic-a9

reference/bionic-a9/memcmp.S

reference/bionic-a9/memcpy.S

reference/bionic-a9/memset.S

reference/bionic-a9/strcmp.S

reference/bionic-a9/strcpy.S

reference/bionic-a9/strlen.c

reference/bionic-c

reference/bionic-c/bcopy.c

reference/bionic-c/memchr.c

reference/bionic-c/memcmp.c

reference/bionic-c/memcpy.c

reference/bionic-c/memset.c

reference/bionic-c/strchr.c

reference/bionic-c/strcmp.c

reference/bionic-c/strcpy.c

reference/bionic-c/strlen.c

reference/csl

reference/csl/arm_asm.h

reference/csl/memcpy.c

reference/csl/memset.c

reference/glibc-c

reference/glibc-c/bp-checks.h

reference/glibc-c/memchr.c

reference/glibc-c/memcmp.c

reference/glibc-c/memcopy.h

reference/glibc-c/memcpy.c

reference/glibc-c/memset.c

reference/glibc-c/pagecopy.h

reference/glibc-c/strchr.c

reference/glibc-c/strcmp.c

reference/glibc-c/strcpy.c

reference/glibc-c/strlen.c

reference/glibc-c/wordcopy.c

reference/newlib-c

reference/newlib-c/memchr.c

reference/newlib-c/memcmp.c

reference/newlib-c/memcpy.c

reference/newlib-c/memset.c

reference/newlib-c/shim.h

reference/newlib-c/strchr.c

reference/newlib-c/strcmp.c

reference/newlib-c/strcpy.c

reference/newlib-c/strlen.c

reference/newlib-xscale

reference/newlib-xscale/memchr.c

reference/newlib-xscale/memcpy.c

reference/newlib-xscale/memset.c

reference/newlib-xscale/strchr.c

reference/newlib-xscale/strcmp.c

reference/newlib-xscale/strcpy.c

reference/newlib-xscale/strlen.c

reference/newlib-xscale/xscale.h

reference/newlib/memcpy.S

reference/newlib/shim.h

reference/newlib/strcmp.S

reference/plain/memset.c

reference/plain/strcmp.c

reference/plain/strcpy.c

scripts

scripts/add-license.sh

scripts/bench.py

scripts/fixup.py

scripts/libplot.py

scripts/plot-align.py

scripts/plot-sizes.py

scripts/plot-top.py

scripts/plot.py

scripts/trim.sh

src/aarch64

src/aarch64/memcmp.S

src/aarch64/memcpy.S

src/aarch64/memmove.S

src/aarch64/memset.S

src/aarch64/strcmp.S

src/aarch64/strlen.S

src/aarch64/strncmp.S

src/aarch64/strnlen.S

src/linaro-a9

src/linaro-a9/memchr.S

src/linaro-a9/memcpy.S

src/linaro-a9/memset.S

src/linaro-a9/strchr.S

src/neon

src/thumb-2

src/thumb-2/strcpy.c

src/thumb-2/strlen.S

tests

tests/hp-timing.h

tests/test-memchr.c

tests/test-memcmp.c

tests/test-memcpy.c

tests/test-memmove.c

tests/test-memset.c

tests/test-skeleton.c

tests/test-strchr.c

tests/test-strcmp.c

tests/test-strcpy.c

tests/test-string.h

tests/test-strlen.c

tests/test-strncmp.c

tests/test-strnlen.c

files removed:
src/reference/Makefile.am

src/reference/bionic

src/reference/bionic/memcmp.S

src/reference/bionic/memcmp16.S

src/reference/bionic/memcpy.S

src/reference/bionic/memset.S

src/reference/bionic/strlen.c

src/reference/configure.ac

src/reference/glibc/memmove.S

src/reference/newlib/strcmp.c

src/reference/test.py

files renamed:
src/reference/ => reference/

files modified:
reference/glibc/memcpy.S

reference/glibc/memset.S

reference/glibc/strlen.S

reference/helpers/bounce.c

reference/helpers/spawn.c

reference/newlib/arm_asm.h

reference/newlib/strcpy.c

reference/newlib/strlen.c

reference/plain/memcpy.c

Show diffs side-by-side

added added

removed removed

scripts/bench.py

#!/usr/bin/env python

"""Simple harness that benchmarks different variants of the routines,

caches the results, and emits all of the records at the end.

Results are generated for different values of:

* Source

* Routine

* Length

* Alignment

"""

import subprocess

import math

import sys

# Prefix to the executables

build = '../build/try-'

ALL = 'memchr memcmp memcpy memset strchr strcmp strcpy strlen'

HAS = {

'this': 'bounce memchr memcpy memset strchr strcpy strlen',

'bionic-a9': 'memcmp memcpy memset strcmp strcpy strlen',

'bionic-a15': 'memcmp memcpy memset strcmp strcpy strlen',

'bionic-c': ALL,

'csl': 'memcpy memset',

'glibc': 'memcpy memset strlen',

'glibc-c': ALL,

'newlib': 'memcpy strcmp strcpy strlen',

'newlib-c': ALL,

'newlib-xscale': 'memchr memcpy memset strchr strcmp strcpy strlen',

'plain': 'memset memcpy strcmp strcpy',

}

BOUNCE_ALIGNMENTS = ['1']

SINGLE_BUFFER_ALIGNMENTS = ['1', '2', '4', '8', '16', '32']

DUAL_BUFFER_ALIGNMENTS = ['1:32', '2:32', '4:32', '8:32', '16:32', '32:32']

ALIGNMENTS = {

'bounce': BOUNCE_ALIGNMENTS,

'memchr': SINGLE_BUFFER_ALIGNMENTS,

'memset': SINGLE_BUFFER_ALIGNMENTS,

'strchr': SINGLE_BUFFER_ALIGNMENTS,

'strlen': SINGLE_BUFFER_ALIGNMENTS,

'memcmp': DUAL_BUFFER_ALIGNMENTS,

'memcpy': DUAL_BUFFER_ALIGNMENTS,

'strcmp': DUAL_BUFFER_ALIGNMENTS,

'strcpy': DUAL_BUFFER_ALIGNMENTS,

}

NUM_RUNS = 5

def run(cache, variant, function, bytes, loops, alignment, run_id, quiet=False):

"""Perform a single run, exercising the cache as appropriate."""

key = ':'.join('%s' % x for x in (variant, function, bytes, loops, alignment, run_id))

if key in cache:

got = cache[key]

else:

xbuild = build

cmd = '%(xbuild)s%(variant)s -t %(function)s -c %(bytes)s -l %(loops)s -a %(alignment)s -r %(run_id)s' % locals()

try:

got = subprocess.check_output(cmd.split()).strip()

except OSError, ex:

assert False, 'Error %s while running %s' % (ex, cmd)

parts = got.split(':')

took = float(parts[7])

cache[key] = got

if not quiet:

print got

sys.stdout.flush()

return took

def run_many(cache, variants, bytes, all_functions):

# We want the data to come out in a useful order. So fix an

# alignment and function, and do all sizes for a variant first

bytes = sorted(bytes)

mid = bytes[int(len(bytes)/1.5)]

if not all_functions:

# Use the ordering in 'this' as the default

all_functions = HAS['this'].split()

# Find all other functions

for functions in HAS.values():

for function in functions.split():

if function not in all_functions:

all_functions.append(function)

for function in all_functions:

for alignment in ALIGNMENTS[function]:

for variant in variants:

if function not in HAS[variant].split():

100

continue

101

102

# Run a tracer through and see how long it takes and

103

# adjust the number of loops based on that. Not great

104

# for memchr() and similar which are O(n), but it will

105

# do

106

f = 50000000

107

want = 5.0

108

109

loops = int(f / math.sqrt(max(1, mid)))

110

took = run(cache, variant, function, mid, loops, alignment, 0,

111

quiet=True)

112

# Keep it reasonable for silly routines like bounce

113

factor = min(20, max(0.05, want/took))

114

f = f * factor

115

116

# Round f to a few significant figures

117

scale = 10**int(math.log10(f) - 1)

118

f = scale*int(f/scale)

119

120

for b in sorted(bytes):

121

# Figure out the number of loops to give a roughly consistent run

122

loops = int(f / math.sqrt(max(1, b)))

123

for run_id in range(0, NUM_RUNS):

124

run(cache, variant, function, b, loops, alignment,

125

run_id)

126

127

def run_top(cache):

128

variants = sorted(HAS.keys())

129

functions = sys.argv[1:]

130

131

# Upper limit in bytes to test to

132

top = 512*1024

133

# Test all powers of 2

134

step1 = 2.0

135

# Test intermediate powers of 1.4

136

step2 = 1.4

137

138

bytes = []

139

140

for step in [step1, step2]:

141

if step:

142

# Figure out how many steps get us up to the top

143

steps = int(round(math.log(top) / math.log(step)))

144

bytes.extend([int(step**x) for x in range(0, steps+1)])

145

146

run_many(cache, variants, bytes, functions)

147

148

def main():

149

cachename = 'cache.txt'

150

151

cache = {}

152

153

try:

154

with open(cachename) as f:

155

for line in f:

156

line = line.strip()

157

parts = line.split(':')

158

cache[':'.join(parts[:7])] = line

159

except:

160

pass

161

162

try:

163

run_top(cache)

164

finally:

165

with open(cachename, 'w') as f:

166

for line in sorted(cache.values()):

167

print >> f, line

168

169

if __name__ == '__main__':

170

main()

Older »