~linaro-toolchain-dev/cortex-strings/trunk

« back to all changes in this revision

Viewing changes to scripts/bench.py

Committer: Michael Hope
Date: 2010-09-13 07:53:58 UTC
Revision ID: michael.hope@linaro.org-20100913075358-386yj5lqacpw2hh5

Minor readme update before 0.1.1

files added:
benchmarks/dhry/Makefile

benchmarks/multi/Makefile

reference/Makefile.am

reference/bionic/memcmp16.S

reference/configure.ac

reference/glibc/memmove.S

reference/newlib/strcmp.c

reference/test.py

src/neon/memcpy.S

src/neon/memset.S

src/thumb-2/strcmp.c

src/thumb-2/strlen.c

files removed:
autogen.sh

reference/bionic-c

reference/bionic-c/bcopy.c

reference/bionic-c/memchr.c

reference/bionic-c/memcmp.c

reference/bionic-c/memcpy.c

reference/bionic-c/memset.c

reference/bionic-c/strchr.c

reference/bionic-c/strcmp.c

reference/bionic-c/strcpy.c

reference/bionic-c/strlen.c

reference/bionic/strcmp.S

reference/bionic/strcpy.S

reference/glibc-c

reference/glibc-c/bp-checks.h

reference/glibc-c/memchr.c

reference/glibc-c/memcmp.c

reference/glibc-c/memcopy.h

reference/glibc-c/memcpy.c

reference/glibc-c/memset.c

reference/glibc-c/pagecopy.h

reference/glibc-c/strchr.c

reference/glibc-c/strcmp.c

reference/glibc-c/strcpy.c

reference/glibc-c/strlen.c

reference/glibc-c/wordcopy.c

reference/newlib-c

reference/newlib-c/memchr.c

reference/newlib-c/memcmp.c

reference/newlib-c/memcpy.c

reference/newlib-c/memset.c

reference/newlib-c/shim.h

reference/newlib-c/strchr.c

reference/newlib-c/strcmp.c

reference/newlib-c/strcpy.c

reference/newlib-c/strlen.c

reference/newlib-xscale

reference/newlib-xscale/memchr.c

reference/newlib-xscale/memcpy.c

reference/newlib-xscale/memset.c

reference/newlib-xscale/strchr.c

reference/newlib-xscale/strcmp.c

reference/newlib-xscale/strcpy.c

reference/newlib-xscale/strlen.c

reference/newlib-xscale/xscale.h

reference/newlib/memcpy.S

reference/newlib/shim.h

reference/newlib/strcmp.S

scripts/add-license.sh

scripts/bench.py

scripts/libplot.py

scripts/plot-align.py

scripts/plot-sizes.py

scripts/plot-top.py

scripts/plot.py

scripts/trim.sh

src/aarch64

src/aarch64/memcpy.S

src/aarch64/memmove.S

src/aarch64/memset.S

src/aarch64/strcmp.S

src/linaro-a9

src/linaro-a9/memchr.S

src/linaro-a9/memcpy-hybrid.S

src/linaro-a9/memcpy.S

src/linaro-a9/memset.S

src/linaro-a9/strchr.S

src/linaro-a9/strlen.S

tests/test-memchr.c

tests/test-memcmp.c

tests/test-memmove.c

tests/test-strchr.c

tests/test-strncmp.c

files modified:
.bzrignore

Makefile.am

NOTES

README

benchmarks/multi/harness.c

configure.ac

reference/bionic/memcmp.S

reference/bionic/memcpy.S

reference/bionic/strlen.c

reference/glibc/memcpy.S

reference/glibc/memset.S

reference/glibc/strlen.S

reference/helpers/bounce.c

reference/helpers/spawn.c

reference/newlib/arm_asm.h

reference/plain/memcpy.c

reference/plain/memset.c

reference/plain/strcmp.c

reference/plain/strcpy.c

tests/test-string.h

Show diffs side-by-side

added added

removed removed

scripts/bench.py

#!/usr/bin/env python

"""Simple harness that benchmarks different variants of the routines,

caches the results, and emits all of the records at the end.

Results are generated for different values of:

* Source

* Routine

* Length

* Alignment

"""

import subprocess

import math

import sys

# Prefix to the executables

build = '../build/try-'

ALL = 'memchr memcmp memcpy memset strchr strcmp strcpy strlen'

HAS = {

'this': 'bounce memchr memcpy memset strchr strcpy strlen',

'bionic': 'memcmp memcpy memset strcmp strcpy strlen',

'bionic-c': ALL,

'csl': 'memcpy memset',

'glibc': 'memcpy memset strlen',

'glibc-c': ALL,

'newlib': 'memcpy strcmp strcpy strlen',

'newlib-c': ALL,

'newlib-xscale': 'memchr memcpy memset strchr strcmp strcpy strlen',

'plain': 'memset memcpy strcmp strcpy',

}

def run(cache, variant, function, bytes, loops, alignment=8, quiet=False):

"""Perform a single run, exercising the cache as appropriate."""

key = ':'.join('%s' % x for x in (variant, function, bytes, loops, alignment))

if key in cache:

got = cache[key]

else:

xbuild = build

cmd = '%(xbuild)s%(variant)s -t %(function)s -c %(bytes)s -l %(loops)s -a %(alignment)s' % locals()

try:

got = subprocess.check_output(cmd.split()).strip()

except OSError, ex:

assert False, 'Error %s while running %s' % (ex, cmd)

parts = got.split(':')

took = float(parts[5])

cache[key] = got

if not quiet:

print got

sys.stdout.flush()

return took

def run_many(cache, variants, bytes, alignments):

# We want the data to come out in a useful order. So fix an

# alignment and function, and do all sizes for a variant first

bytes = sorted(bytes)

mid = bytes[len(bytes)/2]

# Use the ordering in 'this' as the default

all_functions = HAS['this'].split()

# Find all other functions

for functions in HAS.values():

for function in functions.split():

if function not in all_functions:

all_functions.append(function)

for alignment in alignments:

for function in all_functions:

for variant in variants:

if function not in HAS[variant].split():

continue

# Run a tracer through and see how long it takes and

# adjust the number of loops based on that. Not great

# for memchr() and similar which are O(n), but it will

# do

f = 50000000

want = 5.0

loops = int(f / math.sqrt(max(1, mid)))

took = run(cache, variant, function, mid, loops, alignment, quiet=True)

# Keep it reasonable for silly routines like bounce

factor = min(20, max(0.05, want/took))

f = f * factor

# Round f to a few significant figures

scale = 10**int(math.log10(f) - 1)

f = scale*int(f/scale)

for b in sorted(bytes):

100

# Figure out the number of loops to give a roughly consistent run

101

loops = int(f / math.sqrt(max(1, b)))

102

run(cache, variant, function, b, loops, alignment)

103

104

def run_top(cache):

105

variants = sorted(HAS.keys())

106

107

# Upper limit in bytes to test to

108

top = 512*1024

109

# Test all powers of 2

110

step1 = 2.0

111

# Test intermediate powers of 1.4

112

step2 = 1.4

113

114

bytes = []

115

116

for step in [step1, step2]:

117

if step:

118

# Figure out how many steps get us up to the top

119

steps = int(round(math.log(top) / math.log(step)))

120

bytes.extend([int(step**x) for x in range(0, steps+1)])

121

122

alignments = [8, 16, 4, 1, 2, 32]

123

124

run_many(cache, variants, bytes, alignments)

125

126

def main():

127

cachename = 'cache.txt'

128

129

cache = {}

130

131

try:

132

with open(cachename) as f:

133

for line in f:

134

line = line.strip()

135

parts = line.split(':')

136

cache[':'.join(parts[:5])] = line

137

except:

138

pass

139

140

try:

141

run_top(cache)

142

finally:

143

with open(cachename, 'w') as f:

144

for line in sorted(cache.values()):

145

print >> f, line

146

147

if __name__ == '__main__':

148

main()

Older »