~linaro-toolchain-dev/cortex-strings/trunk

« back to all changes in this revision

Viewing changes to scripts/bench.py

Committer: Michael Hope
Date: 2012-06-12 03:19:48 UTC
Revision ID: michael.hope@linaro.org-20120612031948-4ii8jicywtzjprak

Added the C only routines from GLIBC 2.16+20120607~git24a6dbe

files added:
Makefile.am

NOTES

README

autogen.sh

benchmarks/multi

benchmarks/multi/harness.c

configure.ac

reference/bionic-c

reference/bionic-c/bcopy.c

reference/bionic-c/memchr.c

reference/bionic-c/memcmp.c

reference/bionic-c/memcpy.c

reference/bionic-c/memset.c

reference/bionic-c/strchr.c

reference/bionic-c/strcmp.c

reference/bionic-c/strcpy.c

reference/bionic-c/strlen.c

reference/bionic/memchr.c

reference/bionic/strchr.c

reference/bionic/strcmp.c

reference/bionic/strcpy.c

reference/csl

reference/csl/arm_asm.h

reference/csl/memcpy.c

reference/csl/memset.c

reference/glibc-c

reference/glibc-c/bp-checks.h

reference/glibc-c/memchr.c

reference/glibc-c/memcmp.c

reference/glibc-c/memcopy.h

reference/glibc-c/memcpy.c

reference/glibc-c/memset.c

reference/glibc-c/pagecopy.h

reference/glibc-c/strchr.c

reference/glibc-c/strcmp.c

reference/glibc-c/strcpy.c

reference/glibc-c/strlen.c

reference/glibc-c/wordcopy.c

reference/glibc/memchr.c

reference/glibc/strchr.c

reference/glibc/strcmp.c

reference/glibc/strcpy.c

reference/newlib-c

reference/newlib-c/memchr.c

reference/newlib-c/memcpy.c

reference/newlib-c/memset.c

reference/newlib-c/shim.h

reference/newlib-c/strchr.c

reference/newlib-xscale

reference/newlib-xscale/memchr.c

reference/newlib-xscale/memcpy.c

reference/newlib-xscale/memset.c

reference/newlib-xscale/strchr.c

reference/newlib-xscale/strcmp.c

reference/newlib-xscale/strcpy.c

reference/newlib-xscale/strlen.c

reference/newlib-xscale/xscale.h

reference/newlib/memcpy.S

reference/newlib/shim.h

reference/newlib/strcmp.S

reference/plain/memset.c

reference/plain/strcmp.c

reference/plain/strcpy.c

scripts

scripts/add-license.sh

scripts/bench.py

scripts/fixup.py

scripts/libplot.py

scripts/plot-align.py

scripts/plot-sizes.py

scripts/plot-top.py

scripts/plot.py

scripts/trim.sh

src/linaro-a9

src/linaro-a9/memchr.S

src/linaro-a9/memcpy-hybrid.S

src/linaro-a9/memcpy.S

src/linaro-a9/memset.S

src/linaro-a9/strchr.S

src/linaro-a9/strlen.S

src/neon

src/thumb-2

src/thumb-2/strcpy.c

tests

tests/hp-timing.h

tests/test-memchr.c

tests/test-memcpy.c

tests/test-memset.c

tests/test-skeleton.c

tests/test-strchr.c

tests/test-strcmp.c

tests/test-strcpy.c

tests/test-string.h

tests/test-strlen.c

files removed:
benchmarks/dhry/Makefile

src/reference/Makefile.am

src/reference/bionic/memcmp16.S

src/reference/configure.ac

src/reference/glibc/memmove.S

src/reference/newlib/strcmp.c

src/reference/test.py

files renamed:
src/reference/ => reference/

files modified:
.bzrignore

reference/bionic/memcmp.S

reference/bionic/memcpy.S

reference/bionic/strlen.c

reference/glibc/memset.S

reference/helpers/bounce.c

reference/helpers/spawn.c

reference/newlib/arm_asm.h

reference/plain/memcpy.c

Show diffs side-by-side

added added

removed removed

scripts/bench.py

#!/usr/bin/env python

"""Simple harness that benchmarks different variants of the routines,

caches the results, and emits all of the records at the end.

Results are generated for different values of:

* Source

* Routine

* Length

* Alignment

"""

import subprocess

import math

import sys

# Prefix to the executables

build = '../build/try-'

DEFAULTS = 'memcpy memset memchr strchr strcmp strcpy strlen'

HAS = {

'this': 'bounce ' + DEFAULTS,

'bionic': DEFAULTS,

'glibc': DEFAULTS,

'newlib': DEFAULTS,

'newlib-xscale': DEFAULTS,

'plain': 'memset memcpy strcmp strcpy',

'csl': 'memcpy memset'

}

def run(cache, variant, function, bytes, loops, alignment=8, quiet=False):

"""Perform a single run, exercising the cache as appropriate."""

key = ':'.join('%s' % x for x in (variant, function, bytes, loops, alignment))

if key in cache:

got = cache[key]

else:

xbuild = build

cmd = '%(xbuild)s%(variant)s -t %(function)s -c %(bytes)s -l %(loops)s -a %(alignment)s' % locals()

try:

got = subprocess.check_output(cmd.split()).strip()

except OSError, ex:

assert False, 'Error %s while running %s' % (ex, cmd)

parts = got.split(':')

took = float(parts[5])

cache[key] = got

if not quiet:

print got

sys.stdout.flush()

return took

def run_many(cache, variants, bytes, alignments):

# We want the data to come out in a useful order. So fix an

# alignment and function, and do all sizes for a variant first

bytes = sorted(bytes)

mid = bytes[len(bytes)/2]

# Use the ordering in 'this' as the default

all_functions = HAS['this'].split()

# Find all other functions

for functions in HAS.values():

for function in functions.split():

if function not in all_functions:

all_functions.append(function)

for alignment in alignments:

for function in all_functions:

for variant in variants:

if function not in HAS[variant].split():

continue

# Run a tracer through and see how long it takes and

# adjust the number of loops based on that. Not great

# for memchr() and similar which are O(n), but it will

# do

f = 50000000

want = 5.0

loops = int(f / math.sqrt(max(1, mid)))

took = run(cache, variant, function, mid, loops, alignment, quiet=True)

# Keep it reasonable for silly routines like bounce

factor = min(20, max(0.05, want/took))

f = f * factor

# Round f to a few significant figures

scale = 10**int(math.log10(f) - 1)

f = scale*int(f/scale)

for b in sorted(bytes):

# Figure out the number of loops to give a roughly consistent run

loops = int(f / math.sqrt(max(1, b)))

run(cache, variant, function, b, loops, alignment)

100

101

def run_top(cache):

102

variants = sorted(HAS.keys())

103

104

# Upper limit in bytes to test to

105

top = 512*1024

106

# Test all powers of 2

107

step1 = 2.0

108

# Test intermediate powers of 1.4

109

step2 = 1.4

110

111

# Figure out how many steps get us up to the top

112

steps1 = int(round(math.log(top) / math.log(step1)))

113

steps2 = int(round(math.log(top) / math.log(step2)))

114

115

bytes = []

116

bytes.extend([int(step1**x) for x in range(0, steps1+1)])

117

bytes.extend([int(step2**x) for x in range(0, steps2+1)])

118

119

alignments = [8, 16, 4, 1, 2, 32]

120

121

run_many(cache, variants, bytes, alignments)

122

123

def main():

124

cachename = 'cache.txt'

125

126

cache = {}

127

128

try:

129

with open(cachename) as f:

130

for line in f:

131

line = line.strip()

132

parts = line.split(':')

133

cache[':'.join(parts[:5])] = line

134

except:

135

pass

136

137

try:

138

run_top(cache)

139

finally:

140

with open(cachename, 'w') as f:

141

for line in cache.values():

142

print >> f, line

143

144

if __name__ == '__main__':

145

main()

Older »