~nataliabidart/+junk/memusage

« back to all changes in this revision

Viewing changes to parse.py

Committer: Natalia Bidart
Date: 2014-08-20 15:51:09 UTC
Revision ID: natalia.bidart@ubuntu.com-20140820155109-khs5tt8uchggwrhe

Utilities to parse sca test suite memusage.

files added:

fullrun-dummy.txt

fullrun-regular.txt

memusage-tests-all-dummy-cache

memusage-tests-all-regular-cache

memusage-tests-devportal-dummy-cache

memusage-tests-devportal-regular-cache

memusage-tests-exhibits-dummy-cache

memusage-tests-exhibits-regular-cache

memusage-tests-sca-dummy-cache

memusage-tests-sca-regular-cache

memusage-tests-webservices-dummy-cache

memusage-tests-webservices-regular-cache

parse.py

Show diffs side-by-side

added added

removed removed

parse.py

# -*- coding: utf-8 -*-

import os

import re

import sys

from collections import OrderedDict, defaultdict, namedtuple

from matplotlib import pyplot

PAGE_SIZE_BYTES = 4096

TEST_NAME = r'(\w+ \([\w\.]+\))'

TEST_DOCSTRING = r'[/#,=\(\)\[\]\+\:\.\-\'\w\s]+'

TEST_SEP = r' \.\.\. '

TEST_RESULT = r'(?:ok|ERROR|FAIL)'

MEM_USAGE = r'(\d+)\s+(\d+)\s+(\d+)\s+(\d+)\s+(\d+\.\d+)'

TEST_RESULT_ONLY = re.compile(TEST_RESULT)

TEST_PLUS_MEM = re.compile(TEST_NAME + TEST_SEP + MEM_USAGE)

TEST_DOCSTRING_PLUS_MEM = re.compile(TEST_DOCSTRING + TEST_SEP + MEM_USAGE)

TEST_ONLY = re.compile(

r'%s|%s' % (TEST_NAME + TEST_SEP + TEST_RESULT, TEST_NAME))

DOCSTRING_PLUS_RESULT = re.compile(TEST_DOCSTRING + TEST_SEP + TEST_RESULT)

MEM_ONLY = re.compile(MEM_USAGE)

Stats = namedtuple('Stats', ['usage', 'percentage', 'res_megs'])

def mem_stats(groups):

assert len(groups) == 5

percentage = float(groups.pop(-1))

usage = map(int, groups)

assert len(usage) == 4

res_megs = ((usage[1] * PAGE_SIZE_BYTES) / 1024.) / 1024.

return Stats(usage, percentage, res_megs)

def parse_individual(filename):

with open(filename) as f:

lines = f.readlines()

result = []

for line in lines:

match = MEM_ONLY.match(line)

if match:

stats = mem_stats(list(match.groups()))

result.append(stats.res_megs)

else:

print 'no match!', line

return result

def parse_test_id(test_id):

test_name, test_path = test_id.split(' ')

test_path = test_path.strip('(').strip(')')

return '%s.%s' % (test_path, test_name)

def parse_mem_stats(groups, stats, test_id):

result = mem_stats(groups)

app = test_id.split('.')[0]

stats.setdefault(app, [])

stats[app].append(result.res_megs)

return result

def parse(filename):

with open(filename) as f:

lines = f.readlines()

memory_stats = OrderedDict()

last_test_id = 'init.init'

combined_stats = OrderedDict()

combined_stats[last_test_id] = []

for line in lines:

line = line.strip()

if (not line or TEST_RESULT_ONLY.match(line) or

DOCSTRING_PLUS_RESULT.match(line)):

continue

match = TEST_PLUS_MEM.match(line)

if match:

groups = list(match.groups())

last_test_id = parse_test_id(groups.pop(0))

stats = parse_mem_stats(groups, memory_stats, last_test_id)

# print 'TEST_PLUS_MEM', last_test_id, stats

assert last_test_id not in combined_stats

combined_stats[last_test_id] = [stats]

continue

match = TEST_ONLY.match(line)

if match:

groups = filter(None, list(match.groups()))

last_test_id = parse_test_id(groups.pop(0))

100

# print 'TEST_ONLY', last_test_id

101

combined_stats[last_test_id] = []

102

continue

103

104

match = TEST_DOCSTRING_PLUS_MEM.match(line)

105

if match:

106

groups = list(match.groups())

107

stats = parse_mem_stats(groups, memory_stats, last_test_id)

108

# print 'TEST_DOCSTRING_PLUS_MEM', stats

109

combined_stats[last_test_id].append(stats)

110

continue

111

112

match = MEM_ONLY.match(line)

113

if match:

114

groups = list(match.groups())

115

stats = parse_mem_stats(groups, memory_stats, last_test_id)

116

# print 'MEM_ONLY', stats

117

combined_stats[last_test_id].append(stats)

118

continue

119

120

###print '!!! not matched:', repr(line)

121

return memory_stats, combined_stats

122

123

124

def annotate(legend, x, y, color='white', alpha=0.5):

125

pyplot.annotate(

126

legend, (x, y), xytext=(-10, 10),

127

textcoords='offset points', ha='right', va='bottom',

128

bbox=dict(boxstyle='round,pad=0.5', fc=color, alpha=alpha),

129

arrowprops=dict(arrowstyle='->', connectionstyle='arc3,rad=0')

130

)

131

132

133

def regular_vs_dummy():

134

filenames = ('fullrun-regular.txt', 'fullrun-dummy.txt')

135

for filename in filenames:

136

memory_stats, _ = parse(filename)

137

all_stats = []

138

i = 0

139

for app, stats in memory_stats.iteritems():

140

all_stats.extend(stats)

141

if stats:

142

annotate(app, i, stats[0], alpha=1.0)

143

i += len(stats)

144

145

pyplot.plot(all_stats, label=filename.split('.')[0])

146

147

pyplot.ylabel('Resident memory (MB)')

148

pyplot.xlabel('ticks')

149

pyplot.legend(loc='upper left', shadow=True)

150

pyplot.show()

151

152

153

def dummy_annotated():

154

memory_stats , combined_stats = parse('fullrun-dummy.txt')

155

all_stats = []

156

for stat in memory_stats.itervalues():

157

all_stats.extend(stat)

158

pyplot.plot(all_stats, '.-')

159

160

def _annotate(test, stats, color, extra=''):

161

legend = '%s\n%s' % tuple(test.split('.')[-2:])

162

y = stats[0].res_megs

163

x = all_stats.index(y)

164

annotate(legend + extra, x, y, color)

165

166

last_stats = None

167

last_test = None

168

for test, stats in combined_stats.iteritems():

169

ticks = len(stats)

170

if not ticks:

171

continue

172

###if last_stats and stats[0][1] < last_stats[0][1]:

173

### # there was a drop in mem usage, let's anotate the test

174

### annotate(last_test, last_stats, color='yellow')

175

if ticks > 5:

176

_annotate(test, stats, color='grey', extra=' (%s ticks)' % ticks)

177

178

last_test = test

179

last_stats = stats

180

181

pyplot.ylabel('Resident memory (MB)')

182

pyplot.xlabel('ticks')

183

pyplot.show()

184

185

186

def app_individuals():

187

filenames = [f for f in os.listdir('.') if f.startswith('memusage-tests')]

188

for filename in filenames:

189

stats = parse_individual(filename)

190

pyplot.plot(stats, label='-'.join(filename.split('-')[2:4]))

191

192

pyplot.ylabel('Resident memory (MB)')

193

pyplot.xlabel('ticks')

194

pyplot.legend(loc='upper left')

195

pyplot.show()

196

197

198

if __name__ == '__main__':

199

# regular_vs_dummy()

200

# dummy_annotated()

201

app_individuals()

Older »