~andrewjbeach/juju-ci-tools/make-local-patcher

« back to all changes in this revision

Viewing changes to generate_perfscale_results.py

Committer: Aaron Bentley
Date: 2016-07-08 14:26:06 UTC
mfrom: (1465.1.14 client-from-config-5)
mto: This revision was merged to the branch mainline in revision 1509.
Revision ID: aaron.bentley@canonical.com-20160708142606-4x5rpd5c9jw9bn6n

Merged client-from-config-5 into client-from-config.

files removed:
assess_constraints.py

assess_controller_permissions.py

assess_log_forward.py

assess_model_config_tree.py

assess_ssh_keys.py

certificates.py

example-collectd.conf

fakejuju.py

generate_perfscale_results.py

log_check.py

logbreakdown.py

maas-p8

maas-p8/add-virtual-maas-nodes.bash

maas-p8/cloud-config.txt

maas-p8/maas-network.xml

maas-p8/maas-node-1.xml

maas-p8/maaspool1.xml

maas-p8/readme.txt

perf_graphing.py

perf_report_template.html

perf_static

perf_static/collectd.conf

perf_static/setup-perf-monitoring.sh

streams-from-local.bash

tests/test_assess_constraints.py

tests/test_assess_controller_permissions.py

tests/test_assess_log_forward.py

tests/test_assess_model_config_tree.py

tests/test_assess_ssh_keys.py

tests/test_generate_perfscale_results.py

tests/test_gotestwin.py

tests/test_log_check.py

tests/test_logbreakdown.py

tests/test_perf_graphing.py

files modified:
Makefile

assemble-parallel-streams.bash

assess_autoload_credentials.py

assess_block.py

assess_bootstrap.py

assess_container_networking.py

assess_heterogeneous_control.py

assess_jes_deploy.py

assess_log_rotation.py

assess_model_migration.py

assess_recovery.py

assess_storage.py

assess_unregister.py

assess_user_grant_revoke.py

assess_win_client.py

candidate.py

check_blockers.py

concurrently.py

deploy_stack.py

git_gate.py

gotesttarfile.py

gotestwin.py

industrial_test.py

juju-ci-tools-common

jujucharm.py

jujupy.py

remove-manual-juju.bash

run-reliability-test.bash

run-unit-tests

run_chaos_monkey.py

run_deployer.py

scale_out.py

schedule_chaos_tests.py

schedule_hetero_control.py

schedule_reliability_tests.py

substrate.py

template_test.py.tmpl

tests/test_assess_autoload_credentials.py

tests/test_assess_block.py

tests/test_assess_bootstrap.py

tests/test_assess_container_networking.py

tests/test_assess_cs_staging.py

tests/test_assess_heterogeneous_control.py

tests/test_assess_jes_deploy.py

tests/test_assess_log_rotation.py

tests/test_assess_min_version.py

tests/test_assess_mixed_images.py

tests/test_assess_model_migration.py

tests/test_assess_multi_series_charms.py

tests/test_assess_recovery.py

tests/test_assess_resources.py

tests/test_assess_storage.py

tests/test_assess_unregister.py

tests/test_assess_update_mongo.py

tests/test_assess_user_grant_revoke.py

tests/test_candidate.py

tests/test_chaos.py

tests/test_check_blockers.py

tests/test_concurrently.py

tests/test_deploy_stack.py

tests/test_git_gate.py

tests/test_gotesttarfile.py

tests/test_industrial_test.py

tests/test_jujucharm.py

tests/test_jujupy.py

tests/test_quickstart_deploy.py

tests/test_run_chaos_monkey.py

tests/test_run_deployer.py

tests/test_scale_out.py

tests/test_schedule_chaos_tests.py

tests/test_schedule_hetero_control.py

tests/test_schedule_reliability_tests.py

tests/test_substrate.py

tests/test_utility.py

tests/test_verify_mediawiki_bundle.py

tests/test_winazurearm.py

update-jenkins-branches.bash

utility.py

winazurearm.py

Show diffs side-by-side

added added

removed removed

generate_perfscale_results.py

#!/usr/bin/env python

"""Simple performance and scale tests."""

from __future__ import print_function

import argparse

from collections import defaultdict, namedtuple

from datetime import datetime

import logging

import os

import sys

import subprocess

try:

import rrdtool

except ImportError:

# rddtool requires the cairo/pango libs that are difficult to install

# on non-linux.

rrdtool = object()

from jinja2 import Template

from deploy_stack import (

BootstrapManager,

)

from logbreakdown import (

_render_ds_string,

breakdown_log_by_timeframes,

)

import perf_graphing

from utility import (

add_basic_testing_arguments,

configure_logging,

)

__metaclass__ = type

class TimingData:

strf_format = '%F %H:%M:%S'

# Log breakdown uses the start/end too. Perhaps have a property for string

# rep and a ds for the datetime.

def __init__(self, start, end):

self.start = start.strftime(self.strf_format)

self.end = end.strftime(self.strf_format)

self.seconds = int((end - start).total_seconds())

DeployDetails = namedtuple(

'DeployDetails', ['name', 'applications', 'timings'])

SETUP_SCRIPT_PATH = 'perf_static/setup-perf-monitoring.sh'

COLLECTD_CONFIG_PATH = 'perf_static/collectd.conf'

log = logging.getLogger("assess_perf_test_simple")

def assess_perf_test_simple(bs_manager, upload_tools):

# XXX

# Find the actual cause for this!! (Something to do with the template and

# the logs.)

import sys

reload(sys) # NOQA

sys.setdefaultencoding('utf-8')

# XXX

bs_start = datetime.utcnow()

with bs_manager.booted_context(upload_tools):

client = bs_manager.client

admin_client = client.get_controller_client()

admin_client.wait_for_started()

bs_end = datetime.utcnow()

try:

apply_any_workarounds(client)

bootstrap_timing = TimingData(bs_start, bs_end)

setup_system_monitoring(admin_client)

deploy_details = assess_deployment_perf(client)

finally:

results_dir = os.path.join(

os.path.abspath(bs_manager.log_dir), 'performance_results/')

os.makedirs(results_dir)

admin_client.juju(

'scp',

('--', '-r', '0:/var/lib/collectd/rrd/localhost/*',

results_dir)

)

try:

admin_client.juju(

'scp', ('0:/tmp/mongodb-stats.log', results_dir)

)

except subprocess.CalledProcessError as e:

log.error('Failed to copy mongodb stats: {}'.format(e))

cleanup_start = datetime.utcnow()

100

# Cleanup happens when we move out of context

101

cleanup_end = datetime.utcnow()

102

cleanup_timing = TimingData(cleanup_start, cleanup_end)

103

deployments = dict(

104

bootstrap=bootstrap_timing,

105

deploys=[deploy_details],

106

cleanup=cleanup_timing,

107

)

108

109

# Could be smarter about this.

110

controller_log_file = os.path.join(

111

bs_manager.log_dir,

112

'controller',

113

'machine-0',

114

'machine-0.log.gz')

115

116

generate_reports(controller_log_file, results_dir, deployments)

117

118

119

def apply_any_workarounds(client):

120

# Work around mysql charm wanting 80% memory.

121

if client.env.get_cloud() == 'lxd':

122

constraint_cmd = [

123

'lxc',

124

'profile',

125

'set',

126

'juju-{}'.format(client.env.environment),

127

'limits.memory',

128

'2GB'

129

]

130

subprocess.check_output(constraint_cmd)

131

132

133

def generate_reports(controller_log, results_dir, deployments):

134

"""Generate reports and graphs from run results."""

135

cpu_image = generate_cpu_graph_image(results_dir)

136

memory_image = generate_memory_graph_image(results_dir)

137

network_image = generate_network_graph_image(results_dir)

138

139

destination_dir = os.path.join(results_dir, 'mongodb')

140

os.mkdir(destination_dir)

141

try:

142

perf_graphing.create_mongodb_rrd_files(results_dir, destination_dir)

143

except perf_graphing.SourceFileNotFound:

144

log.error(

145

'Failed to create the MongoDB RRD file. Source file not found.'

146

)

147

148

# Sometimes mongostats fails to startup and start logging. Unsure yet

149

# why this is. For now generate the report without the mongodb details,

150

# the rest of the report is still useful.

151

mongo_query_image = None

152

mongo_memory_image = None

153

else:

154

mongo_query_image = generate_mongo_query_graph_image(results_dir)

155

mongo_memory_image = generate_mongo_memory_graph_image(results_dir)

156

157

log_message_chunks = get_log_message_in_timed_chunks(

158

controller_log, deployments)

159

160

details = dict(

161

cpu_graph=cpu_image,

162

memory_graph=memory_image,

163

network_graph=network_image,

164

mongo_graph=mongo_query_image,

165

mongo_memory_graph=mongo_memory_image,

166

deployments=deployments,

167

log_message_chunks=log_message_chunks

168

)

169

170

create_html_report(results_dir, details)

171

172

173

def get_log_message_in_timed_chunks(log_file, deployments):

174

"""Breakdown log into timechunks based on event timeranges in 'deployments'

175

176

"""

177

deploy_timings = [d.timings for d in deployments['deploys']]

178

179

bootstrap = deployments['bootstrap']

180

cleanup = deployments['cleanup']

181

all_event_timings = [bootstrap] + deploy_timings + [cleanup]

182

183

raw_details = breakdown_log_by_timeframes(log_file, all_event_timings)

184

185

bs_name = _render_ds_string(bootstrap.start, bootstrap.end)

186

cleanup_name = _render_ds_string(cleanup.start, cleanup.end)

187

188

name_lookup = {

189

bs_name: 'Bootstrap',

190

cleanup_name: 'Kill-Controller',

191

}

192

for dep in deployments['deploys']:

193

name_range = _render_ds_string(

194

dep.timings.start, dep.timings.end)

195

name_lookup[name_range] = dep.name

196

197

event_details = defaultdict(defaultdict)

198

# Outer-layer (i.e. event)

199

for event_range in raw_details.keys():

200

event_details[event_range]['name'] = name_lookup[event_range]

201

event_details[event_range]['logs'] = []

202

203

for log_range in raw_details[event_range].keys():

204

timeframe = log_range

205

message = '<br/>'.join(raw_details[event_range][log_range])

206

event_details[event_range]['logs'].append(

207

dict(

208

timeframe=timeframe,

209

message=message))

210

211

return event_details

212

213

214

def create_html_report(results_dir, details):

215

# render the html file to the results dir

216

with open('./perf_report_template.html', 'rt') as f:

217

template = Template(f.read())

218

219

results_output = os.path.join(results_dir, 'report.html')

220

with open(results_output, 'wt') as f:

221

f.write(template.render(details))

222

223

224

def generate_graph_image(base_dir, results_dir, name, generator):

225

metric_files_dir = os.path.join(os.path.abspath(base_dir), results_dir)

226

return create_report_graph(metric_files_dir, base_dir, name, generator)

227

228

229

def create_report_graph(rrd_dir, output_dir, name, generator):

230

any_file = os.listdir(rrd_dir)[0]

231

start, end = get_duration_points(os.path.join(rrd_dir, any_file))

232

output_file = os.path.join(

233

os.path.abspath(output_dir), '{}.png'.format(name))

234

generator(start, end, rrd_dir, output_file)

235

print('Created: {}'.format(output_file))

236

return output_file

237

238

239

def generate_cpu_graph_image(results_dir):

240

return generate_graph_image(

241

results_dir, 'aggregation-cpu-average', 'cpu', perf_graphing.cpu_graph)

242

243

244

def generate_memory_graph_image(results_dir):

245

return generate_graph_image(

246

results_dir, 'memory', 'memory', perf_graphing.memory_graph)

247

248

249

def generate_network_graph_image(results_dir):

250

return generate_graph_image(

251

results_dir, 'interface-eth0', 'network', perf_graphing.network_graph)

252

253

254

def generate_mongo_query_graph_image(results_dir):

255

return generate_graph_image(

256

results_dir, 'mongodb', 'mongodb', perf_graphing.mongodb_graph)

257

258

259

def generate_mongo_memory_graph_image(results_dir):

260

return generate_graph_image(

261

results_dir,

262

'mongodb',

263

'mongodb_memory',

264

perf_graphing.mongodb_memory_graph)

265

266

267

def get_duration_points(rrd_file):

268

start = rrdtool.first(rrd_file)

269

end = rrdtool.last(rrd_file)

270

271

# Start gives us the start timestamp in the data but it might be null/empty

272

# (i.e no data entered for that time.)

273

# Find the timestamp in which data was first entered.

274

command = [

275

'rrdtool', 'fetch', rrd_file, 'AVERAGE',

276

'--start', str(start), '--end', str(end)]

277

output = subprocess.check_output(command)

278

279

actual_start = find_actual_start(output)

280

281

return actual_start, end

282

283

284

def find_actual_start(fetch_output):

285

# Gets a start timestamp this isn't a NaN.

286

for line in fetch_output.splitlines():

287

try:

288

timestamp, value = line.split(':', 1)

289

if not value.startswith(' -nan'):

290

return timestamp

291

except ValueError:

292

pass

293

294

295

def assess_deployment_perf(client, bundle_name='cs:ubuntu'):

296

# This is where multiple services are started either at the same time

297

# or one after the other etc.

298

deploy_start = datetime.utcnow()

299

300

# We possibly want 2 timing details here, one for started (i.e. agents

301

# ready) and the other for the workloads to be complete.

302

client.deploy(bundle_name)

303

client.wait_for_started()

304

client.wait_for_workloads()

305

306

deploy_end = datetime.utcnow()

307

deploy_timing = TimingData(deploy_start, deploy_end)

308

309

client_details = get_client_details(client)

310

311

return DeployDetails(bundle_name, client_details, deploy_timing)

312

313

314

def get_client_details(client):

315

status = client.get_status()

316

units = dict()

317

for name in status.get_applications().keys():

318

units[name] = status.get_service_unit_count(name)

319

return units

320

321

322

def setup_system_monitoring(admin_client):

323

# Using ssh get into the machine-0 (or all api/state servers)

324

# Install the required packages and start up logging of systems collections

325

# and mongodb details.

326

327

installer_script_path = _get_static_script_path(SETUP_SCRIPT_PATH)

328

collectd_config_path = _get_static_script_path(COLLECTD_CONFIG_PATH)

329

installer_script_dest_path = '/tmp/installer.sh'

330

runner_script_dest_path = '/tmp/runner.sh'

331

collectd_config_dest_file = '/tmp/collectd.config'

332

333

admin_client.juju(

334

'scp',

335

(collectd_config_path, '0:{}'.format(collectd_config_dest_file)))

336

337

admin_client.juju(

338

'scp',

339

(installer_script_path, '0:{}'.format(installer_script_dest_path)))

340

admin_client.juju('ssh', ('0', 'chmod +x {}'.format(

341

installer_script_dest_path)))

342

admin_client.juju(

343

'ssh',

344

('0', '{installer} {config_file} {output_file}'.format(

345

installer=installer_script_dest_path,

346

config_file=collectd_config_dest_file,

347

output_file=runner_script_dest_path)))

348

349

# Start collection

350

# Respawn incase the initial execution fails for whatever reason.

351

admin_client.juju('ssh', ('0', '--', 'daemon --respawn {}'.format(

352

runner_script_dest_path)))

353

354

355

def _get_static_script_path(script_path):

356

full_path = os.path.abspath(__file__)

357

current_dir = os.path.dirname(full_path)

358

return os.path.join(current_dir, script_path)

359

360

361

def parse_args(argv):

362

"""Parse all arguments."""

363

parser = argparse.ArgumentParser(description="Simple perf/scale testing")

364

add_basic_testing_arguments(parser)

365

return parser.parse_args(argv)

366

367

368

def main(argv=None):

369

args = parse_args(argv)

370

configure_logging(args.verbose)

371

bs_manager = BootstrapManager.from_args(args)

372

assess_perf_test_simple(bs_manager, args.upload_tools)

373

374

return 0

375

376

377

if __name__ == '__main__':

378

sys.exit(main())

Older »