framework_test.py 38 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902
  1. from benchmark.fortune_html_parser import FortuneHTMLParser
  2. from setup.linux import setup_util
  3. from benchmark.test_types import *
  4. import importlib
  5. import os
  6. import subprocess
  7. import time
  8. import re
  9. from pprint import pprint
  10. import sys
  11. import traceback
  12. import json
  13. import logging
  14. import csv
  15. import shlex
  16. import math
  17. from collections import OrderedDict
  18. from threading import Thread
  19. from threading import Event
  20. from utils import header
  21. from datetime import datetime
  22. from datetime import timedelta
  23. class FrameworkTest:
  24. headers_template = "-H 'Host: localhost' -H '{accept}' -H 'Connection: keep-alive'"
  25. # Used for test types that require no pipelining or query string params.
  26. concurrency_template = """
  27. echo ""
  28. echo "---------------------------------------------------------"
  29. echo " Running Primer {name}"
  30. echo " {wrk} {headers} --latency -d 5 -c 8 --timeout 8 -t 8 \"http://{server_host}:{port}{url}\""
  31. echo "---------------------------------------------------------"
  32. echo ""
  33. {wrk} {headers} --latency -d 5 -c 8 --timeout 8 -t 8 "http://{server_host}:{port}{url}"
  34. sleep 5
  35. echo ""
  36. echo "---------------------------------------------------------"
  37. echo " Running Warmup {name}"
  38. echo " {wrk} {headers} --latency -d {duration} -c {max_concurrency} --timeout {max_concurrency} -t {max_threads} \"http://{server_host}:{port}{url}\""
  39. echo "---------------------------------------------------------"
  40. echo ""
  41. {wrk} {headers} --latency -d {duration} -c {max_concurrency} --timeout {max_concurrency} -t {max_threads} "http://{server_host}:{port}{url}"
  42. sleep 5
  43. echo ""
  44. echo "---------------------------------------------------------"
  45. echo " Synchronizing time"
  46. echo "---------------------------------------------------------"
  47. echo ""
  48. ntpdate -s pool.ntp.org
  49. for c in {levels}
  50. do
  51. echo ""
  52. echo "---------------------------------------------------------"
  53. echo " Concurrency: $c for {name}"
  54. echo " {wrk} {headers} --latency -d {duration} -c $c --timeout $c -t $(($c>{max_threads}?{max_threads}:$c)) \"http://{server_host}:{port}{url}\""
  55. echo "---------------------------------------------------------"
  56. echo ""
  57. STARTTIME=$(date +"%s")
  58. {wrk} {headers} --latency -d {duration} -c $c --timeout $c -t "$(($c>{max_threads}?{max_threads}:$c))" http://{server_host}:{port}{url}
  59. echo "STARTTIME $STARTTIME"
  60. echo "ENDTIME $(date +"%s")"
  61. sleep 2
  62. done
  63. """
  64. # Used for test types that require pipelining.
  65. pipeline_template = """
  66. echo ""
  67. echo "---------------------------------------------------------"
  68. echo " Running Primer {name}"
  69. echo " {wrk} {headers} --latency -d 5 -c 8 --timeout 8 -t 8 \"http://{server_host}:{port}{url}\""
  70. echo "---------------------------------------------------------"
  71. echo ""
  72. {wrk} {headers} --latency -d 5 -c 8 --timeout 8 -t 8 "http://{server_host}:{port}{url}"
  73. sleep 5
  74. echo ""
  75. echo "---------------------------------------------------------"
  76. echo " Running Warmup {name}"
  77. echo " {wrk} {headers} --latency -d {duration} -c {max_concurrency} --timeout {max_concurrency} -t {max_threads} \"http://{server_host}:{port}{url}\""
  78. echo "---------------------------------------------------------"
  79. echo ""
  80. {wrk} {headers} --latency -d {duration} -c {max_concurrency} --timeout {max_concurrency} -t {max_threads} "http://{server_host}:{port}{url}"
  81. sleep 5
  82. echo ""
  83. echo "---------------------------------------------------------"
  84. echo " Synchronizing time"
  85. echo "---------------------------------------------------------"
  86. echo ""
  87. ntpdate -s pool.ntp.org
  88. for c in {levels}
  89. do
  90. echo ""
  91. echo "---------------------------------------------------------"
  92. echo " Concurrency: $c for {name}"
  93. echo " {wrk} {headers} --latency -d {duration} -c $c --timeout $c -t $(($c>{max_threads}?{max_threads}:$c)) \"http://{server_host}:{port}{url}\" -s ~/pipeline.lua -- {pipeline}"
  94. echo "---------------------------------------------------------"
  95. echo ""
  96. STARTTIME=$(date +"%s")
  97. {wrk} {headers} --latency -d {duration} -c $c --timeout $c -t "$(($c>{max_threads}?{max_threads}:$c))" http://{server_host}:{port}{url} -s ~/pipeline.lua -- {pipeline}
  98. echo "STARTTIME $STARTTIME"
  99. echo "ENDTIME $(date +"%s")"
  100. sleep 2
  101. done
  102. """
  103. # Used for test types that require a database -
  104. # These tests run at a static concurrency level and vary the size of
  105. # the query sent with each request
  106. query_template = """
  107. echo ""
  108. echo "---------------------------------------------------------"
  109. echo " Running Primer {name}"
  110. echo " wrk {headers} --latency -d 5 -c 8 --timeout 8 -t 8 \"http://{server_host}:{port}{url}2\""
  111. echo "---------------------------------------------------------"
  112. echo ""
  113. wrk {headers} --latency -d 5 -c 8 --timeout 8 -t 8 "http://{server_host}:{port}{url}2"
  114. sleep 5
  115. echo ""
  116. echo "---------------------------------------------------------"
  117. echo " Running Warmup {name}"
  118. echo " wrk {headers} --latency -d {duration} -c {max_concurrency} --timeout {max_concurrency} -t {max_threads} \"http://{server_host}:{port}{url}2\""
  119. echo "---------------------------------------------------------"
  120. echo ""
  121. wrk {headers} --latency -d {duration} -c {max_concurrency} --timeout {max_concurrency} -t {max_threads} "http://{server_host}:{port}{url}2"
  122. sleep 5
  123. echo ""
  124. echo "---------------------------------------------------------"
  125. echo " Synchronizing time"
  126. echo "---------------------------------------------------------"
  127. echo ""
  128. ntpdate -s pool.ntp.org
  129. for c in {levels}
  130. do
  131. echo ""
  132. echo "---------------------------------------------------------"
  133. echo " Queries: $c for {name}"
  134. echo " wrk {headers} --latency -d {duration} -c {max_concurrency} --timeout {max_concurrency} -t {max_threads} \"http://{server_host}:{port}{url}$c\""
  135. echo "---------------------------------------------------------"
  136. echo ""
  137. STARTTIME=$(date +"%s")
  138. wrk {headers} --latency -d {duration} -c {max_concurrency} --timeout {max_concurrency} -t {max_threads} "http://{server_host}:{port}{url}$c"
  139. echo "STARTTIME $STARTTIME"
  140. echo "ENDTIME $(date +"%s")"
  141. sleep 2
  142. done
  143. """
  144. ############################################################
  145. # start(benchmarker)
  146. # Start the test using it's setup file
  147. ############################################################
  148. def start(self, out, err):
  149. # Setup environment variables
  150. logDir = os.path.join(self.fwroot, self.benchmarker.latest_results_directory, 'logs', self.name.lower())
  151. bash_functions_path= os.path.join(self.fwroot, 'toolset/setup/linux/bash_functions.sh')
  152. setup_util.replace_environ(config='$FWROOT/config/benchmark_profile',
  153. command='''\
  154. export TROOT=%s && \
  155. export IROOT=%s && \
  156. export DBHOST=%s && \
  157. export LOGDIR=%s && \
  158. export MAX_THREADS=%s \
  159. ''' % (
  160. self.directory,
  161. self.install_root,
  162. self.database_host,
  163. logDir,
  164. self.benchmarker.threads))
  165. # Run the module start inside parent of TROOT
  166. # - we use the parent as a historical accident, a number of tests
  167. # refer to their TROOT maually still
  168. previousDir = os.getcwd()
  169. os.chdir(os.path.dirname(self.troot))
  170. logging.info("Running setup module start (cwd=%s)", self.directory)
  171. # Run the start script for the test as the "testrunner" user
  172. #
  173. # `sudo` - Switching user requires superuser privs
  174. # -u [username] The username
  175. # -E Preserves the current environment variables
  176. # -H Forces the home var (~) to be reset to the user specified
  177. # `stdbuf` - Disable buffering, send output to python ASAP
  178. # -o0 zero-sized buffer for stdout
  179. # -e0 zero-sized buffer for stderr
  180. # `bash` - Run the setup.sh script using bash
  181. # -e Force bash to exit on first error
  182. # -x Turn on bash tracing e.g. print commands before running
  183. #
  184. # Most servers do not output to stdout/stderr while serving
  185. # requests so there is no performance hit from disabling
  186. # output buffering. This disabling is necessary to
  187. # a) allow TFB to show output in real time and b) avoid loosing
  188. # output in the buffer when the testrunner processes are forcibly
  189. # killed
  190. #
  191. # See http://www.pixelbeat.org/programming/stdio_buffering/
  192. # See https://blogs.gnome.org/markmc/2013/06/04/async-io-and-python/
  193. # See http://eyalarubas.com/python-subproc-nonblock.html
  194. command = 'cat %s %s.sh > /tmp/command.sh && sudo -u %s -E -H stdbuf -o0 -e0 bash -ex /tmp/command.sh' % (
  195. bash_functions_path,
  196. os.path.join(self.troot, self.setup_file),
  197. self.benchmarker.runner_user)
  198. debug_command = '''\
  199. export FWROOT=%s && \\
  200. export TROOT=%s && \\
  201. export IROOT=%s && \\
  202. export DBHOST=%s && \\
  203. export LOGDIR=%s && \\
  204. export MAX_THREADS=%s && \\
  205. cd %s && \\
  206. %s''' % (self.fwroot,
  207. self.directory,
  208. self.install_root,
  209. self.database_host,
  210. logDir,
  211. self.benchmarker.threads,
  212. self.directory,
  213. command)
  214. logging.info("To run %s manually, copy/paste this:\n%s", self.name, debug_command)
  215. def tee_output(prefix, line):
  216. # Needs to be one atomic write
  217. # Explicitly use UTF-8 as it's the most common framework output
  218. # TODO improve encoding handling
  219. line = prefix.encode('utf-8') + line
  220. # Log to current terminal
  221. sys.stdout.write(line)
  222. sys.stdout.flush()
  223. # logging.error("".join([prefix, line]))
  224. out.write(line)
  225. out.flush()
  226. # Start the setup.sh command
  227. p = subprocess.Popen(command, cwd=self.directory,
  228. shell=True, stdout=subprocess.PIPE,
  229. stderr=subprocess.STDOUT,
  230. executable='/bin/bash')
  231. nbsr = setup_util.NonBlockingStreamReader(p.stdout,
  232. "%s: %s.sh and framework processes have terminated" % (self.name, self.setup_file))
  233. # Set a limit on total execution time of setup.sh
  234. timeout = datetime.now() + timedelta(minutes = 20)
  235. time_remaining = timeout - datetime.now()
  236. # Need to print to stdout once every 10 minutes or Travis-CI will abort
  237. travis_timeout = datetime.now() + timedelta(minutes = 5)
  238. # Flush output until setup.sh work is finished. This is
  239. # either a) when setup.sh exits b) when the port is bound
  240. # c) when we run out of time. Note that 'finished' doesn't
  241. # guarantee setup.sh process is dead - the OS may choose to make
  242. # setup.sh a zombie process if it still has living children
  243. #
  244. # Note: child processes forked (using &) will remain alive
  245. # after setup.sh has exited. The will have inherited the
  246. # stdout/stderr descriptors and will be directing their
  247. # output to the pipes.
  248. #
  249. prefix = "Setup %s: " % self.name
  250. while not (p.poll()
  251. or self.benchmarker.is_port_bound(self.port)
  252. or time_remaining.total_seconds() < 0):
  253. # The conditions above are slow to check, so
  254. # we will delay output substantially if we only
  255. # print one line per condition check.
  256. # Adding a tight loop here mitigates the effect,
  257. # ensuring that most of the output directly from
  258. # setup.sh is sent to tee_output before the outer
  259. # loop exits and prints things like "setup.sh exited"
  260. #
  261. for i in xrange(10):
  262. try:
  263. line = nbsr.readline(0.05)
  264. if line:
  265. tee_output(prefix, line)
  266. # Reset Travis-CI timer
  267. travis_timeout = datetime.now() + timedelta(minutes = 5)
  268. except setup_util.EndOfStream:
  269. tee_output(prefix, "Setup has terminated\n")
  270. break
  271. time_remaining = timeout - datetime.now()
  272. if (travis_timeout - datetime.now()).total_seconds() < 0:
  273. sys.stdout.write(prefix + 'Printing so Travis-CI does not time out\n')
  274. sys.stdout.flush()
  275. travis_timeout = datetime.now() + timedelta(minutes = 5)
  276. # Did we time out?
  277. if time_remaining.total_seconds() < 0:
  278. tee_output(prefix, "%s.sh timed out!! Aborting...\n" % self.setup_file)
  279. p.kill()
  280. return 1
  281. # What's our return code?
  282. # If setup.sh has terminated, use that code
  283. # Otherwise, detect if the port was bound
  284. retcode = (p.poll() or 0 if self.benchmarker.is_port_bound(self.port) else 1)
  285. if p.poll():
  286. tee_output(prefix, "%s.sh process exited naturally with %s\n" % (self.setup_file, p.poll()))
  287. elif self.benchmarker.is_port_bound(self.port):
  288. tee_output(prefix, "Bound port detected on %s\n" % self.port)
  289. # Before we return control to the benchmarker, spin up a
  290. # thread to keep an eye on the pipes in case the running
  291. # framework uses stdout/stderr. Once all processes accessing
  292. # the subprocess.PIPEs are dead, this thread will terminate.
  293. # Use a different prefix to indicate this is the framework
  294. # speaking
  295. prefix = "Server %s: " % self.name
  296. def watch_child_pipes(nbsr, prefix):
  297. while True:
  298. try:
  299. line = nbsr.readline(60)
  300. if line:
  301. tee_output(prefix, line)
  302. except setup_util.EndOfStream:
  303. tee_output(prefix, "Framework processes have terminated\n")
  304. return
  305. watch_thread = Thread(target = watch_child_pipes,
  306. args = (nbsr, prefix))
  307. watch_thread.daemon = True
  308. watch_thread.start()
  309. logging.info("Executed %s.sh, returning %s", self.setup_file, retcode)
  310. os.chdir(previousDir)
  311. return retcode
  312. ############################################################
  313. # End start
  314. ############################################################
  315. ############################################################
  316. # verify_urls
  317. # Verifys each of the URLs for this test. THis will sinply
  318. # curl the URL and check for it's return status.
  319. # For each url, a flag will be set on this object for whether
  320. # or not it passed
  321. # Returns True if all verifications succeeded
  322. ############################################################
  323. def verify_urls(self, out, err):
  324. result = True
  325. def verify_type(test_type):
  326. test = self.runTests[test_type]
  327. test.setup_out_err(out, err)
  328. out.write(header("VERIFYING %s" % test_type.upper()))
  329. base_url = "http://%s:%s" % (self.benchmarker.server_host, self.port)
  330. try:
  331. results = test.verify(base_url)
  332. except Exception as e:
  333. results = [('fail',"""Caused Exception in TFB
  334. This almost certainly means your return value is incorrect,
  335. but also that you have found a bug. Please submit an issue
  336. including this message: %s\n%s""" % (e, traceback.format_exc()),
  337. base_url)]
  338. logging.warning("Verifying test %s for %s caused an exception: %s", test_type, self.name, e)
  339. traceback.format_exc()
  340. test.failed = any(result is 'fail' for (result, reason, url) in results)
  341. test.warned = any(result is 'warn' for (result, reason, url) in results)
  342. test.passed = all(result is 'pass' for (result, reason, url) in results)
  343. def output_result(result, reason, url):
  344. out.write(" %s for %s\n" % (result.upper(), url))
  345. print " %s for %s" % (result.upper(), url)
  346. if reason is not None and len(reason) != 0:
  347. for line in reason.splitlines():
  348. out.write(" " + line + '\n')
  349. print " " + line
  350. [output_result(r1,r2,url) for (r1, r2, url) in results]
  351. if test.failed:
  352. self.benchmarker.report_verify_results(self, test_type, 'fail')
  353. elif test.warned:
  354. self.benchmarker.report_verify_results(self, test_type, 'warn')
  355. elif test.passed:
  356. self.benchmarker.report_verify_results(self, test_type, 'pass')
  357. else:
  358. raise Exception("Unknown error - test did not pass,warn,or fail")
  359. result = True
  360. for test_type in self.runTests:
  361. verify_type(test_type)
  362. if self.runTests[test_type].failed:
  363. result = False
  364. return result
  365. ############################################################
  366. # End verify_urls
  367. ############################################################
  368. ############################################################
  369. # benchmark
  370. # Runs the benchmark for each type of test that it implements
  371. # JSON/DB/Query.
  372. ############################################################
  373. def benchmark(self, out, err):
  374. def benchmark_type(test_type):
  375. out.write("BENCHMARKING %s ... " % test_type.upper())
  376. test = self.runTests[test_type]
  377. test.setup_out_err(out, err)
  378. output_file = self.benchmarker.output_file(self.name, test_type)
  379. if not os.path.exists(output_file):
  380. # Open to create the empty file
  381. with open(output_file, 'w'):
  382. pass
  383. if not test.failed:
  384. if test_type == 'plaintext': # One special case
  385. remote_script = self.__generate_pipeline_script(test.get_url(), self.port, test.accept_header)
  386. elif test_type == 'query' or test_type == 'update':
  387. remote_script = self.__generate_query_script(test.get_url(), self.port, test.accept_header)
  388. else:
  389. remote_script = self.__generate_concurrency_script(test.get_url(), self.port, test.accept_header)
  390. # Begin resource usage metrics collection
  391. self.__begin_logging(test_type)
  392. # Run the benchmark
  393. with open(output_file, 'w') as raw_file:
  394. p = subprocess.Popen(self.benchmarker.client_ssh_string.split(" "), stdin=subprocess.PIPE, stdout=raw_file, stderr=err)
  395. p.communicate(remote_script)
  396. err.flush()
  397. # End resource usage metrics collection
  398. self.__end_logging()
  399. results = self.__parse_test(test_type)
  400. print "Benchmark results:"
  401. pprint(results)
  402. self.benchmarker.report_benchmark_results(framework=self, test=test_type, results=results['results'])
  403. out.write( "Complete\n" )
  404. out.flush()
  405. for test_type in self.runTests:
  406. benchmark_type(test_type)
  407. ############################################################
  408. # End benchmark
  409. ############################################################
  410. ############################################################
  411. # parse_all
  412. # Method meant to be run for a given timestamp
  413. ############################################################
  414. def parse_all(self):
  415. for test_type in self.runTests:
  416. if os.path.exists(self.benchmarker.get_output_file(self.name, test_type)):
  417. results = self.__parse_test(test_type)
  418. self.benchmarker.report_benchmark_results(framework=self, test=test_type, results=results['results'])
  419. ##########################################################################################
  420. # Private Methods
  421. ##########################################################################################
  422. ############################################################
  423. # __parse_test(test_type)
  424. ############################################################
  425. def __parse_test(self, test_type):
  426. try:
  427. results = dict()
  428. results['results'] = []
  429. stats = []
  430. if os.path.exists(self.benchmarker.get_output_file(self.name, test_type)):
  431. with open(self.benchmarker.output_file(self.name, test_type)) as raw_data:
  432. is_warmup = True
  433. rawData = None
  434. for line in raw_data:
  435. if "Queries:" in line or "Concurrency:" in line:
  436. is_warmup = False
  437. rawData = None
  438. continue
  439. if "Warmup" in line or "Primer" in line:
  440. is_warmup = True
  441. continue
  442. if not is_warmup:
  443. if rawData == None:
  444. rawData = dict()
  445. results['results'].append(rawData)
  446. #if "Requests/sec:" in line:
  447. # m = re.search("Requests/sec:\s+([0-9]+)", line)
  448. # rawData['reportedResults'] = m.group(1)
  449. # search for weighttp data such as succeeded and failed.
  450. if "Latency" in line:
  451. m = re.findall("([0-9]+\.*[0-9]*[us|ms|s|m|%]+)", line)
  452. if len(m) == 4:
  453. rawData['latencyAvg'] = m[0]
  454. rawData['latencyStdev'] = m[1]
  455. rawData['latencyMax'] = m[2]
  456. # rawData['latencyStdevPercent'] = m[3]
  457. #if "Req/Sec" in line:
  458. # m = re.findall("([0-9]+\.*[0-9]*[k|%]*)", line)
  459. # if len(m) == 4:
  460. # rawData['requestsAvg'] = m[0]
  461. # rawData['requestsStdev'] = m[1]
  462. # rawData['requestsMax'] = m[2]
  463. # rawData['requestsStdevPercent'] = m[3]
  464. #if "requests in" in line:
  465. # m = re.search("requests in ([0-9]+\.*[0-9]*[ms|s|m|h]+)", line)
  466. # if m != None:
  467. # # parse out the raw time, which may be in minutes or seconds
  468. # raw_time = m.group(1)
  469. # if "ms" in raw_time:
  470. # rawData['total_time'] = float(raw_time[:len(raw_time)-2]) / 1000.0
  471. # elif "s" in raw_time:
  472. # rawData['total_time'] = float(raw_time[:len(raw_time)-1])
  473. # elif "m" in raw_time:
  474. # rawData['total_time'] = float(raw_time[:len(raw_time)-1]) * 60.0
  475. # elif "h" in raw_time:
  476. # rawData['total_time'] = float(raw_time[:len(raw_time)-1]) * 3600.0
  477. if "requests in" in line:
  478. m = re.search("([0-9]+) requests in", line)
  479. if m != None:
  480. rawData['totalRequests'] = int(m.group(1))
  481. if "Socket errors" in line:
  482. if "connect" in line:
  483. m = re.search("connect ([0-9]+)", line)
  484. rawData['connect'] = int(m.group(1))
  485. if "read" in line:
  486. m = re.search("read ([0-9]+)", line)
  487. rawData['read'] = int(m.group(1))
  488. if "write" in line:
  489. m = re.search("write ([0-9]+)", line)
  490. rawData['write'] = int(m.group(1))
  491. if "timeout" in line:
  492. m = re.search("timeout ([0-9]+)", line)
  493. rawData['timeout'] = int(m.group(1))
  494. if "Non-2xx" in line:
  495. m = re.search("Non-2xx or 3xx responses: ([0-9]+)", line)
  496. if m != None:
  497. rawData['5xx'] = int(m.group(1))
  498. if "STARTTIME" in line:
  499. m = re.search("[0-9]+", line)
  500. rawData["startTime"] = int(m.group(0))
  501. if "ENDTIME" in line:
  502. m = re.search("[0-9]+", line)
  503. rawData["endTime"] = int(m.group(0))
  504. test_stats = self.__parse_stats(test_type, rawData["startTime"], rawData["endTime"], 1)
  505. # rawData["averageStats"] = self.__calculate_average_stats(test_stats)
  506. stats.append(test_stats)
  507. with open(self.benchmarker.stats_file(self.name, test_type) + ".json", "w") as stats_file:
  508. json.dump(stats, stats_file, indent=2)
  509. return results
  510. except IOError:
  511. return None
  512. ############################################################
  513. # End benchmark
  514. ############################################################
  515. ############################################################
  516. # __generate_concurrency_script(url, port)
  517. # Generates the string containing the bash script that will
  518. # be run on the client to benchmark a single test. This
  519. # specifically works for the variable concurrency tests (JSON
  520. # and DB)
  521. ############################################################
  522. def __generate_concurrency_script(self, url, port, accept_header, wrk_command="wrk"):
  523. headers = self.headers_template.format(accept=accept_header)
  524. return self.concurrency_template.format(max_concurrency=max(self.benchmarker.concurrency_levels),
  525. max_threads=self.benchmarker.threads, name=self.name, duration=self.benchmarker.duration,
  526. levels=" ".join("{}".format(item) for item in self.benchmarker.concurrency_levels),
  527. server_host=self.benchmarker.server_host, port=port, url=url, headers=headers, wrk=wrk_command)
  528. ############################################################
  529. # __generate_pipeline_script(url, port)
  530. # Generates the string containing the bash script that will
  531. # be run on the client to benchmark a single pipeline test.
  532. ############################################################
  533. def __generate_pipeline_script(self, url, port, accept_header, wrk_command="wrk"):
  534. headers = self.headers_template.format(accept=accept_header)
  535. return self.pipeline_template.format(max_concurrency=16384,
  536. max_threads=self.benchmarker.threads, name=self.name, duration=self.benchmarker.duration,
  537. levels=" ".join("{}".format(item) for item in [256,1024,4096,16384]),
  538. server_host=self.benchmarker.server_host, port=port, url=url, headers=headers, wrk=wrk_command,
  539. pipeline=16)
  540. ############################################################
  541. # __generate_query_script(url, port)
  542. # Generates the string containing the bash script that will
  543. # be run on the client to benchmark a single test. This
  544. # specifically works for the variable query tests (Query)
  545. ############################################################
  546. def __generate_query_script(self, url, port, accept_header):
  547. headers = self.headers_template.format(accept=accept_header)
  548. return self.query_template.format(max_concurrency=max(self.benchmarker.concurrency_levels),
  549. max_threads=self.benchmarker.threads, name=self.name, duration=self.benchmarker.duration,
  550. levels=" ".join("{}".format(item) for item in self.benchmarker.query_levels),
  551. server_host=self.benchmarker.server_host, port=port, url=url, headers=headers)
  552. ############################################################
  553. # Returns True if any test type this this framework test will use a DB
  554. ############################################################
  555. def requires_database(self):
  556. '''Returns True/False if this test requires a database'''
  557. return any(tobj.requires_db for (ttype,tobj) in self.runTests.iteritems())
  558. ############################################################
  559. # __begin_logging
  560. # Starts a thread to monitor the resource usage, to be synced with the client's time
  561. # TODO: MySQL and InnoDB are possible. Figure out how to implement them.
  562. ############################################################
  563. def __begin_logging(self, test_type):
  564. output_file = "{file_name}".format(file_name=self.benchmarker.get_stats_file(self.name, test_type))
  565. dstat_string = "dstat -afilmprsT --aio --fs --ipc --lock --raw --socket --tcp \
  566. --raw --socket --tcp --udp --unix --vm --disk-util \
  567. --rpc --rpcd --output {output_file}".format(output_file=output_file)
  568. cmd = shlex.split(dstat_string)
  569. dev_null = open(os.devnull, "w")
  570. self.subprocess_handle = subprocess.Popen(cmd, stdout=dev_null)
  571. ##############################################################
  572. # Begin __end_logging
  573. # Stops the logger thread and blocks until shutdown is complete.
  574. ##############################################################
  575. def __end_logging(self):
  576. self.subprocess_handle.terminate()
  577. self.subprocess_handle.communicate()
  578. ##############################################################
  579. # Begin __parse_stats
  580. # For each test type, process all the statistics, and return a multi-layered dictionary
  581. # that has a structure as follows:
  582. # (timestamp)
  583. # | (main header) - group that the stat is in
  584. # | | (sub header) - title of the stat
  585. # | | | (stat) - the stat itself, usually a floating point number
  586. ##############################################################
  587. def __parse_stats(self, test_type, start_time, end_time, interval):
  588. stats_dict = dict()
  589. stats_file = self.benchmarker.stats_file(self.name, test_type)
  590. with open(stats_file) as stats:
  591. while(stats.next() != "\n"): # dstat doesn't output a completely compliant CSV file - we need to strip the header
  592. pass
  593. stats_reader = csv.reader(stats)
  594. main_header = stats_reader.next()
  595. sub_header = stats_reader.next()
  596. time_row = sub_header.index("epoch")
  597. int_counter = 0
  598. for row in stats_reader:
  599. time = float(row[time_row])
  600. int_counter+=1
  601. if time < start_time:
  602. continue
  603. elif time > end_time:
  604. return stats_dict
  605. if int_counter % interval != 0:
  606. continue
  607. row_dict = dict()
  608. for nextheader in main_header:
  609. if nextheader != "":
  610. row_dict[nextheader] = dict()
  611. header = ""
  612. for item_num, column in enumerate(row):
  613. if(len(main_header[item_num]) != 0):
  614. header = main_header[item_num]
  615. row_dict[header][sub_header[item_num]] = float(column) # all the stats are numbers, so we want to make sure that they stay that way in json
  616. stats_dict[time] = row_dict
  617. return stats_dict
  618. ##############################################################
  619. # End __parse_stats
  620. ##############################################################
  621. def __getattr__(self, name):
  622. """For backwards compatibility, we used to pass benchmarker
  623. as the argument to the setup.sh files"""
  624. try:
  625. x = getattr(self.benchmarker, name)
  626. except AttributeError:
  627. print "AttributeError: %s not a member of FrameworkTest or Benchmarker" % name
  628. print "This is probably a bug"
  629. raise
  630. return x
  631. ##############################################################
  632. # Begin __calculate_average_stats
  633. # We have a large amount of raw data for the statistics that
  634. # may be useful for the stats nerds, but most people care about
  635. # a couple of numbers. For now, we're only going to supply:
  636. # * Average CPU
  637. # * Average Memory
  638. # * Total network use
  639. # * Total disk use
  640. # More may be added in the future. If they are, please update
  641. # the above list.
  642. # Note: raw_stats is directly from the __parse_stats method.
  643. # Recall that this consists of a dictionary of timestamps,
  644. # each of which contain a dictionary of stat categories which
  645. # contain a dictionary of stats
  646. ##############################################################
  647. def __calculate_average_stats(self, raw_stats):
  648. raw_stat_collection = dict()
  649. for timestamp, time_dict in raw_stats.items():
  650. for main_header, sub_headers in time_dict.items():
  651. item_to_append = None
  652. if 'cpu' in main_header:
  653. # We want to take the idl stat and subtract it from 100
  654. # to get the time that the CPU is NOT idle.
  655. item_to_append = sub_headers['idl'] - 100.0
  656. elif main_header == 'memory usage':
  657. item_to_append = sub_headers['used']
  658. elif 'net' in main_header:
  659. # Network stats have two parts - recieve and send. We'll use a tuple of
  660. # style (recieve, send)
  661. item_to_append = (sub_headers['recv'], sub_headers['send'])
  662. elif 'dsk' or 'io' in main_header:
  663. # Similar for network, except our tuple looks like (read, write)
  664. item_to_append = (sub_headers['read'], sub_headers['writ'])
  665. if item_to_append is not None:
  666. if main_header not in raw_stat_collection:
  667. raw_stat_collection[main_header] = list()
  668. raw_stat_collection[main_header].append(item_to_append)
  669. # Simple function to determine human readable size
  670. # http://stackoverflow.com/questions/1094841/reusable-library-to-get-human-readable-version-of-file-size
  671. def sizeof_fmt(num):
  672. # We'll assume that any number we get is convertable to a float, just in case
  673. num = float(num)
  674. for x in ['bytes','KB','MB','GB']:
  675. if num < 1024.0 and num > -1024.0:
  676. return "%3.1f%s" % (num, x)
  677. num /= 1024.0
  678. return "%3.1f%s" % (num, 'TB')
  679. # Now we have our raw stats in a readable format - we need to format it for display
  680. # We need a floating point sum, so the built in sum doesn't cut it
  681. display_stat_collection = dict()
  682. for header, values in raw_stat_collection.items():
  683. display_stat = None
  684. if 'cpu' in header:
  685. display_stat = sizeof_fmt(math.fsum(values) / len(values))
  686. elif main_header == 'memory usage':
  687. display_stat = sizeof_fmt(math.fsum(values) / len(values))
  688. elif 'net' in main_header:
  689. receive, send = zip(*values) # unzip
  690. display_stat = {'receive': sizeof_fmt(math.fsum(receive)), 'send': sizeof_fmt(math.fsum(send))}
  691. else: # if 'dsk' or 'io' in header:
  692. read, write = zip(*values) # unzip
  693. display_stat = {'read': sizeof_fmt(math.fsum(read)), 'write': sizeof_fmt(math.fsum(write))}
  694. display_stat_collection[header] = display_stat
  695. return display_stat
  696. ###########################################################################################
  697. # End __calculate_average_stats
  698. #########################################################################################
  699. ##########################################################################################
  700. # Constructor
  701. ##########################################################################################
  702. def __init__(self, name, directory, benchmarker, runTests, args):
  703. self.name = name
  704. self.directory = directory
  705. self.benchmarker = benchmarker
  706. self.runTests = runTests
  707. self.fwroot = benchmarker.fwroot
  708. self.approach = ""
  709. self.classification = ""
  710. self.database = ""
  711. self.framework = ""
  712. self.language = ""
  713. self.orm = ""
  714. self.platform = ""
  715. self.webserver = ""
  716. self.os = ""
  717. self.database_os = ""
  718. self.display_name = ""
  719. self.notes = ""
  720. self.versus = ""
  721. # setup logging
  722. logging.basicConfig(stream=sys.stderr, level=logging.INFO)
  723. self.install_root="%s/%s" % (self.fwroot, "installs")
  724. if benchmarker.install_strategy is 'pertest':
  725. self.install_root="%s/pertest/%s" % (self.install_root, name)
  726. # Used in setup.sh scripts for consistency with
  727. # the bash environment variables
  728. self.troot = self.directory
  729. self.iroot = self.install_root
  730. self.__dict__.update(args)
  731. ############################################################
  732. # End __init__
  733. ############################################################
  734. ############################################################
  735. # End FrameworkTest
  736. ############################################################
  737. ##########################################################################################
  738. # Static methods
  739. ##########################################################################################
  740. ##############################################################
  741. # parse_config(config, directory, benchmarker)
  742. # parses a config file and returns a list of FrameworkTest
  743. # objects based on that config file.
  744. ##############################################################
  745. def parse_config(config, directory, benchmarker):
  746. tests = []
  747. # This sort ordering is set up specifically to return the length
  748. # of the test name. There were SO many problems involved with
  749. # 'plaintext' being run first (rather, just not last) that we
  750. # needed to ensure that it was run last for every framework.
  751. def testOrder(type_name):
  752. return len(type_name)
  753. # The config object can specify multiple tests
  754. # Loop over them and parse each into a FrameworkTest
  755. for test in config['tests']:
  756. names = [name for (name,keys) in test.iteritems()]
  757. if "default" not in names:
  758. logging.warn("Framework %s does not define a default test in benchmark_config.json", config['framework'])
  759. for test_name, test_keys in test.iteritems():
  760. # Prefix all test names with framework except 'default' test
  761. if test_name == 'default':
  762. test_name = config['framework']
  763. else:
  764. test_name = "%s-%s" % (config['framework'], test_name)
  765. # Ensure FrameworkTest.framework is available
  766. if not test_keys['framework']:
  767. test_keys['framework'] = config['framework']
  768. #if test_keys['framework'].lower() != config['framework'].lower():
  769. # print Exception("benchmark_config.json for test %s is invalid - test framework '%s' must match benchmark_config.json framework '%s'" %
  770. # (test_name, test_keys['framework'], config['framework']))
  771. # Confirm required keys are present
  772. # TODO have a TechEmpower person confirm this list - I don't know what the website requires....
  773. required = ['language','webserver','classification','database','approach','orm','framework','os','database_os']
  774. if not all (key in test_keys for key in required):
  775. raise Exception("benchmark_config.json for test %s is invalid - missing required keys" % test_name)
  776. # Map test type to a parsed FrameworkTestType object
  777. runTests = dict()
  778. for type_name, type_obj in benchmarker.types.iteritems():
  779. try:
  780. runTests[type_name] = type_obj.copy().parse(test_keys)
  781. except AttributeError as ae:
  782. # This is quite common - most tests don't support all types
  783. # Quitely log it and move on (debug logging is on in travis and this causes
  784. # ~1500 lines of debug, so I'm totally ignoring it for now
  785. # logging.debug("Missing arguments for test type %s for framework test %s", type_name, test_name)
  786. pass
  787. # We need to sort by test_type to run
  788. sortedTestKeys = sorted(runTests.keys(), key=testOrder)
  789. sortedRunTests = OrderedDict()
  790. for sortedTestKey in sortedTestKeys:
  791. sortedRunTests[sortedTestKey] = runTests[sortedTestKey]
  792. # By passing the entire set of keys, each FrameworkTest will have a member for each key
  793. tests.append(FrameworkTest(test_name, directory, benchmarker, sortedRunTests, test_keys))
  794. return tests
  795. ##############################################################
  796. # End parse_config
  797. ##############################################################