benchmarker.py 22 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657
  1. from installer import Installer
  2. from framework_test import FrameworkTest
  3. import framework_test
  4. import os
  5. import json
  6. import subprocess
  7. import time
  8. import textwrap
  9. import pprint
  10. import csv
  11. import sys
  12. from datetime import datetime
  13. class Benchmarker:
  14. ##########################################################################################
  15. # Public methods
  16. ##########################################################################################
  17. ############################################################
  18. # Prints all the available tests
  19. ############################################################
  20. def run_list_tests(self):
  21. all_tests = self.__gather_tests()
  22. for test in all_tests:
  23. print str(test.sort) + ": " + test.name
  24. self.__finish()
  25. ############################################################
  26. # End run_list_tests
  27. ############################################################
  28. ############################################################
  29. # next_sort
  30. # Prints the next available sort number that should be used
  31. # for any new tests
  32. ############################################################
  33. def next_sort_value(self):
  34. all_tests = self.__gather_tests()
  35. # all_tests is already sorted by sort, so we can just get
  36. # the last one and add one to it.
  37. print " Next sort number is: " + str(all_tests[-1].sort + 1)
  38. self.__finish()
  39. ############################################################
  40. # End next_sort_value
  41. ############################################################
  42. ############################################################
  43. # parse_timestamp
  44. # Re-parses the raw data for a given timestamp
  45. ############################################################
  46. def parse_timestamp(self):
  47. all_tests = self.__gather_tests()
  48. for test in all_tests:
  49. test.parse_all()
  50. self.__parse_results(all_tests)
  51. self.__finish()
  52. ############################################################
  53. # End run_list_tests
  54. ############################################################
  55. ############################################################
  56. # Run the tests:
  57. # This process involves setting up the client/server machines
  58. # with any necessary change. Then going through each test,
  59. # running their setup script, verifying the URLs, and
  60. # running benchmarks against them.
  61. ############################################################
  62. def run(self):
  63. ##########################
  64. # Get a list of all known
  65. # tests that we can run.
  66. ##########################
  67. all_tests = self.__gather_tests()
  68. ##########################
  69. # Setup client/server
  70. ##########################
  71. print textwrap.dedent("""
  72. =====================================================
  73. Preparing up Server and Client ...
  74. =====================================================
  75. """)
  76. self.__setup_server()
  77. self.__setup_client()
  78. ##########################
  79. # Run tests
  80. ##########################
  81. self.__run_tests(all_tests)
  82. ##########################
  83. # Parse results
  84. ##########################
  85. if self.mode == "benchmark":
  86. print textwrap.dedent("""
  87. =====================================================
  88. Parsing Results ...
  89. =====================================================
  90. """)
  91. self.__parse_results(all_tests)
  92. self.__finish()
  93. ############################################################
  94. # End run
  95. ############################################################
  96. ############################################################
  97. # sftp_string(batch_file)
  98. # generates a fully qualified URL for sftp to client
  99. ############################################################
  100. def sftp_string(self, batch_file):
  101. sftp_string = "sftp -oStrictHostKeyChecking=no "
  102. if batch_file != None: sftp_string += " -b " + batch_file + " "
  103. if self.identity_file != None:
  104. sftp_string += " -i " + self.identity_file + " "
  105. return sftp_string + self.client_user + "@" + self.client_host
  106. ############################################################
  107. # End sftp_string
  108. ############################################################
  109. ############################################################
  110. # generate_url(url, port)
  111. # generates a fully qualified URL for accessing a test url
  112. ############################################################
  113. def generate_url(self, url, port):
  114. return self.server_host + ":" + str(port) + url
  115. ############################################################
  116. # End generate_url
  117. ############################################################
  118. ############################################################
  119. # output_file(test_name, test_type)
  120. # returns the output file for this test_name and test_type
  121. # timestamp/test_type/test_name/raw
  122. ############################################################
  123. def output_file(self, test_name, test_type):
  124. path = os.path.join(self.result_directory, self.timestamp, test_type, test_name, "raw")
  125. try:
  126. os.makedirs(os.path.dirname(path))
  127. except OSError:
  128. pass
  129. return path
  130. ############################################################
  131. # End output_file
  132. ############################################################
  133. ############################################################
  134. # full_results_directory
  135. ############################################################
  136. def full_results_directory(self):
  137. path = os.path.join(self.result_directory, self.timestamp)
  138. try:
  139. os.makedirs(path)
  140. except OSError:
  141. pass
  142. return path
  143. ############################################################
  144. # End output_file
  145. ############################################################
  146. ############################################################
  147. # report_results
  148. ############################################################
  149. def report_results(self, framework, test, results):
  150. if test not in self.results['rawData'].keys():
  151. self.results['rawData'][test] = dict()
  152. self.results['rawData'][test][framework.sort] = results
  153. ############################################################
  154. # End report_results
  155. ############################################################
  156. ##########################################################################################
  157. # Private methods
  158. ##########################################################################################
  159. ############################################################
  160. # Gathers all the tests
  161. ############################################################
  162. def __gather_tests(self):
  163. tests = []
  164. # Loop through each directory (we assume we're being run from the benchmarking root)
  165. # and look for the files that signify a benchmark test
  166. for dirname, dirnames, filenames in os.walk('.'):
  167. # Look for the benchmark_config file, this will set up our tests
  168. # It's format looks like this:
  169. #
  170. # {
  171. # "framework": "nodejs",
  172. # "tests": [{
  173. # "default": {
  174. # "setup_file": "setup",
  175. # "json_url": "/json"
  176. # },
  177. # "mysql": {
  178. # "setup_file": "setup",
  179. # "db_url": "/mysql",
  180. # "query_url": "/mysql?queries="
  181. # },
  182. # ...
  183. # }]
  184. # }
  185. if 'benchmark_config' in filenames:
  186. config = None
  187. with open(os.path.join(dirname, 'benchmark_config'), 'r') as config_file:
  188. # Load json file into config object
  189. config = json.load(config_file)
  190. if config == None:
  191. continue
  192. tests = tests + framework_test.parse_config(config, dirname[2:], self)
  193. tests.sort(key=lambda x: x.sort)
  194. return tests
  195. ############################################################
  196. # End __gather_tests
  197. ############################################################
  198. ############################################################
  199. # Makes any necessary changes to the server that should be
  200. # made before running the tests. This involves setting kernal
  201. # settings to allow for more connections, or more file
  202. # descriptiors
  203. #
  204. # http://redmine.lighttpd.net/projects/weighttp/wiki#Troubleshooting
  205. ############################################################
  206. def __setup_server(self):
  207. try:
  208. if os.name == 'nt':
  209. return True
  210. subprocess.check_call("sudo sysctl -w net.core.somaxconn=5000".rsplit(" "))
  211. subprocess.check_call("sudo -s ulimit -n 16384".rsplit(" "))
  212. subprocess.check_call("sudo sysctl net.ipv4.tcp_tw_reuse=1".rsplit(" "))
  213. subprocess.check_call("sudo sysctl net.ipv4.tcp_tw_recycle=1".rsplit(" "))
  214. subprocess.check_call("sudo sysctl -w kernel.shmmax=134217728".rsplit(" "))
  215. subprocess.check_call("sudo sysctl -w kernel.shmall=2097152".rsplit(" "))
  216. except subprocess.CalledProcessError:
  217. return False
  218. ############################################################
  219. # End __setup_server
  220. ############################################################
  221. ############################################################
  222. # Makes any necessary changes to the client machine that
  223. # should be made before running the tests. Is very similar
  224. # to the server setup, but may also include client specific
  225. # changes.
  226. ############################################################
  227. def __setup_client(self):
  228. p = subprocess.Popen(self.ssh_string, stdin=subprocess.PIPE, shell=True)
  229. p.communicate("""
  230. sudo sysctl -w net.core.somaxconn=5000
  231. sudo -s ulimit -n 16384
  232. sudo sysctl net.ipv4.tcp_tw_reuse=1
  233. sudo sysctl net.ipv4.tcp_tw_recycle=1
  234. sudo sysctl -w kernel.shmmax=2147483648
  235. sudo sysctl -w kernel.shmall=2097152
  236. """)
  237. ############################################################
  238. # End __setup_client
  239. ############################################################
  240. ############################################################
  241. # __run_tests
  242. # Ensures that the system has all necessary software to run
  243. # the tests. This does not include that software for the individual
  244. # test, but covers software such as curl and weighttp that
  245. # are needed.
  246. ############################################################
  247. def __run_tests(self, tests):
  248. for test in tests:
  249. if test.os == 'nt' and os.name != 'nt':
  250. # this is a windows only test, but we're not on windows. abort.
  251. continue
  252. # If the user specified which tests to run, then
  253. # we can skip over tests that are not in that list
  254. if self.test != None and test.name not in self.test:
  255. continue
  256. # If the test is in the excludes list, we skip it
  257. if self.exclude != None and test.name in self.exclude:
  258. continue
  259. # If the test does not contain an implementation of the current test-type, skip it
  260. if self.type != 'all' and not test.contains_type(self.type):
  261. continue
  262. print textwrap.dedent("""
  263. =====================================================
  264. Beginning {name}
  265. -----------------------------------------------------
  266. """.format(name=test.name))
  267. ##########################
  268. # Start this test
  269. ##########################
  270. print textwrap.dedent("""
  271. -----------------------------------------------------
  272. Starting {name}
  273. -----------------------------------------------------
  274. """.format(name=test.name))
  275. try:
  276. p = subprocess.Popen(self.ssh_string, stdin=subprocess.PIPE, shell=True)
  277. p.communicate("""
  278. sudo restart mysql
  279. sudo restart mongodb
  280. """)
  281. time.sleep(10)
  282. result = test.start()
  283. if result != 0:
  284. test.stop()
  285. time.sleep(5)
  286. print "ERROR: Problem starting " + test.name
  287. print textwrap.dedent("""
  288. -----------------------------------------------------
  289. Stopped {name}
  290. -----------------------------------------------------
  291. """.format(name=test.name))
  292. continue
  293. time.sleep(self.sleep)
  294. ##########################
  295. # Verify URLs
  296. ##########################
  297. print textwrap.dedent("""
  298. -----------------------------------------------------
  299. Verifying URLs for {name}
  300. -----------------------------------------------------
  301. """.format(name=test.name))
  302. test.verify_urls()
  303. ##########################
  304. # Benchmark this test
  305. ##########################
  306. if self.mode == "benchmark":
  307. print textwrap.dedent("""
  308. -----------------------------------------------------
  309. Benchmarking {name} ...
  310. -----------------------------------------------------
  311. """.format(name=test.name))
  312. test.benchmark()
  313. ##########################
  314. # Stop this test
  315. ##########################
  316. test.stop()
  317. time.sleep(5)
  318. print textwrap.dedent("""
  319. -----------------------------------------------------
  320. Stopped {name}
  321. -----------------------------------------------------
  322. """.format(name=test.name))
  323. time.sleep(5)
  324. except (KeyboardInterrupt, SystemExit):
  325. test.stop()
  326. print """
  327. -----------------------------------------------------
  328. Cleaning up....
  329. -----------------------------------------------------
  330. """
  331. self.__finish()
  332. sys.exit()
  333. ############################################################
  334. # End __run_tests
  335. ############################################################
  336. ############################################################
  337. # __parse_results
  338. # Ensures that the system has all necessary software to run
  339. # the tests. This does not include that software for the individual
  340. # test, but covers software such as curl and weighttp that
  341. # are needed.
  342. ############################################################
  343. def __parse_results(self, tests):
  344. # Time to create parsed files
  345. # Aggregate JSON file
  346. with open(os.path.join(self.full_results_directory(), "results.json"), "w") as f:
  347. f.write(json.dumps(self.results))
  348. # Run the method to get the commmit count of each framework.
  349. self.__count_commits()
  350. with open(os.path.join(self.full_results_directory(), "commits.json"), "w") as f:
  351. f.write(json.dumps(self.commits))
  352. # JSON CSV
  353. # with open(os.path.join(self.full_results_directory(), "json.csv"), 'wb') as csvfile:
  354. # writer = csv.writer(csvfile)
  355. # writer.writerow(["Framework"] + self.concurrency_levels)
  356. # for key, value in self.results['rawData']['json'].iteritems():
  357. # framework = self.results['frameworks'][int(key)]
  358. # writer.writerow([framework] + value)
  359. # DB CSV
  360. #with open(os.path.join(self.full_results_directory(), "db.csv"), 'wb') as csvfile:
  361. # writer = csv.writer(csvfile)
  362. # writer.writerow(["Framework"] + self.concurrency_levels)
  363. # for key, value in self.results['rawData']['db'].iteritems():
  364. # framework = self.results['frameworks'][int(key)]
  365. # writer.writerow([framework] + value)
  366. # Query CSV
  367. #with open(os.path.join(self.full_results_directory(), "query.csv"), 'wb') as csvfile:
  368. # writer = csv.writer(csvfile)
  369. # writer.writerow(["Framework"] + self.query_intervals)
  370. # for key, value in self.results['rawData']['query'].iteritems():
  371. # framework = self.results['frameworks'][int(key)]
  372. # writer.writerow([framework] + value)
  373. # Fortune CSV
  374. #with open(os.path.join(self.full_results_directory(), "fortune.csv"), 'wb') as csvfile:
  375. # writer = csv.writer(csvfile)
  376. # writer.writerow(["Framework"] + self.query_intervals)
  377. # if 'fortune' in self.results['rawData'].keys():
  378. # for key, value in self.results['rawData']['fortune'].iteritems():
  379. # framework = self.results['frameworks'][int(key)]
  380. # writer.writerow([framework] + value)
  381. ############################################################
  382. # End __parse_results
  383. ############################################################
  384. ############################################################
  385. # __count_commits
  386. ############################################################
  387. def __count_commits(self):
  388. all_folders = [
  389. "aspnet",
  390. "aspnet-stripped",
  391. "beego",
  392. "bottle",
  393. "cake",
  394. "compojure",
  395. "cowboy",
  396. "cpoll_cppsp",
  397. "dancer",
  398. "dart",
  399. "django",
  400. "django-stripped",
  401. "dropwizard",
  402. "elli",
  403. "express",
  404. "finagle",
  405. "flask",
  406. "gemini",
  407. "go",
  408. "grails",
  409. "grizzly-bm",
  410. "grizzly-jersey",
  411. "hapi",
  412. "http-kit",
  413. "HttpListener",
  414. "jester",
  415. "kelp",
  416. "lapis",
  417. "lift-stateless",
  418. "luminus",
  419. "mojolicious",
  420. "nancy",
  421. "netty",
  422. "nodejs",
  423. "onion",
  424. "openresty",
  425. "php",
  426. "php-codeigniter",
  427. "php-fuel",
  428. "php-kohana",
  429. "php-laravel",
  430. "php-lithium",
  431. "php-micromvc",
  432. "php-phalcon",
  433. "php-phalcon-micro",
  434. "php-silex",
  435. "php-silex-orm",
  436. "php-silica",
  437. "php-slim",
  438. "php-symfony2",
  439. "php-yaf",
  440. "phreeze",
  441. "plack",
  442. "plain",
  443. "play1",
  444. "play1siena",
  445. "play-java",
  446. "play-java-jpa",
  447. "play-scala",
  448. "play-scala-mongodb",
  449. "play-slick",
  450. "rack",
  451. "rails",
  452. "rails-stripped",
  453. "restexpress",
  454. "revel",
  455. "revel-jet",
  456. "revel-qbs",
  457. "ringojs",
  458. "ringojs-convenient",
  459. "scalatra",
  460. "servicestack",
  461. "servlet",
  462. "sinatra",
  463. "snap",
  464. "spark",
  465. "spray",
  466. "spring",
  467. "tapestry",
  468. "tornado",
  469. "treefrog",
  470. "undertow",
  471. "unfiltered",
  472. "vertx",
  473. "wai",
  474. "webgo",
  475. "web-simple",
  476. "wicket",
  477. "wsgi",
  478. "yesod"
  479. ]
  480. jsonResult = {"commitCount":{}}
  481. for framework in all_folders:
  482. try:
  483. command = "echo $(git rev-list --count HEAD -- " + framework + ")"
  484. commitCount = subprocess.check_output(command, shell=True)
  485. jsonResult["commitCount"][framework] = int(commitCount)
  486. except:
  487. continue
  488. self.commits = jsonResult
  489. ############################################################
  490. # End __count_commits
  491. ############################################################
  492. ############################################################
  493. # __finish
  494. ############################################################
  495. def __finish(self):
  496. print "Time to complete: " + str(int(time.time() - self.start_time)) + " seconds"
  497. print "Results are saved in " + os.path.join(self.result_directory, self.timestamp)
  498. ############################################################
  499. # End __finish
  500. ############################################################
  501. ##########################################################################################
  502. # Constructor
  503. ##########################################################################################
  504. ############################################################
  505. # Initialize the benchmarker. The args are the arguments
  506. # parsed via argparser.
  507. ############################################################
  508. def __init__(self, args):
  509. self.__dict__.update(args)
  510. self.start_time = time.time()
  511. # setup some additional variables
  512. if self.database_host == None: self.database_host = self.client_host
  513. self.result_directory = os.path.join("results", self.name)
  514. if self.parse != None:
  515. self.timestamp = self.parse
  516. else:
  517. self.timestamp = time.strftime("%Y%m%d%H%M%S", time.localtime())
  518. # Setup the concurrency levels array. This array goes from
  519. # starting_concurrency to max concurrency, doubling each time
  520. self.concurrency_levels = []
  521. concurrency = self.starting_concurrency
  522. while concurrency <= self.max_concurrency:
  523. self.concurrency_levels.append(concurrency)
  524. concurrency = concurrency * 2
  525. # Setup query interval array
  526. # starts at 1, and goes up to max_queries, using the query_interval
  527. self.query_intervals = []
  528. queries = 1
  529. while queries <= self.max_queries:
  530. self.query_intervals.append(queries)
  531. if queries == 1:
  532. queries = 0
  533. queries = queries + self.query_interval
  534. # Load the latest data
  535. self.latest = None
  536. try:
  537. with open('latest.json', 'r') as f:
  538. # Load json file into config object
  539. self.latest = json.load(f)
  540. except IOError:
  541. pass
  542. self.results = None
  543. try:
  544. if self.latest != None and self.name in self.latest.keys():
  545. with open(os.path.join(self.result_directory, str(self.latest[self.name]), 'results.json'), 'r') as f:
  546. # Load json file into config object
  547. self.results = json.load(f)
  548. except IOError:
  549. pass
  550. if self.results == None:
  551. self.results = dict()
  552. self.results['concurrencyLevels'] = self.concurrency_levels
  553. self.results['queryIntervals'] = self.query_intervals
  554. self.results['frameworks'] = [t.name for t in self.__gather_tests()]
  555. self.results['duration'] = self.duration
  556. self.results['rawData'] = dict()
  557. self.results['rawData']['json'] = dict()
  558. self.results['rawData']['db'] = dict()
  559. self.results['rawData']['query'] = dict()
  560. self.results['rawData']['fortune'] = dict()
  561. self.results['rawData']['update'] = dict()
  562. self.results['rawData']['plaintext'] = dict()
  563. else:
  564. #for x in self.__gather_tests():
  565. # if x.name not in self.results['frameworks']:
  566. # self.results['frameworks'] = self.results['frameworks'] + [x.name]
  567. # Always overwrite framework list
  568. self.results['frameworks'] = [t.name for t in self.__gather_tests()]
  569. # Setup the ssh command string
  570. self.ssh_string = "ssh -T -o StrictHostKeyChecking=no " + self.client_user + "@" + self.client_host
  571. if self.identity_file != None:
  572. self.ssh_string = self.ssh_string + " -i " + self.identity_file
  573. if self.install_software:
  574. install = Installer(self)
  575. install.install_software()
  576. ############################################################
  577. # End __init__
  578. ############################################################