stress.py 7.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273
  1. #!/usr/bin/env python
  2. from __future__ import absolute_import, print_function
  3. import os
  4. import platform
  5. import random
  6. import signal
  7. import sys
  8. from time import time, sleep
  9. from kombu.utils.compat import OrderedDict
  10. from celery import Celery, group, VERSION_BANNER
  11. from celery.bin.base import Command, Option
  12. from celery.exceptions import TimeoutError, SoftTimeLimitExceeded
  13. from celery.five import range, values
  14. from celery.utils.debug import blockdetection
  15. from celery.utils.text import indent, pluralize
  16. # Should be run with workers running using these options:
  17. #
  18. # 1) celery -A stress worker -c 1 --maxtasksperchild=1
  19. # 2) celery -A stress worker -c 8 --maxtasksperchild=1
  20. #
  21. # 3) celery -A stress worker -c 1
  22. # 4) celery -A stress worker -c 8
  23. #
  24. # 5) celery -A stress worker --autoscale=8,0
  25. #
  26. # 6) celery -A stress worker --time-limit=1
  27. #
  28. # 7) celery -A stress worker -c1 --maxtasksperchild=1 -- celery.acks_late=1
  29. BIG = 'x' * 2 ** 20 * 8
  30. SMALL = 'e' * 1024
  31. BANNER = """\
  32. Celery stress-suite v{version}
  33. {platform}
  34. [config]
  35. .> broker: {conninfo}
  36. [toc: {total} {TESTS} total]
  37. {toc}
  38. """
  39. app = Celery(
  40. 'stress', broker='amqp://', backend='redis://',
  41. set_as_current=False,
  42. )
  43. app.conf.update(
  44. CELERYD_PREFETCH_MULTIPLIER=10,
  45. )
  46. @app.task
  47. def _marker(s, sep='-'):
  48. print('{0} {1} {2}'.format(sep * 3, s, sep * 3))
  49. @app.task
  50. def add(x, y):
  51. return x + y
  52. @app.task
  53. def any_(*args, **kwargs):
  54. wait = kwargs.get('sleep')
  55. if wait:
  56. sleep(wait)
  57. @app.task
  58. def exiting(status=0):
  59. sys.exit(status)
  60. @app.task
  61. def kill(sig=signal.SIGKILL):
  62. os.kill(os.getpid(), sig)
  63. @app.task
  64. def sleeping(i):
  65. sleep(i)
  66. @app.task
  67. def sleeping_ignore_limits(i):
  68. try:
  69. sleep(i)
  70. except SoftTimeLimitExceeded:
  71. sleep(i)
  72. @app.task
  73. def segfault():
  74. import ctypes
  75. ctypes.memset(0, 0, 1)
  76. assert False, 'should not get here'
  77. def marker(s, sep='-'):
  78. print('{0}{1}'.format(sep, s))
  79. _marker.delay(s, sep)
  80. class Stress(Command):
  81. def run(self, *names, **options):
  82. try:
  83. return Suite(self.app,
  84. block_timeout=options.get('block_timeout'),
  85. ).run(names, **options)
  86. except KeyboardInterrupt:
  87. pass
  88. def get_options(self):
  89. return (
  90. Option('-i', '--iterations', type='int', default=50,
  91. help='Number of iterations for each test'),
  92. Option('-n', '--numtests', type='int', default=None,
  93. help='Number of tests to execute'),
  94. Option('-o', '--offset', type='int', default=0,
  95. help='Start at custom offset'),
  96. Option('--block-timeout', type='int', default=30 * 60),
  97. Option('-l', '--list', action='store_true', dest='list_all',
  98. help='List all tests'),
  99. )
  100. class Suite(object):
  101. def __init__(self, app, block_timeout=30 * 60):
  102. self.app = app
  103. self.connerrors = self.app.connection().recoverable_connection_errors
  104. self.block_timeout = block_timeout
  105. self.tests = OrderedDict(
  106. (fun.__name__, fun) for fun in [
  107. self.manyshort,
  108. self.termbysig,
  109. self.bigtasks,
  110. self.smalltasks,
  111. self.timelimits,
  112. self.timelimits_soft,
  113. self.revoketermfast,
  114. self.revoketermslow,
  115. self.alwayskilled,
  116. ]
  117. )
  118. def run(self, names=None, iterations=50, offset=0,
  119. numtests=None, list_all=False, **kw):
  120. tests = self.filtertests(names)[offset:numtests or None]
  121. if list_all:
  122. return print(self.testlist(tests))
  123. print(self.banner(tests))
  124. marker('Stresstest suite start', '+')
  125. for i, test in enumerate(tests):
  126. self.runtest(test, iterations, i + 1)
  127. marker('Stresstest suite end', '+')
  128. def filtertests(self, names):
  129. try:
  130. return ([self.tests[n] for n in names] if names
  131. else list(values(self.tests)))
  132. except KeyError as exc:
  133. raise KeyError('Unknown test name: {0}'.format(exc))
  134. def testlist(self, tests):
  135. return ',\n'.join(
  136. '.> {0}) {1}'.format(i + 1, t.__name__)
  137. for i, t in enumerate(tests)
  138. )
  139. def banner(self, tests):
  140. app = self.app
  141. return BANNER.format(
  142. app='{0}:0x{1:x}'.format(app.main or '__main__', id(app)),
  143. version=VERSION_BANNER,
  144. conninfo=app.connection().as_uri(),
  145. platform=platform.platform(),
  146. toc=self.testlist(tests),
  147. TESTS=pluralize(len(tests), 'test'),
  148. total=len(tests),
  149. )
  150. def manyshort(self):
  151. self.join(group(add.s(i, i) for i in xrange(1000))())
  152. def runtest(self, fun, n=50, index=0):
  153. with blockdetection(self.block_timeout):
  154. t = time()
  155. i = 0
  156. failed = False
  157. marker('{0}: {1}({2})'.format(index, fun.__name__, n))
  158. try:
  159. for i in range(n):
  160. print(i)
  161. fun()
  162. except Exception:
  163. failed = True
  164. raise
  165. finally:
  166. print('{0} {1} iterations in {2}s'.format(
  167. 'failed after' if failed else 'completed',
  168. i + 1, time() - t,
  169. ))
  170. def termbysig(self):
  171. self._evil_groupmember(kill)
  172. def termbysegfault(self):
  173. self._evil_groupmember(segfault)
  174. def timelimits(self):
  175. self._evil_groupmember(sleeping, 2, timeout=1)
  176. def timelimits_soft(self):
  177. self._evil_groupmember(sleeping_ignore_limits, 2,
  178. soft_timeout=1, timeout=1.1)
  179. def alwayskilled(self):
  180. g = group(kill.s() for _ in range(10))
  181. self.join(g(), timeout=10)
  182. def _evil_groupmember(self, evil_t, *eargs, **opts):
  183. g1 = group(add.s(2, 2).set(**opts), evil_t.s(*eargs).set(**opts),
  184. add.s(4, 4).set(**opts), add.s(8, 8).set(**opts))
  185. g2 = group(add.s(3, 3).set(**opts), add.s(5, 5).set(**opts),
  186. evil_t.s(*eargs).set(**opts), add.s(7, 7).set(**opts))
  187. self.join(g1(), timeout=10)
  188. self.join(g2(), timeout=10)
  189. def bigtasks(self, wait=None):
  190. self._revoketerm(wait, False, False, BIG)
  191. def smalltasks(self, wait=None):
  192. self._revoketerm(wait, False, False, SMALL)
  193. def revoketermfast(self, wait=None):
  194. self._revoketerm(wait, True, False, SMALL)
  195. def revoketermslow(self, wait=5):
  196. self._revoketerm(wait, True, True, BIG)
  197. def _revoketerm(self, wait=None, terminate=True,
  198. joindelay=True, data=BIG):
  199. g = group(any_.s(data, sleep=wait) for i in range(8))
  200. r = g()
  201. if terminate:
  202. if joindelay:
  203. sleep(random.choice(range(4)))
  204. r.revoke(terminate=True)
  205. self.join(r, timeout=100)
  206. def join(self, r, **kwargs):
  207. while 1:
  208. try:
  209. return r.get(propagate=False, **kwargs)
  210. except TimeoutError as exc:
  211. print('join timed out: %s' % (exc, ))
  212. except self.connerrors as exc:
  213. print('join: connection lost: %r' % (exc, ))
  214. if __name__ == '__main__':
  215. Stress(app=app).execute_from_commandline()