suite.py 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340
  1. from __future__ import absolute_import, print_function, unicode_literals
  2. import inspect
  3. import platform
  4. import random
  5. import socket
  6. import sys
  7. from collections import OrderedDict, defaultdict, namedtuple
  8. from itertools import count
  9. from time import sleep
  10. from celery import group, VERSION_BANNER
  11. from celery.exceptions import TimeoutError
  12. from celery.five import items, monotonic, range, values
  13. from celery.utils.debug import blockdetection
  14. from celery.utils.text import pluralize, truncate
  15. from celery.utils.timeutils import humanize_seconds
  16. from .app import (
  17. marker, _marker, add, any_, exiting, kill, sleeping,
  18. sleeping_ignore_limits, any_returning,
  19. )
  20. from .data import BIG, SMALL
  21. from .fbi import FBI
  22. BANNER = """\
  23. Celery stress-suite v{version}
  24. {platform}
  25. [config]
  26. .> broker: {conninfo}
  27. [toc: {total} {TESTS} total]
  28. {toc}
  29. """
  30. F_PROGRESS = """\
  31. {0.index}: {0.test.__name__}({0.iteration}/{0.total_iterations}) \
  32. rep#{0.repeats} runtime: {runtime}/{elapsed} \
  33. """
  34. Progress = namedtuple('Progress', (
  35. 'test', 'iteration', 'total_iterations',
  36. 'index', 'repeats', 'runtime', 'elapsed', 'completed',
  37. ))
  38. Inf = float('Inf')
  39. class StopSuite(Exception):
  40. pass
  41. def pstatus(p):
  42. return F_PROGRESS.format(
  43. p,
  44. runtime=humanize_seconds(monotonic() - p.runtime, now='0 seconds'),
  45. elapsed=humanize_seconds(monotonic() - p.elapsed, now='0 seconds'),
  46. )
  47. class Speaker(object):
  48. def __init__(self, gap=5.0):
  49. self.gap = gap
  50. self.last_noise = monotonic() - self.gap * 2
  51. def beep(self):
  52. now = monotonic()
  53. if now - self.last_noise >= self.gap:
  54. self.emit()
  55. self.last_noise = now
  56. def emit(self):
  57. print('\a', file=sys.stderr, end='')
  58. def testgroup(*funs):
  59. return OrderedDict((fun.__name__, fun) for fun in funs)
  60. class BaseSuite(object):
  61. def __init__(self, app, block_timeout=30 * 60):
  62. self.app = app
  63. self.connerrors = self.app.connection().recoverable_connection_errors
  64. self.block_timeout = block_timeout
  65. self.progress = None
  66. self.speaker = Speaker()
  67. self.fbi = FBI(app)
  68. self.init_groups()
  69. def init_groups(self):
  70. acc = defaultdict(list)
  71. for attr in dir(self):
  72. if not _is_descriptor(self, attr):
  73. meth = getattr(self, attr)
  74. try:
  75. groups = meth.__func__.__testgroup__
  76. except AttributeError:
  77. pass
  78. else:
  79. for group in groups:
  80. acc[group].append(meth)
  81. # sort the tests by the order in which they are defined in the class
  82. for group in values(acc):
  83. group[:] = sorted(group, key=lambda m: m.__func__.__testsort__)
  84. self.groups = dict(
  85. (name, testgroup(*tests)) for name, tests in items(acc)
  86. )
  87. def run(self, names=None, iterations=50, offset=0,
  88. numtests=None, list_all=False, repeat=0, group='all',
  89. diag=False, no_join=False, **kw):
  90. self.no_join = no_join
  91. self.fbi.enable(diag)
  92. tests = self.filtertests(group, names)[offset:numtests or None]
  93. if list_all:
  94. return print(self.testlist(tests))
  95. print(self.banner(tests))
  96. print('+ Enabling events')
  97. self.app.control.enable_events()
  98. it = count() if repeat == Inf else range(int(repeat) or 1)
  99. for i in it:
  100. marker(
  101. 'Stresstest suite start (repetition {0})'.format(i + 1),
  102. '+',
  103. )
  104. for j, test in enumerate(tests):
  105. self.runtest(test, iterations, j + 1, i + 1)
  106. marker(
  107. 'Stresstest suite end (repetition {0})'.format(i + 1),
  108. '+',
  109. )
  110. def filtertests(self, group, names):
  111. tests = self.groups[group]
  112. try:
  113. return ([tests[n] for n in names] if names
  114. else list(values(tests)))
  115. except KeyError as exc:
  116. raise KeyError('Unknown test name: {0}'.format(exc))
  117. def testlist(self, tests):
  118. return ',\n'.join(
  119. '.> {0}) {1}'.format(i + 1, t.__name__)
  120. for i, t in enumerate(tests)
  121. )
  122. def banner(self, tests):
  123. app = self.app
  124. return BANNER.format(
  125. app='{0}:0x{1:x}'.format(app.main or '__main__', id(app)),
  126. version=VERSION_BANNER,
  127. conninfo=app.connection().as_uri(),
  128. platform=platform.platform(),
  129. toc=self.testlist(tests),
  130. TESTS=pluralize(len(tests), 'test'),
  131. total=len(tests),
  132. )
  133. def runtest(self, fun, n=50, index=0, repeats=1):
  134. print('{0}: [[[{1}({2})]]]'.format(repeats, fun.__name__, n))
  135. with blockdetection(self.block_timeout):
  136. with self.fbi.investigation():
  137. runtime = elapsed = monotonic()
  138. i = 0
  139. failed = False
  140. self.progress = Progress(
  141. fun, i, n, index, repeats, elapsed, runtime, 0,
  142. )
  143. _marker.delay(pstatus(self.progress))
  144. try:
  145. for i in range(n):
  146. runtime = monotonic()
  147. self.progress = Progress(
  148. fun, i + 1, n, index, repeats, runtime, elapsed, 0,
  149. )
  150. try:
  151. fun()
  152. except StopSuite:
  153. raise
  154. except Exception as exc:
  155. print('-> {0!r}'.format(exc))
  156. print(pstatus(self.progress))
  157. else:
  158. print(pstatus(self.progress))
  159. except Exception:
  160. failed = True
  161. self.speaker.beep()
  162. raise
  163. finally:
  164. print('{0} {1} iterations in {2}s'.format(
  165. 'failed after' if failed else 'completed',
  166. i + 1, humanize_seconds(monotonic() - elapsed),
  167. ))
  168. if not failed:
  169. self.progress = Progress(
  170. fun, i + 1, n, index, repeats, runtime, elapsed, 1,
  171. )
  172. def missing_results(self, r):
  173. return [res.id for res in r if res.id not in res.backend._cache]
  174. def join(self, r, propagate=False, max_retries=10, **kwargs):
  175. if self.no_join:
  176. return
  177. received = []
  178. def on_result(task_id, value):
  179. received.append(task_id)
  180. for i in range(max_retries) if max_retries else count(0):
  181. received[:] = []
  182. try:
  183. return r.get(callback=on_result, propagate=propagate, **kwargs)
  184. except (socket.timeout, TimeoutError) as exc:
  185. waiting_for = self.missing_results(r)
  186. self.speaker.beep()
  187. marker(
  188. 'Still waiting for {0}/{1}: [{2}]: {3!r}'.format(
  189. len(r) - len(received), len(r),
  190. truncate(', '.join(waiting_for)), exc), '!',
  191. )
  192. self.fbi.diag(waiting_for)
  193. except self.connerrors as exc:
  194. self.speaker.beep()
  195. marker('join: connection lost: {0!r}'.format(exc), '!')
  196. raise StopSuite('Test failed: Missing task results')
  197. def dump_progress(self):
  198. return pstatus(self.progress) if self.progress else 'No test running'
  199. _creation_counter = count(0)
  200. def testcase(*groups):
  201. if not groups:
  202. raise ValueError('@testcase requires at least one group name')
  203. def _mark_as_case(fun):
  204. fun.__testgroup__ = groups
  205. fun.__testsort__ = next(_creation_counter)
  206. return fun
  207. return _mark_as_case
  208. def _is_descriptor(obj, attr):
  209. try:
  210. cattr = getattr(obj.__class__, attr)
  211. except AttributeError:
  212. pass
  213. else:
  214. return not inspect.ismethod(cattr) and hasattr(cattr, '__get__')
  215. return False
  216. class Suite(BaseSuite):
  217. @testcase('all', 'green')
  218. def manyshort(self):
  219. self.join(group(add.s(i, i) for i in range(1000))(),
  220. timeout=10, propagate=True)
  221. @testcase('all')
  222. def termbysig(self):
  223. self._evil_groupmember(kill)
  224. @testcase('green')
  225. def group_with_exit(self):
  226. self._evil_groupmember(exiting)
  227. @testcase('all')
  228. def timelimits(self):
  229. self._evil_groupmember(sleeping, 2, time_limit=1)
  230. @testcase('all')
  231. def timelimits_soft(self):
  232. self._evil_groupmember(sleeping_ignore_limits, 2,
  233. soft_time_limit=1, time_limit=1.1)
  234. @testcase('all')
  235. def alwayskilled(self):
  236. g = group(kill.s() for _ in range(10))
  237. self.join(g(), timeout=10)
  238. @testcase('all', 'green')
  239. def alwaysexits(self):
  240. g = group(exiting.s() for _ in range(10))
  241. self.join(g(), timeout=10)
  242. def _evil_groupmember(self, evil_t, *eargs, **opts):
  243. g1 = group(add.s(2, 2).set(**opts), evil_t.s(*eargs).set(**opts),
  244. add.s(4, 4).set(**opts), add.s(8, 8).set(**opts))
  245. g2 = group(add.s(3, 3).set(**opts), add.s(5, 5).set(**opts),
  246. evil_t.s(*eargs).set(**opts), add.s(7, 7).set(**opts))
  247. self.join(g1(), timeout=10)
  248. self.join(g2(), timeout=10)
  249. @testcase('all', 'green')
  250. def bigtasksbigvalue(self):
  251. g = group(any_returning.s(BIG, sleep=0.3) for i in range(8))
  252. r = g()
  253. try:
  254. self.join(r, timeout=10)
  255. finally:
  256. # very big values so remove results from backend
  257. try:
  258. r.forget()
  259. except NotImplementedError:
  260. pass
  261. @testcase('all', 'green')
  262. def bigtasks(self, wait=None):
  263. self._revoketerm(wait, False, False, BIG)
  264. @testcase('all', 'green')
  265. def smalltasks(self, wait=None):
  266. self._revoketerm(wait, False, False, SMALL)
  267. @testcase('all')
  268. def revoketermfast(self, wait=None):
  269. self._revoketerm(wait, True, False, SMALL)
  270. @testcase('all')
  271. def revoketermslow(self, wait=5):
  272. self._revoketerm(wait, True, True, BIG)
  273. def _revoketerm(self, wait=None, terminate=True,
  274. joindelay=True, data=BIG):
  275. g = group(any_.s(data, sleep=wait) for i in range(8))
  276. r = g()
  277. if terminate:
  278. if joindelay:
  279. sleep(random.choice(range(4)))
  280. r.revoke(terminate=True)
  281. self.join(r, timeout=10)