suite.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342
  1. from __future__ import absolute_import, print_function, unicode_literals
  2. import inspect
  3. import platform
  4. import random
  5. import socket
  6. import sys
  7. from collections import defaultdict, namedtuple
  8. from itertools import count
  9. from time import sleep
  10. from kombu.utils.compat import OrderedDict
  11. from celery import group, VERSION_BANNER
  12. from celery.exceptions import TimeoutError
  13. from celery.five import items, monotonic, range, values
  14. from celery.utils.debug import blockdetection
  15. from celery.utils.text import pluralize, truncate
  16. from celery.utils.timeutils import humanize_seconds
  17. from .app import (
  18. marker, _marker, add, any_, exiting, kill, sleeping,
  19. sleeping_ignore_limits, any_returning,
  20. )
  21. from .data import BIG, SMALL
  22. from .fbi import FBI
  23. BANNER = """\
  24. Celery stress-suite v{version}
  25. {platform}
  26. [config]
  27. .> broker: {conninfo}
  28. [toc: {total} {TESTS} total]
  29. {toc}
  30. """
  31. F_PROGRESS = """\
  32. {0.index}: {0.test.__name__}({0.iteration}/{0.total_iterations}) \
  33. rep#{0.repeats} runtime: {runtime}/{elapsed} \
  34. """
  35. Progress = namedtuple('Progress', (
  36. 'test', 'iteration', 'total_iterations',
  37. 'index', 'repeats', 'runtime', 'elapsed', 'completed',
  38. ))
  39. Inf = float('Inf')
  40. class StopSuite(Exception):
  41. pass
  42. def pstatus(p):
  43. return F_PROGRESS.format(
  44. p,
  45. runtime=humanize_seconds(monotonic() - p.runtime, now='0 seconds'),
  46. elapsed=humanize_seconds(monotonic() - p.elapsed, now='0 seconds'),
  47. )
  48. class Speaker(object):
  49. def __init__(self, gap=5.0):
  50. self.gap = gap
  51. self.last_noise = monotonic() - self.gap * 2
  52. def beep(self):
  53. now = monotonic()
  54. if now - self.last_noise >= self.gap:
  55. self.emit()
  56. self.last_noise = now
  57. def emit(self):
  58. print('\a', file=sys.stderr, end='')
  59. def testgroup(*funs):
  60. return OrderedDict((fun.__name__, fun) for fun in funs)
  61. class BaseSuite(object):
  62. def __init__(self, app, block_timeout=30 * 60):
  63. self.app = app
  64. self.connerrors = self.app.connection().recoverable_connection_errors
  65. self.block_timeout = block_timeout
  66. self.progress = None
  67. self.speaker = Speaker()
  68. self.fbi = FBI(app)
  69. self.init_groups()
  70. def init_groups(self):
  71. acc = defaultdict(list)
  72. for attr in dir(self):
  73. if not _is_descriptor(self, attr):
  74. meth = getattr(self, attr)
  75. try:
  76. groups = meth.__func__.__testgroup__
  77. except AttributeError:
  78. pass
  79. else:
  80. for group in groups:
  81. acc[group].append(meth)
  82. # sort the tests by the order in which they are defined in the class
  83. for group in values(acc):
  84. group[:] = sorted(group, key=lambda m: m.__func__.__testsort__)
  85. self.groups = dict(
  86. (name, testgroup(*tests)) for name, tests in items(acc)
  87. )
  88. def run(self, names=None, iterations=50, offset=0,
  89. numtests=None, list_all=False, repeat=0, group='all',
  90. diag=False, no_join=False, **kw):
  91. self.no_join = no_join
  92. self.fbi.enable(diag)
  93. tests = self.filtertests(group, names)[offset:numtests or None]
  94. if list_all:
  95. return print(self.testlist(tests))
  96. print(self.banner(tests))
  97. print('+ Enabling events')
  98. self.app.control.enable_events()
  99. it = count() if repeat == Inf else range(int(repeat) or 1)
  100. for i in it:
  101. marker(
  102. 'Stresstest suite start (repetition {0})'.format(i + 1),
  103. '+',
  104. )
  105. for j, test in enumerate(tests):
  106. self.runtest(test, iterations, j + 1, i + 1)
  107. marker(
  108. 'Stresstest suite end (repetition {0})'.format(i + 1),
  109. '+',
  110. )
  111. def filtertests(self, group, names):
  112. tests = self.groups[group]
  113. try:
  114. return ([tests[n] for n in names] if names
  115. else list(values(tests)))
  116. except KeyError as exc:
  117. raise KeyError('Unknown test name: {0}'.format(exc))
  118. def testlist(self, tests):
  119. return ',\n'.join(
  120. '.> {0}) {1}'.format(i + 1, t.__name__)
  121. for i, t in enumerate(tests)
  122. )
  123. def banner(self, tests):
  124. app = self.app
  125. return BANNER.format(
  126. app='{0}:0x{1:x}'.format(app.main or '__main__', id(app)),
  127. version=VERSION_BANNER,
  128. conninfo=app.connection().as_uri(),
  129. platform=platform.platform(),
  130. toc=self.testlist(tests),
  131. TESTS=pluralize(len(tests), 'test'),
  132. total=len(tests),
  133. )
  134. def runtest(self, fun, n=50, index=0, repeats=1):
  135. print('{0}: [[[{1}({2})]]]'.format(repeats, fun.__name__, n))
  136. with blockdetection(self.block_timeout):
  137. with self.fbi.investigation():
  138. runtime = elapsed = monotonic()
  139. i = 0
  140. failed = False
  141. self.progress = Progress(
  142. fun, i, n, index, repeats, elapsed, runtime, 0,
  143. )
  144. _marker.delay(pstatus(self.progress))
  145. try:
  146. for i in range(n):
  147. runtime = monotonic()
  148. self.progress = Progress(
  149. fun, i + 1, n, index, repeats, runtime, elapsed, 0,
  150. )
  151. try:
  152. fun()
  153. except StopSuite:
  154. raise
  155. except Exception as exc:
  156. print('-> {0!r}'.format(exc))
  157. print(pstatus(self.progress))
  158. else:
  159. print(pstatus(self.progress))
  160. except Exception:
  161. failed = True
  162. self.speaker.beep()
  163. raise
  164. finally:
  165. print('{0} {1} iterations in {2}s'.format(
  166. 'failed after' if failed else 'completed',
  167. i + 1, humanize_seconds(monotonic() - elapsed),
  168. ))
  169. if not failed:
  170. self.progress = Progress(
  171. fun, i + 1, n, index, repeats, runtime, elapsed, 1,
  172. )
  173. def missing_results(self, r):
  174. return [res.id for res in r if res.id not in res.backend._cache]
  175. def join(self, r, propagate=False, max_retries=10, **kwargs):
  176. if self.no_join:
  177. return
  178. received = []
  179. def on_result(task_id, value):
  180. received.append(task_id)
  181. for i in range(max_retries) if max_retries else count(0):
  182. received[:] = []
  183. try:
  184. return r.get(callback=on_result, propagate=propagate, **kwargs)
  185. except (socket.timeout, TimeoutError) as exc:
  186. waiting_for = self.missing_results(r)
  187. self.speaker.beep()
  188. marker(
  189. 'Still waiting for {0}/{1}: [{2}]: {3!r}'.format(
  190. len(r) - len(received), len(r),
  191. truncate(', '.join(waiting_for)), exc), '!',
  192. )
  193. self.fbi.diag(waiting_for)
  194. except self.connerrors as exc:
  195. self.speaker.beep()
  196. marker('join: connection lost: {0!r}'.format(exc), '!')
  197. raise StopSuite('Test failed: Missing task results')
  198. def dump_progress(self):
  199. return pstatus(self.progress) if self.progress else 'No test running'
  200. _creation_counter = count(0)
  201. def testcase(*groups):
  202. if not groups:
  203. raise ValueError('@testcase requires at least one group name')
  204. def _mark_as_case(fun):
  205. fun.__testgroup__ = groups
  206. fun.__testsort__ = next(_creation_counter)
  207. return fun
  208. return _mark_as_case
  209. def _is_descriptor(obj, attr):
  210. try:
  211. cattr = getattr(obj.__class__, attr)
  212. except AttributeError:
  213. pass
  214. else:
  215. return not inspect.ismethod(cattr) and hasattr(cattr, '__get__')
  216. return False
  217. class Suite(BaseSuite):
  218. @testcase('all', 'green')
  219. def manyshort(self):
  220. self.join(group(add.s(i, i) for i in range(1000))(),
  221. timeout=10, propagate=True)
  222. @testcase('all')
  223. def termbysig(self):
  224. self._evil_groupmember(kill)
  225. @testcase('green')
  226. def group_with_exit(self):
  227. self._evil_groupmember(exiting)
  228. @testcase('all')
  229. def timelimits(self):
  230. self._evil_groupmember(sleeping, 2, time_limit=1)
  231. @testcase('all')
  232. def timelimits_soft(self):
  233. self._evil_groupmember(sleeping_ignore_limits, 2,
  234. soft_time_limit=1, time_limit=1.1)
  235. @testcase('all')
  236. def alwayskilled(self):
  237. g = group(kill.s() for _ in range(10))
  238. self.join(g(), timeout=10)
  239. @testcase('all', 'green')
  240. def alwaysexits(self):
  241. g = group(exiting.s() for _ in range(10))
  242. self.join(g(), timeout=10)
  243. def _evil_groupmember(self, evil_t, *eargs, **opts):
  244. g1 = group(add.s(2, 2).set(**opts), evil_t.s(*eargs).set(**opts),
  245. add.s(4, 4).set(**opts), add.s(8, 8).set(**opts))
  246. g2 = group(add.s(3, 3).set(**opts), add.s(5, 5).set(**opts),
  247. evil_t.s(*eargs).set(**opts), add.s(7, 7).set(**opts))
  248. self.join(g1(), timeout=10)
  249. self.join(g2(), timeout=10)
  250. @testcase('all', 'green')
  251. def bigtasksbigvalue(self):
  252. g = group(any_returning.s(BIG, sleep=0.3) for i in range(8))
  253. r = g()
  254. try:
  255. self.join(r, timeout=10)
  256. finally:
  257. # very big values so remove results from backend
  258. try:
  259. r.forget()
  260. except NotImplementedError:
  261. pass
  262. @testcase('all', 'green')
  263. def bigtasks(self, wait=None):
  264. self._revoketerm(wait, False, False, BIG)
  265. @testcase('all', 'green')
  266. def smalltasks(self, wait=None):
  267. self._revoketerm(wait, False, False, SMALL)
  268. @testcase('all')
  269. def revoketermfast(self, wait=None):
  270. self._revoketerm(wait, True, False, SMALL)
  271. @testcase('all')
  272. def revoketermslow(self, wait=5):
  273. self._revoketerm(wait, True, True, BIG)
  274. def _revoketerm(self, wait=None, terminate=True,
  275. joindelay=True, data=BIG):
  276. g = group(any_.s(data, sleep=wait) for i in range(8))
  277. r = g()
  278. if terminate:
  279. if joindelay:
  280. sleep(random.choice(range(4)))
  281. r.revoke(terminate=True)
  282. self.join(r, timeout=10)