base.py 15 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415
  1. # -*- coding: utf-8 -*-
  2. """celery.backends.base"""
  3. from __future__ import absolute_import
  4. import time
  5. import sys
  6. from datetime import timedelta
  7. from kombu import serialization
  8. from .. import states
  9. from ..datastructures import LRUCache
  10. from ..exceptions import TimeoutError, TaskRevokedError
  11. from ..utils import timeutils
  12. from ..utils.encoding import ensure_bytes, from_utf8
  13. from ..utils.serialization import (get_pickled_exception,
  14. get_pickleable_exception,
  15. create_exception_cls)
  16. EXCEPTION_ABLE_CODECS = frozenset(["pickle", "yaml"])
  17. is_py3k = sys.version_info >= (3, 0)
  18. def unpickle_backend(cls, args, kwargs):
  19. """Returns an unpickled backend."""
  20. return cls(*args, **kwargs)
  21. class BaseBackend(object):
  22. """Base backend class."""
  23. READY_STATES = states.READY_STATES
  24. UNREADY_STATES = states.UNREADY_STATES
  25. EXCEPTION_STATES = states.EXCEPTION_STATES
  26. TimeoutError = TimeoutError
  27. #: Time to sleep between polling each individual item
  28. #: in `ResultSet.iterate`. as opposed to the `interval`
  29. #: argument which is for each pass.
  30. subpolling_interval = None
  31. #: If true the backend must implement :meth:`get_many`.
  32. supports_native_join = False
  33. def __init__(self, *args, **kwargs):
  34. from ..app import app_or_default
  35. self.app = app_or_default(kwargs.get("app"))
  36. self.serializer = kwargs.get("serializer",
  37. self.app.conf.CELERY_RESULT_SERIALIZER)
  38. (self.content_type,
  39. self.content_encoding,
  40. self.encoder) = serialization.registry._encoders[self.serializer]
  41. def encode(self, data):
  42. _, _, payload = serialization.encode(data, serializer=self.serializer)
  43. return payload
  44. def decode(self, payload):
  45. payload = is_py3k and payload or str(payload)
  46. return serialization.decode(payload,
  47. content_type=self.content_type,
  48. content_encoding=self.content_encoding)
  49. def prepare_expires(self, value, type=None):
  50. if value is None:
  51. value = self.app.conf.CELERY_TASK_RESULT_EXPIRES
  52. if isinstance(value, timedelta):
  53. value = timeutils.timedelta_seconds(value)
  54. if value is not None and type:
  55. return type(value)
  56. return value
  57. def encode_result(self, result, status):
  58. if status in self.EXCEPTION_STATES and isinstance(result, Exception):
  59. return self.prepare_exception(result)
  60. else:
  61. return self.prepare_value(result)
  62. def store_result(self, task_id, result, status, traceback=None):
  63. """Store the result and status of a task."""
  64. raise NotImplementedError(
  65. "store_result is not supported by this backend.")
  66. def mark_as_started(self, task_id, **meta):
  67. """Mark a task as started"""
  68. return self.store_result(task_id, meta, status=states.STARTED)
  69. def mark_as_done(self, task_id, result):
  70. """Mark task as successfully executed."""
  71. return self.store_result(task_id, result, status=states.SUCCESS)
  72. def mark_as_failure(self, task_id, exc, traceback=None):
  73. """Mark task as executed with failure. Stores the execption."""
  74. return self.store_result(task_id, exc, status=states.FAILURE,
  75. traceback=traceback)
  76. def mark_as_retry(self, task_id, exc, traceback=None):
  77. """Mark task as being retries. Stores the current
  78. exception (if any)."""
  79. return self.store_result(task_id, exc, status=states.RETRY,
  80. traceback=traceback)
  81. def mark_as_revoked(self, task_id):
  82. return self.store_result(task_id, TaskRevokedError(),
  83. status=states.REVOKED, traceback=None)
  84. def prepare_exception(self, exc):
  85. """Prepare exception for serialization."""
  86. if self.serializer in EXCEPTION_ABLE_CODECS:
  87. return get_pickleable_exception(exc)
  88. return {"exc_type": type(exc).__name__, "exc_message": str(exc)}
  89. def exception_to_python(self, exc):
  90. """Convert serialized exception to Python exception."""
  91. if self.serializer in EXCEPTION_ABLE_CODECS:
  92. return get_pickled_exception(exc)
  93. return create_exception_cls(from_utf8(exc["exc_type"]),
  94. sys.modules[__name__])
  95. def prepare_value(self, result):
  96. """Prepare value for storage."""
  97. return result
  98. def forget(self, task_id):
  99. raise NotImplementedError("%s does not implement forget." % (
  100. self.__class__))
  101. def wait_for(self, task_id, timeout=None, propagate=True, interval=0.5):
  102. """Wait for task and return its result.
  103. If the task raises an exception, this exception
  104. will be re-raised by :func:`wait_for`.
  105. If `timeout` is not :const:`None`, this raises the
  106. :class:`celery.exceptions.TimeoutError` exception if the operation
  107. takes longer than `timeout` seconds.
  108. """
  109. time_elapsed = 0.0
  110. while True:
  111. status = self.get_status(task_id)
  112. if status == states.SUCCESS:
  113. return self.get_result(task_id)
  114. elif status in states.PROPAGATE_STATES:
  115. result = self.get_result(task_id)
  116. if propagate:
  117. raise result
  118. return result
  119. # avoid hammering the CPU checking status.
  120. time.sleep(interval)
  121. time_elapsed += interval
  122. if timeout and time_elapsed >= timeout:
  123. raise TimeoutError("The operation timed out.")
  124. def cleanup(self):
  125. """Backend cleanup. Is run by
  126. :class:`celery.task.DeleteExpiredTaskMetaTask`."""
  127. pass
  128. def process_cleanup(self):
  129. """Cleanup actions to do at the end of a task worker process."""
  130. pass
  131. def get_status(self, task_id):
  132. """Get the status of a task."""
  133. raise NotImplementedError(
  134. "get_status is not supported by this backend.")
  135. def get_result(self, task_id):
  136. """Get the result of a task."""
  137. raise NotImplementedError(
  138. "get_result is not supported by this backend.")
  139. def get_traceback(self, task_id):
  140. """Get the traceback for a failed task."""
  141. raise NotImplementedError(
  142. "get_traceback is not supported by this backend.")
  143. def save_taskset(self, taskset_id, result):
  144. """Store the result and status of a task."""
  145. raise NotImplementedError(
  146. "save_taskset is not supported by this backend.")
  147. def restore_taskset(self, taskset_id, cache=True):
  148. """Get the result of a taskset."""
  149. raise NotImplementedError(
  150. "restore_taskset is not supported by this backend.")
  151. def delete_taskset(self, taskset_id):
  152. raise NotImplementedError(
  153. "delete_taskset is not supported by this backend.")
  154. def reload_task_result(self, task_id):
  155. """Reload task result, even if it has been previously fetched."""
  156. raise NotImplementedError(
  157. "reload_task_result is not supported by this backend.")
  158. def reload_taskset_result(self, task_id):
  159. """Reload taskset result, even if it has been previously fetched."""
  160. raise NotImplementedError(
  161. "reload_taskset_result is not supported by this backend.")
  162. def on_chord_part_return(self, task, propagate=False):
  163. pass
  164. def on_chord_apply(self, setid, body, result=None, **kwargs):
  165. from ..registry import tasks
  166. kwargs["result"] = [r.task_id for r in result]
  167. tasks["celery.chord_unlock"].apply_async((setid, body, ), kwargs,
  168. countdown=1)
  169. def __reduce__(self, args=(), kwargs={}):
  170. return (unpickle_backend, (self.__class__, args, kwargs))
  171. class BaseDictBackend(BaseBackend):
  172. def __init__(self, *args, **kwargs):
  173. super(BaseDictBackend, self).__init__(*args, **kwargs)
  174. self._cache = LRUCache(limit=kwargs.get("max_cached_results") or
  175. self.app.conf.CELERY_MAX_CACHED_RESULTS)
  176. def store_result(self, task_id, result, status, traceback=None, **kwargs):
  177. """Store task result and status."""
  178. result = self.encode_result(result, status)
  179. return self._store_result(task_id, result, status, traceback, **kwargs)
  180. def forget(self, task_id):
  181. self._cache.pop(task_id, None)
  182. self._forget(task_id)
  183. def _forget(self, task_id):
  184. raise NotImplementedError("%s does not implement forget." % (
  185. self.__class__))
  186. def get_status(self, task_id):
  187. """Get the status of a task."""
  188. return self.get_task_meta(task_id)["status"]
  189. def get_traceback(self, task_id):
  190. """Get the traceback for a failed task."""
  191. return self.get_task_meta(task_id).get("traceback")
  192. def get_result(self, task_id):
  193. """Get the result of a task."""
  194. meta = self.get_task_meta(task_id)
  195. if meta["status"] in self.EXCEPTION_STATES:
  196. return self.exception_to_python(meta["result"])
  197. else:
  198. return meta["result"]
  199. def get_task_meta(self, task_id, cache=True):
  200. if cache:
  201. try:
  202. return self._cache[task_id]
  203. except KeyError:
  204. pass
  205. meta = self._get_task_meta_for(task_id)
  206. if cache and meta.get("status") == states.SUCCESS:
  207. self._cache[task_id] = meta
  208. return meta
  209. def reload_task_result(self, task_id):
  210. self._cache[task_id] = self.get_task_meta(task_id, cache=False)
  211. def reload_taskset_result(self, taskset_id):
  212. self._cache[taskset_id] = self.get_taskset_meta(taskset_id,
  213. cache=False)
  214. def get_taskset_meta(self, taskset_id, cache=True):
  215. if cache:
  216. try:
  217. return self._cache[taskset_id]
  218. except KeyError:
  219. pass
  220. meta = self._restore_taskset(taskset_id)
  221. if cache and meta is not None:
  222. self._cache[taskset_id] = meta
  223. return meta
  224. def restore_taskset(self, taskset_id, cache=True):
  225. """Get the result for a taskset."""
  226. meta = self.get_taskset_meta(taskset_id, cache=cache)
  227. if meta:
  228. return meta["result"]
  229. def save_taskset(self, taskset_id, result):
  230. """Store the result of an executed taskset."""
  231. return self._save_taskset(taskset_id, result)
  232. def delete_taskset(self, taskset_id):
  233. self._cache.pop(taskset_id, None)
  234. return self._delete_taskset(taskset_id)
  235. class KeyValueStoreBackend(BaseDictBackend):
  236. task_keyprefix = "celery-task-meta-"
  237. taskset_keyprefix = "celery-taskset-meta-"
  238. chord_keyprefix = "chord-unlock-"
  239. def get(self, key):
  240. raise NotImplementedError("Must implement the get method.")
  241. def mget(self, keys):
  242. raise NotImplementedError("Does not support get_many")
  243. def set(self, key, value):
  244. raise NotImplementedError("Must implement the set method.")
  245. def delete(self, key):
  246. raise NotImplementedError("Must implement the delete method")
  247. def get_key_for_task(self, task_id):
  248. """Get the cache key for a task by id."""
  249. return ensure_bytes(self.task_keyprefix) + ensure_bytes(task_id)
  250. def get_key_for_taskset(self, taskset_id):
  251. """Get the cache key for a taskset by id."""
  252. return ensure_bytes(self.taskset_keyprefix) + ensure_bytes(taskset_id)
  253. def get_key_for_chord(self, taskset_id):
  254. """Get the cache key for the chord waiting on taskset with given id."""
  255. return ensure_bytes(self.chord_keyprefix) + ensure_bytes(taskset_id)
  256. def _strip_prefix(self, key):
  257. for prefix in self.task_keyprefix, self.taskset_keyprefix:
  258. if key.startswith(prefix):
  259. return key[len(prefix):]
  260. return key
  261. def _mget_to_results(self, values, keys):
  262. if hasattr(values, "items"):
  263. # client returns dict so mapping preserved.
  264. return dict((self._strip_prefix(k), self.decode(v))
  265. for k, v in values.iteritems()
  266. if v is not None)
  267. else:
  268. # client returns list so need to recreate mapping.
  269. return dict((keys[i], self.decode(value))
  270. for i, value in enumerate(values)
  271. if value is not None)
  272. def get_many(self, task_ids, timeout=None, interval=0.5):
  273. ids = set(task_ids)
  274. cached_ids = set()
  275. for task_id in ids:
  276. try:
  277. cached = self._cache[task_id]
  278. except KeyError:
  279. pass
  280. else:
  281. if cached["status"] in states.READY_STATES:
  282. yield task_id, cached
  283. cached_ids.add(task_id)
  284. ids ^= cached_ids
  285. iterations = 0
  286. while ids:
  287. keys = list(ids)
  288. r = self._mget_to_results(self.mget([self.get_key_for_task(k)
  289. for k in keys]), keys)
  290. self._cache.update(r)
  291. ids ^= set(r)
  292. for key, value in r.iteritems():
  293. yield key, value
  294. if timeout and iterations * interval >= timeout:
  295. raise TimeoutError("Operation timed out (%s)" % (timeout, ))
  296. time.sleep(interval) # don't busy loop.
  297. iterations += 0
  298. def _forget(self, task_id):
  299. self.delete(self.get_key_for_task(task_id))
  300. def _store_result(self, task_id, result, status, traceback=None):
  301. meta = {"status": status, "result": result, "traceback": traceback}
  302. self.set(self.get_key_for_task(task_id), self.encode(meta))
  303. return result
  304. def _save_taskset(self, taskset_id, result):
  305. self.set(self.get_key_for_taskset(taskset_id),
  306. self.encode({"result": result}))
  307. return result
  308. def _delete_taskset(self, taskset_id):
  309. self.delete(self.get_key_for_taskset(taskset_id))
  310. def _get_task_meta_for(self, task_id):
  311. """Get task metadata for a task by id."""
  312. meta = self.get(self.get_key_for_task(task_id))
  313. if not meta:
  314. return {"status": states.PENDING, "result": None}
  315. return self.decode(meta)
  316. def _restore_taskset(self, taskset_id):
  317. """Get task metadata for a task by id."""
  318. meta = self.get(self.get_key_for_taskset(taskset_id))
  319. if meta:
  320. return self.decode(meta)
  321. class DisabledBackend(BaseBackend):
  322. _cache = {} # need this attribute to reset cache in tests.
  323. def store_result(self, *args, **kwargs):
  324. pass
  325. def _is_disabled(self, *args, **kwargs):
  326. raise NotImplementedError("No result backend configured. "
  327. "Please see the documentation for more information.")
  328. wait_for = get_status = get_result = get_traceback = _is_disabled