Development of an internal social media platform with personalised dashboards for students
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

base.py 22KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623
  1. # -*- coding: utf-8 -*-
  2. """
  3. celery.backends.base
  4. ~~~~~~~~~~~~~~~~~~~~
  5. Result backend base classes.
  6. - :class:`BaseBackend` defines the interface.
  7. - :class:`KeyValueStoreBackend` is a common base class
  8. using K/V semantics like _get and _put.
  9. """
  10. from __future__ import absolute_import
  11. import time
  12. import sys
  13. from datetime import timedelta
  14. from billiard.einfo import ExceptionInfo
  15. from kombu.serialization import (
  16. dumps, loads, prepare_accept_content,
  17. registry as serializer_registry,
  18. )
  19. from kombu.utils.encoding import bytes_to_str, ensure_bytes, from_utf8
  20. from kombu.utils.url import maybe_sanitize_url
  21. from celery import states
  22. from celery import current_app, maybe_signature
  23. from celery.app import current_task
  24. from celery.exceptions import ChordError, TimeoutError, TaskRevokedError
  25. from celery.five import items
  26. from celery.result import (
  27. GroupResult, ResultBase, allow_join_result, result_from_tuple,
  28. )
  29. from celery.utils import timeutils
  30. from celery.utils.functional import LRUCache
  31. from celery.utils.log import get_logger
  32. from celery.utils.serialization import (
  33. get_pickled_exception,
  34. get_pickleable_exception,
  35. create_exception_cls,
  36. )
  37. __all__ = ['BaseBackend', 'KeyValueStoreBackend', 'DisabledBackend']
  38. EXCEPTION_ABLE_CODECS = frozenset(['pickle'])
  39. PY3 = sys.version_info >= (3, 0)
  40. logger = get_logger(__name__)
  41. def unpickle_backend(cls, args, kwargs):
  42. """Return an unpickled backend."""
  43. return cls(*args, app=current_app._get_current_object(), **kwargs)
  44. class _nulldict(dict):
  45. def ignore(self, *a, **kw):
  46. pass
  47. __setitem__ = update = setdefault = ignore
  48. class BaseBackend(object):
  49. READY_STATES = states.READY_STATES
  50. UNREADY_STATES = states.UNREADY_STATES
  51. EXCEPTION_STATES = states.EXCEPTION_STATES
  52. TimeoutError = TimeoutError
  53. #: Time to sleep between polling each individual item
  54. #: in `ResultSet.iterate`. as opposed to the `interval`
  55. #: argument which is for each pass.
  56. subpolling_interval = None
  57. #: If true the backend must implement :meth:`get_many`.
  58. supports_native_join = False
  59. #: If true the backend must automatically expire results.
  60. #: The daily backend_cleanup periodic task will not be triggered
  61. #: in this case.
  62. supports_autoexpire = False
  63. #: Set to true if the backend is peristent by default.
  64. persistent = True
  65. retry_policy = {
  66. 'max_retries': 20,
  67. 'interval_start': 0,
  68. 'interval_step': 1,
  69. 'interval_max': 1,
  70. }
  71. def __init__(self, app,
  72. serializer=None, max_cached_results=None, accept=None,
  73. url=None, **kwargs):
  74. self.app = app
  75. conf = self.app.conf
  76. self.serializer = serializer or conf.CELERY_RESULT_SERIALIZER
  77. (self.content_type,
  78. self.content_encoding,
  79. self.encoder) = serializer_registry._encoders[self.serializer]
  80. cmax = max_cached_results or conf.CELERY_MAX_CACHED_RESULTS
  81. self._cache = _nulldict() if cmax == -1 else LRUCache(limit=cmax)
  82. self.accept = prepare_accept_content(
  83. conf.CELERY_ACCEPT_CONTENT if accept is None else accept,
  84. )
  85. self.url = url
  86. def as_uri(self, include_password=False):
  87. """Return the backend as an URI, sanitizing the password or not"""
  88. # when using maybe_sanitize_url(), "/" is added
  89. # we're stripping it for consistency
  90. if include_password:
  91. return self.url
  92. url = maybe_sanitize_url(self.url or '')
  93. return url[:-1] if url.endswith(':///') else url
  94. def mark_as_started(self, task_id, **meta):
  95. """Mark a task as started"""
  96. return self.store_result(task_id, meta, status=states.STARTED)
  97. def mark_as_done(self, task_id, result, request=None):
  98. """Mark task as successfully executed."""
  99. return self.store_result(task_id, result,
  100. status=states.SUCCESS, request=request)
  101. def mark_as_failure(self, task_id, exc, traceback=None, request=None):
  102. """Mark task as executed with failure. Stores the exception."""
  103. return self.store_result(task_id, exc, status=states.FAILURE,
  104. traceback=traceback, request=request)
  105. def chord_error_from_stack(self, callback, exc=None):
  106. from celery import group
  107. app = self.app
  108. backend = app._tasks[callback.task].backend
  109. try:
  110. group(
  111. [app.signature(errback)
  112. for errback in callback.options.get('link_error') or []],
  113. app=app,
  114. ).apply_async((callback.id, ))
  115. except Exception as eb_exc:
  116. return backend.fail_from_current_stack(callback.id, exc=eb_exc)
  117. else:
  118. return backend.fail_from_current_stack(callback.id, exc=exc)
  119. def fail_from_current_stack(self, task_id, exc=None):
  120. type_, real_exc, tb = sys.exc_info()
  121. try:
  122. exc = real_exc if exc is None else exc
  123. ei = ExceptionInfo((type_, exc, tb))
  124. self.mark_as_failure(task_id, exc, ei.traceback)
  125. return ei
  126. finally:
  127. del(tb)
  128. def mark_as_retry(self, task_id, exc, traceback=None, request=None):
  129. """Mark task as being retries. Stores the current
  130. exception (if any)."""
  131. return self.store_result(task_id, exc, status=states.RETRY,
  132. traceback=traceback, request=request)
  133. def mark_as_revoked(self, task_id, reason='', request=None):
  134. return self.store_result(task_id, TaskRevokedError(reason),
  135. status=states.REVOKED, traceback=None,
  136. request=request)
  137. def prepare_exception(self, exc, serializer=None):
  138. """Prepare exception for serialization."""
  139. serializer = self.serializer if serializer is None else serializer
  140. if serializer in EXCEPTION_ABLE_CODECS:
  141. return get_pickleable_exception(exc)
  142. return {'exc_type': type(exc).__name__, 'exc_message': str(exc)}
  143. def exception_to_python(self, exc):
  144. """Convert serialized exception to Python exception."""
  145. if exc:
  146. if not isinstance(exc, BaseException):
  147. exc = create_exception_cls(
  148. from_utf8(exc['exc_type']), __name__)(exc['exc_message'])
  149. if self.serializer in EXCEPTION_ABLE_CODECS:
  150. exc = get_pickled_exception(exc)
  151. return exc
  152. def prepare_value(self, result):
  153. """Prepare value for storage."""
  154. if self.serializer != 'pickle' and isinstance(result, ResultBase):
  155. return result.as_tuple()
  156. return result
  157. def encode(self, data):
  158. _, _, payload = dumps(data, serializer=self.serializer)
  159. return payload
  160. def meta_from_decoded(self, meta):
  161. if meta['status'] in self.EXCEPTION_STATES:
  162. meta['result'] = self.exception_to_python(meta['result'])
  163. return meta
  164. def decode_result(self, payload):
  165. return self.meta_from_decoded(self.decode(payload))
  166. def decode(self, payload):
  167. payload = PY3 and payload or str(payload)
  168. return loads(payload,
  169. content_type=self.content_type,
  170. content_encoding=self.content_encoding,
  171. accept=self.accept)
  172. def wait_for(self, task_id,
  173. timeout=None, interval=0.5, no_ack=True, on_interval=None):
  174. """Wait for task and return its result.
  175. If the task raises an exception, this exception
  176. will be re-raised by :func:`wait_for`.
  177. If `timeout` is not :const:`None`, this raises the
  178. :class:`celery.exceptions.TimeoutError` exception if the operation
  179. takes longer than `timeout` seconds.
  180. """
  181. time_elapsed = 0.0
  182. while 1:
  183. meta = self.get_task_meta(task_id)
  184. if meta['status'] in states.READY_STATES:
  185. return meta
  186. if on_interval:
  187. on_interval()
  188. # avoid hammering the CPU checking status.
  189. time.sleep(interval)
  190. time_elapsed += interval
  191. if timeout and time_elapsed >= timeout:
  192. raise TimeoutError('The operation timed out.')
  193. def prepare_expires(self, value, type=None):
  194. if value is None:
  195. value = self.app.conf.CELERY_TASK_RESULT_EXPIRES
  196. if isinstance(value, timedelta):
  197. value = timeutils.timedelta_seconds(value)
  198. if value is not None and type:
  199. return type(value)
  200. return value
  201. def prepare_persistent(self, enabled=None):
  202. if enabled is not None:
  203. return enabled
  204. p = self.app.conf.CELERY_RESULT_PERSISTENT
  205. return self.persistent if p is None else p
  206. def encode_result(self, result, status):
  207. if isinstance(result, ExceptionInfo):
  208. result = result.exception
  209. if status in self.EXCEPTION_STATES and isinstance(result, Exception):
  210. return self.prepare_exception(result)
  211. else:
  212. return self.prepare_value(result)
  213. def is_cached(self, task_id):
  214. return task_id in self._cache
  215. def store_result(self, task_id, result, status,
  216. traceback=None, request=None, **kwargs):
  217. """Update task state and result."""
  218. result = self.encode_result(result, status)
  219. self._store_result(task_id, result, status, traceback,
  220. request=request, **kwargs)
  221. return result
  222. def forget(self, task_id):
  223. self._cache.pop(task_id, None)
  224. self._forget(task_id)
  225. def _forget(self, task_id):
  226. raise NotImplementedError('backend does not implement forget.')
  227. def get_status(self, task_id):
  228. """Get the status of a task."""
  229. return self.get_task_meta(task_id)['status']
  230. def get_traceback(self, task_id):
  231. """Get the traceback for a failed task."""
  232. return self.get_task_meta(task_id).get('traceback')
  233. def get_result(self, task_id):
  234. """Get the result of a task."""
  235. return self.get_task_meta(task_id).get('result')
  236. def get_children(self, task_id):
  237. """Get the list of subtasks sent by a task."""
  238. try:
  239. return self.get_task_meta(task_id)['children']
  240. except KeyError:
  241. pass
  242. def get_task_meta(self, task_id, cache=True):
  243. if cache:
  244. try:
  245. return self._cache[task_id]
  246. except KeyError:
  247. pass
  248. meta = self._get_task_meta_for(task_id)
  249. if cache and meta.get('status') == states.SUCCESS:
  250. self._cache[task_id] = meta
  251. return meta
  252. def reload_task_result(self, task_id):
  253. """Reload task result, even if it has been previously fetched."""
  254. self._cache[task_id] = self.get_task_meta(task_id, cache=False)
  255. def reload_group_result(self, group_id):
  256. """Reload group result, even if it has been previously fetched."""
  257. self._cache[group_id] = self.get_group_meta(group_id, cache=False)
  258. def get_group_meta(self, group_id, cache=True):
  259. if cache:
  260. try:
  261. return self._cache[group_id]
  262. except KeyError:
  263. pass
  264. meta = self._restore_group(group_id)
  265. if cache and meta is not None:
  266. self._cache[group_id] = meta
  267. return meta
  268. def restore_group(self, group_id, cache=True):
  269. """Get the result for a group."""
  270. meta = self.get_group_meta(group_id, cache=cache)
  271. if meta:
  272. return meta['result']
  273. def save_group(self, group_id, result):
  274. """Store the result of an executed group."""
  275. return self._save_group(group_id, result)
  276. def delete_group(self, group_id):
  277. self._cache.pop(group_id, None)
  278. return self._delete_group(group_id)
  279. def cleanup(self):
  280. """Backend cleanup. Is run by
  281. :class:`celery.task.DeleteExpiredTaskMetaTask`."""
  282. pass
  283. def process_cleanup(self):
  284. """Cleanup actions to do at the end of a task worker process."""
  285. pass
  286. def on_task_call(self, producer, task_id):
  287. return {}
  288. def on_chord_part_return(self, task, state, result, propagate=False):
  289. pass
  290. def fallback_chord_unlock(self, group_id, body, result=None,
  291. countdown=1, **kwargs):
  292. kwargs['result'] = [r.as_tuple() for r in result]
  293. self.app.tasks['celery.chord_unlock'].apply_async(
  294. (group_id, body, ), kwargs, countdown=countdown,
  295. )
  296. def apply_chord(self, header, partial_args, group_id, body, **options):
  297. result = header(*partial_args, task_id=group_id)
  298. self.fallback_chord_unlock(group_id, body, **options)
  299. return result
  300. def current_task_children(self, request=None):
  301. request = request or getattr(current_task(), 'request', None)
  302. if request:
  303. return [r.as_tuple() for r in getattr(request, 'children', [])]
  304. def __reduce__(self, args=(), kwargs={}):
  305. return (unpickle_backend, (self.__class__, args, kwargs))
  306. BaseDictBackend = BaseBackend # XXX compat
  307. class KeyValueStoreBackend(BaseBackend):
  308. key_t = ensure_bytes
  309. task_keyprefix = 'celery-task-meta-'
  310. group_keyprefix = 'celery-taskset-meta-'
  311. chord_keyprefix = 'chord-unlock-'
  312. implements_incr = False
  313. def __init__(self, *args, **kwargs):
  314. if hasattr(self.key_t, '__func__'):
  315. self.key_t = self.key_t.__func__ # remove binding
  316. self._encode_prefixes()
  317. super(KeyValueStoreBackend, self).__init__(*args, **kwargs)
  318. if self.implements_incr:
  319. self.apply_chord = self._apply_chord_incr
  320. def _encode_prefixes(self):
  321. self.task_keyprefix = self.key_t(self.task_keyprefix)
  322. self.group_keyprefix = self.key_t(self.group_keyprefix)
  323. self.chord_keyprefix = self.key_t(self.chord_keyprefix)
  324. def get(self, key):
  325. raise NotImplementedError('Must implement the get method.')
  326. def mget(self, keys):
  327. raise NotImplementedError('Does not support get_many')
  328. def set(self, key, value):
  329. raise NotImplementedError('Must implement the set method.')
  330. def delete(self, key):
  331. raise NotImplementedError('Must implement the delete method')
  332. def incr(self, key):
  333. raise NotImplementedError('Does not implement incr')
  334. def expire(self, key, value):
  335. pass
  336. def get_key_for_task(self, task_id, key=''):
  337. """Get the cache key for a task by id."""
  338. key_t = self.key_t
  339. return key_t('').join([
  340. self.task_keyprefix, key_t(task_id), key_t(key),
  341. ])
  342. def get_key_for_group(self, group_id, key=''):
  343. """Get the cache key for a group by id."""
  344. key_t = self.key_t
  345. return key_t('').join([
  346. self.group_keyprefix, key_t(group_id), key_t(key),
  347. ])
  348. def get_key_for_chord(self, group_id, key=''):
  349. """Get the cache key for the chord waiting on group with given id."""
  350. key_t = self.key_t
  351. return key_t('').join([
  352. self.chord_keyprefix, key_t(group_id), key_t(key),
  353. ])
  354. def _strip_prefix(self, key):
  355. """Takes bytes, emits string."""
  356. key = self.key_t(key)
  357. for prefix in self.task_keyprefix, self.group_keyprefix:
  358. if key.startswith(prefix):
  359. return bytes_to_str(key[len(prefix):])
  360. return bytes_to_str(key)
  361. def _filter_ready(self, values, READY_STATES=states.READY_STATES):
  362. for k, v in values:
  363. if v is not None:
  364. v = self.decode_result(v)
  365. if v['status'] in READY_STATES:
  366. yield k, v
  367. def _mget_to_results(self, values, keys):
  368. if hasattr(values, 'items'):
  369. # client returns dict so mapping preserved.
  370. return dict((self._strip_prefix(k), v)
  371. for k, v in self._filter_ready(items(values)))
  372. else:
  373. # client returns list so need to recreate mapping.
  374. return dict((bytes_to_str(keys[i]), v)
  375. for i, v in self._filter_ready(enumerate(values)))
  376. def get_many(self, task_ids, timeout=None, interval=0.5, no_ack=True,
  377. READY_STATES=states.READY_STATES):
  378. interval = 0.5 if interval is None else interval
  379. ids = task_ids if isinstance(task_ids, set) else set(task_ids)
  380. cached_ids = set()
  381. cache = self._cache
  382. for task_id in ids:
  383. try:
  384. cached = cache[task_id]
  385. except KeyError:
  386. pass
  387. else:
  388. if cached['status'] in READY_STATES:
  389. yield bytes_to_str(task_id), cached
  390. cached_ids.add(task_id)
  391. ids.difference_update(cached_ids)
  392. iterations = 0
  393. while ids:
  394. keys = list(ids)
  395. r = self._mget_to_results(self.mget([self.get_key_for_task(k)
  396. for k in keys]), keys)
  397. cache.update(r)
  398. ids.difference_update(set(bytes_to_str(v) for v in r))
  399. for key, value in items(r):
  400. yield bytes_to_str(key), value
  401. if timeout and iterations * interval >= timeout:
  402. raise TimeoutError('Operation timed out ({0})'.format(timeout))
  403. time.sleep(interval) # don't busy loop.
  404. iterations += 1
  405. def _forget(self, task_id):
  406. self.delete(self.get_key_for_task(task_id))
  407. def _store_result(self, task_id, result, status,
  408. traceback=None, request=None, **kwargs):
  409. meta = {'status': status, 'result': result, 'traceback': traceback,
  410. 'children': self.current_task_children(request)}
  411. self.set(self.get_key_for_task(task_id), self.encode(meta))
  412. return result
  413. def _save_group(self, group_id, result):
  414. self.set(self.get_key_for_group(group_id),
  415. self.encode({'result': result.as_tuple()}))
  416. return result
  417. def _delete_group(self, group_id):
  418. self.delete(self.get_key_for_group(group_id))
  419. def _get_task_meta_for(self, task_id):
  420. """Get task metadata for a task by id."""
  421. meta = self.get(self.get_key_for_task(task_id))
  422. if not meta:
  423. return {'status': states.PENDING, 'result': None}
  424. return self.decode_result(meta)
  425. def _restore_group(self, group_id):
  426. """Get task metadata for a task by id."""
  427. meta = self.get(self.get_key_for_group(group_id))
  428. # previously this was always pickled, but later this
  429. # was extended to support other serializers, so the
  430. # structure is kind of weird.
  431. if meta:
  432. meta = self.decode(meta)
  433. result = meta['result']
  434. meta['result'] = result_from_tuple(result, self.app)
  435. return meta
  436. def _apply_chord_incr(self, header, partial_args, group_id, body,
  437. result=None, **options):
  438. self.save_group(group_id, self.app.GroupResult(group_id, result))
  439. return header(*partial_args, task_id=group_id)
  440. def on_chord_part_return(self, task, state, result, propagate=None):
  441. if not self.implements_incr:
  442. return
  443. app = self.app
  444. if propagate is None:
  445. propagate = app.conf.CELERY_CHORD_PROPAGATES
  446. gid = task.request.group
  447. if not gid:
  448. return
  449. key = self.get_key_for_chord(gid)
  450. try:
  451. deps = GroupResult.restore(gid, backend=task.backend)
  452. except Exception as exc:
  453. callback = maybe_signature(task.request.chord, app=app)
  454. logger.error('Chord %r raised: %r', gid, exc, exc_info=1)
  455. return self.chord_error_from_stack(
  456. callback,
  457. ChordError('Cannot restore group: {0!r}'.format(exc)),
  458. )
  459. if deps is None:
  460. try:
  461. raise ValueError(gid)
  462. except ValueError as exc:
  463. callback = maybe_signature(task.request.chord, app=app)
  464. logger.error('Chord callback %r raised: %r', gid, exc,
  465. exc_info=1)
  466. return self.chord_error_from_stack(
  467. callback,
  468. ChordError('GroupResult {0} no longer exists'.format(gid)),
  469. )
  470. val = self.incr(key)
  471. size = len(deps)
  472. if val > size:
  473. logger.warning('Chord counter incremented too many times for %r',
  474. gid)
  475. elif val == size:
  476. callback = maybe_signature(task.request.chord, app=app)
  477. j = deps.join_native if deps.supports_native_join else deps.join
  478. try:
  479. with allow_join_result():
  480. ret = j(timeout=3.0, propagate=propagate)
  481. except Exception as exc:
  482. try:
  483. culprit = next(deps._failed_join_report())
  484. reason = 'Dependency {0.id} raised {1!r}'.format(
  485. culprit, exc,
  486. )
  487. except StopIteration:
  488. reason = repr(exc)
  489. logger.error('Chord %r raised: %r', gid, reason, exc_info=1)
  490. self.chord_error_from_stack(callback, ChordError(reason))
  491. else:
  492. try:
  493. callback.delay(ret)
  494. except Exception as exc:
  495. logger.error('Chord %r raised: %r', gid, exc, exc_info=1)
  496. self.chord_error_from_stack(
  497. callback,
  498. ChordError('Callback error: {0!r}'.format(exc)),
  499. )
  500. finally:
  501. deps.delete()
  502. self.client.delete(key)
  503. else:
  504. self.expire(key, 86400)
  505. class DisabledBackend(BaseBackend):
  506. _cache = {} # need this attribute to reset cache in tests.
  507. def store_result(self, *args, **kwargs):
  508. pass
  509. def _is_disabled(self, *args, **kwargs):
  510. raise NotImplementedError(
  511. 'No result backend configured. '
  512. 'Please see the documentation for more information.')
  513. def as_uri(self, *args, **kwargs):
  514. return 'disabled://'
  515. get_state = get_status = get_result = get_traceback = _is_disabled
  516. wait_for = get_many = _is_disabled