state.py 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234
  1. # -*- coding: utf-8 -*-
  2. """
  3. celery.worker.state
  4. ~~~~~~~~~~~~~~~~~~~
  5. Internal worker state (global)
  6. This includes the currently active and reserved tasks,
  7. statistics, and revoked tasks.
  8. """
  9. from __future__ import absolute_import
  10. import os
  11. import sys
  12. import platform
  13. import shelve
  14. import zlib
  15. from kombu.serialization import pickle, pickle_protocol
  16. from kombu.utils import cached_property
  17. from celery import __version__
  18. from celery.datastructures import LimitedSet
  19. from celery.exceptions import SystemTerminate
  20. from celery.five import Counter
  21. __all__ = ['SOFTWARE_INFO', 'reserved_requests', 'active_requests',
  22. 'total_count', 'revoked', 'task_reserved', 'maybe_shutdown',
  23. 'task_accepted', 'task_ready', 'task_reserved', 'task_ready',
  24. 'Persistent']
  25. #: Worker software/platform information.
  26. SOFTWARE_INFO = {'sw_ident': 'py-celery',
  27. 'sw_ver': __version__,
  28. 'sw_sys': platform.system()}
  29. #: maximum number of revokes to keep in memory.
  30. REVOKES_MAX = 50000
  31. #: how many seconds a revoke will be active before
  32. #: being expired when the max limit has been exceeded.
  33. REVOKE_EXPIRES = 10800
  34. #: set of all reserved :class:`~celery.worker.job.Request`'s.
  35. reserved_requests = set()
  36. #: set of currently active :class:`~celery.worker.job.Request`'s.
  37. active_requests = set()
  38. #: count of tasks accepted by the worker, sorted by type.
  39. total_count = Counter()
  40. #: the list of currently revoked tasks. Persistent if statedb set.
  41. revoked = LimitedSet(maxlen=REVOKES_MAX, expires=REVOKE_EXPIRES)
  42. #: Update global state when a task has been reserved.
  43. task_reserved = reserved_requests.add
  44. should_stop = False
  45. should_terminate = False
  46. def maybe_shutdown():
  47. if should_stop:
  48. raise SystemExit()
  49. elif should_terminate:
  50. raise SystemTerminate()
  51. def task_accepted(request):
  52. """Updates global state when a task has been accepted."""
  53. active_requests.add(request)
  54. total_count[request.name] += 1
  55. def task_ready(request):
  56. """Updates global state when a task is ready."""
  57. active_requests.discard(request)
  58. reserved_requests.discard(request)
  59. C_BENCH = os.environ.get('C_BENCH') or os.environ.get('CELERY_BENCH')
  60. C_BENCH_EVERY = int(os.environ.get('C_BENCH_EVERY') or
  61. os.environ.get('CELERY_BENCH_EVERY') or 1000)
  62. if C_BENCH: # pragma: no cover
  63. import atexit
  64. from billiard import current_process
  65. from celery.five import monotonic
  66. from celery.utils.debug import memdump, sample_mem
  67. all_count = 0
  68. bench_first = None
  69. bench_start = None
  70. bench_last = None
  71. bench_every = C_BENCH_EVERY
  72. bench_sample = []
  73. __reserved = task_reserved
  74. __ready = task_ready
  75. if current_process()._name == 'MainProcess':
  76. @atexit.register
  77. def on_shutdown():
  78. if bench_first is not None and bench_last is not None:
  79. print('- Time spent in benchmark: {0!r}'.format(
  80. bench_last - bench_first))
  81. print('- Avg: {0}'.format(
  82. sum(bench_sample) / len(bench_sample)))
  83. memdump()
  84. def task_reserved(request): # noqa
  85. global bench_start
  86. global bench_first
  87. now = None
  88. if bench_start is None:
  89. bench_start = now = monotonic()
  90. if bench_first is None:
  91. bench_first = now
  92. return __reserved(request)
  93. def task_ready(request): # noqa
  94. global all_count
  95. global bench_start
  96. global bench_last
  97. all_count += 1
  98. if not all_count % bench_every:
  99. now = monotonic()
  100. diff = now - bench_start
  101. print('- Time spent processing {0} tasks (since first '
  102. 'task received): ~{1:.4f}s\n'.format(bench_every, diff))
  103. sys.stdout.flush()
  104. bench_start = bench_last = now
  105. bench_sample.append(diff)
  106. sample_mem()
  107. return __ready(request)
  108. class Persistent(object):
  109. """This is the persistent data stored by the worker when
  110. :option:`--statedb` is enabled.
  111. It currently only stores revoked task id's.
  112. """
  113. storage = shelve
  114. protocol = pickle_protocol
  115. compress = zlib.compress
  116. decompress = zlib.decompress
  117. _is_open = False
  118. def __init__(self, state, filename, clock=None):
  119. self.state = state
  120. self.filename = filename
  121. self.clock = clock
  122. self.merge()
  123. def open(self):
  124. return self.storage.open(
  125. self.filename, protocol=self.protocol, writeback=True,
  126. )
  127. def merge(self):
  128. self._merge_with(self.db)
  129. def sync(self):
  130. self._sync_with(self.db)
  131. self.db.sync()
  132. def close(self):
  133. if self._is_open:
  134. self.db.close()
  135. self._is_open = False
  136. def save(self):
  137. self.sync()
  138. self.close()
  139. def _merge_with(self, d):
  140. self._merge_revoked(d)
  141. self._merge_clock(d)
  142. return d
  143. def _sync_with(self, d):
  144. self._revoked_tasks.purge()
  145. d.update(
  146. __proto__=3,
  147. zrevoked=self.compress(self._dumps(self._revoked_tasks)),
  148. clock=self.clock.forward() if self.clock else 0,
  149. )
  150. return d
  151. def _merge_clock(self, d):
  152. if self.clock:
  153. d['clock'] = self.clock.adjust(d.get('clock') or 0)
  154. def _merge_revoked(self, d):
  155. try:
  156. self._merge_revoked_v3(d['zrevoked'])
  157. except KeyError:
  158. try:
  159. self._merge_revoked_v2(d.pop('revoked'))
  160. except KeyError:
  161. pass
  162. # purge expired items at boot
  163. self._revoked_tasks.purge()
  164. def _merge_revoked_v3(self, zrevoked):
  165. if zrevoked:
  166. self._revoked_tasks.update(pickle.loads(self.decompress(zrevoked)))
  167. def _merge_revoked_v2(self, saved):
  168. if not isinstance(saved, LimitedSet):
  169. # (pre 3.0.18) used to be stored as a dict
  170. return self._merge_revoked_v1(saved)
  171. self._revoked_tasks.update(saved)
  172. def _merge_revoked_v1(self, saved):
  173. add = self._revoked_tasks.add
  174. for item in saved:
  175. add(item)
  176. def _dumps(self, obj):
  177. return pickle.dumps(obj, protocol=self.protocol)
  178. @property
  179. def _revoked_tasks(self):
  180. return self.state.revoked
  181. @cached_property
  182. def db(self):
  183. self._is_open = True
  184. return self.open()