13 years ago · 5a22319a92
--- a/docs/getting-started/next-steps.rst
+++ b/docs/getting-started/next-steps.rst
@@ -6,6 +6,9 @@ The :ref:`first-steps` guide is intentionally minimal.  In this guide
 
															 we will demonstrate what Celery offers in more detail, including
														
 
															 how to add Celery support for your application and library.
														
 
															+.. contents::
														
 
															+    :local:
														
 
															+
														
 
															 Our Project
														
 
															 ===========
														
@@ -17,38 +20,218 @@ Project layout::
 
															         /tasks.py
														
 
															 :file:`proj/celery.py`
														
 
															+----------------------
														
 
															 .. literalinclude:: ../../examples/next-steps/proj/celery.py
														
 
															-    :language python:
														
 
															+    :language: python
														
 
															+
														
 
															+In this module we created our :class:`@Celery` instance.  This is something
														
 
															+referred to as the celery *app*.  Your project
														
 
															+imports celery from this module to access Celery's features.
														
 
															+It's possible to use several app instances at once, but that
														
 
															+will not be covered in this tutorial.
														
 
															+
														
 
															+- The ``broker`` argument specifies the URL of the broker to use.
														
 
															+
														
 
															+    See :ref:`celerytut-broker` for more information.
														
 
															+
														
 
															+- The ``backend`` argument specifies the result backend to use,
														
 
															+    It's used to keep track of task state and results.
														
 
															+    While results are disabled by default we use the amqp backend here
														
 
															+    to demonstrate how retrieving the results work, you may want to use
														
 
															+    a different backend for your application, as they all have different
														
 
															+    strenghts and weaknesses.  If you don't need results it's best
														
 
															+    to disable them.  Results can also be disabled for individual tasks
														
 
															+    by setting the ``@task(ignore_result=True)`` option.
														
 
															+
														
 
															+    See :ref:`celerytut-keeping-results` for more information.
														
 
															+
														
 
															+- The ``include`` argument is a list of modules to import when
														
 
															+  the worker starts.  We need to add our tasks module here so
														
 
															+  that the worker is able to find our tasks.
														
 
															 :file:`proj/tasks.py`
														
 
															+---------------------
														
 
															 .. literalinclude:: ../../examples/next-steps/proj/tasks.py
														
 
															-    :language python:
														
 
															+    :language: python
														
 
															+
														
 
															+
														
 
															+Starting the worker
														
 
															+===================
														
 
															+The :program:`celery` program can be used to start the worker::
														
 
															+
														
 
															+   $ celery worker --app=proj -l info
														
 
															+
														
 
															+The :option:`--app` argument specifies the Celery app instance to use,
														
 
															+it must be in the form of ``module.path:celery``, where the part before the colon
														
 
															+is the name of the module, and the attribute name comes last.
														
 
															+If a package name is specified instead it will automatically
														
 
															+try to find a ``celery`` module in that package, and if the name
														
 
															+is a module it will try to find a ``celery`` attribute in that module.
														
 
															+This means that the following all results in the same::
														
 
															+
														
 
															+    $ celery --app=proj
														
 
															+    $ celery --app=proj.celery:
														
 
															+    $ celery --app=proj.celery:celery
														
 
															 Subtasks
														
 
															 ========
														
 
															+A :func:`~celery.subtask` wraps the signature of a single task invocation:
														
 
															+arguments, keyword arguments and execution options.
														
 
															-group
														
 
															------
														
 
															+A subtask for the ``add`` task can be created like this::
														
 
															-.. code-block:: python
														
 
															+    >>> from celery import subtask
														
 
															+    >>> subtask(add.name, args=(4, 4))
														
 
															+
														
 
															+or you can create one from the task itself::
														
 
															+
														
 
															+    >>> from proj.tasks import add
														
 
															+    >>> add.subtask(args=(4, 4))
														
 
															+
														
 
															+It takes the same arguments as the :meth:`~@Task.apply_async` method::
														
 
															+
														
 
															+    >>> add.apply_async(args, kwargs, **options)
														
 
															+    >>> add.subtask(args, kwargs, **options)
														
 
															+
														
 
															+    >>> add.apply_async((2, 2), countdown=1)
														
 
															+    >>> add.subtask((2, 2), countdown=1)
														
 
															+
														
 
															+And like there is a :meth:`~@Task.delay` shortcut for `apply_async`
														
 
															+there is a :meth:`~@Task.s` shortcut for subtask::
														
 
															+
														
 
															+    >>> add.s(*args, **kwargs)
														
 
															+
														
 
															+    >>> add.s(2, 2)
														
 
															+    proj.tasks.add(2, 2)
														
 
															+
														
 
															+    >>> add.s(2, 2) == add.subtask((2, 2))
														
 
															+    True
														
 
															+
														
 
															+You can't define options with :meth:`~@Task.s`, but a chaining
														
 
															+``set`` call takes care of that::
														
 
															+
														
 
															+    >>> add.s(2, 2).set(countdown=1)
														
 
															+    proj.tasks.add(2, 2)
														
 
															+
														
 
															+Partials
														
 
															+--------
														
 
															+
														
 
															+A subtask can be applied too::
														
 
															+
														
 
															+    >>> add.s(2, 2).delay()
														
 
															+    >>> add.s(2, 2).apply_async(countdown=1)
														
 
															+
														
 
															+Specifying additional args, kwargs or options to ``apply_async``/``delay``
														
 
															+creates partials:
														
 
															+
														
 
															+- Any arguments added will be prepended to the args in the signature::
														
 
															+
														
 
															+    >>> partial = add.s(2)          # incomplete signature
														
 
															+    >>> partial.delay(4)            # 2 + 4
														
 
															+    >>> partial.apply_async((4, ))  # same
														
 
															+
														
 
															+- Any keyword arguments added will be merged with the kwargs in the signature,
														
 
															+  with the new keyword arguments taking precedence::
														
 
															+
														
 
															+    >>> s = add.s(2, 2)
														
 
															+    >>> s.delay(debug=True)                    # -> add(2, 2, debug=True)
														
 
															+    >>> s.apply_async(kwargs={"debug": True})  # same
														
 
															+
														
 
															+- Any options added will be merged with the options in the signature,
														
 
															+  with the new options taking precedence::
														
 
															+
														
 
															+    >>> s = add.subtask((2, 2), countdown=10)
														
 
															+    >>> s.apply_async(countdown=1)  # countdown is now 1
														
 
															+
														
 
															+You can also clone subtasks to augment these::
														
 
															+
														
 
															+    >>> s = add.s(2)
														
 
															+    proj.tasks.add(2)
														
 
															+
														
 
															+    >>> s.clone(args=(4, ), kwargs={"debug": True})
														
 
															+    proj.tasks.add(2, 4, debug=True)
														
 
															+
														
 
															+Partials are meant to be used with callbacks, any tasks linked or chord
														
 
															+callbacks will be applied with the result of the parent task.
														
 
															+Sometimes you want to specify a callback that does not take
														
 
															+additional arguments, and in that case you can set the subtask
														
 
															+to be immutable::
														
 
															+
														
 
															+    >>> add.s(2, 2).link( reset_buffers.subtask(immutable=True) )
														
 
															+
														
 
															+Only the execution options can be set when a subtask is immutable,
														
 
															+and it's not possible to apply the subtask with partial args/kwargs.
														
 
															+
														
 
															+.. note::
														
 
															+
														
 
															+    In this tutorial we use the prefix operator `~` to subtasks.
														
 
															+    You probably shouldn't use it in your production code, but it's a handy shortcut
														
 
															+    when testing with the Python shell::
														
 
															+
														
 
															+        >>> ~subtask
														
 
															+
														
 
															+        >>> # is the same as
														
 
															+        >>> subtask.delay().get()
														
 
															+
														
 
															+Groups
														
 
															+------
														
 
															+
														
 
															+A group can be used to execute several tasks in parallel.
														
 
															+
														
 
															+The :class:`~celery.group` function takes a list of subtasks::
														
 
															     >>> from celery import group
														
 
															     >>> from proj.tasks import add
														
 
															-    >>> ~group(add.s(i, i) for i in xrange(10))
														
 
															-    [0, 2, 4, 6, 8, 10, 12, 14, 16, 18]
														
 
															+    >>> group(add.s(2, 2), add.s(4, 4))
														
 
															+    (proj.tasks.add(2, 2), proj.tasks.add(4, 4))
														
 
															+
														
 
															+If you **call** the group, the tasks will be applied
														
 
															+one after one in the current process, and a :class:`~@TaskSetResult`
														
 
															+instance is returned which can be used to keep track of the results,
														
 
															+or tell how many tasks are ready and so on::
														
 
															+
														
 
															+    >>> g = group(add.s(2, 2), add.s(4, 4))
														
 
															+    >>> res = g()
														
 
															+    >>> res.get()
														
 
															+    [4, 8]
														
 
															-    >>> group(add.s(i, i) for i in xrange(10)).skew(1, 10)
														
 
															+However, if you call ``apply_async`` on the group it will
														
 
															+send a special grouping task, so that the action of applying
														
 
															+the tasks happens in a worker instead of the current process::
														
 
															-map/starmap
														
 
															+    >>> res = g.apply_async()
														
 
															+    >>> res.get()
														
 
															+    [4, 8]
														
 
															+
														
 
															+Group also supports iterators::
														
 
															+
														
 
															+    >>> group(add.s(i, i) for i in xrange(100))()
														
 
															+
														
 
															+
														
 
															+A group is a subclass instance, so it can be used in combination
														
 
															+with other subtasks.
														
 
															+
														
 
															+Map & Starmap
														
 
															 -------------
														
 
															+:class:`~celery.map` and :class:`~celery.starmap` are built-in tasks
														
 
															+that calls the task for every element in a sequence.
														
 
															+
														
 
															+They differ from group in that
														
 
															+
														
 
															+- only one task message is sent
														
 
															+
														
 
															+- the operation is sequential.
														
 
															+
														
 
															+For example using ``map``:
														
 
															+
														
 
															 .. code-block:: python
														
 
															     >>> from proj.tasks import add
														
@@ -56,19 +239,233 @@ map/starmap
 
															     >>> ~xsum.map([range(10), range(100)])
														
 
															     [45, 4950]
														
 
															+is the same as having a task doing:
														
 
															+
														
 
															+.. code-block:: python
														
 
															+
														
 
															+    @celery.task
														
 
															+    def temp():
														
 
															+        return [xsum(range(10)), xsum(range(100))]
														
 
															+
														
 
															+and using ``starmap``::
														
 
															+
														
 
															     >>> ~add.starmap(zip(range(10), range(10)))
														
 
															     [0, 2, 4, 6, 8, 10, 12, 14, 16, 18]
														
 
															+is the same as having a task doing:
														
 
															+
														
 
															+.. code-block:: python
														
 
															+
														
 
															+    @celery.task
														
 
															+    def temp():
														
 
															+        return [add(i, i) for i in range(10)]
														
 
															+
														
 
															+Both ``map`` and ``starmap`` are subtasks, so they can be used as
														
 
															+other subtasks and combined in groups etc., for example
														
 
															+to apply the starmap after 10 seconds::
														
 
															+
														
 
															     >>> add.starmap(zip(range(10), range(10))).apply_async(countdown=10)
														
 
															-chunks
														
 
															-------
														
 
															+Chunking
														
 
															+--------
														
 
															+
														
 
															+-- Chunking lets you divide a iterable of work into pieces,
														
 
															+   so that if you have one million objects, you can create
														
 
															+   10 tasks with hundred thousand objects each.
														
 
															+
														
 
															+Some may worry that chunking your tasks results in a degradation
														
 
															+of parallelism, but this is rarely true for a busy cluster
														
 
															+and in practice since you are avoiding the overhead  of messaging
														
 
															+it may considerably increase performance.
														
 
															+
														
 
															+To create a chunks subtask you can use :meth:`@Task.chunks`:
														
 
															+
														
 
															+.. code-block:: python
														
 
															+
														
 
															+    >>> add.chunks(zip(range(100), range(100)), 10)
														
 
															+
														
 
															+As with :class:`~celery.group` the act of **calling**
														
 
															+the chunks will apply the tasks in the current process:
														
 
															 .. code-block:: python
														
 
															     >>> from proj.tasks import add
														
 
															-    >>> ~add.chunks(zip(range(100), range(100)), 10)
														
 
															+    >>> res = add.chunks(zip(range(100), range(100)), 10)()
														
 
															+    >>> res.get()
														
 
															+    [[0, 2, 4, 6, 8, 10, 12, 14, 16, 18],
														
 
															+     [20, 22, 24, 26, 28, 30, 32, 34, 36, 38],
														
 
															+     [40, 42, 44, 46, 48, 50, 52, 54, 56, 58],
														
 
															+     [60, 62, 64, 66, 68, 70, 72, 74, 76, 78],
														
 
															+     [80, 82, 84, 86, 88, 90, 92, 94, 96, 98],
														
 
															+     [100, 102, 104, 106, 108, 110, 112, 114, 116, 118],
														
 
															+     [120, 122, 124, 126, 128, 130, 132, 134, 136, 138],
														
 
															+     [140, 142, 144, 146, 148, 150, 152, 154, 156, 158],
														
 
															+     [160, 162, 164, 166, 168, 170, 172, 174, 176, 178],
														
 
															+     [180, 182, 184, 186, 188, 190, 192, 194, 196, 198]]
														
 
															+
														
 
															+while calling ``.apply_async`` will create a dedicated
														
 
															+task so that the individual tasks are applied in a worker
														
 
															+instead::
														
 
															+
														
 
															+    >>> add.chunks(zip(range(100), range(100), 10)).apply_async()
														
 
															+
														
 
															+You can also convert chunks to a group::
														
 
															+
														
 
															+    >>> group = add.chunks(zip(range(100), range(100), 10)).group()
														
 
															+
														
 
															+and with the group skew the countdown of each task by increments
														
 
															+of one::
														
 
															+
														
 
															+    >>> group.skew(start=1, stop=10)()
														
 
															+
														
 
															+which means that the first task will have a countdown of 1, the second
														
 
															+a countdown of 2 and so on.
														
 
															+Chaining tasks
														
 
															+--------------
														
 
															+Tasks can be linked together, which in practice means adding
														
 
															+a callback task::
														
 
															+
														
 
															+    >>> res = add.apply_async((2, 2), link=mul.s(16))
														
 
															+    >>> res.get()
														
 
															+    4
														
 
															+
														
 
															+The linked task will be applied with the result of its parent
														
 
															+task as the first argument, which in the above case will result
														
 
															+in ``mul(4, 16)`` since the result is 4.
														
 
															+
														
 
															+The results will keep track of what subtasks a task applies,
														
 
															+and this can be accessed from the result instance::
														
 
															+
														
 
															+    >>> res.children
														
 
															+    [<AsyncResult: 8c350acf-519d-4553-8a53-4ad3a5c5aeb4>]
														
 
															+
														
 
															+    >>> res.children[0].get()
														
 
															+    64
														
 
															+
														
 
															+The result instance also has a :meth:`~@AsyncResult.collect` method
														
 
															+that treats the result as a graph, enabling you to iterate over
														
 
															+the results::
														
 
															+
														
 
															+    >>> list(res.collect())
														
 
															+    [(<AsyncResult: 7b720856-dc5f-4415-9134-5c89def5664e>, 4),
														
 
															+     (<AsyncResult: 8c350acf-519d-4553-8a53-4ad3a5c5aeb4>, 64)]
														
 
															+
														
 
															+By default :meth:`~@AsyncResult.collect` will raise an
														
 
															+:exc:`~@IncompleteStream` exception if the graph is not fully
														
 
															+formed (one of the tasks has not completed yet),
														
 
															+but you can get an intermediate representation of the graph
														
 
															+too::
														
 
															+
														
 
															+    >>> for result, value in res.collect(intermediate=True)):
														
 
															+    ....
														
 
															+
														
 
															+You can link together as many tasks as you like,
														
 
															+and subtasks can be linked too::
														
 
															+
														
 
															+    >>> s = add.s(2, 2)
														
 
															+    >>> s.link(mul.s(4))
														
 
															+    >>> s.link(log_result.s())
														
 
															+
														
 
															+You can also add *error callbacks* using the ``link_error`` argument::
														
 
															+
														
 
															+    >>> add.apply_async((2, 2), link_error=log_error.s())
														
 
															+
														
 
															+    >>> add.subtask((2, 2), link_error=log_error.s())
														
 
															+
														
 
															+Since exceptions can only be serialized when pickle is used
														
 
															+the error callbacks take the id of the parent task as argument instead:
														
 
															+
														
 
															+.. code-block:: python
														
 
															+
														
 
															+    from proj.celery import celery
														
 
															+
														
 
															+    @celery.task
														
 
															+    def log_error(task_id):
														
 
															+        result = celery.AsyncResult(task_id)
														
 
															+        result.get(propagate=False)  # make sure result written.
														
 
															+        with open("/var/errors/%s" % (task_id, )) as fh:
														
 
															+            fh.write("--\n\n%s %s %s" % (
														
 
															+                task_id, result.result, result.traceback))
														
 
															+
														
 
															+To make it even easier to link tasks together there is
														
 
															+a special subtask called :class:`~celery.chain` that lets
														
 
															+you chain tasks together:
														
 
															+
														
 
															+.. code-block:: python
														
 
															+
														
 
															+    >>> from celery import chain
														
 
															+    >>> from proj.tasks import add, mul
														
 
															+
														
 
															+    # (4 + 4) * 8 * 10
														
 
															+    >>> res = chain(add.s(4, 4), mul.s(8), mul.s(10))
														
 
															+    proj.tasks.add(4, 4) | proj.tasks.mul(8)
														
 
															+
														
 
															+
														
 
															+Calling the chain will apply the tasks in the current process
														
 
															+and return the result of the last task in the chain::
														
 
															+
														
 
															+    >>> res = chain(add.s(4, 4), mul.s(8), mul.s(10))
														
 
															+    >>> res.get()
														
 
															+    640
														
 
															+
														
 
															+And calling ``apply_async`` will create a dedicated
														
 
															+task so that the act of applying the chain happens
														
 
															+in a worker::
														
 
															+
														
 
															+    >>> res = chain(add.s(4, 4), mul.s(8), mul.s(10))
														
 
															+    >>> res.get()
														
 
															+    640
														
 
															+
														
 
															+It also sets ``parent`` attributes so that you can
														
 
															+work your way up the chain to get intermediate results::
														
 
															+
														
 
															+    >>> res.parent.get()
														
 
															+    64
														
 
															+
														
 
															+    >>> res.parent.parent.get()
														
 
															+    8
														
 
															+
														
 
															+    >>> res.parent.parent
														
 
															+    <AsyncResult: eeaad925-6778-4ad1-88c8-b2a63d017933>
														
 
															+
														
 
															+
														
 
															+Chains can also be made using the ``|`` (pipe) operator::
														
 
															+
														
 
															+    >>> (add.s(2, 2) | mul.s(8) | mul.s(10)).apply_async()
														
 
															+
														
 
															+Graphs
														
 
															+~~~~~~
														
 
															+
														
 
															+In addition you can work with the result graph as a
														
 
															+:class:`~celery.datastructures.DependencyGraph`:
														
 
															+
														
 
															+.. code-block:: python
														
 
															+
														
 
															+    >>> res = chain(add.s(4, 4), mul.s(8), mul.s(10))()
														
 
															+
														
 
															+    >>> res.parent.parent.graph
														
 
															+    285fa253-fcf8-42ef-8b95-0078897e83e6(1)
														
 
															+        463afec2-5ed4-4036-b22d-ba067ec64f52(0)
														
 
															+    872c3995-6fa0-46ca-98c2-5a19155afcf0(2)
														
 
															+        285fa253-fcf8-42ef-8b95-0078897e83e6(1)
														
 
															+            463afec2-5ed4-4036-b22d-ba067ec64f52(0)
														
 
															+
														
 
															+You can even convert these graphs to *dot* format::
														
 
															+
														
 
															+    >>> with open("graph.dot", "w") as fh:
														
 
															+    ...     res.parent.parent.graph.to_dot(fh)
														
 
															+
														
 
															+
														
 
															+and create images::
														
 
															+
														
 
															+    $ dot -Tpng graph.dot -o graph.png
														
 
															+
														
 
															+.. image:: ../images/graph.png
														
 
															+
														
 
															+
														
 
															+Chords
														
 
															+------
														
--- a/docs/images/graph.png
+++ b/docs/images/graph.png
--- a/examples/app/myapp.py
+++ b/examples/app/myapp.py
@@ -2,7 +2,7 @@
 
															 Usage:
														
 
															-   (window1)$ python myapp.py -l info
														
 
															+   (window1)$ python myapp.py worker -l info
														
 
															    (window2)$ python
														
 
															    >>> from myapp import add
														
@@ -27,4 +27,4 @@ def add(x, y):
 
															     return x + y
														
 
															 if __name__ == "__main__":
														
 
															-    celery.worker_main()
														
 
															+    celery.start()
														
--- a/examples/next-steps/proj/celery.py
+++ b/examples/next-steps/proj/celery.py
@@ -2,10 +2,6 @@ from __future__ import absolute_import
 
															 from celery import Celery
														
 
															-celery = Celery("proj", broker="amqp://", backend="amqp")
														
 
															-celery.conf.CELERY_IMPORTS = ("proj.tasks", )
														
 
															-
														
 
															-if __name__ == "__main__":
														
 
															-    from billiard import freeze_support
														
 
															-    freeze_support()
														
 
															-    celery.start()
														
 
															+celery = Celery(broker="amqp://",
														
 
															+                backend="amqp://",
														
 
															+                include=["proj.tasks"])